#==== BC4488 family
ALIGN - ---EEEE------------------------------------------------HHHHHHHHH-EE--E-------------------------HHHHH------------------------------------------EEEEE-------------HHHHHHHHHHHHH------------------------------HHHHHHHHH--------H-------------------HHHHH-----------------------------------HHHHHHHHHH---------
HMM - --EEEEEE-----------EEE-------------------------------EEEEEEEEEEEEEE--EE----------------------HHHHHHH------------------------------------------EEEEEE----------HHHHHHHHHHHHHHHH-----------------------------HHHHHHHH----------EEEEEE----------------HH-----------------------------------HHHHHHHHHH----HHHH-
FREQ - --EEEE-------------------------------------------------EEEEHHEEE--E--EE-----------------------HHHHHH-------HHHHHHH-----------------------------EEEEE------------HHHHHHHHHHHHHHH---------------------------HHHHHHHHHH--------HHH-----------------HHHHH-----------------------------------HHHHHHHHHHH---HHHH-
PSSM - -----E---------------------------------------------------EE--HE-------------------------------HHHHH---------------------------------------------EEE--------------HHHHHHHHHHHHHH---------------------------HHHHHHHHHH----------EEE-------------------H-----------------------------------HHHHHHHHH----------
FINAL - --EEEEE-------------E---------------------------------EEEEEEEEEEEEE--EE----------------------HHHHHHH---------HHHH-----------------------------EEEEEE------------HHHHHHHHHHHHHH----------------------------HHHHHHHHHH----------EEEEE--------------HHHH-----------------------------------HHHHHHHHHH----HHHH-
#-- # # -- -- - - - - # -
ROSINTL182_09631_Rint_240147581 49 EKALEVSSKSE----VRVGKEIGAFS------LEL-DG------------------IFLENVFQAAK--QY-----------------ENGGPYLDLLNV-------SPKQAKRDERHCN-------------------SGKLVGFVRNDEI---WTLEPKTAFYDYIYISALIK--------------------------FNGYDLNISEY--------QWFTDIEFNP-------QKSINCQA-----------------------------------RAVAIYVALQKTALFNSLK 196 240147581 bacteria>firmicutes
ROI_18700_Rint_291535823 49 EKALEVSSKSE----VRVGKEIGAFS------LEL-DG------------------IFLENVFQAAK--QY-----------------ENGGPYLDLLNV-------SPKQAKRDERHCN-------------------SGKLVGFVRNDEI---WTLEPKTAFYDYIYISALIK--------------------------FNGYDLNISEY--------QWFTDIEFNP-------QKSINCQA-----------------------------------RAGSDWIGRW--------- 185 291535823 bacteria>firmicutes
Sca_2305_Scar_224477787 53 DKLLEVSSKSE----KSIGVKASAFN----LKISTVKG----------------HHLSVEQIFQSSK--VY-----------------KKAGNQNYLLEEG-----YNSKEMKQKLREIDK------------------DDYMIKYSSFHQD---FPLEPKTLFYNWIYINALNQ--------------------------NEEVAKEILKY--------EAFTDIEFNP-------KRSFNCQA-----------------------------------EACAIYVSLVKQKNLDEAL 208 224477787 bacteria>firmicutes
pIL105p2_Llac_60461911 54 KKVLEISTKSP----TDLGVELSAFN----LKIQTKQ----------------EIYFTVESAFQSSK--VF-----------------ENGGPYDDLLLK-------GSREAKKDIRLKS-------------------SGKVIGFKYLNRE---FPSEPKTFFYNWLYVNALDK--------------------------NKKLSKELLSY--------DSFTDIEFNP-------EKSINCQA-----------------------------------EAAALYVSLSHKKLLTTAL 206 60461911 bacteria>firmicutes
HMPREF9383_1770_Ssan_325694076 58 LKVLEVSTASE----EEFGKECSAFN----LQLTLRNG----------------SKYSVESLFQSSK--VF----------------KNYGRVNQDLDL--------DAKAVKRQVRSIEV------------------NDKLIEFDFLGVK---FPLLPRTYFYNWLYVNALFQ--------------------------NTELSNFILQY--------DAFTDINFNP-------NKSINCQA-----------------------------------EACSIFLYLAKNSLLNDSI 211 325694076 bacteria>firmicutes
SSA_1883_Ssan_125718681 50 KKILEVSSKSI----DQVGRAASAFN----LKVTLKSG----------------KVYSVEQIFQGSK--VF----------------KKNGSQLKLLDSM-------TSKELKKIVGKLHQ------------------VDKLVEFESFGQH---FPLEPQTFFYNWLYINSLNQ--------------------------HKSLANQIIKY--------DAFTDIEFNP-------EKSKNCQA-----------------------------------EACSIYIFLYKSGLLDFAL 204 125718681 bacteria>firmicutes
HMPREF9382_1113_Ssan_325690155 58 LKVLEVSTASE----EEFGKECSAFN----LQLTLRNG----------------NKYSVESLFQSSK--VF----------------KNYGRVNQDLDL--------DAKAVKRQVRSIEV------------------NDKLIEFDFLGVK---FPLLPRTYFYNWLYVNALFQ--------------------------NTELSNFILQY--------DAFTDINFNP-------NKSINCQA-----------------------------------EACSIFLYLAKNSLLNDSI 211 325690155 bacteria>firmicutes
CBFG_01593_Cbac_239627871 60 ANILEISSKST----SALGVSLSAFN----LNIQTAK-----------------RAFSVECAFQSSK--VF-----------------ESGGPYTDLLDR-------SSIEAKKDPRLHD-------------------SGKLIAFQYFNVK---FPLEPKDYFYNWLYINALKL--------------------------NTELTSEIITY--------DSFSDIEFNP-------QKSINCQA-----------------------------------KAAAIFVSLSNQHLIEEAL 211 239627871 bacteria>firmicutes
bcere0015_42140_Bcer_229129773 46 ESVLEVSSKSE----SDLGRALSAFN----LKIELKNG----------------KNFSVENAFQASK--VF-----------------EFGGPFLDLLYC-------TAKEAKKDVRLKN-------------------SGNLISFRYFNRE---WPLCPKTAFYDWLYINALAR--------------------------QQKLGSCVLEY--------SAFSDIEFNP-------KKSINCQA-----------------------------------RALALYVSLHKADKLQYVL 198 229129773 bacteria>firmicutes
BC4488_Bcer_30022569 32 ESVLEVSSKSE----SDLGRALSAFN----LKIELKNG----------------KNFSVENAFQASK--VF-----------------EFGGPFLDLLYC-------TAKEAKKDVRLKN-------------------SGNLISFRYFNRE---WPLCPKTAFYDWLYINALAR--------------------------QQKLGSCVLEY--------SAFSDIEFNP-------KKSINCQA-----------------------------------RALALYVSLHKADKLQYVL 184 30022569 bacteria>firmicutes
Ilyop_1055_Ipol_310778851 52 ANILEISSKSL----ENLGIKLSAFN----LMIQTKKG----------------KAFSVECAFQGSK--VF-----------------KKGGPYIDLFHK-------TSREAKKDPRIKN-------------------SGPLVKFEYNKNE---WSLEPKTFFYDWLYINSLYR--------------------------KNELAQEIIKY--------DSFTDIEFNP-------EKSINCQA-----------------------------------RAAALFVLLKKLNIIDNAM 204 310778851 bacteria>fusobacteria
OA238_4610_Oant_254453984 34 HPILEISTKSL----VEVGRRLSAFN----LKIDV-NG----------------TLKSLESVYQSSK--VF-----------------AHSGQHEHLMDL-------EPFMAKREVHSLG-------------------QGPIVAFRLLGEE---FPTEPKNAFYDWLYLKAITP--------------------------HEEWIKKNLHY--------AAYSDIEFNP-------SKSINCQG-----------------------------------RAVAEFHALSLRNSTMDCV 185 254453984 bacteria>proteobacteria>alphaproteobacteria
ED21_31874_Esp._149186578 34 EKILEISSKSL----EDLGVRSSAFN----LKWLSSVA---------------NFPISVECAFQGSK--VF-----------------LNGGPFTDLYEA-------RPIDAKRDVRLRS-------------------SGNLKAFDFDGGN---WPIEPQTAFYDWLYISALRE--------------------------NPEIADAILSF--------DGFTDIEFNP-------KKSINCQA-----------------------------------YSAALFCSLYKQGMVDEVL 187 149186578 bacteria>proteobacteria>alphaproteobacteria
CAP2UW1_1710_CAcc_257093308 52 AHILEISSKSE----DPLGVKLSAFN----LPFVMPNG----------------LRTTVENAFQSGK--VF-----------------RHGGPYLDLLNK-------TPREAKKDSRLSG-------------------SGDLVGFRLDGED---WPTRPLTAFYDWIYLSALKQ--------------------------SPALAEQLLRF--------DGFTDIEFNP-------ERSLNCQA-----------------------------------ASAALFVALTKRGEIDAAT 204 257093308 bacteria>proteobacteria>betaproteobacteria
GBP346_A3087_Bpse_237813318 23 NDLLEISSKSP----NPDGVALSAFN----LKFTTLKY---------------NRTFSVEIAFQASK--VF-----------------EHGGPYRELLEV-------DSRTAKRDVRLKT-------------------SGRLLKFSFLKTE---FPLRPVTYFYDWLYINALVK--------------------------NRHLWPALSRA--------EGFTDIVFNP-------SKSLNCQA-----------------------------------YSAALFASLVRADKLSKAL 176 237813318 bacteria>proteobacteria>betaproteobacteria
BCAM1881_Bcen_206563730 53 DRVLEISSKSK----DEYGVKLSAFN----LMIKTPR-----------------REYSLECAYQASK--VF-----------------ERGGPFTDLLNA-------KSIDAKRDPRLTQ-------------------FGRMIRFQWYGKE---WPLQPRTAFYDWLYINALHR--------------------------PQELAKIVLTY--------RAFSDIAFNP-------ERSINCQA-----------------------------------YAAALYVSLHERGLLRDEI 205 206563730 bacteria>proteobacteria>betaproteobacteria
NEISUBOT_05210_Nsub_261381097 53 GKVLEISSKSK----SELGIALSAFN----LMIKSAKG----------------KRVSVECVFQSSK--VF-----------------EGDIQYLDLLEV-------SSREAKKDSRLKS-------------------SGMVIAFRTYGKKDKEWGTKPITAYYDWLYVNALNQ--------------------------HTEFHEELLEY--------SAFSDIEFNP-------EKSLNCQA-----------------------------------YSVALFCALYRRGILQDVL 208 261381097 bacteria>proteobacteria>betaproteobacteria
Glov_2583_Glov_189425639 53 TNLLEISSKSK----TTLGVDLSAFN----LMITTIKY---------------NKTFSVESAFQSSK--VF-----------------EKGGPYLDLLDK-------TSREAKKDGRLQT-------------------SGRLKCFKFFGIE---WGLEPQTAFYDWLYINALKK--------------------------NSDYAEQVMEY--------SAFTDIEFNP-------ERSINCQA-----------------------------------YSAALYVSLCHRDLLEYAT 206 189425639 bacteria>proteobacteria>deltaproteobacteria
HWAG_01373_Hwin_237752248 56 AKILEISKASP----NQLGQKLSAFN----LKLKVFNGIQ-------------DITASVERFFQGSK--VF-----------------NNGGPFEEIIFN-------ENIHPKKYDKLKK-------------------GCNFQGFKLFGKC---YSTEPVTFFYDWLYINALKQ--------------------------NSILATELENY--------DIFTDIEFNP-------NKSLSCQA-----------------------------------ATVALFLSLKKAGTLDKAT 211 237752248 bacteria>proteobacteria>epsilonproteobacteria
CAMGR0001_0616_Cgra_257460202 53 EKILEISKASP----NPLGKALSAFN----LKLRLKDEEQN------------LIEASVERFFQGSK--FF-----------------ERGGPFEEIIFS-------AKVHPKKYPPLKN-------------------SGNFCGFELFGER---FSTEPKTYFYDFLYLSALKQ--------------------------NPNLADEVLRY--------DYFSDIEFNP-------KKSFSAQS-----------------------------------RAAALFVGLSRNGIFKEIF 209 257460202 bacteria>proteobacteria>epsilonproteobacteria
Psyc_0321_Parc_71064897 53 DKILEVSSKSK----EDLGVALSAFN----LMIADKAT---------------KEKYSVECAFQSSK--VF-----------------ENGGAYTDLLKV-------TSKQAKKDERLRN-------------------SGKLIGFEFYNTK---WQLNPLTAFYDWLYVNALNQ--------------------------NVQLHDRLMQY--------QTFTDIEFNP-------KKSINCQA-----------------------------------YSIAMFVALAKRNMLESIR 206 71064897 bacteria>proteobacteria>gammaproteobacteria
ACICU_00103_Abau_184156423 53 FNILEISSKSE----VELGVALSAFN----LMMFDKKT---------------HQKFSVECAFQSSK--VF-----------------QNGGPFLDLLNV-------TSREAKKDERLKT-------------------SGQLKKFTFYGID---WALDPLTAFYDWLYINALNF--------------------------NAEYHQELLAY--------EAFTDIEFNP-------EKSINCQA-----------------------------------YSIAMFVALSKRNLLDKVR 206 184156423 bacteria>proteobacteria>gammaproteobacteria
HMPREF0198_1779_Chom_258545510 63 KNILEASSKSE----QPLGLPLSAFF----LK--DEDG------------------VPVENLFQSSK--VF-----------------ENGGAFLDLRHV-------SPRAAKKDLRLKE-------------------SGAMLKFLFNGKE---FPLEPKSLFYDWLYSKILYG------------------------NNNIELKNQLINE------VFDAFSDIEFNP-------KKSFSCQA-----------------------------------RTLALFISLHSTNCLKEFI 216 258545510 bacteria>proteobacteria>gammaproteobacteria
Pcryo_0891_Pcry_93005719 60 NHVLELSSKSG----NKLSFLLSPLS----LKLTNENG---------------GEQYSVENAFQSSM--VF-----------------EDGGPYIDLLSA-------PPRQAKKDERLIN-------------------SGELIGYNYFGME---WSVEPLTTFYDWLYVNALKQ--------------------------NPHLHEEVMQY--------QAFTDMEFNP-------KKSIHGAA-----------------------------------YALAMFVALHKRELLDNIE 213 93005719 bacteria>proteobacteria>gammaproteobacteria
Psyc_0844_Parc_71065404 67 NHVLELSSKSG----NKLSFLLSPLS----LKLANEHG---------------GEQYSVENAFQSSM--VF-----------------EDGGPYIDLLTA-------PPRQAKKDERLIT-------------------SGELIGYNYFGME---WSVEPLTTFYDWLYVNALKQ--------------------------NPQLHEEVMQY--------QAFTDMEFNP-------KKSIHCAA-----------------------------------YALAMFVALNKRELLDNIE 220 71065404 bacteria>proteobacteria>gammaproteobacteria
GPB2148_1261_Mgam_254482777 24 EGILEISTKSP----ESLGVSLSAFN----LTYQPENS---------------DKRYPLESLFQSAK--VF-----------------TDGGPYRDILSK-------PAREAKSDPRLTT-------------------SGRLVAFSSRDTT---WPLVPRTAFYDWLYLNVLGH--------------------------YPRLAEPLSMF--------GGFTDIEFNP-------KKSINCQA-----------------------------------YSAALFVALSERKLMAKAM 177 254482777 bacteria>proteobacteria>gammaproteobacteria
XAUC_02590_Xfus_294664143 60 DRVLEISSKSP----DSLGVDLSAFN----LMIKTVKH---------------EREFSLECAFQASK--VF-----------------ENGGPYKDLLNA-------RSLDAKRDPRLKE-------------------SGRLIKFRFFNVD---WELEPRTAFYDWLYINALHK--------------------------PQDLAEKVLTY--------RAFSDIAFNP-------DKSVNCQA-----------------------------------YAAALYVSLQERGLLSETM 214 294664143 bacteria>proteobacteria>gammaproteobacteria
V12B01_14190_Vspl_84392320 54 GSILEVSSKSL----DELGVSLSAFN----LCITTKLK---------------KQSFTVETAFQGSK--VF-----------------EQGGPYLDLIGM-------DSRAAKKDLRLKE-------------------SGNLIYFEFFGKK---FPNTPRTFFYDWLYINALVQ--------------------------NQDLAIQVEAY--------DAFSDIEFNP-------KKSINCQA-----------------------------------YAIALYVSLAKNGLLEQAL 207 84392320 bacteria>proteobacteria>gammaproteobacteria
A5C_A0388_Vcho_153817467 52 NNILEISSKSL----DELGILLSAFN----LSFVTKKH---------------NHKITVESAFQGSK--IF-----------------KRGGPYKDLYLA-------DSRTSKKDIRIKD-------------------SGQLVGFKFFNTE---FPLIPRTYFYDWLYIKALVS--------------------------NPQLVDQLYKF--------DGFSDIEFNP-------KKSINCQA-----------------------------------HAAALYVSLNSAGVLEEAL 205 153817467 bacteria>proteobacteria>gammaproteobacteria
PsycPRwf_1182_Psp._148652988 60 KNVLELSSKSG----NKLSFPLSPVS----LKITNEED---------------GQQYSVENAYQASK--VF-----------------KGGGPFVDLLDA-------APRQAKKDERLMS-------------------SGEITGYDYFGMV---WGLEPLTVFYDWLYVNALKQ--------------------------PNHLHQEVLQY--------QAFTDISFNP-------KKNVHCPA-----------------------------------YSLAMFVALHKRELLEGIE 213 148652988 bacteria>proteobacteria>gammaproteobacteria
FPR_02440_Fpra_295103146 48 VSILEVSSASA----QPEGEAVSSLR----LLLRLNSV---------------AQDVPISTVFEAAK--VF-----------------EHGGPFADLLTC-------APSKVHKDTRLRT-------------------NGKLLRYSLEGSEY--PIEPHPDSFFEWLYCRALKQ--------------------------PFEKAAQLSRY--------NAFSDIAAAA-----DSKKYYGDSS-----------------------------------RAAAIYVGLAAAGKLPCID 204 295103146 bacteria>firmicutes
_Fpra_160945657 72 VSILEVSSASV----QPEGEAVSSLR----LLLHLDSV---------------AQDVPISTVFEAAK--VF-----------------EHGGPFADLLTC-------APSKVHKDTRLRT-------------------NGKLLRYSLEGSEY--PAEPYPDSFFEWLYCRALKQ--------------------------PFEKAAQLSRY--------NAFSDIAAAA-----DSKKYYGDSS-----------------------------------RAAAIYVGLAAAGKLPCID 228 160945657 bacteria>firmicutes
KSE_10250_Kset_311894452 22 AVIVDTTSKAP-----DPWVRLSPFYPHGGIPVPFSPG---------------VTAQSVEGIWQALK--VF-----------------ESVDTDPAKLDV------TTMKGLKRTVRRFG-----------------PVRGHRAGLDGTELL---PYQEARRRIYLPAYRWTLEH--------------------------VRPDLLERLRA-----EEHLVLLDYTTNG-------DVADTGSP-----------------------------------LSHAALIRRHLEGRWPDEG 186 311894452 bacteria>actinobacteria
OSCT_1675_Otri_309791192 22 ATLLDVTSQGP-----APWVRFSPFYPHGAIPVPLSPG---------------MTAASVEGIWQGLK--VF-----------------THANIDLNTMTN------TTMRGLKRTTRRFG-----------------AVQGHRAGVAGTTLL---DYATARQRIYLPAYRWVLDH--------------------------LCQPELDDLRQ--RASQGLVVLLDYETNT-------DLADLRRP-----------------------------------LSHAGLIIRYLDGTWPVS- 184 309791192 bacteria>chloroflexi
Tcur_0355_Tcur_269124625 22 ALILDVTSRAE-----RPWARFSPFYPHGGIPVPFSPG---------------VTAQSVEGIWQALK--VF-----------------ANADVDPAKLEI------TTMKGLKRTVRKHG-----------------PVRGHRAGLTGEVLL---PYEQARRQIYLPSYRWVLEH--------------------------VRADLMDRLKE--LSSRGDIVLLDYTTNG-------DVTDLSAP-----------------------------------LSHAALIRCHIEDRWP--- 182 269124625 bacteria>actinobacteria
HCH_04340_Hche_83647036 29 YAIIDVTSKAS-----APWVKFSPFYPHSGIPIPFSS----------------ETAQSVEGIWQGLK--VF-----------------EGQDIDPSRFDI------TDMKGIKRTVRRYG-----------------RVLGHRKGPGGE-LI---PYIEARKQIYLPAYHWTLTH--------------------------LRQAELSQLSE-LLARHEGLVLLDYETNT-------DINDPRKP-----------------------------------LSHAALIRRFLQP------ 185 83647036 bacteria>proteobacteria>gammaproteobacteria
Caci_4610_Caci_256393748 22 ARIIDVTSKGP-----QPWVRMSPFFPHSGIPVPLSDG---------------AVSQSVEGIWQALK--VF-----------------PGSDVDPRKLDV------ASMTGLKRTVRKHG-----------------PVLGHRAGLNGQDLL---PYEQARRRIFLPAYRWVLEH--------------------------VNTDLIAELRA----ADGDIVLLDYTVNG-------DVTDTSSA-----------------------------------LSHAALIRLYVEDRWP--- 180 256393748 bacteria>actinobacteria
M23134_02260_Mmar_124004845 21 YKIIDVTSKAP-----TPFVKLSPFYPIGDIPVPLSEG---------------HFAQSVEGIWQGLK--VF-----------------ETASIDLKKLEV------TTMKGLKRTVRKFG-----------------NVKGHQAGVNNHNLL---PYIIARKQIYLPAYRWVLDH--------------------------VKSDVLQLIKN--EAEQHPIILLDYETNG-------DVENASKP-----------------------------------LSHAYLVKYYLENNFP--- 181 124004845 bacteria
_Krac_298250178 22 VQVIDVTSRGA-----DPWVRFSPFYPHGDIPVPFSPG---------------YTSWSVEGVWQGLK--VF-----------------EQAGVDVSKFRI------ANMKGIKRSGRSLG-----------------GVLGHREGVDGERLL---GYREARSAIYLPTYRWVLEH--------------------------LEQPELETLRQ--LSAQASVILLDYETNA-------NIDDLRRP-----------------------------------LSHAALIKAYLTAPED--- 182 298250178 bacteria>chloroflexi
GobsU_010100001512_Gobs_168698168 22 ATVADVTSKGP-----EPWVRFSPFFPHGGIPIPNTPD---------------ETAASVEGLWQGLK--VF-----------------EKEDIDPKKWAI------TDMRNIKRAGASRG-----------------AVRGHRFGVGSGTLL---GYREARFRIYLPAYAWVLER--------------------------LCAREVEQLRG--IARAGTVVLLDYETNT-------DAEDLSRP-----------------------------------LSHAALVRHFLEETWP--- 182 168698168 bacteria>planctomycetes
GobsU_010100034385_Gobs_168704676 25 SVVYDVSSYAE-----PPHCELSPMWVHGGVPVPGAPG---------------ETSDTVEGVWQGLK--VI------------------RGQTAPRYFR---------GPGAKRGG---------------------KPSGHRFGTR---LL---GVVEARRLIYVPTYEWVIEN--------------------------TRSPEQIRAFIDAAFAGVTQHFHDVGDNG-------DPNDATQP-----------------------------------LAQAAVLVRYLNRKCAERA 182 168704676 bacteria>planctomycetes
BXY_40670_Bxyl_295087466 21 AVILDITSNSE----TRYAKILSPFYPHGNIPIPFTDG---------------LKATCVEAVWQGLK--VF-----------------EGVGVDFATFKN------DTMRDLKRTVRKYG-----------------VPKGHSKGAYSKELL---GYFEARMLIYLPTYKWVLDN--------------------------PVEVHHVVERIKEQSKIQDIVLLDYNTNI-------DFRDISKP-----------------------------------MSHAGLVKLYIEGKYPDNM 191 295087466 bacteria
HMPREF0665_01551_Pori_299141967 21 ADILDITSNSE----TRYAKILSPFYPHGNIPIPFTNE---------------LKATCVEAVWQGLK--VF-----------------DSVDVDFSTFKN------DTMRNLKRTVRKFG-----------------KPKGHRKGAYGKELL---NYFEARMLIYLPTYKWVLDN--------------------------PVEVHRVVERIKEQSKKRDIVLLDYNTNT-------DFRDISKP-----------------------------------LSHAGLVKLYIEGNYPEGM 191 299141967 bacteria
Bfra3_010100013815_Bfra_255010211 21 AVILDVTSNST----MRYAQILSPFYPHGNIPIPFTPD--------------TLKATCVEAVWQGLK--VF-----------------ENADVDFSTFKN------DTMHNLKRTVRKFG-----------------IPLGHRKGAYGKELL---GYFEARMLIYLPTYKWILDN--------------------------KIEVYHVVERIKAQSIKQDIVLLDYNTNI-------DFRDITKP-----------------------------------LSHAGLVKLYIEGKYPNEV 192 255010211 bacteria
Bcep1808_6822_Bvie_134288349 18 AVVVDTTSRSA----TSWSRAFSPFYL---GPADLYDG---------------HVARTVENGWQYAK--VY----------------ADQLGADGNPNEAYWAWAKAGWGKMRADRYPRG-----------------KGAKPVFCWWNGTKL---GYIEARLKVYFPLYRDAV-R--------------------------TQEAFNQLVRL---ARDRTIVLWDFDGF--------DHQTIGLS-----------------------------------LANVLLDDSRPMGHA---- 179 134288349 bacteria>proteobacteria>betaproteobacteria
bthur0002_58540_Bthu_228982721 89 LNVLECSTKGD--------KRFSALS----AKVSVHDV-----------------FDTIENHYQKSK--VF-----------------QDESGFYYTCKKW------ENAKGKKPVA---------------------------CKIGNTIL----SIEYLSMFYELLWYKYLKS--------------------------ENYLEEVLAKF--------DEYHDMFKS--------KKSMVCQA-----------------------------------DTIREYMKNENDEWY---- 221 228982721 bacteria>firmicutes
MexAM1_META2p0262_Mext_240141986 7 APFLECSSRGD--------QRFSAFS----ARLR-SQG-----------------GRSIEEVYQAAK--VF------------------EDGSTGLGWR---------DAKGKRAVN---------------------------------------MPEVRR-LYSRLWDAYIDE--------------------------PNELLALIQVQ--------SGLSDVFG---------QQGNACQA--------------------------------------TELWRIRAERAAVGGV 125 240141986 bacteria>proteobacteria>alphaproteobacteria
16-3p043_BP16-3_195546573 7 APFLECSSRGD--------RRLSAFH----ARIR-SRG-----------------NKSIEDIYQAAK--VF------------------ADGSSGLSWR---------EAKGKRAVN---------------------------------------MAEVRE-LYARLWDEYIGE--------------------------PNALLDVVRAA--------SGLSDMFG---------QSGSACQA--------------------------------------TELWRIRNKEQA---- 121 195546573 dsdna viruses, no rna stage>caudovirales
MAR_ORF111_MV_284504143 1 ------------------------MAL---GPVEHVHPA-------------LPPAKNIENFYQGSK--VF--------------VQEVDKDQNPTSLFYENRERLFSDEIPKRHKYKGMGKN--------------KNIPLYFLWTDKCGK----EHRLDYIQSRQTYCNFFER--------------------------ALSDTEDYRKL--------CRLQDKGYNLIFCGY--DAHDIPEDTPKI-------------------IEEAYLDPSVPF-GHERVLFAMLALRDTPEE 169 284504143 dsdna viruses, no rna stage
LAU_0089_LV_327409634 109 FPNFRHQKRKD----GFGCSNLSPMTL---GPVKHTCPG-------------LEPAKNIENFFQGSK--VF--------------SEEVDKHKNPSSLFYENREMLFADPVPKRHKYKGVGKN--------------KNIPLYFLWTDSEGK----EHRLSYIESRQTYCNFFER--------------------------ALSETKDYRKL--------CRLQDKGYNLIFCGY--DAHEITGS-----------------------IEDAYLDPSVPF-GHERVLYAMLALRDTPEE 284 327409634 dsdna viruses, no rna stage
NAEGRDRAFT_46602_Ngru_290997341 83 YKNVNCCSGAS----GI-FKELSPMKL---GPYEYEHGSE------------KCTITNLENLWQFSK--VF-----------------PGEEEQVRN---------DNGQLTKVPNSEFF-------------------ERRTKGWKDEKAH---RHVKREKPLYSWWKGEKFNY--------------------------QMARRKIYCPL------YAEKVVETEAYK-------KLEEMVNS------------------------------------GMNIQILGFDGYNYDGKT 240 290997341 eukaryota>heterolobosea
consensus/100% - ...hp.sp..............ush.................................lp..hb..b...b.........................................p...................................................h...b...h.................................................h.c............p.............................................................
consensus/95% - ...lphoo.............hSsh.......h........................slp.hab..K..hh.........................................+p.................................................ha...h...l.................................................h.-............p......s......................................................
consensus/90% - ..hl-hoo.u...........hSsh.......h........................slE.haQu.K..la...................ss.....b..............K+.................................................ha...a...l.p...............................................h.Dh...........p....s.s......................................sh..b...........
consensus/85% - ..ll-loo.u...........hSsh.....h.h........................slEshaQu.K..VF...................ss.....h.............hK+..p.......................s........s...........p.hY..hY...l.p...........................p...................h.Dh..s........p....s.s......................................shhhb..b........
consensus/80% - ..lL-loSpu........s..hSsF.....l.h........................slEshaQu.K..VF.................p.ss...pbh.........s...hK+s.c.......................s....h...s.p.......sbp.hY..hY..hL.p...........................p.....l.ph.........sh.Dhp.N........p.s..sps......................................shhhb..l........
consensus/75% - .plL-lSSpS........u..hSsF.....l.l..ps....................oVEshaQu.K..VF.................ppuss..pbh.........s.bphK+ssR..s....................s....h...s.p......psbp.hY.bhY..hL.p...........................pph...lbph.........sh.Dhp.Ns.......cbs.ssps......................................uhhhbh.l........
consensus/70% - .plL-lSS+S........u..lSsF.....l.l..ps....................oVEshaQuuK..VF.................cpuss..shhp........ssbphK+ssRbbs...................ssp...h.h.spp.....bpsbp.hYpbhY.phLpp...........................pph..plbph.........shsDhp.Ns.......cbs.sspu......................................uhhlhh.Lp.p.....
#==== YbiA-like family
#== gp30.3
_Bpar_33595978 4 ASRLNISSTSD----DWRGLALSNFPL----SPFVLDG---------------ELFASVEGFIQGIK---FR----------------EDDPRRATAFLS-------SGWDAKHLGD--------------------TVDRSGAYWGGARIRY---GSAEHHQLIERAIRARIKQ--------------------------CEGLRRTLRAT------EGMTLVHDTGKP-------EAPHTSLPAT-------------------------------------VFCRILETLRREILA 152 33595978 bacteria>proteobacteria>betaproteobacteria
_Bbro_33601359 4 ASRLNISSTSD----DWRGLALSNFPL----SPFVLDG---------------ELFASVEGFIQGIK---FR----------------EDDPRRATAFLS-------SGWDAKHLGD--------------------TADRSGAYWGGARIRY---GSAEHHQLIERAIRARIKQ--------------------------CEGLRRTLRAT------EGMTLVHDTGKP-------EAPHTSLPAT-------------------------------------VFCRILETLRREILA 152 33601359 bacteria>proteobacteria>betaproteobacteria
30.3_BPRB43_66391541 1 M-DIGSGSQY-------PSCALSNFAP----HPFTFDG---------------VECASMEGFLQSLK---F-----------------SNPDMQAHVCTL-------VGKAAKFKGKKKK-----------------WWTTQTLYWKGIPIHR---ESEAYQILIENAYNALFL---------------------------NEGFRRALKAT------GKSTLTHSMGKN-------KMNETVLTER-------------------------------------EFVRNLTRLRDLL-- 146 66391541 dsdna viruses, no rna stage>caudovirales
BMS_2150_Bmar_301167374 62 EGEVILSKRN-------ELGILSNFAA----TDFVYKG---------------TLYKSVEGFWQSLK---YP-ESQDDMRATF--EGIEWPYSRAEVELM-------TGFLAKKAGGYAN-------------ANMREMGIDWVTFQGKKIKFWTVSKGVHYRLIKDALRTKAIQ--------------------------NPKVMEILLST------GDLKLLPDHIMG-------DAPPAWFYNK-------------------------------------IWMELRKEFRE---- 228 301167374 bacteria>proteobacteria>deltaproteobacteria
PT7_2661_Psp._332285914 5 DTHLNVAYTST----DWRGVALSNFSL----SPFVFDD---------------QLFASVEGFIQGLK---FP----------------EGDARREQAFQS-------CAWEAKKIGE--------------------QADKSAAYWAGECMAF---GSTEHHRLVGRAVRVRIEQ--------------------------SQGLCQVLIST------KGLELVHETGHG------PEPAITSLPAA-------------------------------------VFCRVLTDLRGELLA 156 330429867 bacteria>proteobacteria>betaproteobacteria
Gbem_1485_Gbem_197117872 1 M-DVGGYTTG-------IAGRLSNFTP----RAFVLDG---------------FHCACLEGALQAFK---F-----------------DDPEMQKRICMM-------SGKEAKTIGQTRN---------------EAWQSCQTLWWQGKAYDR---LSPEYQQLLDRLYEAALL---------------------------SADFADDLLAT------GDEVLSHSIGEH-------DPRKTVLTEE-------------------------------------EFCSRLMANRSKVKK 150 197117872 bacteria>proteobacteria>deltaproteobacteria
gp30.3_BPSP18_308814565 1 MSELEIRSNF-----PWPSCALSNFAK----WPFVMDG---------------IQFGGLEGFLQGCK---V-----------------RNCEQQKRIFGM-------SGLTAQQTGRAYA----------------RAADRGTLFWLGIPFSR---YSTSWKELYTNAYFEAALQ--------------------------NKGFRDALQAT------KGKVLKHSMASH------LTVHDTILTEQ-------------------------------------EFIDILNQLRDAL-- 152 308814565 dsdna viruses, no rna stage>caudovirales
30.3_BPIME08_299779149 4 MSELEIRSNF-----PWPSCALSNFAK----WPFVMDG---------------IQFGGLEGFLQGCK---V-----------------KNVEQQRRIFGM-------SGLAAQQAGRAYA----------------RAQDRGTLFWLGTPFSR---YSTAWKELYESAYFEAALQ--------------------------NKGFRDALQAT------KGKVLKHSMASH------LTECDTILTEK-------------------------------------EFIDILNKLRDLL-- 155 299779149 dsdna viruses, no rna stage>caudovirales
30.3_BPAeh1_38640191 1 MLDIHIGTAY-------PGNVLSNLAH----NAFVFDD---------------IRCGGMEGLLQSLK---F-----------------QDVNKQIQIAAM-------SGTAAKFRGAKKK-----------------WYNGQTLYWKGVPFSR---HTDAYQNLLDNAYDEMFVQ--------------------------NESFRKALTDS------KNTVLCHSIGHT-------DPFRTILTVE-------------------------------------EFLCRLNRLRSLLLV 150 38640191 dsdna viruses, no rna stage>caudovirales
phiAS5_ORF0053_BPphiAS5_310722519 1 MLDISVSALY-------PANELSNLAK----HEFIFDG---------------VRCGSMEGLLQSLK---F-----------------QDVEKQIAIAAM-------WGTGAKFRGAKKA-----------------WYNDQTLYWKGVPFSR---HSEAYQNLLDNAYDELFVQ--------------------------SESFRKALTSS------GNTVLCHSIGHN-------DPMRTILTVE-------------------------------------EFLCRMKRLRSLLLA 150 310722519 dsdna viruses, no rna stage>caudovirales
30.3_BPKVP40_34419305 1 M-DIKSGAGY-------PASALSNFAP----HAFVVRG---------------VECASMEGFLQSLK---F-----------------KNPEMQREVCKL-------VGKVAKARGSKKN-----------------WQRTQTLYWQGEPIQR---ASVGYQTLLDDAY-AALAQ--------------------------NVKFQKALLAT------GKATLTHSIGRK-------KQAETVLTVQ-------------------------------------EFCSRLTVIREHLQN 148 34419305 dsdna viruses, no rna stage>caudovirales
30.3_BP65_326536778 1 VIDI-YSGSS-----NWIERELSNFTE----HTFTFDG---------------VYYRTIEAFLQSLK---Y-----------------ENPPDINGLRGH---------EVYRFCHNHIG-----------------WKKDLTMWYKGRPIHR---LSDAYSNLIYNAYLSMAEQ--------------------------NKSFLEALVHS------KPHILAHTMGCK-------DPHHTILTEK-------------------------------------EFCDILTEIRELI-- 149 326536778 dsdna viruses, no rna stage>caudovirales
#== YbiA
ALIGN - ---EEEE--------------------------EE----------------------HHHHHHHHHH-----------------------HHHHHHHHH----------HHHHHH---------------------------------HHHHH---HHHHHHHHHHHHHHHHH-----------------------------HHHHHHHHH----------EEEEE------------------H-------------------------------------HHHHHHHHHHHHHH---
HMM - ---EEEEE-------------------------EEEE----------------EEE-HHHHHHHHH------------------------HHHHHHHHHH--------HHHHHHHHHH-------------------------HEEH-HHHHH---HHHHHHHHHHHHHHHHHH---------------------------HHHHHHHHHH----------EEEE------------HHHHHHHH-------------------------------------HHHHHHHHHHHHHHHH-
FREQ - --EEEEE--------------------------------------------------HHHHHHHHHH-----------------------HHHHHHHHH----------HHHHHH---------------------------H-HHHH-----------HHHEHHEHH-HHHH-----------------------------HHHHHHHHH---------EEEEE--------------EE------------------------------------------HHHHHHHHHHHHHH--
PSSM - ----------------------------------EE----------------------HHHHHHHHH-----------------------HHHHHHHHH---------HHHHHHHH-----------------------------------------HHHHHHHHHHHHHHHHHH--------------------------HHHHHHHHHH---------EEEEE--------------EE-----------------------------------------HHHHHHHHHHHHHH---
FINAL - --EEEEE---------------------------EE-----------------EE--HHHHHHHHHH-----------------------HHHHHHHHH---------HHHHHHH---------------------------HHHHHHH-------HHHHHHHHHHHHHHHHHHH--------------------------HHHHHHHHHH---------EEEEEE-------------EE-----------------------------------------HHHHHHHHHHHHHHHH-
PDB(2b3w) - --EEEE-----------HHHHH-----------EEE-----------------EEE--HHHHHHHHH-----------------------HHHHHHHHH---------HHHHHHHHH----------------------------H-----------HHHHHHHHHHHHHHHHHH---------------------------HHHHHHHHHH---------EEEE----------------------------------------------------------HHHHHHHHHHHHHHHH
# # # #
IIV6gp151_IiV6_15078868 19 -DTIVLKHEE-----DKPFGPLRNDYK----SDLYIDG---------------KRWNSVDNYVFSNL---L----------------PSIDFRKQTIEHL-------NPHQVEKTYYDV-----------------------KFEIN----------KSTLSSAIKIGIESKLIA--------------------------DPQFRQALLNT------AGSSIMYLSKNN-------YLGYGNGKWF-----------------------------------VNTYGIWLEHFRTGMLW 159 15078868 dsdna viruses, no rna stage
ORF234_BP0305phi8-36_156564215 7 SNAIRFYSGS------DNYSEFSCMSK----HPVVIAG---------------TEYPTLEHYYHAQK---F-----------------IDLEPVEEILAT------NNPFEARRLGQRTD-------------------YPIHEDW-----------DVMKEHVMFVGLIHKFKQ--------------------------HEWLRTLLLST------GDKELIHHSDR--------DRYWGQSVTG---------------------------------KGKNRLGIMIMNVRERIKN 151 156564215 dsdna viruses, no rna stage>caudovirales
Deipr_2488_Dpro_325284428 43 QEVTSFTG---------PFSFLGNFHS----EKAVRYG--------------ALQFQTLEAAFQAAK---T-----------------GDVDIQRRIAAA------PSPKEAKAIGRALQ---------------------LREDW-----------EDMKEQVMLDLLREKFS---------------------------HRVYREQLLGT------GLVPLIHNNAHK-------DAFWGVYKGE----------------------------------GQNRLGKLLMQVREEIRA 182 325284428 bacteria>deinococci
TVAG_227690_Tvag_123462122 1 --MINIYYSTN------ENAELSNFAI----RPFIING---------------VRYDSVEQYFQIMK---FKIEAVYTYDKDSEEGRKSKEKIDSLIQKMQNT---KSGSLLKKLGNTRI----------------KNAKFNSGLW-----------TQESQNVMREGIFESFKQ--------------------------NPPFLKKLLET------GDATLTHNQDK------------------------------------------------SRW-GK-LFPKILMEVREQLKE 157 123462122 eukaryota>parabasalia
Mmc1_1181_Masp_117924481 22 PTMVALLPPI-------WYSCFSNFSD----HPFELDG---------------KLWFTVEHYFQAAK---F-----------------ADPQQRARIYAC------PSPMTAALMGKDRS-------------------IPIRADW-----------DAIKLDVMRQALNAKFDT--------------------------HQQIHDFLQAT------HPYPLLNYTAF--------DPFWGQDKRG---------------------------------HGQNQLGKLLMERRSRML- 164 117924481 bacteria>proteobacteria
Msp_0486_Msta_84489297 69 DAQELIKSTLK----PLFIKLWTRDGK----PKYNIDFN--------------EDKNYIQMYDTIYK----------------------DTTHHIHIGT-------KTYDSAKEIISLIE---------------NDLKSKSPELW-----------NELKYTLYLNALYYKIVT--------------------------DINFTKELIKT------KDRCIVFKSDN---------LEWGVTIDD------------------------------GKLIGQNLFGFAMMEIRDVLCD 219 84489297 archaea>euryarchaeota
SrosN15_010100002350_Sros_239939813 220 QLYQSYPNKPVA---DPGHRGLRNDYP----APITVGE---------------VLHPSVAHAYWALS---V-----------------AQPEVSSAITAA------DTAAAARKLAAAAP---------------------RREGW-----------EHSRTAVMTGLLRAKYDQ--------------------------HPELAEILLAT------DDATLIYDDME--------SAFWGDNAGR----------------------------------GRNWTGRLLELVRSELHL 364 239939813 bacteria>actinobacteria
LbrM06_V2.0110_Lbra_154331017 12 QNVVTFCEAH-----DPQYGVLSPLSP----SPLVVRH---------------VQYPSLHHYFLCER---F-----------------KGSPAEQWVTEA------TTVWSLDRLVKAAE-----------------AEGYQRSNW-----------NKVKVDVMLLGTYLKFKQ--------------------------NEAARAVLLST------HPSLLLYHTPK--------DDFWGDGGDG---------------------------------TGKNVLGVVTMTARARLHS 159 154331017 eukaryota>euglenozoa>kinetoplastida
LinJ06.0130_Linf_146070759 8 QNVVTFSEVH-----DPLYGVLSPLSP----SPLVVRH---------------VQYPSLHHYFLCER---F-----------------KGSPAEQWMAEA------TTVWSLERLVKTAE-----------------EEGYQRHNW-----------NKVKVDVMLLGTYFKFKQ--------------------------NEAARAVLLST------QPSLLLYHTPT--------DDFWGDGGDG---------------------------------KGKNVLGVVNMAVRARLHS 155 146070759 eukaryota>euglenozoa>kinetoplastida
Tc00.1047053507521.60_Tcru_71654521 3 KGVVRFHDVH-----EVPYGVFSPLSP----HPIVIRH---------------KQYPSVHHYFLTER---F-----------------RDAPVTAALRSA------TSVWELDRLVKEAE-----------------RTGSQREDW-----------NRVKVDVMLLGNYMKFKQ--------------------------NEAVRSLLLET------GDKLIIDHTTS--------DDFWGDRGDG---------------------------------SGKNLLGVILMAVRDRLRR 150 71654521 eukaryota>euglenozoa>kinetoplastida
Tb927.7.4780_Tbru_72391614 3 KGVVRFHDSR-----EKPYGVFSPLSP----HPVTIHH---------------TQFPSLHHYFLTER---F-----------------GGLPDAAPFQSA------ASVWELDRLVRVAE-----------------REGRQRGDW-----------DRLKVDVMLLGNYMKFKQ--------------------------NENAREILMNT------GTRLIVDHTEE--------DDFWGDAGDG---------------------------------TGHNLLGVILMAVRDRLHR 150 72391614 eukaryota>euglenozoa>kinetoplastida
TTHERM_00998900_Tthe_118397133 37 EQVIKFTHKLH-----DKYGFLSNLFQ----SKIMIDK---------------LQFMSVEHYYQAMK---F-----------------EGTKKFEVIRRA------GKAIDAHKLAQKKD-------------------TPKNRDW-----------QDLKVAYMKKAIQAKFQQ--------------------------NKALKKQLIET------YPNKLVDVTPG--------DKFWGIGDKE---------------------------------EGKNMNGQILMEIRE-LCM 181 118397133 eukaryota>alveolata>ciliophora
OSTLU_35648_Oluc_145348536 4 LPPVKFYKAW------DEYGALSNFSP----FPVSVDG---------------VEWPTVEHYYQAQK---FAGVH-----------NDIARESFEKIKLA------ESPEAAAKIGRSAQ---------------AAHPESVRKDW-----------DDVKVDVMRRALTEKLVR--------------------------YEGPRTLLMESVCTD--GRVRVIEDSPV--------DGVWGAGRDG---------------------------------TGQNLLGALLVNIREDLVS 162 145348536 eukaryota>viridiplantae>chlorophyta
Plabr_0990_Pbra_325107565 1 --MILIRKVK------DEYGWLGNMSS----FPVLYEG---------------KKYRTTEALFQALR---F-----------------DHEKIIESIREQ------KSPMSAKMKAKKHR------------------NRMVVVPL-----------SEADLDNMRLVLRLKLLQ--------------------------YPKLRTLLLAT------GDQEIVEDCTKRPR---GSGLFWGAANRD------------------------------GKWIGENWLGRLWMELRTELTQ 152 325107565 bacteria>planctomycetes
PRU_0382_Prum_294673143 23 DKCACIRKTT------EEWGIFGNFFY----APIIVEG---------------VTIDCTERLFHLMK---FNA---------------NGEEGIKSEYAA------KRGMAIKMHMKPIY---------------KSHPEWLRNDW-----------GAMVVDAMRFCLQTKYEQ--------------------------CEAFRKELERS------KGLFIVEDETKRNEKKKADADSWGTNLVG------------------------------NEYVGPNLLGRLLMELRDNGKL 184 294673143 bacteria
DICPUDRAFT_22458_Dpur_330798615 1 ---IKFFNNG------DPYYEFTNFYE----ACFNLDG---------------LYWKTSEHYYQAQK---FS----------------PNKAIMEQVRHL------PNPREAFKFGNFKG-----------------HKHFIRKDW-----------HDIKEEIMEKAIRAKFEQ--------------------------NSKLQNLLFKT------KGSELIENSPF--------DDYWGIGINN---------------------------------NGQNRLGVILMKVRDSL-- 143 330798615 eukaryota>amoebozoa>mycetozoa>dictyosteliida
DICPUDRAFT_35661_Dpur_330802814 24 SGELKFYSQG------QDFYEFTNFYE----SPFNLDG---------------KLWTTSEHYFQAQK---FS----------------PDQALIELVRNL------PSPREAFNFTRIPD-----------------LQKDIRKDW-----------QEVKYTIMCDALFAKFTQ--------------------------NNHLRKLLLST------DDMKLIENSPV--------DYYWGEGKDG---------------------------------TGENKLGEILMELRRNLKT 171 330802814 eukaryota>amoebozoa>mycetozoa>dictyosteliida
DICPUDRAFT_42446_Dpur_330843562 24 SGELKFYNQG------QDFYEFTNFYE----SPFYLDG---------------KLWTTSEHYFQAQK---FS----------------PYQSLIEHVRNL------PSPREAFNFTKKPD-----------------LQIDIRKDW-----------HEIKDIIMYNALFAKFTQ--------------------------NHYLRQLLLST------GDMKLIEDSPI--------DNYWGVGKDG---------------------------------TGKNKLGETLMDLRRSLNM 171 330843562 eukaryota>amoebozoa>mycetozoa>dictyosteliida
SELMODRAFT_413953_Smoe_302783817 153 STVIYFYKSW------DPYGAFTNFTA----HSIKLPGSS-------------ETWKSVEHYYQAQK---FSGVK-----------DELAMQAIENIRNA------ESPEEAARIGRRLA---------------RERPDLVRPDW-----------ENSKMDVMEEALVAKFSS--------------------------YPQLRSLLLST------AGCVLIESSPQ--------DYFWGSGKDG---------------------------------TGQNQLGRLLMKLRAAILT 309 302783817 eukaryota>viridiplantae
NPH_6632_Dpro_301059840 13 IDSVVFRKTI------EKFGGLSNMAP---GFPLQIGD---------------ISVRTSEALYQACR---FP----------------YAEEIQKMIISQ------KSPMTAKMKSKPFR-------------------SQTRPDW-----------DHVRVKVMRWSLRVKLAC-------------------------NWDKFRNLLLLT------ADKQIVEDSRR--------DRFWGAVAND-----------------------------EDYLEGENVLGRLLMEIREELKS 164 301059840 bacteria>proteobacteria>deltaproteobacteria
PSYMP_06728_Psyr_330874307 12 SNSIVFLKTS------DEFGGLSNMAG---GFPLFVNE---------------RKILTSEALYQVCR---FP----------------HLPEVQCLIVSQ------TSPMTAKMRSKPFR-------------------SESRPDW-----------MRVRVRVMRWCLRAKLVQ-------------------------NWDRFSKLLLMT------EGLPIVEQSSK--------DKFWGASPQN-----------------------------DNKLVGANVLGRLLMELREDIVS 163 330874307 bacteria>proteobacteria>gammaproteobacteria
PE36_21039_Msp._149908726 2 IDEIQFYEPN------DDFGFLSNFAL----AAVKIDG---------------VVWPSSEHFYQAQK---F-----------------NDPQLQDFIRTA------TTPDEAFSLSREYA-------------------QLVKSDW-----------MAVRDGVMRDVVMEKFSQ--------------------------NPFYAYQLVAT------GEQVLTEHSHK--------DAYWGDGGDG---------------------------------QGRNELGKILMNVRHQLAS 146 149908726 bacteria>proteobacteria>gammaproteobacteria
VME_08600_Vhar_269960099 2 VDQILFYEPD------ESHGFLSNFCQ----AQIKVST---------------QSWPTSEHYYQAQK---F-----------------SDRELQDKILTA------KSPDEAFALSRKYQ-------------------HLVREDW-----------DDDKLSVMAFIVREKFLQ--------------------------NPQLAKQLMET------GNACLTEHSHK--------DAFWGDGGDG---------------------------------SGENHLGEILMNVRAELKH 146 269960099 bacteria>proteobacteria>gammaproteobacteria
VPA0006_Vpar_28899861 17 VDQILFYEPD------EPHGFLSNFCH----APVEISS---------------QSWPTSEHYYQAQK---F-----------------VDAQLQTKIQKA------QSPDEAFALSRQYE-------------------HLVRSDW-----------DNMKLSVMAFIVREKFLQ--------------------------NPKLAQKLMRT------GNACLTEHSHK--------DAFWGDGGDG---------------------------------KGLNHLGEILMNVRAELRH 161 28899861 bacteria>proteobacteria>gammaproteobacteria
VSWAT3_18363_Vbac_148975384 8 AEEVLFYEPE------DPNGYLSNFAA----CPIKVDG---------------QVWATSEHYYQAMK---F-----------------SSPSLRNMILEA------CTPAEAFSLSRQYE-------------------EQVREDW-----------YDIRVEVMRFIVTEKFTQ--------------------------NPQFALFLTST------GDSVIKEHSHK--------DHFWGDGGDG---------------------------------TGENHLGKILMAVRQQLRS 152 148975384 bacteria>proteobacteria>gammaproteobacteria
GobsU_010100009074_Gobs_168699662 6 PRVINFYSVA------AEYGCFSNFSR----HPVFLRG---------------KRWPTTEHFFQAMK---F-----------------EGTEHEEQVRLA------KRPMDAASMGRDRK-------------------RPLRRDW-----------ESVKERIMMDGLRAKFTQ--------------------------HEELKAVLLGT------GDATLVEQTAN--------DSYWGDGGDG---------------------------------SGKNRLGYLLMRLREELRA 150 168699662 bacteria>planctomycetes
HCH_06997_Hche_83649602 4 KKTINFYLAN------GEYGCFSNFSR----DPVYLKD---------------KRWPTSEHYFQAQK---F-----------------AGTEHEEAVRMA------SKPMEAANMGRERT-------------------RPLRPDW-----------EAVKDDIMREAVMAKFVQ--------------------------HEKLTSILLGT------GDAELVEHTAN--------DRYWADGGDG---------------------------------SGLNMLGKILMEVREAIQQ 148 83649602 bacteria>proteobacteria>gammaproteobacteria
sce3364_Scel_162451636 1 MTVIRFYRSG------DAHGFFSNFSR----HPVTLKG---------------KVWPTSEHYFQAQK---F-----------------PGTEHEEVIRNA------PGPGEAARMGRQRS-------------------RPLRPDW-----------EQVKDDVMREVVLAKFTQ--------------------------HEDLRRALLDT------GDAELVEHTAN--------DAYWADGGDG---------------------------------SGRNMLGVILMEVRAQLRR 145 162451636 bacteria>proteobacteria>deltaproteobacteria
M23134_02266_Mmar_124004851 2 DNLIKFYSIG------APYGEFSNFAP----YPIKLKG---------------KVWATTEHYFQAQK---F-----------------VGTPHETKIRKA------ASPMKAAELGRTRK-------------------VRIRDNW-----------DHIKDNVMMEAVKAKFTQ--------------------------HADLQTLLLDT------GGATLIEHTEN--------DAYWGDGGDG---------------------------------KGKNRLGKILMKVREELKD 146 124004851 bacteria
PM8797T_20343_Pmar_149175186 5 NQPVLFYSVS------EAYGEFSNFAE----YPIQVDG---------------KRWPTSEHYFQAQK---F-----------------TEVQHREAIRKA------PSPMQAARMGRDRK-------------------RPLRKDW-----------ESVKVAVMRTAVLSKFAQ--------------------------YEKLCMLLIST------GQRKIVEHTTN--------DSYWGDGGDG---------------------------------SGKNMLGRILMEVRSQLRE 149 149175186 bacteria>planctomycetes
HCH_04109_Hche_83646809 18 VEVIKFYSVN------DEFGEFSNFAQ----YPIKLKG---------------KVWPSSEHYFQAMK---F-----------------EEEKDRSDIRKA------KSPLEAARKGRDRK-------------------RKLRNDW-----------ESVKLNIMREAILAKFTQ--------------------------HDALRERLLST------GSAKIVEHTDN--------DDYWGDGGDG---------------------------------SGQNMLGRILEEVRAQLSE 162 83646809 bacteria>proteobacteria>gammaproteobacteria
_Rbal_32471506 31 SDPIKFYSTG------DEHGEFSNFAG----YPIKIGK---------------KVWPTSEHYFQAMK---F-----------------QEGSDQEEIRKA------NSPMQAARMGRDRK-------------------RKLRRDW-----------ESVKVNIMREAILAKFTQ--------------------------HEDLRELLLAT------GDAKIIEHTTN--------DDYWGDGGDG---------------------------------RGKNMLGRILMDTRTKLRE 175 32471506 bacteria>planctomycetes
YbiA.2b3w_Ecol_82407990 14 DTIINFYSTS------DDYGDFSNFAA----WPIKVDG---------------KTWPTSEHYFQAQK---F-----------------LDEKYREEIRRV------SSPMVAARMGRDRS-------------------KPLRKNW-----------ESVKEQVMRKALRAKFEQ--------------------------HAELRALLLAT------APAKLVEHTEN--------DAYWGDGGHG---------------------------------KGKNRLGYLLMELREQLAI 158 82407990 bacteria>proteobacteria>gammaproteobacteria
VspiD_010100021915_Vspi_171913880 1 MEPILFYSTK------GTYGAFSNFSA----HPFVLNN---------------KRWPTTEHYFQAQK---F-----------------VGTEHEEAIRMI------ASPMVAARMGRSRQ-------------------RPLRKDW-----------DSAKDDVMRKALRAKFTQ--------------------------HQDLQSLLLST------GEAQLIEHTKN--------DSYWADGGDG---------------------------------SGKNRLGILLMELRDRLRS 145 171913880 bacteria
Namu_1431_Nmul_258651665 1 MRIIEFYLHT------DPWGELSNFHP----APIHLDG---------------QRWPTTEHYFQAAK---F-----------------PGTPHAELIRLA------ATPDRAKQLGGDRA-------------------APLRADW-----------LAVRDEVMRTALRAKFTQ--------------------------HEQLRALLLDT------ADAQLVEHTVN--------DHYCGDGGDG---------------------------------SGVNRLGLLLMQVRAELS- 144 258651665 bacteria>actinobacteria
TTHERM_00486130_Tthe_118401008 12 NGHIYFYREY------EHNGIFSNFYA----SPIALKE---------------KQWPTTEHYFQAQK---F-----------------SGTEKEELIRLA------STPSESFKLGRQRD-----------------DEYPLRKDW-----------ESVKDEVMYEALKAKFTQ--------------------------HKDLQKFLLST------GDAKIIEHTQK--------DKYWADGGDG---------------------------------SGKNMLGILLMNLRNELKA 158 118401008 eukaryota>alveolata>ciliophora
TTHERM_00289300_Tthe_118370894 18 GNTIKFYGAK------NKNGLFSNFYI----SPIKLKG---------------KIWQTTEHYFQAQK---F-----------------AGTVKEEQVRNA------SGPGIAFRLGRKKS-----------------NDYPLRSDW-----------LKVKDDVMYEAIKAKFTQ--------------------------HDNLKKILLST------KNHKLIEHTKR--------DAYWGDGGDG---------------------------------KGKNMLGILLMKLRKELSE 164 118370894 eukaryota>alveolata>ciliophora
PTSG_01145_Ssp._326434983 1 MGAIRFYGHT------KPFGFMSNFYP----AKVVIDG---------------HTWPTTEHYFQAMK---F-----------------HDKDYQAQIRKY------SSPSTAKKLGQTRA-------------------VKLRSDW-----------EDVKYDVMYKACLAKFTQ--------------------------HADLRKQLLDT------GDAKLIEHTRN--------DRVWGDGGDG---------------------------------TGQNKLGQVLMEVRRELRE 145 326434983 eukaryota>choanoflagellida
PPL_02864_Ppal_281209628 3 RPTIYFYRAA------DAYGCFSNFSD----HPVMMDG---------------YIWPTSEHYYQAMK---FKT---------------TDIEYYHQIRDA------ESPARSFKMGNTYA-------------------HDKRRDW-----------NQIKDQVMYDVVLNKFLQ--------------------------NKDIQRN---T------GISKIVEHTRC--------DDYWGDGSDG---------------------------------NGRNQLGKTLELVREFIKN 146 281209628 eukaryota>amoebozoa>mycetozoa>dictyosteliida
DDB_G0281625_Ddis_66812724 4 NNIISFYRST------DAYGCFTNFSW----FKVHFKN---------------HTFKTSEHAFQAFK---FE----------------HEQKIFFQILNS------KTASESKRIAHLNN-------------------DKKRKDW-----------ETIKDQIMYEICFEKFNQ--------------------------NDHLKLILLDT------GNLKIVESSEK--------DFYWGIG-DG---------------------------------SGRNQLGITLMKIREDLRK 148 66812724 eukaryota>amoebozoa>mycetozoa>dictyosteliida
DICPUDRAFT_85573_Dpur_330846708 3 DNVINFYRAG------SGYGCFSNFSR----HTVFYKG---------------QKWPTSEHAFQAMK---F-----------------EGTDHFLNVLKT------KTPGDAAKMGRNRS-------------------LPLRKDW-----------EGVKDEIMYEVCLAKFQQ--------------------------HQDIQLTLIET------NDAKLVEHTTN--------DSYWGDGGDG---------------------------------SGRNQLGITLMRVRETIRN 147 330846708 eukaryota>amoebozoa>mycetozoa>dictyosteliida
DDB_G0283925_Ddis_66810169 5 EHVINFYRPN-----EIPYGPFSNFSR----HTVFYNN---------------VLAKTSEHIFQAMK---F-----------------EGTQHFNDVLNT------KTPGDSAKMGRDRK-------------------RPLRKDW-----------EGVKDELMYEICLAKFSQ--------------------------HKDIQKILLET------GDATLVEHTGN--------DSYWGDGGDG---------------------------------SGRNQLGKTLMRVRETIKN 150 66810169 eukaryota>amoebozoa>mycetozoa>dictyosteliida
FP2309_Fpsy_150026339 10 MNIIKFYKVN------EPYGFFSNFSP----HPIYINN---------------ERWNSVEHYFQASK---F-----------------DNIEIREKIQAI------ESPMQVAIEGRDKK-------------------NIIRDDW-----------EMVKEEIMYSALLCKFYQ--------------------------HPKLMKELLLT------KDSLIIEHTKN--------DNYWGDGGDG---------------------------------KGKNRLGLLLMKVREEIAK 154 150026339 bacteria
PaecuDRAFT_4172_Pcur_304407843 1 MTQIKFYETN------KPYGCFSNFSK----HPIELNN---------------KRWATVEHYFQAMK---F-----------------ENTSFEEEIRLL------RTPMEAAIAGRDRN-------------------KPLRKDW-----------EEMKEIIMRRAIEAKCEQ--------------------------HESVRDILVST------GNCLLIEHTKN--------DSYWADGGDG---------------------------------SGQNKLGQLLMEVRSEQPE 145 304407843 bacteria>firmicutes
XNC1_2895_Xnem_300723771 4 IDVIKFYRTN------DPYGCFSNFSK----YGFLGEDD--------------FFWPTVEHYFQAKK---F-----------------IDENTQENIRLL------NSPMDAATAGRDRK-------------------KPLRPDW-----------EVIKDDIMRFAVLEKFKQ--------------------------NLDIQNILLST------HNAQLIEHTSN--------DFYWADGGDG---------------------------------SGNNMLGIILMETREILQK 149 300723771 bacteria>proteobacteria>gammaproteobacteria
ybiA_Rden_311112847 5 MTEIKFYRVN------DAYGYLSNFAP----YPFEING---------------LIWSTSEHYFQAQK---F-----------------LDKAIQEKIRRL------KSPMDAALEGRNRE-------------------NPLRSDW-----------EVVKDDIMRLAVFEKFRQ--------------------------NPAIRRELLAT------GHATLIEHTKN--------DNYWADNGDG---------------------------------TGKNMLGIILMETRKRLKA 149 311112847 bacteria>actinobacteria
ybiA_Spar_296876279 1 MKEIKFYKVH------DEYGFMSNFAP----YPFSDGS---------------KIWPTSEHYFQAQK---F-----------------LVPEIQEKIRQI------ASPMDAALEGRNRQ-------------------NPLRSDW-----------EEVKDEVMHQALRMKFRQ--------------------------NPDIAKELLAT------GDAIIIEHTQN--------DAYWADGGDG---------------------------------SGNNKLGLLLMHVRQELKN 145 296876279 bacteria>firmicutes
ybiA_Ssan_325693558 1 MKEIKFYKVN------DAYGYMSNFAP----YPFSDGN---------------KIWPTSEHYFQAQK---F-----------------LVPEIQEKIRLL------ESPMDAALEGRNRH-------------------NPLRKDW-----------EDVKDDIMRYAVREKFRQ--------------------------NTVIMEDLLET------GDSIIIEHTKN--------DSYWADGGDG---------------------------------TGKNMLGKILMEVRAELR- 144 325693558 bacteria>firmicutes
CORMATOL_00583_Cmat_225020576 1 MNEIRFYRAH------DDYGFLSNFAA----YPFELDG---------------KRWPTSEHYFQAMK---F-----------------LNPETQNLIRSL------DTPGRAAKVGR-RE-------------------KPLRKDW-----------ESVKDQVMFDAVLAKFTQ--------------------------NPDIARKLLST------GDAYLIEHTKN--------DFYWADGSDG---------------------------------SGKNRLGEVLMAVRDSLRA 144 225020576 bacteria>actinobacteria
Deima_1776_Dmar_320334379 1 MKAIRFYRQG------DAYGTFSNFSA----HPIHVDG---------------VTWPTTEHYFQAQK---F-----------------LDPELQAMIRAL------PTAGDAAKTGRRRD-------------------LPLRADW-----------EAVKEDVMRTALHAKFTQ--------------------------HEDARTLLLST------GDASLIEHTRN--------DTYWADGGDG---------------------------------HGLNRLGLLLMDLRAALRH 145 320334379 bacteria>deinococci
AM1_2731_Amar_158335874 1 -MTIFFYKVQ------DPYGCFSNFSL----HSIDLQG---------------QTWPTSEHYYQAQK---YQGT--------------PHQALCDKIRQA------STPEAAAALGRNPL-------------------YTEQADW-----------DVIKPEIMYAAVRTKFLT--------------------------HPTIQAELLST------GDELIVENSPL--------DPYWGCGADG---------------------------------KGQNQLGKILMQVRQEIRQ 147 158335874 bacteria>cyanobacteria
MC7420_6514_Mcht_254412559 1 -MTIYFYKVE------EPYGCFSNFSP----HPIQIDG---------------WCWQTVEHYYQAHK---FVGT--------------TDEALIRTIKNV------STPMEAALLGRDRT-------------------RNHRPDW-----------EQVKQQIMWRGVLTKFLT--------------------------HPDIQQILLNT------GEDVIVEDSPT--------DYYWGCGEDQ---------------------------------TGENHLGKMLMNVRQHIRQ 147 254412559 bacteria>cyanobacteria
all5029_Ana_17232521 1 -MTIYFYKVW------QPYGCFSNFSP----HSIEIQG---------------TYWLTVEHYYQAQK---FVGS--------------VDAAIIPAIRAS------KTPEEAAALGRCTS-------------------RQLRQDW-----------DLVKTIVMREAVLKKFLT--------------------------HTDIREILLST------GNEILVEDSSC--------DYFWGCGADK---------------------------------TGQNHLGKILMSVREEIRK 147 17232521 bacteria>cyanobacteria
N9414_00365_Nspu_119509756 1 -MTIYFYKVW------QPYGCFSNFSP----HGIQIHG---------------TYWSTVEHYYQAQK---FVGT--------------VDAVIIPVIHAA------ETPEEAAALGRCRT-------------------RQLRPDW-----------EMVKTKVMREAVLNKFLS--------------------------HLEIKDILLST------GNETLVENSPN--------DYFWGCGAEK---------------------------------TGQNHLGKILMGVRAEIRK 147 119509756 bacteria>cyanobacteria
CRD_01664_Rbro_282897552 1 -MTIYFYKVW------EPYGCFSNFSP----HPIEIHG---------------VYWATVEHYYQAQK---FVHT--------------EDNVIIPLIRSA------PTPEMAAALGRCET-------------------RKSRPDW-----------NLIKIDVMKTAVWQKFLS--------------------------HQEIQEVLLGT------GDETLVENSPI--------DYFWGCGADK---------------------------------TGENHLGKILMGIRNQIRF 147 282897552 bacteria>cyanobacteria
OSCI_3190004_Osp._300866977 1 -MTIYFYKVE------EPYGCFSNFSP----HSIYLNG---------------QDWLTVEHYYQAQK---FVGS--------------VDEQLIYLIHAS------ETPQQAAKLGREPS-------------------RQLRPDW-----------EEVKTEIMREAVLTKFIT--------------------------HSDIQAILLST------GDRLIVEDSPT--------DYYWGCGCDR---------------------------------TGQNHLGKILMSVRLEISQ 147 300866977 bacteria>cyanobacteria
SYNPCC7002_A1948_Syn_170078553 7 -EPIYFYKAH------DPYGCFSNFSL----HPIHCEA---------------LDWPTVEHFYQAHK---FLPT--------------HQQDLIDKIRAA------STPEIAAALGRDPQ-------------------HPKRPDW-----------EDIKRTVMWQGVWTKFKT--------------------------HPDIAQILLAT------GDAAIIENSPV--------DYYWGCGADG---------------------------------SGRNYLGKVLMRVRSQLRQ 153 170078553 bacteria>cyanobacteria
tlr2465_Telo_22300007 1 -MTIYFYRVK------DAYGSFSNFSP----HGFTLEG---------------YYWPTAEHYYQAHK---FFGT--------------PYEAFGHAIRIA------PTPEAAAQLGRSGR-------------------YPVHPQW-----------DQLKQAVMWRALVAKFTT--------------------------HAELRELLLAT------VDEELVEDSPV--------DSYWGCGGDR---------------------------------QGSNYLGRLLMHLRHCLRQ 147 22300007 bacteria>cyanobacteria
Cyan7425_0270_Csp._220905714 1 -MVIYFYKVE------GPYGCFSNFSP----HGFELEG---------------QRWQTVEHYYQAHK---FVGT--------------PDHHLCTQIQQC------QTPAQAAALGRNPC-------------------HCPRSDW-----------EEIKQQVMRTAVLAKFKT--------------------------HPQIRTILLET------GEAWLVEDSPV--------DFYWGCGADR---------------------------------SGQNHLGRILMSVRQELRS 147 220905714 bacteria>cyanobacteria
_Krac_298249651 1 -MTIYFYTAR-----EEPYGCFSNFSR----HGIDLDG---------------AWWPTVEHYFQAQK---F-----------------AGTPYANKIRIA------FTPKQAADLGRSRQ-------------------HPLRPDW-----------EQVKDEIMLKAVRRKFEL--------------------------HTQLRKLLLAT------GSEELIENAPS--------DYYWGCGSDG---------------------------------SGQNKLGQLLMRVRLELSS 145 298249651 bacteria>chloroflexi
Tery_2448_Tery_113476072 1 -MTIYFFDET-----EQPYGCFSNFSP----HGFELDG---------------LWWPTSEHYFQAQK---F-----------------LGVQHLEEIRWA------KTPAGAAKMGRERS-------------------RPLRKDW-----------EEIKEDVMERGLLCKFQS--------------------------HKDIGEILLST------KDELIVENAPE--------DYYWGCGKDG---------------------------------SGKNRLGEILMKVRNRLQN 145 113476072 bacteria>cyanobacteria
Cyan7822_3925_Csp._307153746 1 -MAIYFYSTR-----EQPYGCFSNFSQ----HGFELEG---------------FWWPTSEHYFQAQK---F-----------------PNHPWQDQIRKA------KTPKDAAKMGRDRR-------------------YPLRSDW-----------EEIKDEIMKRAVWQKFTT--------------------------HADIREILLQT------GDELIVENSPI--------DYYWGCGADG---------------------------------TGKNRLGEILMAVREILRA 145 307153746 bacteria>cyanobacteria
L8106_12950_Lsp._119486659 1 -MTIYFYSSR-----EEQYGCFSNFSY----HGFVLDE---------------LWWPTNEHYFQAQK---FVS---------------TDPEWFTKIQTA------KTPAQSARMGRSRE-------------------HPLRSDW-----------EEVKDEIMQKVVLCKFQT--------------------------HADIREILLST------GDEFIVENSPI--------DYYWGCGQDG---------------------------------SGKNKLGEILMAVREILRQ 147 119486659 bacteria>cyanobacteria
MC7420_678_Mcht_254413191 24 -MPVYFYSTR-----EKPYGCFSNFSR----HGFELDG---------------CWWATSEHYFQAQK---FVE---------------TDHPWFDKIREV------KTPKDAAKMGRSRE-------------------HPIRSDW-----------EQVKDEIMKRGVLQKFET--------------------------HADIREILLAT------GDELIVENSPS--------DYYWGCGKDG---------------------------------SGKNRLGEILMAVREILCQ 170 254413191 bacteria>cyanobacteria
ybiA_Osp._300869472 1 -MTIYFYSTR-----EEPYGCFSNFSA----HGFELEG---------------VYWLTSEHYFQAQK---F-----------------VGTPHVEQIRQV------KTPKDAAKMGRERK-------------------RPLRQDW-----------EEVKDDIMRKAVLCKFET--------------------------HANIREVLLST------GDEEIVENSPI--------DYYWGCGKDG---------------------------------SGKNKLGLILMEVREILRQ 145 300869472 bacteria>cyanobacteria
Haur_0354_Haur_159896886 1 -MTIYFYAVS------AEFGCFSNFSA----HGFKLDG---------------HYWPTSEHYFQAQK---F-----------------TGTDYATTIRLA------KSPAIAARLGRSRK-------------------QPLRRDW-----------EAIKDAVMRRALLAKFRS--------------------------HAEIRAILLAT------DDQPLVENAPN--------DYYWGCGIDG---------------------------------SGKNMLGQLLVEIRQTLRD 144 159896886 bacteria>chloroflexi
AM1_3712_Amar_158336844 1 -MAIYFYSSR-----EKPYGCFSNFSA----HGLTLDG---------------VWWPTSEHYFQAQK---F-----------------VGTPHADQIRQV------KLPKDAARLGRQRT-------------------RPLRPDW-----------EAVKDDVMRQAVLCKFET--------------------------HADIQDILLST------GNQDLVENAPG--------DYYWGCGQNG---------------------------------TGKNMLGKILMEVRERLRA 145 158336844 bacteria>cyanobacteria
PM8797T_29763_Pmar_149176205 1 -MTIYFYTK------NDTYGEFSNFSP----HGVERDG---------------LWWPTVEHYFQAQK---F-----------------AEADYRERIRNA------HNAKQAANLGRSRK-------------------IPLRADW-----------EEVKDEIMYQGVLQKFQT--------------------------HAELKILLLST------GDQEIVENAPG--------DYYWGCGKEG---------------------------------TGLNRLGEILVRVRGELRE 144 149176205 bacteria>planctomycetes
TM1040_1897_Rsp._99081738 6 PDTIYFYAQ------TDPYAEFSNFAP----YGVCFED---------------IWWPTVEHYFQAMK---F-----------------HDAAYRTRIRRC------QKPKDAKALGMTRK-------------------IPLRADW-----------EEVKDDIMYAAVLCKFRT--------------------------HGAPRQLLLGT------GDAPLVENAPM--------DAYWGCGPDG---------------------------------LGLNKLGRILMRVRGELAE 150 99081738 bacteria>proteobacteria>alphaproteobacteria
Jann_2797_Jsp._89055288 6 LNTIYFYAQ------TDAYAEFSNFAP----FGVEMEG---------------VYWRTVEHYFQAMK---F-----------------DDATHRERIRTA------RKPKDAKASGMTRA-------------------VALRADW-----------DEVKDAIMQAAVFRKFQT--------------------------HAVPRDLLLGT------GSAQIVENAPM--------DAYWGCGPDG---------------------------------RGLNKLGRILMDVRDSLAS 150 89055288 bacteria>proteobacteria>alphaproteobacteria
SCH4B_1850_Sisp_259416444 5 PEPIYFYAQ------TDPYAEFSNFAP----YGVAFEG---------------TWWRTVEHYFQAMK---F-----------------HDADHRERIRRC------HKPKAAKALGMTRA-------------------IPLRADW-----------EEVKDGIMLTAVRCKFQT--------------------------HAAPRQLLLST------GDAPLIENAPM--------DAYWGCGPDG---------------------------------RGLNKLGQILMTVRSKLSG 149 259416444 bacteria>proteobacteria>alphaproteobacteria
Sde_0405_Sdeg_90020054 9 EKALSFSR-------FDASHWLSPCVL----RPFQLDG---------------HTWPTAEHYLQANL---V-----------------ASAALADKIRQA------ASGEQAHALGSPWY-------------------RRKRKDW-----------KNLRRVLMTRALYTQTMT--------------------------HPDIKDALLET------GDQHIVETSLY--------DHYWGIARDQ---------------------------------RGENILGKVWMGVRDKIRA 152 90020054 bacteria>proteobacteria>gammaproteobacteria
TERTU_3943_Ttur_254787804 9 ENAVRFSR-------FDPESLFSTVSA----HPLELEA---------------EVWPSAEHYFQAQL---A-----------------GSDSWREKIKAA------PTPAQAYKLGCVWY-------------------KRKVRGW-----------KNLRRVMMTRALYTKVQM--------------------------YPAVRDALLST------GDETILETSLY--------DHYWGIGRDQ---------------------------------RGDNMLGKVWMDIRRKLRE 152 254787804 bacteria>proteobacteria>gammaproteobacteria
HP15_2779_Mbac_311695670 10 ENDLFMSR-------TDPENPLGTHAP----YSFELEG---------------KIWPTVEHYFQGMK---F-----------------TDDNRQEKVRSA------DTPGKAGKLGRKRH-------------------KSLRRDW-----------KQVRETVMTRGIYVRCRT--------------------------HPELAEALLDT------GDTKIVENSNF--------DYFWGCGRDR---------------------------------RGENRYGKVLMNVRARLRE 153 311695670 bacteria>proteobacteria>gammaproteobacteria
RED65_02704_Bmar_94501287 9 EDAIFFSR-------LDEEEMLGSRIH----QPFLLDD---------------YNWPTAEHYTQALL---F-----------------KDAKIQQQIRES------EEPVEAAKQYKWRF-------------------WLKHKDW-----------KKRGPILMTRAIYTQCKT--------------------------YPVKAQALLDT------EDRLLMENSLY--------DYFWGCGRDR---------------------------------RGDNRYGKVMMSVRGRLRK 152 94501287 bacteria>proteobacteria>gammaproteobacteria
GP2143_10137_Mgam_119476904 11 QDAMYFTR-------SDVNEDFGSFSK----HPFQLED---------------KEWPSVEHYYQAMK---F-----------------DDQAYQETIRCA------DHPKKARKLGRNRF-------------------RSIRKDW-----------RDVKVVYMTRAVYTMCRT--------------------------YPDIATKLLTT------GSNRLVENSQY--------DYFWGCGRDR---------------------------------RGDNHFGKVLMNVRDKLHT 154 119476904 bacteria>proteobacteria>gammaproteobacteria
SCHCODRAFT_258660_Scom_302674850 60 RPQIFFYDR------DKPHYGFTNFSP----HPVKYKD---------------AIYPTSEHLFQAFK---FME---------------HQPQLAEHIRRQ------PRPRDALSEARRFD-------------------NEKRRDW-----------FKVNIDKMDEALHLKFTQ--------------------------HKDLQEELLST------GSAELIEDSPV--------DAFWGIGKDG---------------------------------RGRNELGKALGRLRKKLKR 206 302674850 eukaryota>fungi>basidiomycota
LACBIDRAFT_318005_Lbic_170095960 159 RPRILFYNK------SDPHYGFTNFSA----HSVVYKG---------------KRYPTSEHLFQSFK---FQK---------------HRPNLAEHIRTCS-----ERPSVAFSEARRFQ-------------------PEVRTDW-----------KQVNIEKMDEALWCKFTQ--------------------------HSDLKAELLST------GDAELVEDSDK--------DAFWGVGADR---------------------------------RGRNELGKALERLRAKLRE 306 170095960 eukaryota>fungi>basidiomycota
LACBIDRAFT_316770_Lbic_170117768 78 PSPIFFYHK------HDLHYGFTNFSD----HPVCYER---------------EMYPTSEHLFQSFK---FLP---------------HRPDLAKHIRSC------SCPSDALAKARRFK-------------------AYVRPDW-----------RRINIQIMDQVLLLKFTQ--------------------------HQDLKDELLAT------GNAELIEDSYK--------DSFWGVGADG---------------------------------QGRNELGKALMDLQDKLHR 224 170117768 eukaryota>fungi>basidiomycota
SCHCODRAFT_258659_Scom_302674848 103 AQRILFYHK------HDPHYGFTNFSD----HPVKYQG---------------KVYPTSEHLFQALK---FMP---------------HKSQVAEHIRTSS-----PSPRAAFTEAHRYQ-------------------SEVRKDW-----------SKVNVKMMEIALEHKFDQ--------------------------HPALREELLAT------GEAELVEDSAQ--------DAFWGVGPNG---------------------------------KGRNELGKALMRLRTQLRQ 250 302674848 eukaryota>fungi>basidiomycota
MGL_3049_Mglo_164657874 61 TNKIEFFSK------DLPFFWLNNASD----HPVVLDG---------------VRYPTAEHLFQAQK---FID---------------HRPDIANKIRKA------SNAVEAIHIARTFS-------------------RDVRADW---------IKDGVNVSTMRMVLLTKFMQ--------------------------YSDLRLALLET------GDAEIVHASPN--------DAFWGSAAAP-----------------------------NSVGRGRNMLGRTIMQTRE-LLR 212 164657874 eukaryota>fungi>basidiomycota
SCHCODRAFT_36431_Scom_302693411 1 --QIRFCNR------DTSYNSFCNFAR----YSVAYNG---------------ETYPTAEHLFHASK---FLP---------------VNGDIARRIRNT------KDVGEVARLADRFQ-------------------ARVPQEW-----------WNNMVETMHGILLDKFLQ--------------------------HEDLQAALLST------GDAELVFDSVE--------DGFWGVDKDE---------------------------------TGNNILGRTLERVREELR- 144 302693411 eukaryota>fungi>basidiomycota
HMPREF9488_03196_Csp._319937960 7 KIIDSFHG---------EYAFLSNYYD----SPIFYDG---------------ILYPTVEHAFQAAK---T-----------------TVFIQRIIIANK------KTPGQAKCAGRKV---------------------TLRDNW-----------DDIKLYIMKELIILKF-T--------------------------NPKLKSALLNT------KDAELIERNTWN-------DTYWGICN-G---------------------------------IGENHLGKILMEVREMLRG 145 319937960 bacteria>firmicutes
mru_1967_Mrum_288561223 3 DEIDRFDG---------KYLFLSNFYI----CDVEYDG---------------ILYPHTEAAFHAQK---V-----------------FDDETKMKFTNV-------TPKQSKRLGRKV---------------------KLREDW-----------NEVKDNIMYEVCKAKFEQ--------------------------NPDIRKLLLET------GDATLIEGNTWN-------DQYWGVCR-G---------------------------------KGRNQLGKTLMRIREELRE 141 288561223 archaea>euryarchaeota
DORFOR_01894_Dfor_166032191 27 TQINEFRG---------DYAFLSNFYP----APVSYMG---------------QTYANNEAAFQAQK---T-----------------LSAREQRKFCIFRM----HNPSDAKKLGRDL---------------------TLRPDW-----------EKVKVRLMYEICMCKFMQ--------------------------NPELRDKLLAT------GESTLIEGNNWG-------DYFWGKVN-N---------------------------------CGENQLGIILMDVRAKLQW 168 166032191 bacteria>firmicutes
RUMGNA_01423_Rgna_154503599 12 QTIDHFHG---------AYAFLSNFYP----SRIYYRG---------------YWYANNEAAFQAQK---T-----------------ISPKEQLQFTKL------RNPKDAKKLGREV---------------------QLRSDW-----------ESVKLMYMYEICMCKFMQ--------------------------NPTLCKALLAT------GNCHLVEGNNWG-------DYFWGSVN-G---------------------------------HGENHLGKILMDIRAKLQF 151 154503599 bacteria>firmicutes
CCU_25310_Csp._295094771 3 TTINSFRG---------DYFFLSNFYE----CPVTYQG---------------ITYPNNETAFQAQK---C-----------------INDSDKTKFISL-------NPSAAKKLGRRV---------------------ALRKDW-----------ESIKFSVMKNLVKAKFTQ--------------------------NPDLAEKLLAT------DNAHLEEGNTWG-------DRIWGTVN-G---------------------------------TGANKLGIILMQVRDELNL 141 295094771 bacteria>firmicutes
Rumal_1634_Ralb_317056301 1 -MIDRFTD---------EYFFLSNFYE----SKVTFEG---------------ITYLNNEAAFQAMK---T-----------------LDESERRSFAGL-------DPDSAKRAGRKV---------------------SLRSDW-----------EEVKTDLMYEICKAKFTQ--------------------------NKDLAEKLLAT------GGEELVEGNDWN-------DRIWGKVN-G---------------------------------QGENRLGIIFMKVREELRL 138 317056301 bacteria>firmicutes
nadE_Ralb_325680741 1 -MIDSFKG---------DYCFLSNFYE----AKVTYEG---------------ITYLNNEAAFQSIK---T-----------------TDMAKRRDFADL-------DPAEAKKAGRNV---------------------SLRGDW-----------EDIKINVMYKICKAKFTQ--------------------------NSDIAEKLLAT------GDEELVEGNDHG-------DKIWGKVN-G---------------------------------EGANNLGKILMRVREELKM 138 325680741 bacteria>firmicutes
99_BPphiW-14_282599036 1 -MIDNFKT--------PETEWLSNMYP----CRVLYEG---------------VVYPSAEHAYAAQK---A-----------------VDWLDREEIAQA------KTGYLAKQMGAAV---------------------QKRADW-----------DQVKMRVMLEVLRAKFFN--------------------------NDFLGDKLLAT------GSQELVEGNWWH-------DTFWGVCE-G---------------------------------VGENHLGKLLMQVRRELEA 140 282599036 dsdna viruses, no rna stage>caudovirales
Pmar_PMAR024558_Pmar_294875527 18 NVIRAFRG---------EFGFLSNFSD----DPVRMDDG--------------ILYPTAEHAFQAQK---V-----------------VDVEKRRCMVEKC-----GTAKSAKAWGKRAK--------------------PLRADW-----------NDIRVDVMREVIGAKFKGG-------------------------SEELREMLVAT------GERELVEGNVWN-------DTFWGVSLRT--------------------------------GKGQNQLGKILMEVREELKK 163 294875527 eukaryota>alveolata
_BP1_308516893 13 KPIMGFQG---------EYRWLSNFWT----APIVVTG---------------FEYQNTEAAYQAAK---T-----------------INVAHRMQFKNM-------TGGEAKRAGRSV---------------------IMRHDW-----------DFVKLEIMELVLRAKFMA--------------------------HADLALKLIET------GDRDIVELNTWG-------DTHWGQIKDK-----------------------------EGNLVGENVLGKLLMNIRSDINK 156 308516893 dsdna viruses, no rna stage>caudovirales
Mpe_B0288_Mpet_124262828 3 AAPISFYRAS-----ERPFGAFSNLFR----REILIAG---------------RTFATTEHAYQALK---P-----------------RDARVRDWLLAA------PAPSLLAIAAHTLPSESADPTEIMARTADALLGFHTRPGW-----------SRLRFPWMLRCLDAKFDQ--------------------------HPDLAELLLST------GDSAIIEAGRIDDDA----GRRWGIVN-G---------------------------------RGSNYLGRMLQRVRHRLGG 170 124262828 bacteria>proteobacteria>betaproteobacteria
bgla_2p0770_Bgla_330822167 19 LNEIRFYRAN-----EKPYGAFSNLYK----RPIEFEG---------------VTYPTSEHAYQAGK---A-----------------VKPAVRQWILSA------PTPALAAMAAHGLY------------------VWDVVPDW-----------AQIKFDRMRAVLRAKFDQ--------------------------HADLRELLLST------GEARLVEAGTVNNAV----NRLWGEVD-G---------------------------------KGENMLGVMLMELRAAYAK 168 330822167 bacteria>proteobacteria>betaproteobacteria
PSPA7_3050_Paer_152987782 1 MQEIRFYRAN-----EKPYGAFSNLYK----REVLFEG---------------VVYPTSEHAYQAGK---P-----------------RKEAVRDWILSA------PSPALVAMAAHGLY------------------WWDIRPGW-----------SKIKFDRMRAILLAKFTQ--------------------------HEDLKALLLST------EQARLVESATVDNEV----NRTWGEVN-G---------------------------------KGKNMLGVLLMEVREELLH 150 152987782 bacteria>proteobacteria>gammaproteobacteria
Tgr7_1771_Tsp._220934941 20 KESAVFYKTK------ETFGALSNMAS---GYPLRVNC---------------VRILTSEALYQACR---FP----------------HLPEVQRVIIDQ------KSPIAAKMKSKPHR-------------------KDSRPDW-----------DQVRVGVMRWCLRVKLAQ-------------------------NYKEFGRWLLVT------KDKEIVEQSKK--------DAFWGAKVID---------------------------DDGEILVGQNVLGRLLMELRELYRN 173 220934941 bacteria>proteobacteria>gammaproteobacteria
GSTUM_00011304001_Tmel_296424705 50 TGPVYFWKPH-----EVPFGIFSQWYE----DEFTAPFDGEQ-----------MRFGTAEQYMMYSKAVLF-----------------NDPDTAAEIMKT------MNPSTQRALGRKVR-------------------NFTDVTW-----------AENRSRIVEEGSYWKFKK--------------------------DP---SRLLET------GDREMVEASPR--------DRIWGIGFGP----------------------KNADAGKRDKW-GMNLLGKALMEARDRLRR 209 296424705 eukaryota>fungi>ascomycota
R617_APMV_311978014 4 DKYVFFHGAN---KNQAGVHIFSQWFP----VNFKEYLNGEE----------FAEYVSAEQYMMAHKALLF-----------------GDMFHFKKIMEC------SKQCKIKYLGRRVR-------------------NFNPTIW-----------DKHKFDIVTEGNRLKFSQ--------------------------NPDLMKRLLET------GNKTIVEASPS--------DKIWGIGLTA----------------------QQAVNIPENKWPGKNLLGKVLMKIREEN-- 168 311978014 dsdna viruses, no rna stage
Esi_0071_0113_ESV_298714411 57 EGMVLFWK---------EPACFVQWTP----CSFELDG---------------ERYCNAEQWMMASKARLF-----------------NDRTALQQIMAT------ADPRRQKALGRQVR-------------------GFDPAMW-----------DKKGYDVVVRGNLAKFKQ--------------------------NPGFRDELLAT------GDRILAEASPY--------DSEWGIGLHA----------------------NDADALIQARWPGRNKLGEALMDVRSQL-- 210 298714411 eukaryota>stramenopiles
Esi_0017_0056_ESV_298707265 134 DTMVLFWN---------PPCVFTQWEP----ALFEVDG---------------VKYCSAEQYMMACKANVF-----------------GDTDIWNKIMST------SDPAQQKRLGKEVA-------------------NYDHGIW-----------NLCKVQFVLTGNYSKFTQ--------------------------NPGMCDQLLAT------GDKMLAEASQH--------DKVWGIGMDA----------------------FDPNVERHECWRGQNLLGKILMYVRNKI-- 287 298707265 eukaryota>stramenopiles
Esi_0345_0025_ESV_298711392 58 PDLLFFWQ---------PPSVFSQWTP----SVFVVDN---------------VQYSCAEQYMMAEKAKLF-----------------GDNSSWQKIMAT------PSPREHKDLGRGVS-------------------GYDQNVW-----------DQHKMRIVARGNYAKFTQ--------------------------NEMMGQRLLDT------GEKLLAEASPY--------DRVWGIGLRA----------------------DNPAARTPSSWRGQNLLGDILQEVRTR--- 210 298711392 eukaryota>stramenopiles
NAEGRDRAFT_31328_Ngru_290996009 18 QKYEFFWK---------DKSVFSNWHA----ASYVLDG---------------IQFANTEQGMMYGKAKLF-----------------GDDEVAKDILAN------TSPSNAKQLGRMVS-------------------NFTDDMW-----------NQNRELIMKRHLYAKFSQ--------------------------NEDIKQTLLST------GDKILAEASPN--------DAIWGIGMRE----------------------HEAIETHPSKWPGLNLLGKLLTEVKQELRN 173 290996009 eukaryota>heterolobosea
NAEGRDRAFT_36485_Ngru_290990814 20 SKFHFFWG--------TKGGYYSQWVK----APMKIDG---------------KTFVTCEQYMMYQKAQLF-----------------NDHEMAEKILKT------SDPKQCKEFGRKVK-------------------NFDTNQW-----------EANRDRIVYEGNYAKFTQ--------------------------NEEMRRDLLSR------LDVEYVEASPY--------DKIWGIGLEE----------------------KDQRAHDRSQWKGLNLLGRIITQIRDDLIN 176 290990814 eukaryota>heterolobosea
NAEGRDRAFT_31151_Ngru_290996214 26 SKFFFFWN---------EETCFSQWVK----APMKVND---------------QTFSNCEQFMMYQKALLF-----------------NDQEIAKRILQS------TNPKNTKALGRKVS-------------------NFNEKIW-----------EDNKVRIVYEGNYAKFAQ--------------------------NDDLRKDLLSR------PDVEYVEASPY--------DKIWGIGLEE----------------------KDPRAKQRNEWQGQNLLGRIITQVRDDLMM 181 290996214 eukaryota>heterolobosea
PRU_0345_Prum_294673111 5 DKHICFWN-----------EWPSNWHP----AEFDVEVNGV-----------KCHFYNTEQYFMYMKAIVF-----------------GDEEIAKQILEV------SDPKKVKALGRKVQ-------------------NYDEAVW-----------NEKRYQVMLKANVAKFSQ--------------------------NEDLKQLLLSPEY----EGHGFVEASPY--------DKVWGVRMFE----------------------SNPDIDDETKWKGLNLLGKVLDETRRIVSL 164 294673111 bacteria
Fisuc_1361_Fsuc_261415758 7 DKHVFFYH-----------EWLSNFWN----APFEYKG---------------RTFFCNEQAFMWEKAVLF-----------------GDKVMEEKILVA------STPQEAKRLGRKVT-------------------PFDKEKW-----------DSVRYQVMLDINYAKYSQ--------------------------VEDCKNRLLDPEF----DGHAFVEASPR--------DRIWGIGLSV----------------------TNPNIDDPANWRGRNLLGKVITEVRDRLVQ 162 261415758 bacteria
KgORF4_BPK_48696395 5 REYIMFWG---------KEDIYSNFYP----IKFKHQG---------------RTFNNSEQAFMWRKARYF-----------------NDFQIAGEILNA------KNPNHAKSLGRKVR-------------------NFNEEQW-----------NKVRYNIMVEVVKDKFMT--------------------------THLKQRILDTD------VRKDFVEASPY--------DKIWGVGLKA----------------------NDPKILEQSNWKGQNLLGKVMEDVRVHCIY 160 48696395 dsdna viruses, no rna stage>caudovirales
bgla_4p0890_Bgla_330814539 5 GNFTAFFG---------AEDVLSNWHP----SRFTYHD---------------VEFNCVEQFMMYAKAMLF-----------------DDHGTASKILTA------QSPKRQKELGRDVS-------------------GFDEQTW-----------IKSRESIVFVGCREKFRQ--------------------------NPSQGTVLSGT------GSTILVEASRS--------DKIWGAGIGQ----------------------FDSRITDPTKWPGLNLLGYTLMRVRDRPFS 160 330814539 bacteria>proteobacteria>betaproteobacteria
bgla_3p0420_Bgla_330818849 5 NNMTLFFG---------AEDALSNWHQ----CRFEYHG---------------VAFTCVEQFMMYAKAKLF-----------------EDHATAAAILAT------TDPHKQKQLGREVK-------------------GFNDAVW-----------VEKREAIVTVGCREKFQQ--------------------------NPALRDTLLAT------GDTVLVEASPY--------DRIWGVGFAW----------------------NDPLILDPKNWRGTNLLGKTLTTVRQLLKD 160 330818849 bacteria>proteobacteria>betaproteobacteria
Rpic12D_5003_Rpic_241589866 5 LGMTLFFG---------AEDALSNWHP----ARFTYRG---------------VEFSSVEQFMMYSKARLF-----------------NDDQTARKILSA------SEPREQKRLGREVR-------------------GFDEAVW-----------IIKRKPIVTVGCREKFWQ--------------------------NQPLGEVLLGT------DDTLLVEASPY--------DRIYGVGLAW----------------------NDPRIRDVSQWQGLNLLGEVLMEVRTWLPK 160 241589866 bacteria>proteobacteria>betaproteobacteria
GobsU_010100015693_Gobs_168700969 3 ETFTFFWK-----------HRLSQWHR----APFVICG---------------VTFTHAEQYMMYAKALLF-----------------GDRETAGKLLAA------ETPREQQALGRAVR-------------------GFDESVW-----------VLFREGIVFAGNYARFGQ--------------------------NPDQRELLFST------RGTTLVEASPH--------DRVWGIGLSA----------------------DDPRARDRSRWLGLNLLGATLTRVREALLF 156 168700969 bacteria>planctomycetes
M23134_00353_Mmar_124010457 5 EQFTFFWE---------TRSPLSQWHP----SDFTVDG---------------VAFNCAEQYMMYQKAKLF-----------------EDEQIAAQILRT------KKPRDQKALGRKVR-------------------NFDATTW-----------NNHCKKIVYDANYAKFTQ--------------------------NETLKASLLAT------TGTTLVEASPY--------DKIWGIGLAV----------------------DHPDVQDKSKWQGTNWLGEVLTQLRDDLIS 160 124010457 bacteria
PPE_02438_Ppol_308069201 2 EKFTFFYR---------SHSPFSQWYP----SDFVADG---------------LEFNCAEQYMMLKKAQLF-----------------GDEEAALKIMQV------PTPREQKARGRSVR-------------------GFDQSLW-----------EGNCRQFVYDGNYAKFTQ--------------------------NPNLLKYLLKT------KGTTLVEASPT--------DTIWGVGLAE----------------------SDARIRNRKLWRGTNWLGEILTNLREDVLQ 157 308069201 bacteria>firmicutes
AceceDRAFT_2244_Acel_303240378 2 EKFTFFWR---------SHSPFSQWYI----AKFIING---------------IEFNCAEQYMMYMKAVLF-----------------KDEEISQKILEA------KMPSQHKSLGRKVK-------------------HFNQEVW-----------ESNCKKIVYDGNYAKFTQ--------------------------NPELKQKLLET------KG-TIVEASPV--------DSIWGVGLSE----------------------DDPRIQDRKTWRGKNWLGEVLTQLRDDLLK 156 303240378 bacteria>firmicutes
Sterm_3136_Ster_269121732 2 EKFEFFWK---------SDSPFSQWYK----KGFKVKG---------------KSFNCAEQYMMYMKAVLF-----------------GDEIIAAKILEA------KSPREQKDLGRKVK-------------------NFNKDIW-----------ERQCKNIVYNGNYAKFTQ--------------------------NEGLKSALLET------KGKTLVEASPY--------DTIWGIGLSE----------------------ENPDSKRRSKWRGKNYLGEILTQLREDILK 157 269121732 bacteria>fusobacteria
MXAN_5330_Mxan_108762267 7 QRFTFFWQ---------AHSPFSQWHP----SDFTVDG---------------VRYVCAEQYMMAGKARLF-----------------GDNEALASILSS------KSPKTHKALGRKVR-------------------DFDNTRW-----------EKARERIVYEGNRAKFTQ--------------------------SPELLKALLAT------AGTELVEASPV--------DRIWGVGLDE----------------------EDPRILHPAKWRGLNLLGKVLTKLREDLLA 162 108762267 bacteria>proteobacteria>deltaproteobacteria
Bresu_2709_Bsub_302383816 19 EGFHPFIK-----------GVFSQWHP----TPFAIDG---------------LSFHTAEQWMMFAKARLF-----------------ADDQQADLILAT------PDPATQKRLGQRVQ-------------------NFDQATW-----------DASKINIVYAGNRAKFEQ--------------------------NEGAYRQLKST------SGLMLVEANPR--------DWIWGAGLAI----------------------DDPCLSQPQEWRGVNLLGRILTKVRSDLS- 171 302383816 bacteria>proteobacteria>alphaproteobacteria
C08E8.4_Cele_212646224 12 QTYVLFYE---------DESVFSNFHP----SNFEAETAKKLVNSGMFKEEEMLKFNCSEQYFMYHKALLV-----------------GDVDSAKVIITA------KHPMVMKMTGRQLN-----------------MNRHDIDNW-----------TQKSRDIMYLACLAKFSQ--------------------------NVELRKMLFRT------QDMYLVEASGN--------DAIWGNGIWK----------------------EDKRSDDVANWHGTNYLGEILDRIRGELIG 184 212646224 eukaryota>metazoa>nematoda
T24A6.7_Cele_17564644 13 KQFVFFYK---------FDCVFSNFYP----CEFSAQEFENDVEKN-------VNFNCSEQYFMYHKALLV-----------------GDSEIAGKILKE------TDPRKMKRLGRQLS-----------------MSKKQLEEW-----------SQNSKEVMYNGCLEKFSQ--------------------------NNVCRENLFRT------HGMRLVEASPM--------DRIWGIGLSH----------------------HDKRCENEQTWRGTNWMGSVLDKVREELWT 178 17564644 eukaryota>metazoa>nematoda
LOC588539_Spur_72168255 9 DRYTFFYG--------EKSAPFSQFRA----ANFEVDG---------------VQYTCAEMYMMHQKAVLF-----------------GDHEIAEQILLG------TKPMAMKALGRKVR-------------------NFDEEVW-----------KQNRRQIVKKGNLAKFSQ--------------------------NPDIRAELMAT------RGTTLVEASPR--------DKIWGIGMGK----------------------DNPHAKNKSKWRGQNLLGYILTEVREELEK 165 72168255 eukaryota>metazoa>echinodermata
DR_1263_Drad_15806282 68 TEYLFFYR---------TAHPFSNFHP----SPFSASG---------------RQFHTAEQYIMHRKAEEF-----------------GDHASAKAILQA------RTPAECKALGRRVQ-------------------GFSESHW-----------AQVRGQVAFDAAWHKFRS--------------------------SRRLREFLLDT------GELILVEAAPN--------DRIWGIGYSE-----------------------QDAWEHRDQW-GENLLGQALMQVRERLRD 221 15806282 bacteria>deinococci
Pc16g08100_Pchr_255940726 25 VDTIFFWKI------NSDFGEFSQWYR----SDFVCDD---------------EAFATAEQYMMYKKAMMF-----------------GDSNMSERILCS----SSADPRKHKSMGRKVA-------------------NFNEVIW-----------ESRNMNVAINGNYCKFAQ--------------------------NIDLMKLLLGT------GDKMIVEASPM--------DRIWGIGFDS-----------------------KLAMSNVGRW-GQNRLGKSLMTVRSMIKD 183 255940726 eukaryota>fungi>ascomycota
FG02760.1_Gzea_46111757 7 PGPVYFWKES-----DPEAGYLSQWYY----CPFRDDK--------DER----IRYKTAEHYMMFQKAMLF-----------------KDEHTAIEVLKA------ATPRKVKALGRKVK-------------------NFNEATW-----------LKHRCDIVRHGNILKFTRAISEKGYKKGSPSG---------NPLEGSLLDTLLRT------GDRELVEASPF--------DPVWGIGFKA-----------------------ADAEAARGSW-GENLLGKELMAVRSILRK 184 46111757 eukaryota>fungi>ascomycota
NECHADRAFT_29138_Nhae_302884348 5 SNPLYFWRET-----DPVSGYLSQWYY----CPFRDDG--------DEK----KTYKTAEHYMMHHKALLF-----------------NDEKVALQILRA------GHPREVKSLGRKVS-------------------NFDEATW-----------NAHRREIVRRGNLLKFTNAVSEEGFQKGTPAKGKSAVKRKYEPIEGSLREMLLST------GEREIVEASPF--------DRIWGIGFKA-----------------------ADAEAARESW-GQNLLGLELMEVRRILRE 191 302884348 eukaryota>fungi>ascomycota
PMAA_059590_Pmar_212541268 10 DNPVYFWKP------EGDYGFLGQWWP----SSFSWKT-------DDEE----YTYASAEQYMMHRKALLFAG---------------PEDPITLQIQTG----WKLRPSVIRDLGRQIP-------------------NFSEEAW-----------QQNRYEIVLEGNYLKFSQ--------------------------NEELKEKLLET------GARELVEASPR--------DRIWGIGFGA-----------------------RHAGANRREW-GLNLLGKVLMETRERLVR 174 212541268 eukaryota>fungi>ascomycota
TSTA_012120_Tsti_242799239 9 SNPVYFWRP------EGEYGFLGQWWP----SSFSWKN-------GDEE----FTYANAEQHMMHRKALLFAG---------------PSHPITHQLQKA----WKLEPGTIRDLGRQIP-------------------DFSEQMW-----------QQNRYAIVLEGNYLKFSQ--------------------------NGDLRRELLAT------EDRELVEASPR--------DRIWGVGFGA-----------------------AYASENRREW-GLNLLGKALMETRERLRR 173 242799239 eukaryota>fungi>ascomycota
MGYG_00619_Agyp_315054313 3 SEPIFFWKP------EQEHGYLGQWWK----SDFTVPA-----EDGGKE----LKYENCEHYMMHQKGVLFA----------------PDDPVTQEILAPSG--PVPDPKTIKALGRKVP-------------------NFDDAVW-----------KKERFRIVVQGNYYKFTQ--------------------------NPELKAQLLET------GDRELVEASPR--------DRIWGVGFGA-----------------------KNAPAKRANW-GLNLLGKALMEVRERIRR 170 315054313 eukaryota>fungi>ascomycota
HCAG_05480_Acap_154278399 6 SEPVYFWKP------ESENGYLGQWYT----SDFTWAR-NAADAHGDVEI---VKYDNAEQFMMHRKGLLFA----------------PDDPITQEILARDS--PSPHPRDLRSLGRQIP-------------------NFDDAVW-----------KTHRYAIVVEGNYLKFTQ--------------------------NPQLKEELLAT------GDRELVEASPR--------DRIWGVGFGA-----------------------KNAGARRKHW-GLNLLGKALMEVRERIRK 178 154278399 eukaryota>fungi>ascomycota
LACBIDRAFT_252516_Lbic_170107053 5 DDYVFFWKT------NEKYGWASQWYS----SPFTVKL-KL-EEEGEEEE---VTFASAEHWMMVQKALLF-----------------GDYGKAREILGVEG-VSSSDMAHVKALGRQVS-------------------GFDEAKW-----------VDARQDIVLQGNMHKFSQ--------------------------NGELLEKLMLT------GDKKMVEASPR--------DRIWGIGFGE-----------------------KNALNQRERW-GLNLLGIALEGTRRKLNK 176 170107053 eukaryota>fungi>basidiomycota
PTRG_08392_Ptri_189204778 24 TKPVFFWKP---------NSYLSQWYW----SKFTVDG---------------DTYATAEMWMMVQKARLF-----------------NDEKTAKQMLAT------TKPHEHKALGRQVK-------------------GFEARVW-----------DQHKVQIVTQGNYHKFTIS-----------------------TDAENLRKMLLAM------GERELVEASPV--------DRIWGIGFAE----------------------REAERM-RHKW-GQNLLGKALVKVRGSLRA 180 189204778 eukaryota>fungi>ascomycota
GCWU000342_00580_Ssat_229828516 1 MTVIGFHNP------DEKYGFLSNWYL----SHFTVHG---------------TEFSSVEQYMMYQKAACF-----------------YDEDIASQIMKT------DDVAEIKQLGRAVN-------------------GYDDHVW-----------NGIRQIVVYEGLMAKFSQ--------------------------NQELKEQLMDT------GGAILAECAVR--------DRIWGIGLSM----------------------TDPDRFDRSKWKGQNLLGYALMMVRDRL-- 157 229828516 bacteria>firmicutes
RflaF_010100008155_Rfla_268609453 14 MNVICFHNP------DEENGYLSNWYL----SDFTVDG---------------VKFTSMEQYMMYRKAMCF-----------------HDSDIAAQILET------SDVEQIKALGRLVR-------------------NYDDHHW-----------NGVRQIVIYEGLKAKFSQ--------------------------NPDLLKMLKDT------GDALIAECAVK--------DRIWGIGLSM----------------------TDPDRFDRTKWNGQNLLGYALMMVRNILTV 172 268609453 bacteria>firmicutes
HOLDEFILI_02959_Hfil_223985602 2 MKIVCFHNP------DEENGYLSNWYP----SRFIVKN---------------RVFSSMEQFMMVRKAVCF-----------------HDDSAAAQILAT------EDVARIKELGRHVS-------------------NYDDHHW-----------NGIRQIVVYEGLLAKFSQ--------------------------NEDLKEQLKAT------GDAVLAECAVK--------DRIWGIGLSM----------------------SDPDRMNREKWQGQNLLGYALMMVREQL-- 158 223985602 bacteria>firmicutes
GCWU000341_01684_Osp._291459520 1 MNVIGFHNP------EEENGFLSNWYL----SAFRSDN---------------IDFSSLEQFMMYRKAVCF-----------------RDDESAARILST------DDTAKIKALGRLVS-------------------GYDGHIW-----------NGIRQLVVYEGLLAKFSQ--------------------------NESLKRDLLDT------GDALLAECAVK--------DCIWGIGLSM----------------------TDPKRFDPSQWRGQNLLGYTLMMTRSKLAA 159 291459520 bacteria>firmicutes
_Bado_154487137 2 TDIICFHNP------DEENGYLSNWYP----SRFVVVD---------------VEFSSMEQYMMYRKACCF-----------------NDAETAARILRT------SDVAEIKRLGRLVA-------------------GYDDHVW-----------NGVRQIEVYEGLLAKFSQ--------------------------NAELGAQLVAT------GNAILAECAVK--------DRIWGIGLSM----------------------HDPARLDPAQWRGQNLLGYALMLTRKKLNR 160 154487137 bacteria>actinobacteria
ROSINTL182_08410_Rint_240146453 1 MDILCFHNP------DEENGYLSNWYM----SQFDVNG---------------IGFSSMEQYMMYKKAVCF-----------------RDDVIAEKILET------DEVGSIKELGRMVA-------------------GYNENYW-----------NGIRQIVVYEGLIAKFSQ--------------------------NDKLREGLLHT------KDQILAECAVK--------DRIWGIGLSM----------------------KDPDRMDLSKWRGQNLLGYTLMMIRDRL-- 157 240146453 bacteria>firmicutes
M23134_07250_Mmar_124009340 129 DEKFYFFSS--------SDSPFSTLYK----AKFIIQG---------------ITYNSVIQYIAHHKARLF-----------------LDRGIEKGILKS------DSQKEIYQLSLQVK-------------------NYDKVTW----------HNMYLGQHISFAYQQQFLQ--------------------------NEYLKDVLFST------EGKTIVLSDKN--------DEKWGIGLSQ----------------------LNSKALQRNTWLGKNFLGEILTRLRIELMG 286 124009340 bacteria
PSPA7_5219_Paer_152985284 16 FKYLYFWGHRPAADDQVGKSCFSQWYE----ASFKLGG---------------VRYASAEHYMMAAKARLF-----------------DDRKLLERILAA------RSPGEAKALGREVA-------------------GFDEALW-----------SAERMGIVIEGNLGKFGQ--------------------------NASLKKYLLGT------ADRVLVEASPV--------DAIWGIGLAA----------------------TDPQATEPAAWRGLNLLGFALMEVRRRLAQ 180 152985284 bacteria>proteobacteria>gammaproteobacteria
MDS_1227_Pmen_330502141 20 FDYLYFWGHSRAAGAPVGKSCLSQWYP----SAFTLDG---------------IHYATAEHFMMAGKARLF-----------------DDAEALERILAA------RAPNEVKAIGRQIR-------------------GFDEARW-----------RESRQAIVFEGNLGKFSQ--------------------------DPELARYLLDT------APRVLVEASPV--------DPVWGIGLAE----------------------GDSNVRTPATWRGLNLLGFALMQVRECLLN 184 330502141 bacteria>proteobacteria>gammaproteobacteria
_Kora_238022350 20 LKYVYFWGHTPKQKGIADEAVFSQWYP----APFELDG---------------ERYATAEHYMMAEKARLF-----------------GADDIRCQILQA------GSPAQAKALGRQII-------------------GFQDDIW-----------NAHRFDIVCRANHAKFSQ--------------------------HPDLKTFLLQT------GERILVEASPV--------DSIWGHRLGA---------------------RRPPRRKPVAMARLEPARLRADESARPIAGS 188 238022350 bacteria>proteobacteria>betaproteobacteria
BBR47_45420_Bbre_226314127 19 VKYLFFWGHTQKDSGTTDKSCFSQWYP----AAFVEDG---------------ITYLTAEHYMMAKKAELF-----------------GDLAIRDEILRK------NHPKQAKDLGRKVH-------------------SFDEAVW-----------NANKTAIVRQANLLKFSQ--------------------------HADLKAYLLDT------GDRIIVEASPY--------DRIWGIGMAQ----------------------DHPHAEQPEKWRGENLLGFALMAVREQLRS 183 226314127 bacteria>firmicutes
ABSDF2913_Abau_169634335 21 FKYLYFWGHIPKKANLIDKSCFSQWFP----AQFNVEG---------------IEYFTAEHYMMAQKAKLF-----------------NDKEIFAQILQV------KHPNEAKQLGRKVR-------------------NYDEQIW-----------REKRFDIVVQANFAKFSQ--------------------------HPELKKFLLAT------KDRILVEASPV--------DKIWGVGMAQ----------------------DHPHIQDPSLWQGLNLLGFALIHVRELLLT 185 169634335 bacteria>proteobacteria>gammaproteobacteria
HMPREF0012_02967_Acal_262281016 20 FKYLYFWGHTPKQVDLIDKSSFSQWYP----VQFKDEG---------------IEYLTAEHYMMAQKAKLF-----------------NDEGIFAQILQV------KHPNEAKQLGRKVR-------------------NYDEKIW-----------QEKRFDIVVQANFVKFSQ--------------------------HPELKNFLLAT------KDHILVEASPV--------DKIWGIGMAQ----------------------DHLHTQDPSQWQGLNLLGFALMHVRDQLLA 184 262281016 bacteria>proteobacteria>gammaproteobacteria
LMHCC_1724_Lmon_217965001 18 LKYIFFWGHQPAEDGKISKSCFSQWWI----CSFKVDG---------------VEYNCAEQFMMAEKAKLF-----------------NDMEMREKILAA------KHPKQAKDFGRLIS-------------------GFQEDIW-----------LKNRFNIVMRANQAKFSQ--------------------------NEELKKFLMQT------KNRILVEASPV--------DKIWGIGMAT----------------------DNKNVENPLYWKGLNLLGFALMVVRDELEN 182 217965001 bacteria>firmicutes
PROPEN_00827_Ppen_226326967 16 IKYIYFWGHQ-SKGNDITKSCFSQWYP----APFILDD---------------VRYASAEHYMMAEKAKLF-----------------NDIDVRKRIITA------SNPGSAKALGREVK-------------------GFDQDIW-----------EQHRMDIVIRANIAKFSQ--------------------------NKELGNFLIST------GNRVLVEASPV--------DKIWGVGLSE----------------------QDNEINNPLLWKGLNLLGFALMKVRSILIE 179 226326967 bacteria>proteobacteria>gammaproteobacteria
EHI_017590_Ehis_67472915 30 HQYTYFWKP--SIEEEVNKSCLGNWYP----SEFDYDG---------------IHYYFCEQFLMGCKAKLF-----------------GDDQIFKLILDS------RNPYEMKKLGKKVK-------------------GFNQEVW-----------DEYKAAVMFEGGLAKFTQ--------------------------NPQLRRFLMET------GDDILVEASKF--------DAVWGIKMEE----------------------SDERANDPHQWCGENILGFTLMSIRDYLLV 192 67472915 eukaryota>amoebozoa>entamoebidae
CCC13826_2022_Ccon_157165319 106 DKFLLFWGHQKSA--NLSASCLSQWFN----SIFWQDE---------------TKYICAEQYMMAKKALCF-----------------GDKEALKQILSA------KDPAQMKGLGRQVR-------------------GFDAKVW-----------DEVKFGVVLNASYLKFSQ--------------------------NAPLRDFLLQT------GSKILVEASPV--------DKIWGIGLGA----------------------SDENAQNPMKWRGQNLLGFALMRARDEIAK 268 157165319 bacteria>proteobacteria>epsilonproteobacteria
ANACOL_01151_Acol_167769817 19 CRFLFFWGHTPPADGHVNESCLSQWWM----CRFSAGG---------------VEYNCAEQYMMAEKARIF-----------------GDNEMLEKIMAS------KFPKEMKAYGRAVR-------------------NFDQAVW-----------DSRCYDRVLTGNLAKFGQ--------------------------NADLWEFLAGT------KGHILVEASPR--------DRIWGIGMGK----------------------QNPNAPNPTLWRGKNLLGFALTEAR-ELLQ 182 167769817 bacteria>firmicutes
GYMC10_6272_Psp._261410041 18 FKYVFFWGHTPPKDGSVDKSCFSQWWM----CPFTVEG---------------TEYSCAEQFMMAEKARLF-----------------GDNEMLESILTA------KHPKEMKAYGRAVR-------------------NFDKDTW-----------DKECYGIVKRASLAKFSQ--------------------------NPELGDYLKST------KNRILVEASPR--------DRIWGIGMGQ----------------------SNPDAENPVKWRGRNLLGFALTEARDELLQ 182 261410041 bacteria>firmicutes
HMPREF1977_0666_Coch_315224011 151 LKFLFFWKPNAD---AIDESCFSQWQL----SPFNVNA---------------NEYSCTEQYMMAEKARLF-----------------DDEEVEKEIMNT------TDPKLIKALGRKVR-------------------NFDPAVW-----------DKVKYSIVLNGNYYKFTQ--------------------------NQAMMDFLLST------GDKILVEASPL--------DTIWGIGLGK----------------------DNEKAFNIASWRGKNLLGFALMEVRDELRK 312 315224011 bacteria
HMPREF9071_1307_Csp._326335654 113 LKFVFFWKPNCK---VVDESCFSQWQP----SSFCIDG---------------DEYSCTEQYMMAEKARLF-----------------GDKEVEEEIMNT------SDPKLMKALGRKVR-------------------NFDPQVW-----------DKAKYSIVLNGNYYKFTQ--------------------------NKEMMDFLLST------GDKILVEASPM--------DTIWGIGLSK----------------------DNEKSQNIAAWRGKNLLGFALMEVRDEIRK 274 326335654 bacteria
Cbei_3546_Cbei_150018370 104 LEYIYFWGHHPKKDGGITKSCFSQWWK----SRFNIGH---------------TEYLFMEQYMMAEKARFF-----------------GDKEIEEKIMNS------YDPKEIKIFGRKVR-------------------GFDEEIW-----------NRAKYSIVINGNYNKFMQ--------------------------NERLKTFLLST------GDKILVEASPY--------DNVWGIQMSE----------------------EDVNIKNPELWRGENLLGFALMEVRNEIKR 268 150018370 bacteria>firmicutes
_Fpra_160945914 125 RELCLFWGHQPAKDGQLTKSCLSQWWT----EDFWFVA---------------NTYLCMEQYMMAGKAELF-----------------GDQEIREQILKC------SDPKQIKALGRKVR-------------------GFDQKVW-----------DKFKYAIVLNGNWCKFSQ--------------------------NRDLREFLLST------GDSVLVEASPY--------DNIWGIRLSA----------------------NSPEAQDPMKWRGQNLLGFALMEIRDELRR 289 160945914 bacteria>firmicutes
LMHCC_1997_Lmon_217965272 94 YNFNQMKNENQPELYLFENCYFSHCWM----EEFSVST---------------QKYCCMEQFMIEQKAELF-----------------NDTTTKQKVLET------NSLEQIQALDKEVQ-------------------SFDQDIW-----------DKFKYAIALYGNWNKFNQ--------------------------KRILRDYLLST------GYSILVETNPS----------------------------------------GSPNMPNPLKRHGQNLLGLALMELRDELRR 248 217965272 bacteria>firmicutes
BHWA1_00589_Bhyo_225619532 82 IDFLFFYGHT-NDKKEVTKSSLSQWYI----KDFRDND---------------LVFNCMEKYMMYNKALLF-----------------DDKDIANEILNN------NQPKAIKELGRKVK-------------------NFNDEIW-----------DKMKYKIVFTGNYYKFSQ--------------------------NTDLRNFLIST------KNKVLVEASPY--------DKVWGIKMKY----------------------DDENIENPFYWKGENLLGFALMEVRDEIKR 245 225619532 bacteria>spirochaetes
Bmur_0365_Bmur_296125416 85 IDFLFFYGHS-NDKKEINKSSLSQWYI----KDFREND---------------LTFNCMEKYMMYNKALLF-----------------DDKNIADEILNT------NQPKAIKELGRKVK-------------------NFNDNIW-----------NNMKYKIVFIGNYYKFSQ--------------------------NTDLRNFLLST------KNKVLAEASPY--------DKVWGIKMKY----------------------DDENIENPFCWKGENLLGFALMQVRDEIKR 248 296125416 bacteria>spirochaetes
CPR_0151_Cper_110802054 18 LEFLFFWGHTKNKNGKITKACFSQWYL----SDFTVNG---------------VLYNCAEKYMMAEKARLF-----------------KDYETLEEILSA------ENQKEIKDLGRKIK-------------------NFNEELW-----------NREKYEIVKRGNLAKFSQ--------------------------NENLKEFLLNT------GDKIIVEASPY--------DSIWGIGMGA----------------------KDENIEDPTAWKGENLLGFALMEVRDLLNK 182 110802054 bacteria>firmicutes
FSDG_00336_Fsp._237744336 18 LKFLFFWGHTENG-AETTKACFSQWYS----CKFVVDE---------------IIYHTAEQYMMAQKTLLF-----------------NDNEIFHKIMSS------KSPKEYKELGRKIK-------------------NFSDSKW-----------NENKYQIVLKGNIAKFSQ--------------------------NEKLKVFLLNT------DTKILVEASPY--------DKIWGIGLSA----------------------DQENIKNPLTWNGENLLGFALMEVRDLLNK 181 237744336 bacteria>fusobacteria
AceceDRAFT_0731_Acel_303238852 110 IKYLFFWGHQPSVDGSITKTCFSQWWK----SDFTIDI---------------EDYCCMEQYMMAEKARLF-----------------EDKEILEEIMKS------KHPKQIKELGRKVR-------------------NFDEEVW-----------KKKRYSIILNGNYAKFLQ--------------------------NEELRQFLIQT------QNRVLVEASPY--------DKIWGIGMSA----------------------DDEHIENPLEWQGLNLLGFALMEVRDELIR 274 303238852 bacteria>firmicutes
Fjoh_0750_Fjoh_146298513 12 SKFLFFWGHQPSKDGTITKNCFSQWWL----SSFKVNE---------------VTYKTAEHWMMAKKAELF-----------------NDQEILEKIIQC------NSPAEAKKLGRKVK-------------------NYDDKIW-----------LENRFEIVKEGNYHKFSQ--------------------------NSDLKTFLLNT------NDRVIVEASPV--------DPIWGIGMAG----------------------DHKDALNPEKWKGLNLLGFALMEVRDELR- 175 146298513 bacteria
KAOT1_16128_Kalg_163754439 29 LKFLFFWGHQPSKDGSITKSCFSQWWE----DAFTVNN---------------EIYKTAEHWMMAEKARIF-----------------NNSEIRKEILMA------SHPHDAKKLGRKVK-------------------NFDPIIW-----------DEHKFNVVVEGNYHKFSQ--------------------------HEDLKQFLLNT------KNRILVEASPR--------DRIWGIGMSE----------------------KNEKATNPNLWRGQNLLGFALMEVRDHLKK 193 163754439 bacteria
Cpin_0074_Cpin_256419128 18 LNFTFFWGHK-GEPGNVTKSCFSQWWP----SAFTDGT---------------HTYATAEHWMMAGKARLF-----------------KDPAMEQEILQT------SDPATAKKLGRKVA-------------------NFDTALW-----------DVEKFSLVVQGNLLKFSQ--------------------------YPKMKEFLLST------GDSIIVEASPL--------DRIWGIGMGA----------------------NHEHAANPLLWKGQNLLGYALMEVRDQLKQ 181 256419128 bacteria
HMPREF0204_10236_Cgle_300774513 18 IKFLFFWGHT--TKDTITKSCFSQWFP----GKFEENG---------------TIYKTAEHYMMAGKARLF-----------------NDPETEEKILKA------NTSNQAKALGRKVK-------------------NFDPKQW-----------DEHKFEIVTRGNLLKFSQ--------------------------NQKFKDFLLST------GDKVLVEASPY--------DRIWGIGMLD----------------------TDSRAENPLLWNGENLLGFALMEVRDELRG 180 300774513 bacteria
EcSMS35_3361_Ecol_170684265 21 VKYLWFWGHQPAANHEITASCFSQWWQ---GSPFTYDG---------------ITYATAEHWMMAGKARLF-----------------NDSKTLARILAA------ATPAEAKKLGRQVT-------------------NFDEQCW-----------QACCFDLVCEGNYHKFSQ--------------------------HSALKTFLLNT------QPRILVEASPV--------DKIWGIGLAK----------------------DHPHAGVPSHWKGKNLLGFALMVVRDRLA- 185 170684265 bacteria>proteobacteria>gammaproteobacteria
CIT292_10857_Cyou_283836396 21 FDYLFFWGHRPSSSGAITASCFSQWWP----SPFEVDG---------------ITYASAEHWMMAEKARLF-----------------GDESTLLRILSA------KSPAEAKAFGRQVS-------------------GFNQQVW-----------EENCFESVCKGNVHKFSQ--------------------------HPELGEFLIST------RTLVLVEASPV--------DRVWGIGLAQ----------------------DDERAGDPLRWNGSNLLGFALMVVRDRIAN 185 283836396 bacteria>proteobacteria>gammaproteobacteria
Slin_1821_Slin_284036735 18 IKYLFFWGHQKSKSGDLTASCFSQWWT----SPFIIDK---------------VKYNTAEHWMMAQKALLF-----------------GDKEVYDKIIVA------KSPAEAKSLGRQVR-------------------NFDEATW-----------SAKRSGIVVQGSLQKFTQ--------------------------HPDLKEFLLNT------KERVLAEASPV--------DKIWGIGLAA----------------------DSDKAENPKRWNGLNLLGFALMEVRDILRK 182 284036735 bacteria
Ndas_4523_Ndas_297563442 23 AEYLCFWGHQPPASGGVSASCLSQWWP----ADFTVEG---------------VGYRTAEHYMMAAKARLF-----------------GDAEAEERILAA------GHPRDAKVIGRQVR-------------------GFDEREW-----------EAARFGIVVEGGLGKFGQ--------------------------NPELREFLLGT------GGRVLVEASPR--------DRVWGIGLGA----------------------ENDDARVPERWRGLNLLGFALMETRARLAA 187 297563442 bacteria>actinobacteria
AMED_1633_Amed_300783556 23 PEYLLFYGHTPSKSGRVTASCLSQWWV----DPFEADG---------------VEYPTAEHYMMAGKAALF-----------------GDHEKAELIRTT------PDPKAAKVLGREVA-------------------GFDAAIW-----------ERHRFDIVVDGNLAKFRA--------------------------HRDLRRFLLGT------GDAVLVEASKK--------DLVWGTGLAR----------------------EEKNATKPDYWRGLNLLGFALMEVRDQLRA 187 300783556 bacteria>actinobacteria
Caci_2927_Caci_256392113 28 PKWRLFFGHRARIPGVVDEACLSQWWP----AEFRIGS---------------ITYFTAEHWMMVSKAQLF-----------------GDSDAWARVLST------RDPAVAKRAGRNAC-------------------DFDETTW-----------AAVRFGLVVAGNYAKFAQ--------------------------NSDLRAFLAGT------AGEVLVEASPY--------DRVWGVGLAA----------------------SHRDVRDPAAWPGLNLLGFALMRVREELMA 192 256392113 bacteria>actinobacteria
Plim_2199_Plim_296122446 17 IEFLYFWGHTPPENGEVNHACLSQWYP----SPFTIDG---------------VVYPTAEHWMMASKARLF-----------------GDFATLAEIRAT------ISPKEAKAAGRKVR-------------------DFDEARW-----------EAHRFRFVVDGNWAKFTQ--------------------------NHTLRQYLLGT------GTKVLIEASPT--------DHIWGIGLSE----------------------QEARNSSPEHWPGLNLLGFALMEVREQISE 181 296122446 bacteria>planctomycetes
Kfla_1718_Kfla_284029681 20 YKYVFFWGDTPSADGQADASCLSQWYR----APFTVGE---------------VRYPTAEHWMMAAKARLF-----------------GDRDAERDVLAA------GHPQQAKAIGRTVR-------------------GFDTEVW-----------QQHRFDLVVEGNVRKFEQ--------------------------NPVLRDYLLGT------GERVLVEASPV--------DRIWGIGLAA----------------------DDERAEHPDQWRGLNLLGFALMQVRDQLTT 184 284029681 bacteria>actinobacteria
SSGG_05341_Sros_291448123 25 VKYLPFWGHRPRPDGRIGASCLSQWWP----SPFTVDG---------------VTYASAEHWMMAGKARLF-----------------DDPEAEAAAVTA------KSPAAAKKAGRLVR-------------------GFDEDVW-----------IGERFALVVAGSVHKFGQ--------------------------DPELAGYLLGT------GDRVLVEASPR--------DRIWGIGLAA----------------------DDERAERPQEWRGLNLLGFALMEARERLRA 189 291448123 bacteria>actinobacteria
SGM_1884_Sgri_329936685 21 VKYLYFWGHQERPGGRLGASCLSQWWP----SPFIVDG---------------VEYATAEHWMMAGKARLF-----------------GDADAERLALAA------PHPAQAKKAGRQVR-------------------GFDEAVW-----------RRERFRIVVEGSVHKFGA--------------------------DEELREFLLGT------GERVLVEASPL--------DRVWGIGLAA----------------------DDEAAGDPERWRGDNELGFALMVARERLRE 185 329936685 bacteria>actinobacteria
SSRG_01621_Sgri_302558106 33 VRYLHFWGHRPGPDGRVGASCLSQWWP----SPFTVDG---------------VEYATAEHWMMAAKARLF-----------------ADPEGERRVLAA------EHPAQAKKAGRLVR-------------------GFDEAIW-----------RRERFGVVVEGSVHKFAA--------------------------HDDLRAFLLGT------GDRVLVEASPV--------DQVWGIGLAA----------------------HDEGAADPERWRGPNLLGFALMEARARLRA 197 302558106 bacteria>actinobacteria
KSE_25370_Kset_311895942 113 PKYLCFWGHRPQRDGQIGPGALSQWWP----SPFTVDG---------------VRYDTAEHWMMAGKARLF-----------------GNEEIVPRILGA------RTPAEAKNLGRLVT-------------------GFDEDRW-----------VEHRFELVVTGSTAKFGQ--------------------------DERLRTYLLRT------GERVLVEASPL--------DRIWGIGLAA----------------------DDQRANSPAQWQGSNLLGFALMEARARLAG 277 311895942 bacteria>actinobacteria
_Ctes_221067792 23 PKYLCFWGHQAERNGSVGKGCLSQWFS----APFTVEG---------------DRFATAEHFMMAGKARLF-----------------GDEEARAQVLAA------PSPASAKQIGRSVR-------------------NFDEARW-----------KAECFDIVVSANVAKFTQ--------------------------NPAMGEFLLRT------GERVLVEASPR--------DRIWGIGLGA----------------------THPDAEQPRKWHGQNLLGFALMAARTQLRA 187 221067792 bacteria>proteobacteria>betaproteobacteria
PFL_5821_Pflu_70733106 86 PDCLMFWGHQPTRDGRISQSCFSQWFD----AGLELDG---------------IQYPSAEHFMMAGKALLF-----------------GDQETHGRILKA------VTPADVKQLGREVR-------------------GFDDARW-----------TEARLDIVVQGNLAKFSQ--------------------------HQALGEYLLST------GDQVLVEASPV--------DRIWGIGLAA----------------------EDARASRPEQWRGLNLLGYALMEVRDRLRI 250 70733106 bacteria>proteobacteria>gammaproteobacteria
Daci_5761_Daci_160901192 23 PRFLPFWGHQPAADGSIGKTCMSQWFE----AGFEVEG---------------QHYPTAEHFMMAGKARLF-----------------GDEAAHAAIVRC------RTPGEAKKLGRGIQ-------------------GFDEAAW-----------VAARMDIVVRANEAKFSQ--------------------------NPALARYLLNT------GDRVLVEASPV--------DAIWGIGLAA----------------------DDVRATDPARWQGLNLLGFALMQVRARLRS 187 160901192 bacteria>proteobacteria>betaproteobacteria
Amir_3505_Amir_256377585 7 MGHLFFWGHTPHRDGELGRECLSQWWE----RPFELDG---------------RVHPTAEHAMMTGKALLF-----------------GDERTAGRVAEA------RTPGEAKSLGRQVR-------------------GFDEDTW-----------ARERLELVARLNEAKFGQ--------------------------HDDLRAYLLGT------GGRVLVEASPV--------DRIWGIGLAA----------------------DDPRATDPDQWRGLNLLGEALMLARARLAA 171 256377585 bacteria>actinobacteria
Caci_5873_Caci_256395008 3 VKYLFFWGHTPNRPGTVGAECLSQWYP----APFEVDG---------------LRFATAEHSMMWGKAQLF-----------------GDEQAAARIVAA------GHPKEAKDLGRTIR-------------------KFDEDTW-----------VAERVAIVTAGNVEKFRQ--------------------------NPDLLAFLLTT------GERVLVEASPM--------DRIWGIGLAS----------------------DDERAQDPARWRGLNLLGEALMAARKTLRG 167 256395008 bacteria>actinobacteria
Sros_2401_Sros_271963927 26 LRYLFFWGHRPPRGGGVGAGCLSQWWE----VAFTVDG---------------HLFRSAEHYMMAHKAWLF-----------------GDGETAVRILAA------GHPGEAKKLGREVR-------------------GFDESVW-----------NEHRYEIVVGANIAKFGQ--------------------------HPELGDFLLGT------RGRVLVEASPV--------DRIWGIGLTA----------------------DDERAASPATWQGLNLLGFALMDARDALDT 190 271963927 bacteria>actinobacteria
FRAAL2340_Faln_111221771 24 LRFRYFWGQRQAVADGTGAGCLSLRWP----ARFAVDG---------------VDYPSAQHYVLARKAGLF-----------------GDQAAAEAVLAL------PAPISLAAVGRRIR-------------------GFDEAVW-----------DRHRYAVALAANSAKFAQ--------------------------NAILRTYLAGT------AGLVLADISPR--------DRVWGIGCDR----------------------DDDRAGRPSAWPGRNLLGFALMEVRDALLA 188 111221771 bacteria>actinobacteria
FrEUN1fDRAFT_4219_Fsp._288920206 31 LAFRYFWGHRRPAGGGIGPGCLSQWWA----VEFTVEG---------------RRYASAEHFMMERKARLF-----------------GDDETAEEILAA------PDPGRAKALGRRVR-------------------GYDDARW-----------ERHRHGVVVAGNTAKFGQ--------------------------HDDLRGYLLST------GSDILVEASPL--------DAIWGIGLAA----------------------SDERAGRPARWPGLNLLGFALMDVRAALAN 195 288920206 bacteria>actinobacteria
FraEuI1c_6936_Fsp._312200713 33 LSFRFFWGHRPPAGGGVGASCLSQWYP----SPFTAEG---------------QRYATAEHFMMAGKARLF-----------------GDDKTVDAILGA------PDPGRVKALGRRVA-------------------GFDEATW-----------ERHRYDIVVAGNLAKFGQ--------------------------HDRLRGFLLAT------GDDVLVEASPL--------DTVWGIGIAA----------------------GDPRAEHPIDWPGLNLLGFALMDVRAALRS 197 312200713 bacteria>actinobacteria
VAB18032_22000_Vmar_330468357 21 VKFLFFWGHQPQRDGSVGAGCLSQWWS----APFTIDG---------------LRFATAEHYMMWRKATLF-----------------DDHATAARVLAA------AHPHAAKMLGRQVT-------------------GFDQHVW-----------EQHRYDIVLTGTVAKFDE--------------------------HPALRTYLIGT------GERVLVEASPL--------DRIWGIGLAA----------------------DHPHATDPARWRGLNLLGFALMQARDILTG 185 330468357 bacteria>actinobacteria
Micau_3582_Maur_302868047 29 VKYLHFWGHRPRPDGSVGASCLSQWWP----AAFTVDG---------------REFATAEHWMMWHKATLF-----------------GDHAIAERVLAA------GHPHRAKALGRQVR-------------------DFDEATW-----------TARRYEIVVAGSVAKFGR--------------------------HEPLRRFLLGT------GDRVLVEASPT--------DRIWGIGLTA----------------------DDPRAADPATWRGDNLLGFALMEARATLAG 193 302868047 bacteria>actinobacteria
MCAG_03098_Msp._238062132 50 VKYLFFWGHRPQPDGSIGPGCLSQWWP----APFVVNE---------------VRYATAEHYMMVGKARLF-----------------GDEATAARMLTV------PSPGAVKALGRQVQ-------------------GFDQTVW-----------DAHRFDLVVAGNVAKFGQ--------------------------HPELRKYLART------GNRILAEASPV--------DRIWGIGLAA----------------------TDPRTCNPAQWRGLNLLGFALMHARAQLAT 214 238062132 bacteria>actinobacteria
NBCG_01909_Nbac_326330475 37 PRYVHFWGHTPKGPG-VGMHVLSQWWP----KVFADAD--------------GRSFASAEHYMMWRKAVLF-----------------GDDRTAARILDA------ASPGAAKALGREVS-------------------GFEDEVW-----------LEHRWRIVVEGSTLKFGS--------------------------DPALRDYLLAT------RGRVLVEASPR--------DRIWGIGLGK----------------------SSPYAEEPARWNGLNLLGFALMEARNRL-- 199 326330475 bacteria>actinobacteria
EFP_gp169_BPphiEF24C_158079465 2 SKYILFWGHTPSKRNKLGKECLSQWYP----SQFTAPI---------EGLGEDIIFPTAEHYMMVRKAMLF-----------------NDVDTAKRILKT------ESPKDAKRLGRQVK-------------------NFEEDLW-----------VKHRKSIVLDGNTYKFTQ--------------------------NDSLRNFMLSIP-----KGTKFAEASPF--------DKVWGIGLRE----------------------SDPRSRDMSKWEGLNLLGEVLTEVRENLN- 172 158079465 dsdna viruses, no rna stage>caudovirales
SS1G_05618_Sscl_156053544 46 LFELGFSR---------HTPFTSNPLC--------------------------KRTSTIFTYFQAVKAWVV-----------------KDRSKFMQIAHT------RSGLEAKKLGNAIK-------------------DLPVARW-----------DQISRHVMADALYFKFNH--------------------------NADIRNELIST------GSKVLIEARD---------DRVWASGIKT---------------------VKATAKTPISEWQGQNKLGEELMRLRHFFR- 193 156053544 eukaryota>fungi>ascomycota
GSTUM_00003347001_Tmel_296414614 4 NPPIYFREDDLRY----YPFCLSHTCTF--TSSPTGPG-------NTAPPGVCCYFTSLTQYLQYRKALFF-----------------YDHRAAEDILTT------SDVSLIMSISRRIN-------------------GLQVEVW-----------NGMRNTLVREGLMLKFGQ--------------------------NEELRRLLLDT------GDRELVYASG---------TRDWGVGFAP----------------------TDAGKS-RDSW-GLNLLGQALMDVRRRLRE 171 296414614 eukaryota>fungi>ascomycota
F44E2.8_Cele_32565136 54 DNVVYFNG---------PTHYLSALYP----CTVVVDG---------------NEYNSVEHYYQACKLYVL-----------------TGEQSAAQLKAS------ETPIEVKKATKNILKEAK-------------IPAKKISAW----------KDKDSIAVLKHVIYHKFNQ--------------------------NDELKVKLLDT------GDKILIQTYIG--------DTYFAAGANAKYTSTWVDRHVNQSLKYPENVVVDNVQYLPLVANGKNVLGWILMQVRDELRM 238 32565136 eukaryota>metazoa>nematoda
consensus/100% - ....................................................................................................................................................................h.........................................................h......................................................................b.....
consensus/95% - .....h...............hsph........h.....................h.s.-.hhb..+...h.........................h..........ps......s.............................W..................h......bh.p.............................h...L..o..........lhp............s..au.........................................s.hs..h...R..h..
consensus/90% - .....F...............hoph........h.h...................a.s.E.hhb..K...h.........................l..........ps......up............................W..............p..hh..s...Ka.p..........................p..h...Lh.T..........lhc.s..........D.hWu.......................................G.N.LGb.L..hR..l..
consensus/85% - .....F.............s.hSpa........h.hps.................a.ssEphhbh.K...F..................s......lb.........ps..h..hu+.........................p..W...........p..p..lh..s.b.KF.p..........................p..h...Lh.T.......s..llE.s..........D.hWG.s.....................................G.NbLGbhL..hR..l..
consensus/80% - ...l.Fa............s.hSpa........h.hps.................a.ssEpahbh.K...F..................s......lb.s.......ps..h..hG+p........................p..W...........p..+..lh..u.b.KF.p..........................p..h.pbLl.T.......s..llE.ss.........D.hWG.u.....................................GbNbLGbhLhplRp.l..
consensus/75% - ...lbFa............uhhSpa.......sh.hps.................asosEpahbh.K...F..................s.....pIb.s.......sP.ph..hGRp.p......................c..W...........p..+.plh.pu.b.KF.Q..........................p.plbpbLLsT......ss..llEsos.........D.hWG.G.s..................................pGbNbLGbhLMplRppL..
consensus/70% - .p.lbFa..........s.uhhSpa.......sh.hcu.................asosEpahbu.K...F..................c.p..ppIb.s.......sP.phb.hGRp.p......................c..W...........pp.+.plhbpu.b.KFpQ..........................p.plbphLLsT......ss..LlEsos.........D.hWGhG.s..................................pGbNbLGbhLMplRppL..
#====== global.consesus
consensus/100% - ....................................................................................................................................................................h.........................................................h............................................................................
consensus/95% - .....h...............hs.h........h.......................s.c.hhb..+...h..........................................................................h.................hh.......h...................................l.............h.c............p.............................................s.h.............
consensus/90% - .....h...............ho.h........h.......................s.E.hhb..K...h.........................h..........ps......sp............................a.................hh.......h.p..........................p..h...l.............h.-............c...s.........................................s.h.b.....p..h..
consensus/85% - ...h.h...............hS.h........h..ps.................h.s.E.hhb..K...F.........................hb.........ps..h...s+............................a..............p..hh.......h.p..........................p..h...Lh............h.-.p..........c..hs.........................................s.h.bhhb..+..l..
consensus/80% - ...l.h...............hS.a........h.hps.................h.ssEphhbs.K...F..................s......lb.........ps..h...s+............................a..............p..hh....b.bh.p..........................p..h.p.Lh.s..........lh-.s..........-..hs.......................................u.s.hsbhhhp.R..l..
consensus/75% - ...l.h.............s.hSpa........h.hps.................a.osEphhbu.K...F..................s.....plb.s.......ss.phb..uR............................W...........p..+..lh..s.b.+h.p..........................p.pl.pbLl.T..........lh-.s..........D.hau.s.....................................GbNbLGbhlhphR..l..
consensus/70% - .p.lbF.............s.hSpa.......sh.hpu.................a.osEphhbu.K...F..................s.....plb.s.......ss.phc.huRp.p......................b..W...........pp.+..lh..s.b.KFpp..........................p.plbpbLl.T.......s..ll-.ss.........D.hWGhs.....................................GbNbLGbhLhphRpbL..
Back to Contents
ALIGN ---EEEEE----HHHHH-H----------------------HHHH-------------------EEEE--------------EEEEE-------------------EEEEEE--HHHH-----------EEE-----------------------HHH-HHHHHHHHHH-----------------------HHHHHHHHHHH-----HHHHHHHHH---------HHHHHHHHHH------------EEE------
HMM -HHHHHHHHH--HHH-------H--HHHHHHH-----HHHHHH----------------------HHHHHHHHHH------H--EEE---EE--------------------E-----E-------EEEEE---------HH-------------------------EEE--------E---HH-------EHH---EEEEEE------EEEEEEE-----------------EEE--E----H----EEEEEE---
FREQ --EEEEE-----HHHHH---------HHHH----------HHHHHHHH----------------EEEE------H-------HHHHH-------------------EEEEEE--HHHH----------EEE---------HHH-----------H-HH-HHHHHHHHHH-----------------------HHHHHHHHHH-------EEEEEEE-----------HHHHHHHHH-----------EEEE------
PSSM ---EEEE----HHHHHH-H-----HHHHHH---------HHHHHHHH-----------------EEEEE---------------HHHHH-----------------EEEEEE-----------------EEE----------------------HHHH-HHH-----------------------------------EEEE----------EEEEEE---------HHHHHHHHHH-------E---EEEE------
FINAL -EEEEEE----HHHHHH-H------HHHHHH--------HHHHHHHHH----------------EEEE---------------HHHHH------------------EEEEEE----------------EEEE-------HHHHH-----------HHH-HHHHHHHHHH-------------------------HHHEEEEE-------EEEEEEE-----------HHHHHHHHH-----------EEEEE-----
225620246 KLIYHLTAINNFESIIRN--GLCPRNKIKP----NIDVADNEILNGRNKY-N---------LLDYVPFHFFINTP-------FDGAVKKKY-----------KTTDFIYICLEREIAKM-------NEFKIIPCHPLSNRLINYENI---LFDYDKGF-DLIEWDKIDSDN-------------RNYVDQDIKNACMAECLYKGVISCRIFSSISVKD-----VESFKKIDKILLK----F-G------FISDKNKY
307823107 KLLYHLTSIKNIGPILAD--GLKPRAELKN----FDDVADSEIIVNRRHL-S---------LENFVPFHWFARNP-------FDGRVQADR-----------PNDLFVLITVERTLAVS-------RNWKVIPYHPLSAGNIEL-------MDYSKGF-AAIDWDTMNRR---------------DYHDPLCKSICMAECLSPITVSPDDFFNIFVYC-----DDSVSYVRRFDRQ--I-------KITKNERMFLP
104779561 RFLYHLTSVANVSSIFQR--GLLPRTVLDEE--EFADIADAEIILGRRQQ-G---------LEQYVPFHWFAKNP-------FDGRVYQDR-----------PDEEFVLIAVERSHAQT-------QNWSVIARHPLSGSRFEL-------LGYDEGF-EAIDWDLMDRR---------------DYHDQECKHVCMAECLAPGPVPVSQFAKIYTPS-----DEIFGYVRAQAVA--AGFRN---LWIDANRNMFP
269140414 QFLYHLTDLNNLEDIFSE--GLKSRSLLRG----FSDVADPEIIASRSAL-R---------LEEYVPFHFFARNP-------FDGRVHRNN-----------PNKTFVLITVRRSHAQT-------NSWSVIPRHPLSGSTITL-------LDYEAGM-ATIDWETMNRR---------------EYGDDNCKCVCMAECLSPTSVPASDFNSIFVPD-----AETEATVNNLKRT--YGL-N---MYVNNSPHMFP
299141966 RFLYHFTDKRNIPSIKRHG-GLFSWHYCET-----NNINIPRQGGDYDSR-ELD-KKYG--LQDYVRLSFCDDHP-------MKYRLQQ-------------SGSDMVVLRIKIDVALL-------KDTLFSDINAADRLHTH--------GGSLLDL-KRVNFDATKRH-------------FVSKNDEDFKP-HQAEVMVKTFVPLKYIVNI-------------------------------------------
268609383 NGFYNIMPISNLASVLKY--GILSNELAERI--PHRSVAMSIIQDRRDQV---LIPNGLM-LHQYANLYIDARNP-------MLYKRKD----------------EDVIVLKVDCRILD------LPDVVVSDQNASSSYVRFY--------EPEEAM-NKLDFNMIFAR--------SWESDNQ-FEYWRKKSAKCAEVLVPGKIEPSYVIAAAVK---------NDADKEKIIA--LGF-D---KRIYVNGDLFF
254410814 KYLYHMTAISNLRSILQH--GLLSHKEAHRLELVMMDISDPEVQRRRDDK--KDTIYSRL-LHDYVPLYFSPRNP-------MLYRRREI--------------QENIVILGIKPEVIF------KANTVFSDGNAASKGTIFY--------NDVAML-DSLCWNIINAL--------NW------SDFPEGKRIKCAEVLVYPKIDVKNIVSIFCYS-----GNQLSTIHETIRYF-RAIPLSLTISVQVKPELFF
302864537 QELHFITPISNLESVLRH--GILSHNAARRL--PHLSVADEDVQSRRRQK---RVPGGMQ-LHDYANLYFDARNP-------MMYRIKGN--------------GTPLAVVCVNPSILD------LPGVVITDGNAASDGTRFA--------ASPGGI-AILDEGLVYAH--------SWTSSDR-WDYIERKRARCAEVLVPNCVDPSYIDKAKVI---------RQSHVISCHA--AGL-R---GEVF--ANVFF
297618118 TELHYITHIENMKSIMRF--GLLSNRRASRT--RHNSVAMQVIQERRAGK---RVPGGLL-LHDYVNLYLCARNP-------MMYKLRGR--------------HKELCVLRIDVGVLN------IPGTIVTDRNASSDWACFY--------PSPVGL-KHVDLELVCAQ--------SWVHNDE-IETFKHKSIKCAEVLVPHHVPTSFFKGVYVSC----AESMSRLHCLAGDG--K-L-E---IEVY--PHMFF
315652379 TGIYNIQAIDNIPSIIRR--GLLSNERAVSI--KHKSIAMDEVQARRDNI---IIPNGLK-LHQYANLYFDPRNP-------MLFKRKSQ--------------NEEICILKFDRVILD------FNGVVLSDRNASSSYAAFY--------EAKYGL-ENIDFKLVYAR--------YWTDDNY-FEQCRRKSIKCAEVLVPYGISYDYVVFAAVV---------NDAAADRLRL--NGF-D---KNIFIEPKIFF
91215317 GGLFYITHLDNVASILKL--GILSHNLAHSNGFVSTDISNQQVNARRNRI---DPNLGGN-IHDYTPLYFNHKNP-------MLYTLCKN------------TDRNKLILLKVNPHILL------AENVSFSDGNASVRSTKFY--------NNIEEF-NNINWTLINSG--------SWNHYEF-NIKREQSRIMCSEVLAKEKIPSYYINEIFVYS-----EETLEQILPMFPN---HL-G---IKTSINKSLYF
163847525 KRLYHITHIDNLASILQY--GILSHRQVESQNVSFTPIYNENIVHNRKER---LTPDQRS-LWDYANLYFQPRNP-------MLYKVLSEK-----------STREIVILGVKPQVLDT-------KGAFIALGNAAHSQTEIVD-----VATGRKVI-TGEFWPIIHSD--------WW------KPEDGTKRKIMAECLIPHVIVPEAIHSIFVAH-----PSVADTVRSIIAE----I-PC-PVEVVTEPHLFF
161528666 QYLFYITHIDNIPSMLQN--GILSHDQIVKQKLEYTSIYDSDIVSSRREK----TANGKS-LWYFANLYFQPRNP-------MLYRVTMEK-----------SPDCIAVVAVDKKILTT-------PNTIITDGNAANGPTHFYP------NTEFKTI-ERQINRITSLQ--------WW------TDSNATKRQIMAECLVPERIPPEFIRAIYVSN-----HTLADEIRNSMSS------S---ISIIPEPSMFF
156740099 KSLFYITHINNLESIFQH--GILSHARVEEMGIPYTPIYDAQIVSNRRER-S--TPDGKS-LWRFANLYFQPRNP-------MLYRVINKI-----------DKKEVAIIGVRPEVLSY-------PGCYISTGNAASSPSEILP-----VKEGIKAI-F-EMWKIIHNE--------WW------NPDDGSKRKIMAECLVPDFVSPDMIQTIYVVN-----HDVAKDVRSRISG----A-R---VPVVPEPSMFF
295087467 RYLYHFTDRRNIPSIKRHG-GLLSWSYCEK-----HKIDIPNPGGGNLSR-N--LDEMRN-LQDYVRLSFTTEHP-------MMYVAMKDG-----------RISNPVILRIDPSVVYL-------QHTMYADMNATTTKRTPNI------GKSLEDF-KKIHFSTVKAH-------------KHFDLDENERPYFQAEVMVMTFIPKKYIINLDTF----------------------------------------
307299774 KHLYYLSPVKNIPSILEH--GVMSKMAVETLEIPYDDYSDQTVQTIRERK-S---------LHEYVPLFFNTRNA-------MTFRYQKE--------------NRDFAILRLNSDLVT------HYDCLVSDRIAACSDAEIY-------TLSEPAL-KKINIEVVLST-------RNFY------DNWLLKKRLGAEILVKIDMIEPEWIECIILD------RTAEKIKGISIR----------QLRDSGYTYYF
257093309 GHLWHFTDIRNLAPIRRAG-GLYSWAGLGA-----LGISDAYMLANDFSR-SCDARLG---RDRYVRLSFIPNS--------WFFQRVRWS-----------CPQAVWLRFSLKAVTL--------GEVDYSLGNAASGFVALRDDLPS--MGINWDM-VTPSPPHPCDKGPTRYPTLYPDQVGDPFLFRQISNAWNSEVLIKHYLPLD-FCTGVFDC----RSGEALNI---------------------------
84392321 PFLVHFTNLKNLESIFNN--GLVPRSQLDA-----SDSEYESNDDSRLDG-----------HEDSVSTSVAFPNC-------QMFYKLRRN-----------SDDKFCLLALDPELLLN-------HSSAFCKYNAADAAISSQNIET---LKTAEAF-EGMFTELATQR---------SR--EDQKLEDYDPTDVQAEILVFDTIPKGYIGAVVFP---------DKETEKQFKG--IIG-G---CKSYVHNPNKG
218779300 EEIVHYTTMNGLIGILAT--KMVKSRERVA---QESLLEYILQLNTPLRK-----DTG---WLDYVSLSISNMNS-------WLFHFSSKKWH---------TNSKFCILSFKPEILSH-------NGVFFATTNNMYPAVRRG--------EGETGF-EALFAPIVLGRY----NAPIIR--SP-TCHDSCPTCEQAEILYPGELSTDFLLRIYVEE---D--DDEDSVHGIFGG--VGH-AK--VPVEINPGKFR
125718682 HRLCHFTHVSNLSNILKG--NIFSSRSIPR--DQWNDSDRVDGYIDYVCT-S---------VELPNSYCLKN----------MVRKTQTNI-------------EEWIIFKINPYIID--------DTSLFCPLNAAKECGKYVSEG----VEAYESI---FLNEG-RTRN-------------P-KWISSVPSNLQAEVLIKGIIPINQIKGVIFHE---N--FVDDDIFKLVNQ--AN------IEIRQSTDLFD
281416943 TRLCHFTKLKMLTHILSSNEGILASA-CIRSDV-KTVIDADRYEGEPEYV-C---------CSIEYPNSWFLSE--------AQRRDTDQIF------------RDWVVLYINLRILNY-------RDAKFCPCNASKGCGRYI-------FSDLNKL-ITLYFSPTVVGR-----------LRTPNMLECCPTDDQAEILIKNSIPRDYITGIAVGN-----NDIAERVSAILKT--YSI-FG--MRIFIAPDVVS
113473935 EYLCHFTPAPNLPNIIAH--GLLCRAHLST-----AGMPAYTSIDHRLDG-----------EDQAISVSISAINH-------RMFEAKRAAS----------GRTDWIVLFLCPSILWT-------HECRFYARNAARREMLDHRG----FLGGPWAF-NRMFSESSHPNGFTG--YSYRVDT---GIADALTTYSDAEIQVLEPISPEYVIGAWANN-----MPLAEIAQSCLNR--LSG-SE--RDVQVSSPHRV
60461910 DHLVHFTNINNIDNIMRH--GLLNTQDLKE-----QNIPFIFTDEYKLDG------------RHGLSLSVQFPNY-------KMFYSKTNKS----------PQNDMVVLLLDPELINE-------KKCLYFYDNAATTELKNMSSSD---LMTDIAW-EKMFSDKVDGI---------LR--SELKIPNSFTTNPQAEVICLEPIEPKYIKNIICK---------SDDQFGRVSN--Y-------LDIVGKDEHYF
260557664 KSIFHFTRVENLNNILTN--GIIPRNNLSN-----KTSIF--NDTVRADG-----------KLDYSSFSISFPNH-------LMFYRLRCAV----------PESKWAILVFKSDLLTT-------NNCLFYPVNAASSNVSRSPVDM---FRGGQAL-ERMFTYSAESR--------------ESVLRACDPTDVQAEVMIPGIVTMENLKGCILS---------EKDLVEFFSK--RFP-N---IKFVHCHSGRQ
153817479 EYLWHFTKLENVSSIFQS--GIVPRATLEA-----NQSNVAYNDQHRLDG-----------FKTASCFSIGHPNY-------KMFYSLRQQD----------PSVEWVVFGVKAEVLWT-------KDCAFCTTNAANSSVTSVPIEQ---RKGVQAF-ESLFLPVAGKP---------SR--QELQLPDDCPTDPQAEVLVFDTILPSDIVGVIVP---------TKAKELELKP--LYP-A---HQVVYHRAHYS
239627870 EHCVHFTNVLNLPSILSY--GLLSKADLEY-----NWIEYNHNDNLRLDE-----------FEESISVSITSPNY-------KTFYQWRCDN----------PSKSWVVLILDAIQILN-------LDCAFCYTNAANIRISSIPLAE---RKTYSAF-ESMFAEKQNQA---------TR--QEMKLYPNEPTDPQAEILVFNSIPVSAIQFALFN---------DYQIMKQYAP--LLD-N---ANIPYTRDLGY
149186577 GHLVHFTQAENLASIMQN--GILSVSSLRR-----RGISFRQNDISRYDY-----------QINASSLSITHPNE-------KLFYKWRMED----------PSQDWVVLLIESSILRR-------RDLAFNIHNAADKRMSSRPLSA---RKGVDAF-EGMFAEIDGFA---------KR--AELGLRDQDTTDVQAEVLAFQKIEPRLILGAVFD---------SLGAMARYSN--ILG-N---RDISCVQPNTG
71064898 QILCHFTPINNLESILNN--GLYPRDYIDE-----NLPDAIWTDDGRFEG-----------MKNGVCLSISFPNH-------QMFYRKRMQLK---------DIESWAVIVLDARVIKL------NHDCAFFQTNSAFGDYRNKSLSE---FMTSNAF-FSLFEEKVETRN-----GVVTR--QD-YLTDEFPTDVQAEVVVFDHIPPDSIEACYLQ---------SEKYLKYFEE--KFS-K---FTFIEDSNDNS
294664142 KALFHFTREENLASILSR--GLLRRDQL-S-----SSEGAVFNDDLRLDR------------TSAICLSVGFPNY-------KMFYPLRINN----------PDTKWVVIAVMPSVLWM-------LPCAFCTTNAASNAVTASTLAQ---RMGLAPF-QNMYGDCSGKI----------R--SSLGIPNDYPTDPQAEVLVLNDIPPAYLMGLATH---------TREGKDRILS--RHA-G---THVIHAPTLFS
237813317 RNIVHFTRLSNLASIIAN--GIVPRSTLVA-----KNLLFEYNDAYRHDG-----------YLNASCFTIGWPNY-------KMFYPIRCSN----------PDVNWAVIECSPAILWE-------KPCIFSAQNAASNAARLVPLEQ---RTGLSGI-TGIFAEIPGKP---------TR--AEMGVHESFPTNPQAEVLVCDIVEPRYFVRVHIE---------DWASRNKLAA--EY------HPLPFVTGWEG
189425638 SHLVHFTRLENLEGIMRQ--GIRTRYDLDN-----SGTGYIYNDDLRLDG-----------YPNAASISVSYPNY-------KMFYSYRCAD----------HNVPWVVLRLRPDILWE-------KNCAFCWENAASTNVTCIPIEN---RRGREAF-LDLFVNKSGYP---------TR--ETTLIPRSYPTHPQAEVLVFGTIEPAYITRVDLP---------TRFNPNSVFS--SIN-RH--CEFWYDDDLFW
206563731 KYLVHFTRLSNLASILAH--GLVCRNRLDG-----RNVIGAVNDQYRLDR------------TDAVCVSIGFPNY-------RMFYRYRQEN----------RGENWVVVGIDPSALWK-------LRCAFCITNAAAGRVSAIPLDQ---RTGLPAF-QAMYGDFDDKV----------R--ANLHLADQFPTNPQAEVLMLDGVPAAYFLGVAVQ---------NDMMKAQVEA--LHP-G---LHVVRHEEFYS
260590817 EFLIHFTPTINLYSILEQ--GKLMSRKTLE---NLDIEQFDILDYAQFTD-NV---RCD--DKGFINLSISGPNT-------FLFSKFQERTKD---D----MTIDWCILKIDPKYIYE-------KETKFSVTNAASNVAKAIGV-----TGDLDKF-KMLFANSINIP---------YG--IRGKINSKYPTNVQAEVLVKKDIPVESIIEVCFNSIE------SFASAKAALS--EFD-T---SNFVVDMEIFS
258545511 KYLCHFTPQNNLEHIKNY--GLLLRNEMPC--------GATITDSTRADN-----------VRSAICMTISKPNR-------WMLEQ-KQREG-----------HHLALLLISPDVLFM-------RKCLFYPHNAATASLRRRPIED---FMGIDAF-KEIFAEEVEYKK-SGKESQIIR--RSSHLSAAETTSDQAEVQCLEQISPQHIMRIITY-----NIPLDYQDVQILAG-----------KLFLNPQRYR
229129771 TRLCHFTNSRSFIHIIQNDLGVVANNFLGD---EEEIGIMSKNDNLRLDG-----------KEDYISCSIEYPNT-------WYLDKVKLRDP---------NFRDWVVLFIDPLVMLE-------ENTLFCHRNAAAGEGKYL-------KSGNEGL-RGMFAQTVDGK-------FKIN--RAYNMLSCCPTDGQAEVMVYKNIPKESIKGVCVSSMEQVKIEMLKISHLNLLE--GEL-N---FDWIISPELFS
30022567 TRLCHFTNSRSFIHIIQNDLGVVANNFLGD---EEEIGIMSKNDNLRLDG-----------KEDYISCSIEYPNT-------WYLDKVKLRDP---------NFRDWVVLFIDPLVMLE-------ENTLFCHRNAAAGEGKYL-------KSGNEGL-RGMFAQTVDGK-------FKIN--RAYNMLSCCPTDGQAEVMVYKNIPKESIKGVCVSSMEQVKIEMLKISHLNLLE--GEL-N---FDWIISPELFS
224477788 TRLCHFTKSKNLPFILGEGVDSDNGILANN-----FISDTSFLNKTDENR-FD-------NHEDFICTSIQYPNC-------YYFSTVVKKNQ--TE-----IFNEWTILGISPEIID--------DSTKFCPVNAATKGGRMI-------GNGAEAF-EEVFSERVEGKR-------IF--VRNQNYPDNVPTNVQAEVLIYNKIPKENITSLIFPT---EAIAEKECLRLELCG--VNV-SQ--YDIIVSSDLFE
237800583 ESILHFTSNSGALGVFAS--RALKSRQRLN---ADQQLKHIFQPNARFRD-KD------VAWLDYANLSISQINT-------AFFKTCSGSWH--KE-----KDFFWCILDFSPSIMLH-------DDVWFTTTNNIYTGVKRA--------CGVEGL-EAVFQPT-THQY----QANYVR--RPADHPSNLPTCYQAEILYPQELSTDYLQRIYVRC---D--NDTDELAGQMAA--TRH-PQ--VEVVVRPELFE
325690156 TRLCHFTKSSNLPYILGGTDEEANGIISNK-AIRDSECKFLKLNDIHRYD----------NRPELICLSVEYPN--------FFFFEKSIEKE--KES----LLNDWVVLLISPSIIN--------EETYFCPVNAAKNRGAHIG------KGSQKFM-ELFNTEVLGLNR-------------SVSMLPNIPTNNQAEVLSPDMIPKDKIIGLVFSS---KKQARDEVLRLKLCQ--IEL-RN--LKIYYSHEWFK
148821249 WIVWHFTHADNLPGIITAG-RLLADSAVT---PTTEVAYNPVKELRRHKVVAPDSRYPASMASDHVPFYIAARSP-------MLYVVCKGHSG--YSG----GAGPLVHLGVALGDIID-----ADLTWCASDGNAAASYTKFS--------RQVDTLGTFVDFDLLCQR--------QW---HNTDDDPNRQSRRAAEILVYGHVLFELVSYVCCYN-----T-ETMTRVRTLLD--PVG-GV--RKYVIKPGMYY
15607201 WIVWHFTHADNLPGIITAG-RLLADSAVT---PTTEVAYNPVKELRRHKVVAPDSRYPASMASDHVPFYIAARSP-------MLYVVCKGHSG--YSG----GAGPLVHLGVALGDIID-----ADLTWCASDGNAAASYTKFS--------RQVDTLGTFVDFDLLCQR--------QW---HNTDDDPNRQSRRAAEILVYGHVPFELVSYVCCYN-----T-ETMTRVRTLLD--PVG-GV--RKYVIKPGMYY
90419305 ALIFRIVHRDNVEWILDN--GLHCKKAHVS-DPNYVAIGNLELIDRRTNH-PVPCHPNG-TLGDYVPFYFTPFSP-------MMLNIKTGYGG-IRKR----ANEEIVVLVSSLHKLNE-----AGLPIVFTDRHAYLQAARFY--------TDMQRL-NEIDWAILRAK--------DFK--RNAEDPGKF-ERYQAEALVHRSLPCAGLLGIACY-----NEAVMASVKRQTER--RGL-N---MRVIAQRKYYF
307823108 ALIWRIVHRDNLSWILDN--GLHCANSKTL-SPNYINIGNSDLIDKRRHR-VVPIAPSG-TLADYVPFYFTPFSV-------MMLNIHSGRGG-VPRR----RNEEIVILVSNLHHVHS-----IGLPFLFTNAHAYPNWTNYY--------SNLAQL-YNIDWDILQRR--------DFK--RDPDDLRKM-ERYQAEALIFKHLPINGILGIVCY-----TEQLKHDIEQQVQD--RNL-M---LEVYARTKWYF
228911570 TFIYHMTHYRNLSKILSSN-GLVCVSNIMNNGQTYCNIANNDIQSRRASY-SVPVEPFG-TLHKYVPFYFAPKSP-------MLYSIYKGNVI-QYNE----GQEPLIYFVSSAQKIKQ-----NGVPFCFTDGHGIMHFTEYY--------NDLTEL-HNIDWDIMKSK--------YWHDT---IEDNDRKRRRMAEFLVYQYVPLDCIIGIAVYS-----QKYKEETEKILTE--HNV-S---LPVKLKPNWYY
309811906 PGIVHFTRVEHLGTIVQQ--GLLSDHAVGS--ALQHEIGNRNIKAQRTRR-VVPIPPGG-VVADYVPFYFAARSP-------MMYSIAMGNVP-GYAE----GTARIVYLVSDVGRVLT-----DGMRVVISDRNAALHVAAFRP-----PTVELFAG-DFIDWDLMRAR--------YWGQYDDGSTRADGRERRMAECLVHQKVSWGCITHVVAKS-----EAVAREARLLLGD--RLP-P---GGVVVRPEWYF
326943719 TFIYHMTHYRNLSKILSSN-GLVCVSSIMNNGQTYCNIANNDIQNRRAYY-SVPVEPFG-TLHKYVPFYFAPKSP-------MLYSIYKGNVT-QYNE----GQGPLIYFVSSAQKIKQ-----NGVPFCFTDGHGIMHFTEYY--------NDLKEL-HNIDWDIMKSKY-----------WHDTIEDNDRKRRRMAEFLVYQYVPLDCIIGIAVYS-----QKYKEETEKILTE--HNV-S---LTVKLKPNWYY
292493384 GLIFRITHRDNILWILDH--GLHCPNGTVF-DHNFVPIGNPELIDRRHHR-EVPIPPGG-VLGDYVPFYFTPYSP-------MMYNIKTGYGG-VKKR----RNDEIVVLVSSLHQVAK-----EQRKFVFTDRHAYLRAANFY--------NNINDL-NLVDFKLLRSR--------DFS--RDVEDPEKI-ERYQAEALVHQSLPVQALLGIVCY-----TKAVADEVQSVLRV--RKI-T---MRTLVKPSWYF
257455836 GLIWRIVHIANLPWIFAN--GLHSGNSPIQ-SPNWQHIGNPELIQKRANH-PVPVGRQG-YLNDYVPFYFTPFSP-------MLLNIKSGRG--VMQR----PMQDIVILVSSIDTVES-----QHLDYVFTNSHAYYQWTNFF--------TDRKDL-DKIDWALLQRR--------DFS--RDPNDLAKF-ERYQAEFLIYQHCPISAIIGICCY-----NDNVKQSIQQLINM--SGI-T---LDVHSRPNWYL
215486216 ALIWRIVHRDNIPWILDN--GLHCGNSLVQ-AENWINIGNPELIGKRAGH-PVPVGTGG-TLHDYVPFYFTPFSP-------MLMNIHSGRGG-IKRR----PNEEIVILVSNLRNVAA-----HDVPFVFTDSHAYYNWTNYY--------TSLNSL-DQIDWPILQAR--------DFR--RDPDDPAKF-ERYQAEALIWQHCPISLLDGIICY-----SEEVRLQLEQWLFQ--RNL-T---MSVHTRSGWYF
256023435 ALIWRIVHRDNIPWILDN--GLHCGNSLVQ-AENWINIGNPELIGKRAGH-PVPVGTGG-TLHDYVPFYFTPFSP-------MLMNIHSGRGG-IKRR----PNEEIVILVSNLRNVAA-----HDVPFVFTDSHAYYNWTNYY--------TSLNSL-DQIDWPILQAR--------DFR--RDPDDPAKF-ERYQAEALIWQHCPISLLDGIICY-----SEEVRLQLEQWLFQ--RNL-T---MSVHTRAGWYF
304560215 ALIWRIVHRDNIPWILDN--GLHCGNSQVQ-AVNWINIGNPELIGKRAGH-PVPVGTGG-TLHDYVPFYFTPFSP-------MLMNIHSGRGG-ITQR----PNEEIVILVSSLRSVAA-----QNAPFVFTDSHAYYNWANYY--------TRLEDL-NQIDWSILQAR--------DFR--RDPDDPAKF-ERYQAEALIWQHCPITLLVGMICY-----NDGVRLQLEQWLSQ--RNL-T---MPVHARAGWYF
238921299 ALIWRIVHRDNIPWILDH--GLHCGNSPVQ-AANWINIGNPELIGKRAGH-PVPVGMGG-TLHDYVPFYFTPFSP-------MLMNIHSGRGG-ITQR----PNEEIVILVSNLRNVAA-----QNIPFVFTDSHAYYNWVNYY--------TRLDDL-NQIDWSILQAR--------DFR--RDPDDPAKF-ERYQAEALIWKHCPITLLVGMICY-----NDGVRLQLEQWLSQ--RNL-T---MPVHARAGWYF
269140415 ALIWRIVHRDNIPWILDH--GLHCGNSPVQ-AANWINIGNPELIGKRAGH-PVPVGMGG-TLHDYVPFYFTPFSP-------MLMNIHSGRGG-ITQR----PNEEIVILVSNLRNVAA-----QNIPFVFTDSHAYYNWVNYY--------TRLDDL-NQIDWSILQAR--------DFR--RDPDDPAKF-ERYQAEALIWQHCPITLLVGMICY-----NDGVRLQLEQWLSQ--RNL-T---MPVHARAGWYF
253687260 ALIWRIVHRDNIPWILDN--GLHCGNSPVQ-AGNWINIGNPELIGKRAGH-PVPAGAGG-TLHDYVPFYFTPFSP-------MLMNIHSGRGG-IKQR----PNEEIVILVSSLRTVAA-----QNVPFVFTDSHAYYNWANYY--------TDLNNL-NQIDWPILQAR--------DFR--RDPDDPGKF-ERYQAEALIWRHCPITLLSGMVCY-----NDSVKLQLEQWLSQ--RNL-T---MPVHARAGWYF
104779562 ALIWRVVHRDNLPWLLDN--GLCAVSRGNL-SSGYVGIGNPDLISKRSRR-AVPIHPGG-TLADYVPFYFTPFSV-------MMKNIHSGRG--VQQR----RNEEIVILVSSLYHVRS-----LGLPFVFTDAHAYPDWAGYY--------SDLEHL-DKIDWQILQSR--------DFK--RDPDDPRKM-ERYQAEALIHGHVPVAGLLGIVCY-----NEALQRRVDQEVRQ--RQL-D---LPVHARPGWYF
206579710 ALIWRIVHRDNIPWILDN--GLHCGNSPVQ-AANWINIGNPELIDKRAGH-PVPAGTGG-TLHDYVPFYFTPFSP-------MLMNIHSGRGG-IKQR----PNEEIVILVSSLRHVAT-----QNVPFVFTDSHAYYNLANYY--------TDLNNL-HRIDWPILQAR--------DFR--RDQDDLAKF-ERYQAEALIWQHCPITLLVGMICY-----NDGVRLQLEQWLSQ--RNL-T---MPVHARAGWYF
288457846 ALIWRIVHYSNLPWILDN--GLYCGNSKIK-SPNWFNIGNPELIQKRADH-SVPLPPSG-MLNDYIPFYFTPFSP-------MLRNISTGWGG-IPQL----PNEKIIILVSSLHHIAD-----LGLPFLFTDSHAYSPCANYY--------SNLSDL-NQIDWPILQHR--------DFK--RDPDDPAKF-ERYQAEALIYQHLPINGLYGIICY-----TELLKQRIEQEICA--RNL-N---LRVYARPEWYF
146305602 ALIWRIVHRDNLVWILDN--GLHCASANVQ-APNYVVIGNVDLISRRRER-TVPVAPGG-TLSDYVPFYFTPFSP-------MMYNIHTGRGE-VQQR----HNEEICILVSSLRRVHE-----LGLGFAFTDRHAYTPLARYF--------NELDLL-EQLDWPLLQAR--------NFS--RNPDDPEQI-ERYQAEALVHRYLPIEGLLGVVCF-----TQAVKDRLDAQAQA--KGL-K---LDIRVMPQWYF
209527878 TYIYHITHLKNLPSILRSE-GLLANNHLKSQPINYVDIAHETIQNKRAQI-NIPCSRGG-TLHDYVPWYFAPRSP-------MLYAISRGNVQ--GYE----QGQSPVIHLVATAEDIA----AASLPFAFTDGHAIVRYSEFY--------DNLDSL-NAIDWEIMNAG--------YWA--DTLEDGDRK-RRRQAEFLVYEFFPWTLVREIGVI-----DAGRKAEVEEILQN--FTI-S---TPVKVFREWYY
209527890 TYIYHITHLKNLPSILRSE-GLLANNHLKSQPINYVDIAHETIQNKRAQI-NIPCSRGG-TLHDYVPWYFAPRSP-------MLYAISRGNVQ--GYE----QGQSPVIHLVATAEDIA----AASLPFAFTDGHAIVRYSEFY--------DNLDSL-NAIDWEIMNAG--------YWA--DTLEDGDRK-RRRQAEFLVYEFFPWTLVREIRVI-----DAGRKAEVEEILQN--FTI-S---TPVKVFREWYY
300868768 TFIYHITHINNLESIVKAG-GLLACNAMYEANAEYTNIAYDGIQDRRART-SVPCSVGG-VLHDYVPFYFAPRSP-------MLCAINNKGKVK-GYS----EGQTPIIYLVSEVEKIA----DSNLHFAFTDGHAVMTFTDFF--------DNLEYLDEAIDWEVMESR--------YWF--DTDEDNDRK-RKRQAEFLVYKFFPWQLVTEIGVK-----NYQIKTEVDKILEKN-TTH-Q---PPVKTRTAWYY
119483244 TPIYHITHIDNLVSIISSG-GLIACSQLRQQQVRYTDIAHQNIQDRRANK-PVPCSVGG-LLHDYVPFYFGPRSP-------MLYAIYRRNVQ--GYQ----GSQSSIIHLVTEIETIA----NSDLDFAFTDGHAIMDYSDFY--------DDLWQLGEVIDWGLMEER--------YWS--DTEEDRNRK-WRRQAEFLVHRFYPWRFITAIGVI-----NDSIKTKVQSILQK--KQH-Q---PLVRVCSNWYY
307154521 PSIYHITHLNNLASILRAG-GLIANSRLRQQQINYTDIAHEQIQDRRARK-RLPCGAGG-TLHDYVPFYFAPRSP-------MLYAIHTGNVR--GYQ----DGQDSIIHLVTDIEAPFF---EEENAFVFTDGHAIMDYSDFY--------DDLNALDFVIDWELMKSK--------YWF--DTEDYPDRK-WRRQAEFLVYERCPWDLITEIGVI-----NSTIQLRVQNILKN--FSD-L---TPVRVYPNWYY
218295754 TLIYHITHLNNLQGILQRG-GLLPYSQRPPTQ-QNVAYGHIQAHRAQVVV-PVGPR--G-KLHDYVPFYFCPRSP-------MLYAIHTQQT---DYQ----GDQRPILHLVSSAQKVA----EARIPFVFTDRHAAVQYVCFF--------HKLEHL-KALDWQAIQAS--------YWA--------NVR-EKKQAEFLVKDFFPWELVEEIGVI-----DKTIQAQVESILAQFPDLH-H---PPVRVRRSWYY
310818319 PLIFHITHVDNLPNILREG-GLWCDAQRIARGLSSTNIGHLHIKQRRLLR-PVTTTAGG-TLGDYVPFNFCSRSV-------MLYAVHCGHQ---DYK----GGQESIVHMVSSVSRATA----LGRAWAFTDRHAELAHALHF--------DDLGKL-GEVPWQVMPLQ--------YWS--------EVK-EERQAEFLVREFFPWEAVTEVAAM-----TPAASARVQQALRG--AAH-H---PPVTTQAGWYY
30249340 PKLYHIVHVDRLSSILKDG-FLWCDVHMAQHIPVGTTIGMNNIKQRRLQNC-LNSYPDL-HVGDCVPFYFCPRSV-------MLYLIYRQNT-ELDYK----GGQGPIIHLEADLNAVTTWAKTQSARWVFTLTNAGSFYFEDR--------NDLTCL-KEVNWTAVHAL--------NWK--------EHK-EGKQAEFLIEQCFPWNLVERIGVQ-----SEVIYNHVVNALPV--NGH-R---PKVEIKPEWYY
38505777 PKIYHIVHVDRLPSIIADG-CLWCDAAISQRNPAGTTIGMNKIKQRRLKELTLTSHPSL-YVGQCVPFYFCPRSI-------MLFLIHKKNT-ELTYQ----GGQEPIIHLEGDLIQAVNWADQNNLRWAFTLSNAGSSYFEDR--------NSLAQL-HEIDWAAVQAT--------NWQ--------TCK-EGKQAEFLVESTFPWHLVERIGVK-----SRVIYDQVIKALPT--GGH-H---PQVEVRPDWYY
120608868 PKLYHICHVDRLPSIIASG-GLLSDAAVVQVAAPGTVIGMNHIKQRRMTELQLTSHPGL-YVGQCVPFYFCPRSV-------MLYLIHRQNA-DLAYK----GGQGPIVHLEADLHTTVAWANGQGLRWAFTLSNAGARYFEDR--------ADLGRL-GEVDWDAVAAR--------NWS--------AQK-EGKQAEFLLERGFPWQLIERIGVL-----SQPIATQVAHALPV--GGH-R---PPVQLMPAWYY
217979677 PKIYHIIHSDRLASIIADG-FLWPDAAMAQRQGVGTTIGMSNIKARRLNELTLSCHPHL-RVGHCTPFYFCSRSV-------MLYLIYRRNE-ELTYK----GGKSRSSIWKLISTRRLL-GRNRTIGAGRLLCRMPVRITLRT-------GRTLRSL-A-INWDAVQAR--------QWS--GNAVSRSVK-EGKQAEFLIERAFPWRLVERIGVF-----SQGYVQPVSQAMQG--AAH-R---PEIEIRRDWYY
189425258 PKIYHIVHVDRLTSIIASN-GLLCDAEIVRSKPPGTTIGMGTIKQRRLNELFLSSHFGL-NVGDCVPFYFCPRSV-------MLYLIWRANDPELTYR----GGQAPIVHLEADLHQTVAWAESQNLRWAFTLSNAGAYYFEDR--------SNLDRL-GDIDWQAVEAT--------NWQ--------KCK-EGKQAEFLIEQRFPWELVTRIGVM-----TTQTHAQASAAIAA--STH-K---PRVELMQNWYY
154253368 PKIYHIVHVQNLASIVTDG-HLWSDATMVNRPPGGTVIGMGGIKLRRLRL-PVTCHQGT-HVGDFVPFYFCSRSI-------MLYVLHCANHAELTYR----GGQQPIVHLEADLYRSVRWAEENGSRWAFSLSNAGAAYTQFR--------SKREQL-SEVNWEAVRAT--------DFR--PA----DVK-EGKQAEFLVERSFPWHLVERVGVH-----SQAVVDQVSTAMRG--VRH-R---PQIEIRKDWYF
146294612 PKIYHIVHVDRLAPILASN-ALLCDAEIIAQQAAGTTIGMNTIKQRRLNELTLDSYPDL-YVGQCVPFYFCPRSI-------MLYVIHRADSAELVYR----GGQGPIIHLQADLHATVQWAQQQGRRWAFTLSNAGSYYFEDR--------NDLARL-NELDWQAIGAR--------QWQ--------GCK-EGKQAEFLMEHSFPWHLVEEIVVQ-----SPIIHQQVVNTLQR--VGH-R---PPVRINPNWYY
251788569 PKIYHILHIDRLHSIIAE--GLLSDEQISVRHGAGTMIGMSSIKQRRLHELTLTNHPNL-YVGQCVPFYFCPRSV-------MLYLIYRANHPELAYR----GGQEPILHLEADLYTTIAWAEQHRQRWAFTLSNAGSLYFEDR--------CQQSQL-GELNWEAIQSN--------QWS--GGN---GTK-EAKQAEFLIERCFPWHLIERIGVH-----SPLIYQQVANMIPL--DGH-R---PPVEVKREWYY
153872688 PKIYHIVHIDRLASIIAAG-ELWCDAQIVAQNPGGTTIGMTSIKQRRLYELSLNSHPNL-HVGDCVPFYFCPRSI-------MLYLIYQANHPKLAYY----GGQEPIVHLQADLHASVAWAHKQKRCWAFTLSNAGSYYFEDR--------CDLAQL-NELDWAAIQSN--------QWQ--------HCK-EGKQAEFLMEASFPWNLIERIGVF-----SQPIYQQTMNILQT--GVY-R---PPITISREWYY
257095819 PKLYHIAHVDRLPSIVTDA-CLWCDSEVSRRGPAGTMIGISSIKQRRLSELTLSSHPGL-HVGDCVPFYFCARSV-------MLYLIHQANHPELAYR----GGQSPIIHFEADLGAVVDWADRQGRRWAFTLSNAGSRFFEDR--------CDLAQL-GEIDWNAVQAR--------DWR--------QCK-EGKQAEFLLEHSLPWHLVERIGVQ-----SRPIFQQVSNALPA--SGY-R---PAVDIVSDWYY
284119730 PKIYHIMHIDRLASIVADD-YLWCDAKMATRTSSGTTIGMNGIKERRLTN-PLHSHSGL-RVGDCVPFYFCPRAV-------MLYVIYKANHPELDYR----GGQGPIVHLEADLRQTVVWAERQQRRWAFTTSNAGSRFFDDY--------ADLADL-DKIDWDAVHAT--------DWR--------QCQ-DGKQAEFLVQDSFPWAMVSRIAVN-----SKEIYAKVQLVLRE--ARH-R---PPVEVKPDWYY
148654473 PKIYHITHVDNIRNIVSTG-GLLSDARILQQGGPTQMIGLSNIKRRRIEELEVRCHPGT-KVGEYVPFYFCPRSI-------MLYVIHRADHPELMYR----GGQDSIAHLEADLHQVVDWADNNGVRWAFSLSNAGARYTQFR--------SNLRYL-HELDWDAIAAT--------DFR--DS----DVK-EGKQAEFLVHGFFPFDLVERIGVH-----RANIWNKVRSVLAG--SGY-T---PRVEVRDDWYF
126667035 PKVYHIVHVDRLASIIADQ-VLWSDAQVIARAPAGTTIGMSGIKQRRLNELTLTSHPDL-YVGACVPFYFCPRSI-------MLYLIYQGNHPDLGYK----GGQGPIIHLEADLNDSVAWAEANQQRWAFTLSNAGSCYFEDR--------SDLFRL-NEINWTAVGAR--------NWM--------SCK-DGKQAEFLLENCYPWHLVERVGVC-----SQAIYTQVANILAG--VPH-R---PDLQIKPDWYY
254245305 PKIYHIVHVDRLASIIRSG-ALWCDARVIRDGADGTTIGMSSIKRRRLQELQLDSHADL-YVGQCVPFYFCPRSV-------MLYLIYRGNHSELTYR----GGQGPIVHLEADLRQSVAWANANRHRWAFTLSNAGSYYFEDR--------CDLRHL-GDINWDAVQTR--------QWQ--------SDR-EGKQAEFLMEDSFPWGLIERIGVS-----SAQAYQQVVNALPA--GGH-R---PTVEVKHDWYY
261344446 PKIYHIVHVDRLSSIFASN-GLLCDAEVIFQNLSGTNIGISNIKKRRLTELQLSSHSNL-YVGQCVPFYFCPRSI-------MLYVIHRGTNTNLTYQ----GGQNSIIHLQADLYASVQWAKKHKNRWAFTLSNAGSYFFEDR--------CDLSQL-NQLVWQDIQAT--------QWQ--------NCK-ENKQAEFLMERYFPWHLVEQIVVH-----SQDIQQKVIQLLRM--EEH-R---PPVTIKSDWYY
46309426 FYLIHETSFEALSKILQGS-FLLTSSKTQKLKVRGQGSSNRRLASDPRV-----------SLTDSEFFNKYDEVD-------GVYMRLQPKMHSIRYS------KSDCVLVLRMNLLKYC------KFVINSEENFGFYIAEEC-------VIGTSQFSGEPGFTTTSFE-------KLALLK-------DTTDYSSTEVLILQDVPVSFIKFIFLV-----RDTKADTIFKPLAR--YNI-KC--FNIL-------
192290492 TAIFHITAIANLDSIAKQG-ALLSKNEAAARGLVAANIAYDHIQGRRAVR-TVPIAPGG-TLHDYVPFYFAPRSP-------MLFTINQGNVPDCIYR------QDDIVHLATTAQTVAD----TGQQIVFSDIHAALDYARFF--------SDLGSL-TEIDWRIFFEPPRLEGYCKFWQNRQIPIHHLRRLEIRQAEFLVHGELPIAAISEIGVK-----TAQAAAQVEQAVAG--SGW-T---PTVRVVPGWYF
74317508 VRLFHITAIANLPAICAAG-ALLSKNQGATNGIAYQNIAHQGAQGARSIK-SVPNPPGG-LVHDFVPFYFAPRSP-------MLLAINGGRVAGCDWR------QADIAHFETTVEHVTA----AGEDFVFYDLNATLAWSTPY--------TGLANLD-KVAWDLICESPALDGYCKYWQSKLDHARYSDRMERRQAEFLVKGMVPLVRFTRIGAI-----DRGHADVVRAILDQ--AGV-K---LPVVVKPEWYF
237654251 TRLFHITAIANLPAIFAAG-ALLSKNGGAAAGINYQNIAHAGAQGARAVR-AVPNPPGG-LVHDFVPFYFAPRSP-------MLFAINGGRVAGCQWR------QTDIVHFETTVQCLVA----RGRPFVFYDRNATLAFSTPY--------TDLAHLDTAVAWDLMTEAPQLDGYCKFWQNNPAVARYADRMERRQAEFLVRDNVPLDCMTRLGVI-----DAARQAQVLALLAQ--AGV-A---LTVDIMPAWYF
317126949 RFLLHFTRAENLNSIFRYG-ILSVSKQKSL------SLEVSRNDPNRYDE-----------FLNATSVSIHLPNN--------ILLYKYKNKFNC-----------EWVVLGIKPDIIWE------KRCGFCNENAASSNVSKIPLNK---RMSVESL-NGLFNNISGKPSR----SKLNIDK------SLT-TSPQAEVLVFEDIEPSYIWGVAFE---------SNYAKNKYKE--NIP-SS--IKIEIVPELFR
255010210 TCFYHFTDRRNLLSIKKQR-GLLSWHYCKT-----HGIVIPNQGGDADSE-NLDMRYG---LQDYVRLSFCDDHP---------MTWRLKQS------------GSNLVLLRIKIDVAWF------KETLFSDINAADQLHSHG--------GDLCHL-QKVNFAATKRH--------YVNRND-----ED-FKPHQAEVMVKTFIPLEYIINIDNPILI-------------------------------------
328871094 TQLYHFTDKSNLDSIKQN--GLFSWDHIDQ------NGIQSVMGSNEDSR-RLDKRKG---LEDYVRLSFVQNHP-------MMHAAYKRDSI----K------QPIILVIDIMVVDLL--------DVKFSDVNATSNNVIIQ--------NDT----NHIQFSIFKKD--------YFKLST-----NE-KQYFQAEVLIRNNVPASYIKRSITPNMGRKST---------------------------------
282881570 KYAFRIVHIDNIPYILEN--GIVNAAKSTKKDDSYISIGDESLIEVRRNQ-NIIHTESC--IGDYIPFYFGPRTP-------MLYTIQHGYNG---VK------KCDATNLVYLVLKISDIIKS-GFQGYFTDGHARNICSHTYE------IDKLNQL-NELVHYENVYR-------TYWSIR--EDNSGEYKRLKSAELLIENNIPTTMIAGYVVY-----DKAAHDKLVSFGID------N---EKIIINNNYYF
310778852 FNLLHITEFDNIKSILETG-GLISLRKLEV-----ENVCPKFMTS-EASR-SLDRCKG---LDAYVRLAYTTWYD-------MIPTAVFYNNL----K------NPAVIIVNCELLNKK-------RDILFTTKNAVANDAIYY--------KQ-NEIGDHINWEKVFSE--------RNY----DTQSQEYKDARQSEVMVQDIVEKDYFVCIFVETGS-----DLKDLNG--YG--VEI-KE--DNIKSIINRFG
262039223 MWIHHLTHIDNLESILER--GLISRNQLKQFNIKFNDTADKRIIGERND------------LNNYIPFHINYLQKKY-----SIPYNWKVLKNQ---S------SENMIFLNYNIDDFSN------NELDFYLYHPISKSQNNA--IK---INDLMGF-KEKLLKEEKKLQ--------NDMGYLDFSDNKTQQFLMSEVLIKDRIYLSEKWKIGVFS-----FAQKQIVEKKLEK--NNL-K---IEVFIDDKRYF
88856595 QRVYHVTHISNLENILLTG-QLVAAAQIES---PILDVSSPLTREMRGTA----SLSTGETVDRYVPFSLVPESNTWRELRDGAGEPRWSDAAR-AAS------SSDFVFLVTTIRALGT-------DAVLADGDAAAGETIFA--------TDEGAM-TRMLGNLRA-----------------------DELTEDAEVLIHGSFAFDEVQLVGVAS-----DKARDRVKELLDA--ASF-V---TKVAVYPPWFI
222529646 FGIYHYTDFTNLESIFKEG-FLYSRVDCIKKGLQFTDGADHNVLSIAPYD-----------VKNKVRFYFRPNTPTLFE-NEGIKLPAYIGK----AH------MPIPVCLLFDDELILL------DTTEFSNGNATSVKYTQI-------GCTYAFF-KSMEWDLIFHEG-----------YIEPFERNKIVNRRNSELLSTTPVSLKYLKKVIFRT-----KADFKRASNLF-G--MN------KKFCVDINYFS
126652604 RYIYHFSDIQNIVSILKCG-YVASRNFAIENGLMKNENACLDVIDKTTHD-----------NKNLARFYFRPKTPTQYH-NEGIKSKFREYEND--AH------IPVPVFLVFDAVGMFS-----KNQSMFVERNLVYSPPIK---------KHISEL-EKFDFDKIYHS-----SSLYGYSS---YDKQEIIEKRHAEVVFKDFCSLDCLRSIVCRS-----SAEKDTLIHLLRF--EGV-DVSKYRIVTNGNELL
328958126 RYCYHFSHIDNIISILNTG-KVYSRSKSKELKLMQNDNASQDVINQTNIL-----------VKDYVRLYFRPKTPTQYH-NEGLRNLRTTTTLN--AH------CPFPVFLLFDL------------KQVLTSENSFFCKHSLAHSSEYHLCNTPLEL-ANFPFSKIYHD--------RSFSGAQR---NEIISHRQAEIVVPNEMSLNTLKKIMVRSIA-----EKETLMYMLSA--DSK-KKYNELIQIDSKKIV
262383473 PKAYHFTHMDNALKIIRSM-KLQSRNLA--TGC-FSNSAGTNVLRTSK-------------AHRFARFYFVPQSPTQFY-NECLGKDSSDIRYYQKALNLGLPKCPMPVFLIFDVEELLMAM---PDKCYYSNGNMQKDASRSF--------KVVDNP-NMIKAKEIYTD--------SFS----------TKNERQQEFLIDGELDFSYLTKVQIRCY---DEYQAATLRKELLG--TKW-E---NCIKVDRSLYT
MARKUP ..........!**???....*.....*...............................................!**...............................................................*....<--------------------.ARTT.loop.-------------------->....**!....................................................
STRUCT .....S1..........................................................S2.........................................S3...................S4...................................................................S5............S6..................................S7.......
consensus/100% ..h........h..h.......................................................................................................................................................................................Eh.....h...................................................
consensus/95% ..hh.h....ph..l......h...............................................h......................................h.....................h...ps.....................h.......................................uEhhh...h....h..............................................
consensus/90% ..lh+hs..ppl..Ih.....l.s......................p..................s...h............h........................hh.....................h...ps.....................h...h...............................p...AEhlh...h....h..h...........................................
consensus/85% ..lh+hsp.ppl..Ih.....l.s......................c..................s.h.h....s.......hbb......................hh.h...................hs..pu.....................h...h...............................p..pAEhLh...hs.p.l..h.h.................h..............h......h.
consensus/80% ..lh+hsp.psl..Ih....slhs.s...........hs.......R................pbssh.hs..ps.......hhb.h....................lh.h..s..............hhhs..pA.....p..........ps...h...h.h..h............b.............p..pAEhLl.p.hs.phl..h.h.................h..............h.....ba.
consensus/75% .blaHhsp.pNl..Ilp...ulhs.s.h.........hs......pR.p..............phssh.as.pps.......hhh.hpp................p.ll.h.ss..............hhas..pA.....p.b........ps...h.p.l.hp.h..........p.b..........p..p..pAEhLl.p.hs.phl..l.h.............h...h..............l.....ha.
consensus/70% .blaHhschsNlssIlp...GLhspsph.........ls..ph..pR.p............h.phsshhasspss.......Mhh.hpp.p.............pp.ll.l.ss...h..........hhFss.pAh....p.b........ssh..h.p.l.hphhp.........p.hp.........p.bp.bQAEhLlbp.hs.phl..l.h......p.....ph.p.l........p.....l.hp..hab
Back to Contents
PDB:1wfxA - - HHHHHHHHHH--------------------EEHH--HH--HHHHHHH--------------HHHHHHHHHHHH----EEEEE-------------------------------------------------------------------------------------------------------------------------------------------------------------------EEEEEE--------------------------------------------------------------EEEEE---HHHH-HHHHHH-----------EEEEEHH------------------------HHHHHHHH-----EEEEEEEHHHHHH-H--------------EEEEE--EEEEE-----------------EEEEEEEE--
DOMAINS - - <---------------------------------------------------------------------------------------------Helix-Turn-Helix-------------------------------------------------------------------------------------------------------------------------------------------------------------------->......................................<---!**--------*---*-------R++h!**-----------Catalytic core-------**-----------------------------------------*------------------------------->
118430933 314 40 SKTLAGILRHH--PGR-YGVR--LTRE-GWARVS--EV--VEGLRKA---------gWSWVEEWHIVGVALHDP-KGRYELRN------------------------------------------------------------------------------------------------------------------------------------------------------------------GEIRARYGHS--IP----------VNVEP------------------------------LPGEPP---PILYHGTTEEAL-PLIMERG--IMRGRRLKVHLTSSL------------------------EDAVSTGRRHGNLVAVLLVDVECLRR-R------------GLKVERMSKTVYTVD-----------WVPPECIAEVRRESL 208 Aeropyrum pernix K1 archaea>crenarchaeota
154496777 381 5 SIYLCRLLRHA--PED-AGLD--MDIH-GWVSTQ--QL--IDNVNKAg---------RHHLTMPQLEQLVATDS-KGRYRFSPD----------------------------------------------------------------------------------------------------------------------------------------------------------------KSRIKACQGHS--IPw---------VEPEL------------------------------TPAAPP---AYLYHGTTERAW-NAIQDSG-YISRMSRHAVHMQADEs-----------------------KAWQSACRWRQ-APVVLKIDAQAMAA-D------------GIPFGVSDNGVWCTE-----------QVDRKYVCTEQVDRK 179 Pseudoflavonifractor capillosus ATCC 29799 bacteria>firmicutes
268610712 382 5 SKYLCLLLRHQ--PEK-AGLD--MDEH-GWVSIE--QL--INGVNCHs---------SYKLDRELLEQIAAEDN-KGRYRFDEK----------------------------------------------------------------------------------------------------------------------------------------------------------------HEKIKCCQGHS--IPw---------VEPEL------------------------------EYCEPP---EFLYHGTTAKAL-EAIEESG-AIKKMKRHAVHMQADIg-----------------------KAWQSAERWHK-TPVVLKIAASEMNK-D------------GYKFGVTENEVWCTE-----------EVPVKYICTEEVPVK 177 Ruminococcus flavefaciens FD-1 bacteria>firmicutes
116252353 384 11 SKYMSYVLRHA--PDA-AGLT--LDSG-GWVSFD--EL--EKALASK-----------YDVSRAEIIEIVENNP-KKRFTLA------------------------------------------------------------------------------------------------------------------------------------------------------------------HNRIRANQGHS--VD----------IDLAL------------------------------NQAEPP---AALFHGTSLTNW-QSIEREG--LKKMQRHHVHLSADVe-----------------------TAKIVAARRKG-EHIILRVDAARMFS-E------------GHSFFVSDNGVWLAE-----------SVPVQYLLAESVPVQ 177 Rhizobium leguminosarum bv. viciae 3841 bacteria>proteobacteria>alphaproteobacteria
124003655 387 1 SKRLSYVLRHR--PEE-IELI--MDEE-GWVEVD--LL--LDRFSNN----------YFPITLADLQKVVAQND-KKRFAFSDD----------------------------------------------------------------------------------------------------------------------------------------------------------------EAYIRASQGHS--IQ----------IDLGY------------------------------EAIKPP---AQLYHGTATRFV-HSIREQG--LKKRNRHHVHLSADI------------------------DTATKVGGRHG-QPVILTVNALDMQQ-D------------GYKFFQSENGVWLTD-----------QVPVQYLEFPEENVQ 181 Microscilla marina ATCC 23134 bacteria
338211687 389 6 SKFLSLVLRHN--PAL-IGLD--LDAN-GWAPVK--EL--LAKMKAK----------GHGISMEELKHIVETNS-KKRFAFSEN----------------------------------------------------------------------------------------------------------------------------------------------------------------FEKIRANQGHS--VE----------VDLGY------------------------------EKQVPP---AVLFHGTAEKNF-DLILKDG--IKKMSRHHVHLSQDI------------------------TTARKVGMRHG-KPVVLSVDAKGMAD-G------------GFDFYLSNNGVWLID-----------FVPAEFIKVDDCFAE 176 Runella slithyformis DSM 19594 bacteria
312888255 390 2 SKFLSLVLRHQ--PEL-IGIE--MDEQ-GWVKVT--DL--LEKANAH----------GKALNMDVLKYVVDTNA-KKRFAFDES----------------------------------------------------------------------------------------------------------------------------------------------------------------QTYIRASQGHS--VE----------VELGY------------------------------LPQIPP---EILYHGTGSQSV-DAILKTG--LEKRARQHVHLSHDV------------------------ETATKVGSRHG-KPVILKVLAADMHQ-Q------------GYAFYLSENKVWITD-----------GVPAQFLEVFGVPAQ 180 Mucilaginibacter paludis DSM 18603 bacteria
110638931 391 14 SKFLSLVLRHQ--PEL-IGLQ--LNEQ-GWAHIE--TL--LEKSAAY----------GVSFDKQTLKYLVATNS-KKRFAFSPD----------------------------------------------------------------------------------------------------------------------------------------------------------------AEYVRASQGHS--VD----------IELGY------------------------------KNQKPP---EILYHGTAEKFM-QSILETG--LEKCRRQHVHLSSTI------------------------ETAIHVGQRHG-KPVVFTVLAQQMYA-N------------DFSFYLSDNGVWLTD-----------HVPVIYLTINPVPVI 191 Cytophaga hutchinsonii ATCC 33406 bacteria
146298511 395 1 SKFLSLVLRHS--PEK-IGLK--LDEN-GWADVN--EL--IEKCTKK----------GNRLDAELLDYVVENND-KKRFAYNED----------------------------------------------------------------------------------------------------------------------------------------------------------------KTKIRASQGHS--IS----------VELNL------------------------------AETEPL---EYLYHGTVGKFM-ESIQKEG--LKKMSRQHVHLSKDK------------------------ETAVKVGSRRG-VPQILTVRSGAMYR-D------------GFKFYLSENNVWLTD-----------EVPPKYIEFKSVPPK 180 Flavobacterium johnsoniae UW101 bacteria
256419129 396 1 SKFMSLVLRHQ--PET-IGIT--LDEN-GWTDVE--EL--LTRMSQH----------KHPITLAQLQEVVETND-KKRFAFSED----------------------------------------------------------------------------------------------------------------------------------------------------------------GTKIRASQGHS--VD----------VSLGL------------------------------DPVTPP---EYLYHGTVARFL-DSIKKEG--LQKMSRQHLHLSKDR------------------------ETAVNVGSRRG-APYILTIRTGQMHR-D------------GFLFYLSDNGVWLTD-----------HVPPAYIEIDHVPPA 180 Chitinophaga pinensis DSM 2588 bacteria
163754445 398 6 SKFLSYVLRHN--PDK-LGIT--FDSN-GWTSVA--IL--LEKINVE----------PYSLSMEELEYVVATNN-KKRFAFNED----------------------------------------------------------------------------------------------------------------------------------------------------------------KTMIRASQGHS--VN----------IDLAL------------------------------QPKEPP---SYLYHGTVEKFI-TSIQEKG--LIKGTRQHVHLSADK------------------------ETAINVGSRRG-KPIILTIRSGEMYA-Q------------HHTFYQSENGVWLTE-----------EVPTEFIEFEEVPTE 179 Kordia algicida OT-1 bacteria
300774500 399 1 SKFLSLILRHQ--PES-IGLT--LDEN-GWADVE--EL--REKSAKR----------RIHFTPEELDEVVETNN-KKRFAFNED----------------------------------------------------------------------------------------------------------------------------------------------------------------KTMIRASQGHS--VN----------IDLAL------------------------------EALQPP---DFLYHGTAETNI-ASILEKG--IEKRTRQHVHLSADK------------------------ETAAKVGMRHG-KPVILTIRTGTMYQ-D------------GLAFFQSANGVWLTD-----------FVDAKYISKDFVDAK 178 Chryseobacterium gleum ATCC 35910 bacteria
333381571 400 1 GKFLSLVLRHD--PAK-IELE--LDEN-GWANVK--EL--IEKCRKH----------RYHFSMEDLIEIVETND-KQRYSFNEK----------------------------------------------------------------------------------------------------------------------------------------------------------------RNKIRANQGHS--ID----------IDLGL------------------------------SAVEPP---EYLYHGTATRFL-SSIMEQG--IVKGSRRHVHLSKDK------------------------ETAIKVGARHG-KPVILTIMSGKMYQ-D------------GILFYQSDNGVWLTN-----------YVDVKYILKQIVDVK 178 Dysgonomonas gadei ATCC BAA-286 bacteria
213962768 404 13 SKFLSLVLRHH--PEA-IGIS--LDTH-GWAEVN--VL--IKNMKRK----------FPVFSLKILEEIVATDS-KQRYAFSED----------------------------------------------------------------------------------------------------------------------------------------------------------------NTKIRANQGHS--LA----------VTLEL------------------------------QPQTPP---ECLYHGTASRFV-ESILKSG--LQKQTRQHVHLSMDI------------------------ATATKVGARHG-KPVIFKVNTIAMHK-A------------GYVFYLSANGVWLTD-----------EVPPKFLNLIVNNPK 181 Capnocytophaga sputigena ATCC 33612 bacteria
163814521 405 4 SRFMSLILRHR--PES-IGIS--LDEH-GWANVD--EL--LSGIGEQ-----------HPIDMDMLEEIVRADK-KQRYSFNED----------------------------------------------------------------------------------------------------------------------------------------------------------------KTLIRANQGHS--IP----------VDVEL------------------------------DEVSPP---EELWHGTGEKYV-QDIETEG--LLPKSRLYVHLSNDR------------------------DTAFKVGQRHG-KPVLYIVRSGEMYR-D------------GYKFYLSKNGVWLTK-----------AVPVKYLQKQAVPVK 179 Coprococcus eutactus ATCC 27759 bacteria>firmicutes
323140426 406 3 GRFLALVLRHK--PQA-VGIE--LDAH-GWAQVE--AL--LAAFNR-----------IEAFNMLMLEQIVAEDG-KQRFAFSED----------------------------------------------------------------------------------------------------------------------------------------------------------------KKRIRANQGHS--VK----------VDVEL------------------------------WEVAPP---ELLYHGTGVKYV-ASINRQG--LIARQRLYVHLSANV------------------------ETAHNVGKRHG-EPFIYVVLAGEMAR-A------------GYKFYLSANGVWLTE-----------SVPKKFLRELEGALD 176 Phascolarctobacterium sp. YIT 12067 bacteria>firmicutes
154497918 407 11 SKYMSLILRHK--PQV-IGIH--LDAH-GWADVN--AL--LAGISRK-----------YSINRDILDEIVSRDE-KQRYSFSED----------------------------------------------------------------------------------------------------------------------------------------------------------------GTKIRANQGHS--IQ----------VDVEL------------------------------TLTEPP---EMLCHGTARRFA-ASIEAQG--LLSGSRLYVHLSPDQ------------------------ETAEKVGRRHG-EPVIYLVDAGQMHR-D------------GYCFYLSANGVWLTK-----------VVPATYLKRLEDRLT 183 Pseudoflavonifractor capillosus ATCC 29799 bacteria>firmicutes
167749542 410 7 SRYMALLLRHK--PEI-AGLV--LDKQ-GWADVD--ML--LKCISEN----------MEPVSFERLCEIVKNDS-KQRYSLSED----------------------------------------------------------------------------------------------------------------------------------------------------------------KSRIRANQGHS--VN----------VDVGL------------------------------KATVPP---EYLYHGTATRFV-ESIDSGG--IIRKTRLYVHLSRDT------------------------ETATQVGMRHG-KPFIYRVKSGEMAR-D------------GYVFYLSENGVWLTE-----------NVPVKYLEKTWQDDA 176 Eubacterium siraeum DSM 15702 bacteria>firmicutes
210621794 412 4 SRFISLILRHK--PET-IGIT--LDEH-GWANVE--EL--IVGVNKK-----------YPIDMQILEKIVDEDD-KNRYSFNED----------------------------------------------------------------------------------------------------------------------------------------------------------------KTMIRANQGHS--IS----------VDVEL------------------------------KKLNPP---DILYHGTGEKYV-ESIEKQG--LIRKNRLYVHLSNDI------------------------ETAEKVGKRHG-KPIIYEIDCKKMVE-N------------GIEFLKSENNVWLVE-----------SVPVKYLKKLSVPVK 175 Clostridium hiranonis DSM 13275 bacteria>firmicutes
336428119 414 1 ---MSYLLRHD--KDF-------IDEH-GWAPVT--EV--IHTLKKE----------WPEFNEECLSEIVRTDE-KGRYSYDEA----------------------------------------------------------------------------------------------------------------------------------------------------------------GVRIRANQGHS--VP----------VDVEL------------------------------KEAEPP---EILYHGTADRFL-NAIMEEG--LTGRSRIYVHLSSTT------------------------ETAVNVGKRHG-KPVVLKIYAGRMRD-A------------GYKFYLSQNQVWLTQ-----------KVPVEYIETLYPEQG 163 Lachnospiraceae bacterium 3_1_57FAA_CT1 bacteria>firmicutes
225388916 415 1 SVLISLVLRHK--PEA-AGIS--LDEH-GWADIE--TM--MAGMNAS----------GHRIDREMLEEIVRTDE-KGRYSLSED----------------------------------------------------------------------------------------------------------------------------------------------------------------GTKIRANQGHS--VP----------VDVEL------------------------------SPVQPP---EILYHGTAERFA-HAIREGG--LLPMGRLYVHLSKDV------------------------ETVVKVGSRHG-KPVVFEVESGRMYR-D------------GIPFYLSCNGVWLTK-----------AVKPRYLKGREVKPR 178 Clostridium asparagiforme DSM 15981 bacteria>firmicutes
317056274 418 13 GRFISLVLRHE--PSA-AGIV--LDAE-GWADVD--EL--IHGICNT----------GRKLDMETLERIVRENN-KQRYSFNED----------------------------------------------------------------------------------------------------------------------------------------------------------------KTKIRANQGHS--IN----------VVINM------------------------------KIMSPP---EVLYHGTSEAFI-ESIKEKG--ISKMSRQYVHLSEDM------------------------DSAVKVGSRHG-KPAVLVIDTAKMSA-D------------GFVFRISENGVWQSD-----------DIPWKYVTEIKYPWK 180 Ruminococcus albus 7 bacteria>firmicutes
167769835 419 12 GRFLSLVLRHN--PAA-AQIT--LDEH-GWADVE--AL--LAGCARA----------GRRIGRDTLERIVRENS-KQRYSFNGD----------------------------------------------------------------------------------------------------------------------------------------------------------------HTKIRANQGHS--IA----------VDVEL------------------------------RQAQPP---ARLYHGTAMRFL-ESIRAQG--ITRQSRQHVHLSADY------------------------PTALAVGSRHG-RPVVLAIDAAAMAR-D------------GYVFYRSENGVWLCE-----------RVPWSYVLEDGAGLA 179 Anaerotruncus colihominis DSM 17241 bacteria>firmicutes
260889106 421 2 GKFISLILRHK--PEM-IGIE--LDRN-GWANVD--EL--INGINRS---gdvengkEERINFEILEEIVRNNS-KKRYEFNED----------------------------------------------------------------------------------------------------------------------------------------------------------------FTKIRACQGHS--ID----------VDLEL------------------------------KAVKPP---RILYHGTADRFL-EQIKKEG--LKKKSRQFVHLSETE------------------------ETAYSVGQRHG-KPFIIKVLAEKMYE-D------------GKEFFISKNGVWLTD-----------DIEVKYLEFDDIEVK 186 Leptotrichia hofstadii F0254 bacteria>fusobacteria
225620034 422 12 SKFVSLVLRHK--PEY-IGLE--LSKD-GWANVY--EL--IEKIKSK----------GRNINKDILERVVLYND-KKRFRFNEN----------------------------------------------------------------------------------------------------------------------------------------------------------------HTLIRANQGHS--IN----------VDLQF------------------------------EEKEPP---EILFHGTSINNI-DSIKHEG--IKKMNRLHVHLSLAE------------------------ETAKKVGERHG-KPTIIKINSKQMYE-D------------GIKFYLSENKVWLCD-----------YVDPKYIIEVIVDPK 182 Brachyspira hyodysenteriae WA1 bacteria>spirochaetes
167757534 423 8 GKFISLILRHK--PEL-IGLK--LDYH-GWAKVD--EL--LLGINNS----------GRFINRTLLDEIVMTNN-KQRYQYNED----------------------------------------------------------------------------------------------------------------------------------------------------------------HTKIRANQGHS--IK----------VDIEL------------------------------IEKIPP---EYLYHGTAFKYL-NKIEQEG--IKKMKRLYVHLSKDI------------------------ETAFKVGSRHG-KAIVLVIDTKAMCE-D------------GCKFYYSQNGVWLTE-----------DIDYKYVMEVIKDYK 176 Clostridium ramosum DSM 1402 bacteria>firmicutes
237742025 426 5 GRFISLILRHK--PET-IDLK--LDKN-GWANTK--EL--IEKISKS----------GREIDFEILERIVNENN-KKRYSFNED----------------------------------------------------------------------------------------------------------------------------------------------------------------KTKIRAVQGHS--ID----------VNLEL------------------------------KEVVPP---AILYHGTAFKNL-ESIKKEG--IIKMSRQYVHLSADV------------------------ETAKNVATRHSGKYIIFEIDTEAMLK-E------------NYKFYLSENKVWLTD-----------FVPCKFIKFDFVPCK 179 Fusobacterium sp. 4_1_13 bacteria>fusobacteria
110800227 428 7 SKYISLILRHK--PEE-IGLK--LDEH-GYLGVL--DL--IEGLNKS----------YEGFSMDDLERIVREDS-KGRYSFNED----------------------------------------------------------------------------------------------------------------------------------------------------------------KSKIRANQGHS--IK----------VDLGL------------------------------EPIKPP---KVLYHGTGRKYL-ESILKNG--LIKKERNYVHLSKDI------------------------ETASIVGKRHG-DLVILEVDSESMFN-D------------GIKFYLSKNNVWLCN-----------YVPKKYIKELNLEEV 177 Clostridium perfringens ATCC 13124 bacteria>firmicutes
150018230 429 10 SKFISLILRHK--PEE-IGLT--LDEY-GYISTP--DL--IKGLNKK----------GYKVTISDIERIVAEDG-KQRYSFNND----------------------------------------------------------------------------------------------------------------------------------------------------------------KTKIKANQGHS--IK----------VNLEL------------------------------QAIKPP---KVLYHGTASRFI-DSICKEG--IKKQNRQYVHLSADI------------------------ETATKVGKRHG-ELVIFKINSEQMNK-D------------GYKFFLSENKVWLTD-----------YVPVKYFEVFRTNVK 179 Clostridium beijerinckii NCIMB 8052 bacteria>firmicutes
224542154 431 1 SRRLSYILRHC--PES-IDLE--LDDH-GYGDVN--KI--LEAL---------------NITIEDLDMIVREDE-KQRYSYNGD----------------------------------------------------------------------------------------------------------------------------------------------------------------HTRIRANQGHS--IP----------VNVDL------------------------------KEVQPH---DILYHGTATRFV-PSILEEG--ILSQTRIYVHLSQDI------------------------ETAMTVGSRHG-EPYVFTIDTKQMYE-D------------GYKFYLSENNIYLTK-----------IIPAKYLKASTIPAK 168 Catenibacterium mitsuokai DSM 15897 bacteria>firmicutes
255103268 433 6 SIFISLILRHK--PET-IGIK--LDDY-GYADVN--EL--IEKINNT----------GRNINIEILEQIVKEDN-KQRYSFNDD----------------------------------------------------------------------------------------------------------------------------------------------------------------RSKIRANQGHS--IN----------VNVEL------------------------------RELEPP---KYLYHGTATRFL-DNIKNEG--IIKQSRLYVHLSRDI------------------------DIAVKVGKRHG-TPVILKINTGKMYE-N------------GYKFYLSENNVWLCE-----------YIPFKYVEIFEIPFK 177 Clostridium difficile QCD-63q42 bacteria>firmicutes
149175185 443 1 SKFLSLILRHQ--PET-VGIT--LDES-GWVDVD--IL--LAAMSQQ----------GKGMSRATLNTVVQSND-KQRFSFNAE----------------------------------------------------------------------------------------------------------------------------------------------------------------GTRIRANQGHS--IS----------VDLGY------------------------------TTAVPP---EILFHGTPEKFI-EPISREG--LKKMNRHHVHLHVDE------------------------QTSIAVGRRRG-RPVLLQVRAREMHQ-A------------GCEFFVTPNQVWLTE-----------SVPVEYIDFPSVPVE 181 Planctomyces maris DSM 8797 bacteria>planctomycetes
87311897 444 4 SKFLSLVLRHQ--PDK-IGIE--LDEQ-GWVEVA--TL--LAAIRRE----------SRPLTLAQLQEVVTRND-KQRFMFSSD----------------------------------------------------------------------------------------------------------------------------------------------------------------GLRIRAVQGHS--IE----------VELGY------------------------------EAAAPP---EYLLHGTPEQSV-AIILETG--LKKMKRHHVHLHHDR------------------------QTASAVGQRRG-KPVLLQIAAGRMHA-D------------GYSFYVTPNQVWLTD-----------EVPPAYLSILEVPPA 183 Blastopirellula marina DSM 3645 bacteria>planctomycetes
163849264 446 25 SKFLSLVLRHR--PEQ-IGLS--LDQH-GWAEVD--EL--IRCANRH----------GLPLSRAQLEQVVAEND-KQRFAFSAD----------------------------------------------------------------------------------------------------------------------------------------------------------------GRRIRANQGHS--LP----------VDLQL------------------------------TPAQPP---PVLYHGTAERFV-ESIKRDG--LLPGKRQYVHLSQDE------------------------TTALTVGQRHG-RPVVLTVHAAAMTA-A------------GYVFYVSANGVWLTK-----------QVPARFIEFPAVPAR 205 Chloroflexus aurantiacus J-10-fl bacteria>chloroflexi
171913881 447 4 SKFLSLVLRHK--PEE-IGLV--LDEA-GWASTD--KL--IDACNRH----------GPGLDLPTLQLLVNTNE-KKRFEFNAD----------------------------------------------------------------------------------------------------------------------------------------------------------------GSRIRASQGHS--VE----------VDLGY------------------------------TPQVPP---AVLHHGTVEDFL-DPIRSQG--LVKGERHHVHLSADP------------------------AIARIVGTRHG-KPVVLTVQASTMHT-A------------GHPFYLSTNGVWLTD-----------HVPARFIDFPSVPAR 183 Verrucomicrobium spinosum DSM 4136 bacteria
223939130 449 7 SKFLSLVLRHE--PGR-IGIQ--LDSA-GWVDVD--EL--LRACTAH----------QFPFSRDELNQVVATND-KKRFAFSED----------------------------------------------------------------------------------------------------------------------------------------------------------------GKRIRANQGHS--VE----------VELQY------------------------------EPSVPP---EILYHGTADRFL-ASIQQDG--LIKGNRHHVHLSTEL------------------------STAISVGQRHG-RPLVFRVLAGQMHR-S------------GHQFFVSANGVWLAD-----------HIPANFLQIHTGEQN 177 Pedosphaera parvula Ellin514 bacteria
196229950 451 1 SKFLSLVLRHE--PEK-VGLE--LDSA-GWVEVE--ML--LAACRQH----------GVAIERAELEEIVVTNE-KKRFAFSDD----------------------------------------------------------------------------------------------------------------------------------------------------------------GRRIRANQGHS--IE----------VSLGY------------------------------TPQVPP---ARLFHGTATRFL-DSIRSDG--LKKMERHHVHLSADE------------------------ETAHKVGQRHG-KPLILLIKADAMHA-A------------NHSFFLSENGVWLTD-----------AVPVAFIEFPEDKTL 181 Chthoniobacter flavus Ellin428 bacteria
284038905 453 4 SKLLSLALRHK--PET-TGII--LDKN-GWTDVD--LL--IAKLQAQ----------SYPVNFEQLCYIVDTNN-KSRFAFNND----------------------------------------------------------------------------------------------------------------------------------------------------------------KSKIRANQGHS--VE----------VDLGY------------------------------MTEEPP---HFLYHGTATRFI-NQIIIEG--LKKMSRHHVHLSADE------------------------LTALRVGERHG-EPIVLTVKAKEMAA-N------------GHVFHRSENGIWLTD-----------FVPPSYLIYEFVPPS 181 Spirosoma linguale DSM 74 bacteria
118591032 454 6 SKRLSFWLRHK--PED-AGLT--LSHD-GWADVS--AV--LKAFSTL----------KLDCNRDQLERVVETND-KKRFEFSDD----------------------------------------------------------------------------------------------------------------------------------------------------------------GKRIRARQGHS--VD----------IDLGL------------------------------TALTPP---EILFHGTATRFL-PLILTEG--LKPMARHHVHLSPDR------------------------STALKVGSRHG-KPAVLQVAASAMQA-D------------GHTFYRTENGVWLTD-----------SVPATFLTQTETVST 176 Labrenzia aggregata IAM 12614 bacteria>proteobacteria>alphaproteobacteria
256394652 458 5 SKRMSSWLRHH--PEA-IGLE--MDGA-GWVRVD--EL--LAKAAAR----------GQAFSRAQLEEVVAENT-KKRFEFDET----------------------------------------------------------------------------------------------------------------------------------------------------------------ETLIRARQGHS--IP----------VELGY------------------------------ATAEPP---EVLFHGTAQNTL-TLIWRDG--LLPMKRHAVHLSPDK------------------------ETAVKVGSRHG-KPAVLAVAAARMHA-E------------GYTFFVTGNGVWLTD-----------AVPAEYLREVPALGE 173 Catenulispora acidiphila DSM 44928 bacteria>actinobacteria
257063188 459 1 SRHLSYLLRHH--PEA-AGLH--MDEH-GWVRVD--EL--VAAVAQK-----------HSFDQTTLERIVATDK-KGRYSFNED----------------------------------------------------------------------------------------------------------------------------------------------------------------RTLIRANQGHS--IP----------VDVEL------------------------------ACVTPP---DRLFHGTATRFA-ESIERQG--LLPQNRLYVHLSPDP------------------------ETAMVVGARHG-KPMVYVVDAKAMSA-A------------GHRFFLSVNGVWLVK-----------TVPPEYLTRMTVPPE 177 Slackia heliotrinireducens DSM 20476 bacteria>actinobacteria
149919906 460 1 GKRLAWLLRHE--PEA-WGLR--VDAH-GWMEVE--AL--LAAFAER----------GHALSRAELETHVAADG-KQRFILSSD----------------------------------------------------------------------------------------------------------------------------------------------------------------GARIRAVQGHS--IA----------VDLEL------------------------------DERPPP---AQLFHGTPRRFV-DSILREG--LIPKARHHVHLSADE------------------------ATARQVGARRG-PPVILLVDAATMAA-D------------GHRFFVSANGVWLCE-----------RVPPEHLRVANVPPE 173 Plesiocystis pacifica SIR-1 bacteria>proteobacteria>deltaproteobacteria
302525419 463 1 SKRLSRHLRHD--PGG-LGLT--LAPG-GWVPVD--EL--LAALARN----------RFPVSRAELDEVVANCA-KQRFAFDGT----------------------------------------------------------------------------------------------------------------------------------------------------------------GTLIRASQGHS--VR----------VDLEL------------------------------SDAVPP---EILYHGTATRFL-PSIRAEG--LRPMKRHAVHLSATR------------------------ETAWKVGSRHG-KPVVLTVAAGEMAA-R------------GHVFQVSDNGVWLAP-----------AVPAEFLTVAEVPAE 178 Streptomyces sp. AA4 bacteria>actinobacteria
300784169 464 5 SKRLSRHLRHD--PAA-LGLT--LTSD-GWAPVD--AL--VRALA---------------ITRAQLDEVVEKNS-KRRFAFDET----------------------------------------------------------------------------------------------------------------------------------------------------------------GTRIRASQGHS--VP----------VELGL------------------------------PDTTPP---DVLYHGTVAKYL-DAIFREG--LRPMNRHAVHLSATV------------------------ETAGIVGARRG-KPVILRVDAAAMAA-E------------GHPFQISANEVWLTP-----------SVPPHHLASLTVPPH 168 Amycolatopsis mediterranei U32 bacteria>actinobacteria
297564265 466 1 SKLLSRVLRHD--PAR-VGVR--LDPR-GWAGVD--EL--LAGCRRA----------GVRLSRAALQEVVDTND-KKRFVLSPD----------------------------------------------------------------------------------------------------------------------------------------------------------------GTRIRAQQGHS--VR----------VDLGL------------------------------EPSTPP---ALLYHGTVGRLL-PAITAEG--LRPMRRHDVHLSPDT------------------------ATARRVGARRG-APVVLTVASGRMHG-D------------GHVFRVTGNGVWLVP-----------AVPPEYLGEPVVPPE 181 Nocardiopsis dassonvillei subsp. dassonvillei DSM 43111 bacteria>actinobacteria
256379719 467 1 SKRMSRCLRHD--PGR-YGLA--LDAA-GWVDLG--GL--VRALR---------------TSREAVLEVVERNN-KRRFTVR------------------------------------------------------------------------------------------------------------------------------------------------------------------GDRIRADQGHS--VA----------VELGL------------------------------AQVEPP---GVLFHGTNAKAL-PDVLVEG--LRPMNRHAVHLSTDL------------------------ATATQVGARRG-RPVVLEVDAARMHA-E------------GHAFSVSENGVWLVA-----------AVPPDYLRQRAVPPD 171 Actinosynnema mirum DSM 43827 bacteria>actinobacteria
182437433 468 1 SKYLSKHLRHQ--PER-IGLT--LDEN-GWVAVE--EL--LRAAARH----------GFAFSRAELDHVVAAND-KRRFTVENG--------------------------------------------------------caadgvh-------------------------------------------------------------------------------------------------GDRIRANQGHT--VA----------VDLDL------------------------------PPAEPP---AHLYHGTVARVM-DAIRTEG--LRPMARHHVHLSPDR------------------------ETATRVGARRG-RPLVLTVDAGAMHR-A------------GHVFRVSANGVWLAD-----------AVPPRFLLADAVPPR 185 Streptomyces griseus subsp. griseus NBRC 13350 bacteria>actinobacteria
284988800 471 1 SKRLSYVLRHA--PGS-VGLT--LDAA-GWADVD--AL--LAALG---------------WTRAELERVVATND-KRRFALDGT----------------------------------------------------------------------------------------------------------------------------------------------------------------GTRIRASQGHS--VA----------VDLGY------------------------------AAQTPP---PVLFHGTAERNV-PAIEAGG--LRPGRRHAVHLSPDE------------------------VTARRVGARHG-RPVVLRVDAAGMAA-V------------GAVFTRSANGVWLVD-----------AVPPAFLTVVGVPPA 173 Geodermatophilus obscurus DSM 43160 bacteria>actinobacteria
311899069 473 7 SKTLSRILRHD--PGA-VGIT--LDAA-GWVEVD--AL--LAALARH----------GRRLSRAELDHVVATND-KRRFAYSED----------------------------------------------------------------------------------------------------------------------------------------------------------------GRSIRASQGHT--VE----------VDLGL------------------------------PAATPP---DTLFHGTAERTL-RHVLAEG--LRPMSRRDVHLSADT------------------------ETAVKVGSRHG-RPVVLAVDAAAMAR-D------------GYEFRASANGVWLTD-----------AVPVGYLRRTPVPVG 184 Kitasatospora setae KM-6054 bacteria>actinobacteria
296130288 477 5 SRFLSYVLRHR--PDA-AGLT--LDAA-GWVDVD--VL--LAALAAH----------GHTATPEDLRYLAEDVPGKKRLELRD-----------------------------------------------------------------------------------------------------------------------------------------------------------------G-RVRAAQGHS--VR----------VDLGL------------------------------APVVPP---ATLFHGTATRFL-DRILVDG--LRPMSRQHVHLSADR------------------------ATATDVGSRHG-RPVVLLVDAAAMHA-G------------GAAFYRAANGVWLTD-----------AVPPEHLRREVVPPE 172 Cellulomonas flavigena DSM 20109 bacteria>actinobacteria
330469061 478 3 SKFLSYVLRHR--PDA-VGVT--LDEA-GWVPVD--VL--LAALARH----------GRPVTPALLDQLVGNTD-KQRFEVRE-----------------------------------------------------------------------------------------------------------------------------------------------------------------G-RIRAAQGHT--IA----------VDLQL------------------------------APAVPP---TVLYHGTVARFL-PGIRVEG--LTSGERTHVHLSSDL------------------------DTAARVGARRG-KPVVLRIDAAGMHV-A------------GLVLYRAANGVWLTR-----------HVPPRFITLPSVPPR 178 Verrucosispora maris AB-18-032 bacteria>actinobacteria
159038434 479 5 GKALAYVLRHR--PDA-VGLQ--LDSA-GWVEIP--AL--LSAMADA----------GHTIGEADLDRIVAGSD-KKRYEVRA-----------------------------------------------------------------------------------------------------------------------------------------------------------------R-RIRAAQGHS--VR----------VELGL------------------------------EPTIPP---AVLYHGTVARFL-EAIRREG--LRPGERTHVHLSADA------------------------STARQVGERRG-APVVLEIEAKRMYA-D------------GHSFLLAANGVWLVA-----------HVPPDYLALTDVSPD 175 Salinispora arenicola CNS-205 bacteria>actinobacteria
159901400 482 1 SKYLSKHLRHQ--PER-LGLT--LEPG-GWVGVE--QL--LAACAAN----------NVAISLAELHEVVEQNN-KQRFGFDPT----------------------------------------------------------------------------------------------------------------------------------------------------------------GQKIRAHQGHS--VT----------VDLGL------------------------------VAQQPP---IILYHGTAKHNL-AIILRDG--LRPMQRQHVHLSRDR------------------------ATALQVGARHG-QAVILIVQADELFQ-A------------GQAFFCSDNGVWLTT-----------AIDPAYLALERIDPA 178 Herpetosiphon aurantiacus ATCC 23779 bacteria>chloroflexi
67921554 483 20 SRFLSYHLRHA--PEK-LGLE--LEPG-GWISTE--KL--LKACQNT----------KFTLTFSDLETVVKDND-KQRFSFNEA----------------------------------------------------------------------------------------------------------------------------------------------------------------KTKIRANQGHS--VN----------IDLQL------------------------------EPLIPP---VILYHGTHQKVV-KTILKEG--LKKMARHHVHLSERK------------------------ETALKVGSRRG-KPVIFVIKAQQMSE-D------------GCIFYCSDNGVWLVD-----------YIDPKYLTIKYIDPK 197 Crocosphaera watsonii WH 8501 bacteria>cyanobacteria
300868996 484 1 SKYLSRHLRHT--PER-LGIE--LSPG-GWVAVD--RL--LAASSDR----------NFPIQLAELKEVVAKND-KQRFSFDST----------------------------------------------------------------------------------------------------------------------------------------------------------------GTLIRANQGHS--IT----------VDLQL------------------------------EPAVPP---DVLYHGTGKGAV-ESILKSG--ICKMSRHHVHLSVNI------------------------KTAQKVGARHG-LPVVFTIAAEAMHD-R------------GYTFYCSENGVWLVE-----------YVPPEYLKLTYVPPE 180 Oscillatoria sp. PCC 6506 bacteria>cyanobacteria
307150228 485 1 SKYLSYHLRHH--PEE-LGLE--LAPG-GWVEVE--KL--LAACLEA----------QFPLTREELEEVVTNND-KQRFSFDQT----------------------------------------------------------------------------------------------------------------------------------------------------------------KTLIRANQGHS--VP----------VDLQL------------------------------TSLAPP---EILYHGTSTKAV-PSILSQG--LLKMARHHVHLSTTI------------------------EAARKVGQRQG-KPVVFELDAAAMYQ-A------------GYQFFVSENGVWLVE-----------TVPPAYLRQIYPLLV 178 Cyanothece sp. PCC 7822 bacteria>cyanobacteria
168698114 489 1 SKFLSKVLRHE--PES-AGLT--LERG-GWVPIV--DL--LSGLARS----------GTRISREDLDVVVSECE-KQRFAIDDT----------------------------------------------------------------------------------------------------------------------------------------------------------------GTKIRANQGHS--AE----------VELQF------------------------------EPVEPP---TELYDGTTETNI-SSVLRDG--LLKMARHHVHLSADG------------------------TTARKVGGRHG-KPVVITVHAAQMSA-D------------GYIFYRSANGVWLVD-----------HVPPQYLRLDHVPPQ 178 Gemmata obscuriglobus UQM 2246 bacteria>planctomycetes
302868056 490 1 SKRLSLALRHR--PDT-FGLR--LDRA-GWVPVA--DV--LAGLR---------------ISRAQLDAVVAGND-KQRFAVEAGpd-------------------------------------------------------------------------------------------------------------------------------------------------------------gADRIRANQGHS--VP----------VDLGL------------------------------TPAAPP---PRLFHGTGEAVL-DAIRAQG--LRRGGRHHVHLSPDV------------------------ATARRVGARRGGAVVVLTVDAAAMAE-A------------GYLFYRSANGVWLTD-----------TVPPPYLLTDTVPPP 177 Micromonospora aurantiaca ATCC 27029 bacteria>actinobacteria
320333790 491 1 SRRLSYLLRHA--PHE-AGLT--LEPG-GWVRVD--DL--LAGLRRL----------GVAATREAVETVVRTND-KRRFSLDGA----------------------------------------------------------------------------------------------------------------------------------------------------------------GERIRANQGHS--VP----------VDLEL------------------------------TPSVPP---DALYHGTVRAAT-GDIFREG--LRPMARHHVHLSPDT------------------------ATAVRVGARRG-RPVVLRVDAAGMHA-A------------GHRFYCSENGVWLTD-----------TVPPAFLSVLPADGT 177 Deinococcus maricopensis DSM 21211 bacteria>deinococci
226355053 492 1 LSYL---LRHA--PQK-AGLT--LEPG-GWAPLA--PV--LAHLN---------------VTRAQVERVVATNN-KQRFTLN------------------------------------------------------------------------------------------------------------------------------------------------------------------GERIRANQGHS--VE----------VDLRL------------------------------PLTVPP---ARLYHGTHPGVL-AAIQHEG--LRPMQRHHVHLSSDP------------------------ETARQVGARRG-TPVILTVQSGAMYD-A------------GHSFYRSDNGVWLTE-----------AVPPEFLNFPAVPPE 171 Deinococcus deserti VCD115 bacteria>deinococci
325283812 495 1 SKRLAYLLRHA--PHE-AGLT--LARG-GWVPLA--PL--LAHLR---------------VTRGQVERVVREDE-KGRFGLSEG----------------------------------------------------------------------------------------------------------------------------------------------------------------GDKIRATQGHS--VP----------VDLGL------------------------------EPQVPP---ATLYHGSHQGAR-VGITRHG--LKAMSRHHVHLSADT------------------------DTALKVGLRRG-WPLLFAVDAARLHA-D------------GFTFYRSENGVWLVD-----------AVPPAYLSELPTPGQ 170 Deinococcus proteolyticus MRP bacteria>deinococci
291300690 1 6 SKKLSYVLRHD--PAS-IGVT--VDAA-GWIDID--TL--LAALTRH----------GTTVSRQQLDAVVATND-KQRFTIDA------------------------------------------------------------------------------------------------------------------------------------------------------------------ERIRANQGHS--IT----------VDLGL------------------------------KARVPP---ARLFHGTATTRL-ASILDTG--LRRGTRHHVHLSTDT------------------------ATAAKVGSRHG-IPAVLTIDAAGMHD-H------------GHEFFVSANGVWLVD-----------SVPATYLTAQSVPAT 181 Stackebrandtia nassauensis DSM 44728 bacteria>actinobacteria
258545015 2 12 SKRLSFILRHQ--PQS-IGIT--LDAQ-GWVDVA--IL--LQQLNAH----------GTAIDRALLDHVVATNP-KQRFSYDAS----------------------------------------------------------------------------------------------------------------------------------------------------------------GTKIRANQGHS--VA----------IDLAY------------------------------TPCVPP---ETLYHGTARSTF-AAIRESG-GLDKRTRHHVHLSSDV------------------------ETAMKVGQRHG-KPLVLRIAAGEMQR-D------------GHVFYQSDNGVWLTE-----------HVPLAYISADAVPLA 181 Cardiobacterium hominis ATCC 15826 bacteria>proteobacteria>gammaproteobacteria
226330224 4 8 SRFLSYILRHA--PES-IGLT--LDDQ-GWGEIS--TL--ISLAQKN----------GTPLTLKLIKDVVETND-KKRFAISED----------------------------------------------------------------------------------------------------------------------------------------------------------------GFFIRAVQGHS--LK----------TTVDY------------------------------QAITPP---KILYHGTATRFI-TSIFDQG--LIPNGRQYVHLSQDY------------------------KTAVNVGNRHG-KAVVLTVDSEKMFS-E------------GFEFYQADNGVWLTL-----------SVPAKYLKIDENEAK 176 Proteus penneri ATCC 35198 bacteria>proteobacteria>gammaproteobacteria
225075180 5 3 SKFLSFILRHH--PEQ-IGIT--LDKD-GWVDID--TL--LTQVNHP-----ergftGNPLTYEVLLEVVENND-KKRFTLSED----------------------------------------------------------------------------------------------------------------------------------------------------------------GKRIRAAQGHS--TA---------QVQVEH------------------------------KVATPP---QILYHGTAERSV-PSIMEQG--LHSASRHFVHLSADA------------------------ATAVNVGSRHG-KPVVLTIDTVAMLA-A------------GHQFYLADNGVWLTE-----------NVPPQFILTENVPPQ 186 Neisseria flavescens NRL30031/H210 bacteria>proteobacteria>betaproteobacteria
308446799 6 4 SKFLSLVLRHQ--PET-IAIQ--LDSE-GWTDVH--IL--LQQMIKH----------KRPLKLVELIEVVESSD-KKRFQLSPD----------------------------------------------------------------------------------------------------------------------------------------------------------------QSKIRAVQGHS--SA---------QVQREY------------------------------AAITPP---DTLFHGTATRFV-NSILEKG--LISGERHHVHLSADL------------------------VTAQKVGQRHG-KVIIFILDTKQMHQ-D------------GFRFYCAENGVWLTE-----------QVPIKYLKLFESNQK 183 Caenorhabditis remanei eukaryota>metazoa>nematoda
225023628 9 9 SKFLSYILRHH--PEA-IGLT--LDGE-GWADVD--EL--LTQAAAH----------GRNISLPLLHEVVATNN-KKRFTLSAD----------------------------------------------------------------------------------------------------------------------------------------------------------------GGKIRAEQGHS--TA---------QVDIAY------------------------------TETEPP---EILYHGTAQRFA-EAIEEQG--LLPGSRHYVHLSGDV------------------------ETAVSVGSRHG-KPLVLEVQAGLMRQ-Q------------GFVFYLTANKVWLIK-----------EVPSQFLRRMEVPSQ 178 Eikenella corrodens ATCC 23834 bacteria>proteobacteria>betaproteobacteria
15891357 11 6 SKFLSYVLRHA--PES-IGLV--LDSQ-GWADVA--DL--LAKANAS----------GTPLDEAGLRAVVAESD-KKRFTLSED----------------------------------------------------------------------------------------------------------------------------------------------------------------GRRIRAAQGHS--VK----------VDLGQ------------------------------PPVEPP---PQLFHGTATRFL-EPILREG--LRPGERQQVHLSADR------------------------TTALAVGQRHG-KPVVLIVDAGQMFA-D------------GCRFYLADNGVWLTD-----------AVPFSYLTVSADSSA 174 Agrobacterium tumefaciens str. C58 bacteria>proteobacteria>alphaproteobacteria
213966822 12 1 SKLLSYVLRHA--PES-MGLT--LDRD-GWCEVD--EL--VGKANAN----------GHSFDRQALKEVVETNE-KKRFTLSED----------------------------------------------------------------------------------------------------------------------------------------------------------------GQRIRAAQGHS--TR---------LVQVQH------------------------------IEKEPP---ARLYHGTASRFM-ASIETQG--LIAGSRHHVHLTEDP------------------------ETALSVGKRYG-QPVLLAVDAKGMFE-A------------GVQFFQADNGVWLVE-----------AVPIEWLTKVADTVS 179 Pseudomonas syringae pv. tomato T1 bacteria>proteobacteria>gammaproteobacteria
32476856 36 4 SKFLSLVLRHQ--PGV-IGMT--LDEQ-GWLEID--GL--IANANTR----------GKKLTLELIHEVVATND-KKRFVLSDD----------------------------------------------------------------------------------------------------------------------------------------------------------------GLRIRASQGHS--VA---------GVDLNL------------------------------TEANPP---ATLYHGTVDAFL-PRIREQG--LQKRSRNHVHLSADE------------------------ATATNVGSRRG-KPKLLLIAAQRMHQ-D------------GHIFYLSENEVWLVD-----------SVPPTYLTFPTVPPT 183 Rhodopirellula baltica SH 1 bacteria>planctomycetes
325928686 16 7 SKFLSYVLRHA--PQS-IGLT--LDRE-GWADID--AL--IAAATAA----------GRALDADLIRAVVSSND-KQRFALSAD----------------------------------------------------------------------------------------------------------------------------------------------------------------GRQIRAVQGHS--TA---------TVALVH------------------------------MPRTPP---SMLYHGTATRFL-EAILAQG--LQPGQRHHVHLSADP------------------------KTATTVGARHG-APSVLRVHSLQMHE-D------------GHVFYQADNGVWLTR-----------HVPPNYLHLVQVPPN 180 Xanthomonas perforans 91-118 bacteria>proteobacteria>gammaproteobacteria
170683612 18 5 SKFLSFVLRHK--PES-IGIV--LDRE-GWADID--KL--ILCAQKA----------GKRLTRALLDTVVATSD-KKRFSYSSD----------------------------------------------------------------------------------------------------------------------------------------------------------------GRCIRAVQGHS--TS---------QVAISF------------------------------AEKTPP---QFLYHGTASRFL-DEIKKQG--LIAGERHYVHLSADE------------------------ATARKVGARHG-SPVILTVKAQEMAK-R------------GLPFWQAENGVWLTS-----------TVAVEFLEWPFMPAG 185 Escherichia coli SMS-3-5 bacteria>proteobacteria>gammaproteobacteria
260554979 19 1 SQYLSFILRHK--PEE-IGLT--LDRE-GWANIE--EL--ISKSQPV---------kNVALDEEIIKNIVSNSD-KKRFQISDD----------------------------------------------------------------------------------------------------------------------------------------------------------------GKLIRAVQGHS--TT---------SVDITL------------------------------NKLKPP---TYLYHGTAQRFI-DSIKEQG--LISKDRQYVHLTENR------------------------DTALTVGARYG-KPEILVIDALKMHD-S------------GFEFFQAENGVWLSK-----------HVPIEFIAFKHVPIE 179 Acinetobacter baumannii ATCC 19606 bacteria>proteobacteria>gammaproteobacteria
330977809 21 1 SKFLSYVLRHE--PEA-IGLE--LSRD-GWADID--ML--IACAAKN----------EQVFDRDFLERVVAESE-KKRFLISED----------------------------------------------------------------------------------------------------------------------------------------------------------------RRYIRAAQGHS--NS---------SVSIQY------------------------------TQVVPP---EFLYHGTATRFL-ESIFKEG--LVAGARHYVHLSESK------------------------ETARSVGLRYG-KPIVLEIEALHMHN-L------------GFKFFQAENNVWLID-----------KVPASWLVLKGVPAS 179 Pseudomonas syringae pv. aptata str. DSM 50252 bacteria>proteobacteria>gammaproteobacteria
172064765 25 29 SKFLSFVLRHA--PES-IGLQ--LDRE-GWASID--SV--LAGAITQ----------PFTLNREILHIVVSESD-KKRFEISAD----------------------------------------------------------------------------------------------------------------------------------------------------------------DQWIRAVQGHT--SS---------SVRREY------------------------------VEKQPP---EFLYHGTVERFL-DSILEQG--LHQGTRHHVHLSASI------------------------ETAISVGKRRG-KPVVLKIDSSRMYR-Q------------GFKFFLTENGVWLTG-----------AVPVDFIEILTVPVD 208 Burkholderia ambifaria MC40-6 bacteria>proteobacteria>betaproteobacteria
322832748 27 1 SKFLSYILRHK--PDT-IGLQ--LDVE-GWADIN--SL--ILGAAKE----------GRVLDQAIIQTVVNSSD-KKRFTLSED----------------------------------------------------------------------------------------------------------------------------------------------------------------GQRIRAVQGHS--TP---------DVNLQH------------------------------MEKKPP---EFLYHGTATRFL-ESILQQG--LIAGSRHHVHLSQDI------------------------TTAVAVGQRYG-KPAVLKVEALRMHQ-Q------------GFNFFQAENGVWLTN-----------HVPNFFIYQEHVPNF 179 Rahnella sp. Y9602 bacteria>proteobacteria>gammaproteobacteria
107099046 29 1 SKFLSYVLRHQ--PEA-IGLT--LDGE-GWADID--AL--IAGAARD----------GRALDRVLLGAVVENND-KKRFALSAD----------------------------------------------------------------------------------------------------------------------------------------------------------------DQRIRAVQGHS--HA---------AVAIAY------------------------------APAVPP---AVLYHGTASRFL-DSIRERG--LVPGSRHHVHLSARR------------------------ATALEVGRRYG-SPVLLEIDARDMHL-A------------GHLFHQAENGVWLTE-----------RVPVRFIREARVPVR 179 Pseudomonas aeruginosa PACS2 bacteria>proteobacteria>gammaproteobacteria
70733133 30 1 SKFLSYVLRHE--PQA-IGLE--LDSE-GWGDID--AL--ISGAAKN----------GRQLSRELIELVVEGND-KKRFALSAD----------------------------------------------------------------------------------------------------------------------------------------------------------------SRRIRAVQGHS--NK---------AVQLQL------------------------------EAKQPP---AVLFHGTATRFM-DSINEKG--LIPGSRHHVHLSQEI------------------------DTARAVGQRYG-KVVILQIDAQAMQA-Q------------GFTFYQAENGVWLTD-----------QVPVGFIKALQVPVG 179 Pseudomonas fluorescens Pf-5 bacteria>proteobacteria>gammaproteobacteria
53718401 35 10 SKFLSYVLRHR--PDS-IGVT--LDAQ-GWADVS--EL--LTKAAAA----------GMALTLDELKQVVAEND-KKRFVLNDD----------------------------------------------------------------------------------------------------------------------------------------------------------------ATRIRAAQGHS--VD----------VDLQL------------------------------PVKAPP---PVLYHGTVGKSM-ADIRKQG--LTPMNRHDVHLSPDR------------------------ETATRVATRRG-KPVILVIETYPLLR-D------------GYQFRVSDNGVWLVP-----------EVPAKYIKFPGVPAK 183 Burkholderia pseudomallei K96243 bacteria>proteobacteria>betaproteobacteria
307946056 39 6 SKFLSYVLRHK--PEA-IGLS--MDEA-GWVAID--EI--LEKAN-------------RPISRELIEQIVAEND-KQRFAISSD----------------------------------------------------------------------------------------------------------------------------------------------------------------GRQLRANQGHS--VS----------VDLKL------------------------------KPKEPP---AELFHGTASRFL-DSIFEKG--LVPGTRQHVHLSANV------------------------ETALKVGQRHG-KPVILAVPALEMHQ-S------------GHFFFLSENGVWLTH-----------AVPANKLVLHDNNAN 176 Roseibium sp. TrichSKD4 bacteria>proteobacteria>alphaproteobacteria
329847506 41 1 SKFLSLVLRHQ--PET-IGLT--LDAH-GWTSVD--DL--LKRMAAH----------GKFLTREKLERVVAEND-KKRYTLSED----------------------------------------------------------------------------------------------------------------------------------------------------------------GLRIRAAQGHS--VK----------VDLAL------------------------------LPALPP---DILYHGTATRFV-ESIMTEG--LKPQSRQQVHLSLDY------------------------ATASKVGQRHG-KPYIFRVEAGRMQA-D------------GHLFFRADNGVWLTD-----------AVPPQYLIAPDSAAQ 178 Asticcacaulis biprosthecum C19 bacteria>proteobacteria>alphaproteobacteria
296114887 43 15 SKFLSLVLRHA--PER-IAIS--LDPQ-GWVETT--IL--IRQARRH----------GQTFDLPSLQRVVRDND-KQRFTLSPD----------------------------------------------------------------------------------------------------------------------------------------------------------------GKRIRAAQGHS--IA----------VDLAL------------------------------PPAIPP---AVLWHGTARTSL-ESIFRDG--LLPGRRRHVHLSNDE------------------------ATAMTVGTRHG-RAVVMRVAAGRMHD-D------------GLTLWRADNGVWLTD-----------GVPPCYLSFAGVPPC 188 Gluconacetobacter hansenii ATCC 23769 bacteria>proteobacteria>alphaproteobacteria
84499293 45 1 ------------------------------------------------------------MSRGHLVRLVADDN-KRRFTLSEG----------------------------------------------------------------------------------------------------------------------------------------------------------------GERIRAAQGHS--LA----------VDLTL------------------------------APQSPP---AVLYHGTNRQSL-DSIFQSG--LLSGRRQFVHLSADV------------------------DTALDVGTRHG-KPIVLSVEAGAMSR-G------------GHQFWVADNGVWLTR-----------QVPAQFLAFAPRHDP 131 Oceanicola batsensis HTCC2597 bacteria>proteobacteria>alphaproteobacteria
84499284 42 1 SKFLSRVLRHE--PEL-IAIQ--LDPQ-GWVSVD--DL--LRRLKKV----------GHGMSREQLREIVETND-KRRFTLSAD----------------------------------------------------------------------------------------------------------------------------------------------------------------GRRIRAAQGHS--VD----------VDLGL------------------------------TPLVPP---EFLYHGTAAQNL-DAIFETG--LNPGRRRQVHLSPEP------------------------ETANRVGQRHG-KPTVLRVEASKMHA-D------------GFVFTCSDNGVWLTD-----------SVPAAYLGFGVMLAA 175 Oceanicola batsensis HTCC2597 bacteria>proteobacteria>alphaproteobacteria
84501233 44 1 SRFLSLILRHK--PEE-VGLK--LGPG-GWVRID--EL--LVAMKRA----------GRRLTRDHLIEIVEQND-KKRFTISSD----------------------------------------------------------------------------------------------------------------------------------------------------------------GERIRAAQGHS--LD----------VDLGL------------------------------PAQDPP---DELFHGTARAHL-DEIFSAG--IIPGRRRLVHLSVDI------------------------ATALTVGGRHG-KPVVLTVAAKAMHQ-D------------GHKFYRADNGVWLTD-----------HVPTSYLSFATIRTS 175 Oceanicola batsensis HTCC2597 bacteria>proteobacteria>alphaproteobacteria
221067794 50 35 SKFLSLVLRHS--PET-IGLT--LDEA-GWARTD--EL--LACLARS----------GRPTRLEELQRIVADNN-KQRYSFSAD----------------------------------------------------------------------------------------------------------------------------------------------------------------GKHIRANQGHS--IK----------VELGL------------------------------EASSPP---AVLYHGTATRFL-DAIFHEG--LNRQSRHHVHLSDSV------------------------EVAAQVGSRHG-KLALLQVDAARMQG-E------------GHVFYRSDNGVWLTD-----------VVPVRYLLKLPSPVR 212 Comamonas testosteroni KF-1 bacteria>proteobacteria>betaproteobacteria
333912499 51 3 SKFMSLVLRHN--PGR-AGLA--LDAQ-GWVSID--AL--LRGAQAA----------GRNISPALLMEVVRSCP-KQRFAISAD----------------------------------------------------------------------------------------------------------------------------------------------------------------GLRIRASQGHS--VQ----------IDLGL------------------------------QASVPP---QRLYHGTATRFL-DSILRTG--LDRRNRHHVHLTDNL------------------------ATARSVGQRYG-RLVLLEIDAARMHA-D------------ACLFYRSDNGVWLTD-----------SVAPHYLRVLAEEEH 179 Delftia sp. Cs1-4 bacteria>proteobacteria>betaproteobacteria
158337724 53 2 SKFLSYILRHR--PEA-ISLE--LNAG-GWAAIS--EL--IQCASKH----------DHFLSEEIIKEVVVSND-KKRFKLSED----------------------------------------------------------------------------------------------------------------------------------------------------------------GQYIRANQGHS--IR----------VDLDL------------------------------LPLTPP---DVLFHGTATRFL-ASIMAKG--LLPSGRQHVHLSASY------------------------ETAIAVGRRHG-KPTVLEINAQKMQG-D------------GYLFYRSENGVWLTD-----------HVPAQYFVEVEVPAQ 177 Acaryochloris marina MBIC11017 bacteria>cyanobacteria
330983843 54 95 GRYLAAILRHKKISDN-IGLK--HDAQ-GWMSIA--DI--IEKSTAN--------rkAPPLSVEIIDLAVQHCD-KQRYAISPD----------------------------------------------------------------------------------------------------------------------------------------------------------------RCHIRAKQGHS--FP----------VDLGL------------------------------KAEIPP---VVLYHGTVDRFF-SSIMREG--LTPQKRQHVHLSHEKe-----------------------TALNVGGRRKG-EVIILEIDAKAMLA-N------------GHVFHLSENGVWLTE-----------AVPSQYINTEAVPSQ 277 Pseudomonas syringae pv. lachrymans str. M301315 bacteria>proteobacteria>gammaproteobacteria
34497880 58 35 SRFLSLVLRHQ--PET-IGLQ--LDDQ-GWADIG--EL--LARLAAK----------GRNLGRKQLEKIVLDND-KQRFAISED----------------------------------------------------------------------------------------------------------------------------------------------------------------GLRIRANQGHS--IK----------IDLGL------------------------------AACEPP---DRLYHGTASRFL-DAILAEG--LRPGQRQHVHLSADG------------------------QTARKVGARHG-KPVVLEIDARAMRQ-A------------GLAFYRSDNGVWLID-----------GVPPVFIRQTEARPV 203 Chromobacterium violaceum ATCC 12472 bacteria>proteobacteria>betaproteobacteria
83643039 59 15 SKFLSLVLRHQ--PEL-IQLP--LDAN-GWADIE--VL--LAGAARQ----------GVNISLQDVLEIVATND-KQRFALSGD----------------------------------------------------------------------------------------------------------------------------------------------------------------KRRIRASQGHS--ID----------VDLQL------------------------------TPVTPP---DELYHGSATRFT-DAILATG--LQPGQRRHVHLSADV------------------------ETAHKVGSRHG-KPVIFRIDAKALTL-A------------GHAFYLSANQVWLTD-----------AVPPQYLSLLDTSPQ 179 Hahella chejuensis KCTC 2396 bacteria>proteobacteria>gammaproteobacteria
325189229 64 17 SKKLSYALRHG--ALD-LKLD--MTTD-GYVDTS--HL--LAKSMFA------------SYTISDIERVVETND-KKRYEMRRD--------------------------------------------------------------------------------------------------------------------------------------------------------------geGKFIRATQGHS--LK--------IVNDEHLL--ALVS-----------------------DANEI----EHCIHGTLEQNW-TQIENSG--LSSMKRNHIHFTTQEf-----------------------GAQVISGMKQT-SELMVYINIRQAMQ-H------------GIKFYRSSNNVLLTRGIND-----SGTLPVRYVDSGTLPVR 198 Albugo laibachii Nc14 eukaryota>stramenopiles
254578506 68 9 SKSLSYLLRHG--ALK-EKLP--IDAN-GYVPLQ--VL--LAHNRLK----------SHRCTLEDVHRIVDSNE-KKRFHTKVSs-------------------------------------------------------------------------------------------------------------------------------------------------------------egQELICATQGHS--IK-------SVLPTEDVL--HEIR-----------------------DPKELP---PKLVHGTTVHNA-LLILQSG-AIKKLRRNHVHLSPGVtgv---------------------DAAVVSGMRAT-SNVHIYIKLGSELL-E------------QMKVYKSLNNVYLVP----------DDVPIALFDPDDVPIA 194 Zygosaccharomyces rouxii CBS 732 eukaryota>fungi>ascomycota
45198857 69 14 SKSLSYLLRHG--ALK-EQLP--IDSD-GYVPVS--AV--LAHNRLK----------SHRCSFSDLQRIVENNE-KKRFHMRPGp-------------------------------------------------------------------------------------------------------------------------------------------------------------dgQEYICATQGHT--IE-------QVLPSADVL--TQLI-----------------------DPGELP---AQLIHGTNLRNA-VLILDSG-CIKRMQRNHVHLSHGVtg----------------------KDCVISGMRLS-STVHIYLNTE-GIL-D------------HLRLYKSRNDVYLTP----------SDIPVVYLTPSDIPVS 193 Ashbya gossypii ATCC 10895 eukaryota>fungi>ascomycota
255712699 71 11 SKSLAYLLRHG--ALK-EKLP--IDPN-GYIPIS--VL--LQHNRLK----------SLHCTQQDVDRVVANNA-KKRFHIKTE--------------------------------------------------------------------------------------------------------------------------------------------------------------dnNVLICATQGHS--IA-------AVAPAGDVL--QPIT-----------------------ADDKLP---EKLVHGTNLKNC-KLIIESG-GIRKMRRNHVHLAAGItgl---------------------DGEVVSGTRTS-SNVFIFLKRE-LAF-Q------------QLRLFKSLNDVYLTA----------DDVPTELFEADDVPTE 194 Lachancea thermotolerans CBS 6340 eukaryota>fungi>ascomycota
50305581 72 15 SKALAYLLRHG--AVK-ENLP--IDSD-GYIALD--RI--LQHNRLK----------SLKATSTEIQHIVASND-KQRFHIKTDpn------------------------------------------------------------------------------------------------------------------------------------------------------------tgIMYVCATQGHT--LK-------QIAPSQHVL--KPIT-----------------------NIEQLS---SKLVHGTNVSNC-ISILHSG-FIKKMSRNHVHLSPGItgk---------------------DTDVISGMRSS-SNVYIHIKRIQEML-D------------SLNLVKSLNNVYLTS----------QDIPLKFIDFQDIPLK 204 Kluyveromyces lactis NRRL Y-1140 eukaryota>fungi>ascomycota
151945531 75 15 SKALSYLLRHA--AVK-EKLT--IDSN-GYTPLK--EL--LSHNRLK----------THKCTVDDIHRIVKEND-KQRFHIKTLga-------------------------------------------------------------------------------------------------------------------------------------------------------------dEEWICATQGHS--IK-------SIQPSDEVL--VPIT-----------------------EASQLP---QELIHGTNLQSV-IKIIESG-AISPMSRNHVHLSPGMlh----------------------AKGVISGMRSS-SNVYIFIDCHSPLFFH------------TLKMFRSLNNVYLSS-----------SIPVELILSSSIPVE 198 Saccharomyces cerevisiae YJM789 eukaryota>fungi>ascomycota
126131670 84 1 SKAMSYLLRHA--AVK-EKLA--IDED-GYVQIE--DL--LKHQRLK----------TFRTSIADLERVVQNDN-KQRYTIK------------------------------------------------------------------------------------------------------------------------------------------------------------------DNAICANQGHS--IK---------SVGSDNL--ELLT------------------------LETIP---SEVYHGTYRNKL-GLIYSSG-GLNRLRRNHIHMTSK-------------------------AYSVKSGIRYN-ANVLIYIDVAKCME-A------------GIKFYKSLNDVILSEGDEN------GYISWKYFDKVVEVKT 188 Scheffersomyces stipitis CBS 6054 eukaryota>fungi>ascomycota
156845856 76 3 SKALSYLLRHG--AQK-EKLS--INSN-GYILVK--DI--LSHNRLK----------THKCTLEDLHRIVENND-KKRFHLKIV--------------------------------------------------------------------------------------------------------------------------------------------------------------ddQEHICATQGHS--LK-------TVKPSDEVL--EPVL-----------------------SLDQLP---KRLVHGTNLQNA-ILIFKSG-QIKKMNRNHVHLSPGVige---------------------DSEVVSGMRYS-SNVHIFLKLNDSLL-E------------NLKLFKSINSVYLSA----------VDIPTDLVEAVDIPTD 201 Vanderwaltozyma polyspora DSM 70294 eukaryota>fungi>ascomycota
241952517 83 14 SKALSYLLRHG--AEK-EKLS--IDEQ-GYVKIS--DV--LSHQRLK----------SLKTTIEDIERIVREND-KKRFTIR------------------------------------------------------------------------------------------------------------------------------------------------------------------DEMICANQGHS--LK---------AVKNDNL--VPMT-----------------------IDELNQ---LRIYHGTYKTKL-PIIKSSG-GLSRMNRNHIHLTCD-------------------------QYATCSGIRYN-ANVLVYIDASKCIE-H------------GIVFYKSLNNVILTSGDKD------GKISWEFIDRIVDLEG 192 Candida dubliniensis CD36 eukaryota>fungi>ascomycota
260945038 87 36 SKALSYLLRHG--ADK-EKLP--LDEH-GWAKVS--DV--LANNRIR----------THRATQEDIRRIVAQNA-KQRFTLRER--------------------------------------------------------------------------------------------------------------------------------------------------------------sdGDYICANQGHS--LE---------RVCPEL---ELLT------------------------SETMP---REVYHGTYENKL-DTIMQHG--LNRMARNHIHLACN-------------------------EPWSRSGSRAS-STVFIYIDIDKCLS-A------------GISFYRSKNGVILTSGNAQ------GCIPSEYFAQGCIPSE 214 Clavispora lusitaniae ATCC 42720 eukaryota>fungi>ascomycota
255638634 99 101 SRLLTRILRHM--ASE-LNLN--MRSD-GYVKVN--DL--LKLNLKT-----fanipLRSHTIDHIREAVRKDN-KQRFSLLEE--------------------------------------------------------------------------------------------------------------------------------------------------------------ngELLIRANQGHT--VK--------VVETESLL--KPIL-----------------------SAKEFP----VCLHGTYRKNL-ESILGSG--LKRMKRLHVHFSCGLpt----------------------DGEVISGMRQD-VNVLIFLDVRKALE-E------------SIKLYISDNKVILTEGFD-------GVVPPKYFEDGVVPPK 289 Glycine max eukaryota>viridiplantae
148907021 100 374 -RSLSSVLRHR--ADE-LKLN--IRSD-GYVAVK--DL--LKLNVKT-----parvpLNSHSIDDIKEAVKRDN-KQRFGLLEE--------------------------------------------------------------------------------------------------------------------------------------------------------------ksVLLIRANQGHS--IN--------FIDSEELL--KPIL-----------------------SAEDVP----VCVHGTYLKNL-ELIKKNG--LNRMKRNHVHFARGLsk----------------------DSGVISGMRSD-CEVFIYLDTKKALQ-G------------GMKLFVSENGVILTEGFN-------GVVPPEYFFNGVVPPE 560 Picea sitchensis eukaryota>viridiplantae
168049051 102 9 -RCMTAILRHR--ASD-YGLE--MQND-GFVLVA--DL--LKLSKNT-----aagipLSSHSVEDVRKAVARDG-KRRFGLKEE--------------------------------------------------------------------------------------------------------------------------------------------------------------dgHLYIRANQGHS--IR--------TVESGQLL--SLVT-----------------------SPSQIP----VCVHGTYERFM-DSIWQEG--LKRMNRNHVHFATGLpe----------------------QDGVISGMRGS-AQVLIYLDVEKAME-D------------GMKLYVSDNKVVLTEGFD-------GVVPTKYFFDGVVPTK 195 Physcomitrella patens subsp. patens eukaryota>viridiplantae
302766619 103 36 -RALTKILRHR--AAE-LNLE--MRSD-GFCKVA--DL--LRLDFTT-----rskvpLSAHTVEEVLQAVEQNS-KERLATMVDe-------------------------------------------------------------------------------------------------------------------------------------------------------------sgELLIRANQGHT--LL-------DAVCSDDLL--EEIS-----------------------IDDNML---AVCVHGTFKHAL-PGILRDG--LKTMGRKHVHFAAGLpg----------------------AGEVVSGMRGS-CDALVFVNAARAMA-D------------GMKFYVSKNGVVLTEGFE-------QCVPAKYFDEQCVPAK 226 Selaginella moellendorffii eukaryota>viridiplantae
302756333 104 15 -RAMTKILRHE--AAT-FNLD--LRSD-GYCKVD--EL--LKIGMKT-----ragipLSSHSVEEVLQAVKQDN-KQRFSTTRE--------------------------------------------------------------------------------------------------------------------------------------------------------------dgTLYIRANQGHS--IK--------EVLSDHLL--REIS-----------------------STDKIP----VCIHGTYKHAL-PSILESG--LKVMGRNHVHFATGLpd----------------------ENGVISGMRSS-CQVLIYLDTEKAMA-D------------GMKFYVSDNNVVLTEGFE-------GCVPCEYFEEGCVPCE 202 Selaginella moellendorffii eukaryota>viridiplantae
302757341 106 13 ---LCRILRHQ--ATQ-LSLP--IRSN-GYVKVD--DI--LRLTIRT-----hagipMNEHSVEEVLRVVERDP-KQRYSTMVE--------------------------------------------------------------------------------------------------------------------------------------------------------------ggELFIRANQGHS--MK--------VVASDALL--TEIT-----------------------SADQVP----VCVHGTFRCFL-PSIMRTG--LNRMSRNHVHFAIGLpn----------------------EEGVISGMMDS-VEVLIYLNVAKALQ-D------------DMKLYISDNKVLLTEGFA-------GVVPCEYFEAGVVPCE 198 Selaginella moellendorffii eukaryota>viridiplantae
302796097 107 2 SKTIAWVLRHG--AVK-MDLK--IRSN-GYCSIK--DL--LEMDVKI-----gggipLSSFTVADVMSMVACDP-KQRFSTIEEe-------------------------------------------------------------------------------------------------------------------------------------------------------------ddQLYIRANQGHT--MD--------AVQTAELL--REIK-----------------------SADEVP----MCVHGTFRNNF-RGIRKTG--LKRMKRNHVHFATGLp-----------------------QDGVISGMKSK-CEVLIYLDLAKAMK-D------------GMKFFMSENGVVLTEGFD-------GVVPREYFEDGVVPRE 195 Selaginella moellendorffii eukaryota>viridiplantae
302782377 108 2 ------ILRHQ--AVE-MGLK--IRSD-GYCRMN--DL--LKLQPMR------------GHSIQDVLKVVETDL-KTRFSTNVE--------------------------------------------------------------------------------------------------------------------------------------------------------------ngILFIRANQGHS--MK--------AVVTEKLL--KEIE-----------------------SADQVPGTSKVCVHGTFKKNL-ASIRRTG--LCVMGRNHVHFATGLpr----------------------DDGVVSGMRNT-CDALIFLDVEKALD-D------------GMQLFISENRVVLTEGFG-------GVVPPRYGFGGVVPPR 179 Selaginella moellendorffii eukaryota>viridiplantae
290988948 114 32 SRALSKLLRHK--ADKTKGIN--LRAD-GYVLIR--EI--LALKDFK------------GVTQQMIEECVKNND-KQRFNMTQDat------------------------------------------------------------------------------------------------------------------------------------------------------------tgEYIIRANQGHT--IA-------VEVEMEEI---DSPS-----------------------KLGEYA---NTVMHGTYHDAY-DKIVQSG-GLSRMSRQHIHFAIGEpe----------------------EGHVISGMRKS-AEVCFFLDVQKTID-E------------GIKLLKSSNGVILSLKSSN------GVILSPGNDKGLIPMH 210 Naegleria gruberi strain NEG-M eukaryota>heterolobosea
322505025 115 365 SKFMSALLRHK--AVQ-WRVP--ITSN-GYVLLD--DV--LRQPQMR---------rKPQVSVQDVARMVRDSD-KQRFQLAYGaa------------------------------------------------------------------------------------------------------------------------------------------------------------dgRLYITATQGHS--ID---------GVEPKL---RTLT-----------------------SVEEVP----MAIHGTYWEAW-KTIQRCG-YLSAMTRQHIHFAKGLmn----------------------DAQVISGMRNN-VQLFIYLDVAAVLA-D------------GVALYESTNGVILTPGVG-----DTRQLPLKYVDTRQLPLK 560 Leishmania braziliensis MHOM/BR/75/M2904 eukaryota>euglenozoa>kinetoplastida
261334507 116 333 SKALSRILRHG--ADK-MKIT--ISDA-GYVLAD--DL--VRCAPFS----------NDKAALTHLAWVVYSND-KKRFKMAYDe-------------------------------------------------------------------------------------------------------------------------------------------------------------nrRVYIRANQGHS--LS---------GINPEL---VPIT-----------------------SETQVP----FAVHGTYYSAW-ERIRGCG-YLSTMGRQHIHFAKGMpg----------------------SDGVISGMRNT-SEVLLVLDVPLLLK-E------------SVELWESANGVLLTRGVS-----GTGRLPLKYIGTGRLPLK 526 Trypanosoma brucei gambiense DAL972 eukaryota>euglenozoa>kinetoplastida
322815443 117 372 SKTLTRILRHA--ADK-MGIP--VSSG-GFVHVD--HI--LRCKPFC----------NDPLALSHIALVVHTND-KKRFKMAYDd-------------------------------------------------------------------------------------------------------------------------------------------------------------qhRLYIRANQGHS--LA---------GIDPEL---RRIE-----------------------SATEMP----AAIHGTYYSAW-KEICACG-YLSTMTRQHIHFSRGLis----------------------DHCVISGMRSN-VEVLLYLDVAKVLA-D------------GIELWESENGVLLTPGMG-----STKRLPLTYISTKRLPLT 564 Trypanosoma cruzi eukaryota>euglenozoa>kinetoplastida
328867666 123 5 SKAMSYILRHG--CAK-ERIE--ISAD-GYVKVN--DL--LKNKNFK------------NITFQDIQHVVDTND-KKRFELKQQ--------------------------------------------------------------------------------------------------------------------------------------------------------------dnEYYIRASQGHT--IK--------TVTENDSLF-TKIT-----------------------DINQVP----GVIHGTYRKHL-VSIKEKG--LNKMDRNHIHFATGD------------------------HGDVVSGMRGN-CEIVIYIDLEKALN-D------------GIEFLLSKNGVVLCAGIQ------ TEHVLCAGIQTEHGNHY 188 Dictyostelium fasciculatum eukaryota>amoebozoa>mycetozoa>dictyosteliida
281203700 124 9 SKTLSYLLRHG--AVK-EGLT--ISND-GFVKVN--DV--LNHKQMR------------GVTLEKLREIVDTND-KKRYHLEEI--------------------------------------------------------------------------------------------------------------------------------------------------------------ggVLNIRANQGHT--LK--------HVDDVDL---KKIE-----------------------SVNDVP----SVIHGTYRKHL-ESIKSKG--LNKMDRNHIHFATGD------------------------HGDVVSGMRGN-CELVIHINLQKALD-D------------GIPFFLSKNGVVLCAGDKN------GYLLCAGDKNGYLSPI 182 Polysphondylium pallidum PN500 eukaryota>amoebozoa>mycetozoa>dictyosteliida
330795375 126 10 SKTLSYILRHS--AVK-EGLN--ISKD-GYVSVD--EL--LKHKLFS------------QYTFKDIQEVVDTND-KKRYNLKKGege----------------------------------------------------------------------------------------------------------------------------------------------------------nseKYFICANQGHS--IS--------DVDEVDL---KRIE-----------------------SVDEVE----SVVHGTYKKHL-KSILENG--LQKMERNHIHFAVGLpg----------------------EGQVISGMRGS-CDMVIYIDLQKCLD-D------------DIPMFLSKNNVVLTNGKDNN-----GILPIKYDNNGILPIK 202 Dictyostelium purpureum eukaryota>amoebozoa>mycetozoa>dictyosteliida
238496189 147 18 SKALSLLLRHA--AEK-EGLK--LDAQ-GYANVA--DV--LAWRKLK----------SLKVTFPEIVAAVATSD-KKRFALLHIpst----------------------------------eaqa-------------qqstsaeastehgipttsagqdsatetalavsesd-------------------------------------------------------------------ldpaHFLIRATQGHS--IK---------SVDAASLMEKLSL----------------------dEEAKLP---DTVVHGTFHAAW-PAILASG-GLKSMGRNQVHFATGPsvesvlaqgaqgskevtgdh----GEKVISGMRRD-AQVLIYIDLKKALA-A------------GCPFWRSENGVILSEGMVVE--GSSGIVPVEFFDSGIVPVE 272 Aspergillus flavus NRRL3357 eukaryota>fungi>ascomycota
149246000 82 23 SKALSYLLRHG--AEK-ENLA--IDNL-GYVPIV--QI--LQHQRLK----------SFKTTREDIERIVAEND-KQRFSINAE----------------------------------------------------------------------------------------------------------------------------------------------------------------EDTICANQGHS--LS---------SVSGTL---DLLT-----------------------KAQLAE---MAIYHGTYKKKL-PLILGSG-GLSRMNRNHIHFTCE-------------------------QYHTISGIRNS-ANCLIYIDTDKCID-Ey-----------GLQFFKSANNVILCAGNEHGVIPVDCFAKVVDLKGQPVKVV 189 Lodderomyces elongisporus NRRL YB-4239 eukaryota>fungi>ascomycota
254573246 80 8 SKALSWLLRHG--AQS-EKLT--IDKD-GFVPLE--EV--LNHRRIK----------GTRASFEDVQRIVDNND-KKRFTLQKR--------------------------------------------------------------------------------------------------------------------------------------------------------------ddRWFICANQGHS--IA---------NVNGHDL--KLLS-----------------------TREDLP---KEIIHGTYLSKI-PQIIASG-GLSKMTRNHVHFASGLpkv---------------------DSDVISGMRNG-CSALIYLDIDKILG-Qq-----------EIKFYISKNKVILSYISKNKVILSPGNKDGIVPTSLFLKVV 181 Pichia pastoris GS115 eukaryota>fungi>ascomycota
294657248 81 14 SKSLSYLLRHG--AVK-EKLN--IDQT-GYININ--EL--LNHNRLK----------TNKVTLDDIRRIVGNND-KKRFSIVEK--------------------------------------------------------------------------------------------------------------------------------------------------------------egEIMICANQGHS--IK---------TVNDSNL--IQLS------------------------KDTIP---EEIYHGTYKNKL-PAIFNSG-GLSKMNRNHIHFASSI--------------------------SDVSGIRNS-SNVLIYLNIEKCLQ-S------------GIVFYRSSNNVILTYRSSNNVILTSGDANGLIGSEFFGKVV 180 Debaryomyces hansenii CBS767 eukaryota>fungi>ascomycota
50290283 67 10 SKALSYLLRHG--AVK-ENLP--FDVN-GYIEVE--RV--LNHQRLK----------SHKCTLEDLHRVVDTND-KKRFNIKLS------------------------------------------------------------------------------------------------------------------------------------------------------------ddgqTELICAVQGHS--ID-------RIKPDEEVL--EVID-----------------------TAEKLP---KNIIHGTSVRNA-IQILKSG-SIKRMNRNHIHLSIGItek---------------------DKEVISGMRKS-SRVHIYILSEPKIL-E------------HLKLYRSMNSVILTYRSMNSVILTPDDINKSLFLLVKIRAA 186 Candida glabrata CBS 138 eukaryota>fungi>ascomycota
146417847 90 8 SKALSYFLRHG--AQK-SNLE--IDDR-GFIKVA--DL--LAHQNLK----------SKKTTLQDILRVVETNE-KKRFALEDR--------------------------------------------------------------------------------------------------------------------------------------------------------------ngELYICATQGHL--IH---------TVTEGNL--RPL------------------------DEASLP---KQIIHGTRKRAL-EQIRKSG-GLSKMGRNHIHCTSDH--------------------------NLVSGFRST-SDTLIYIDGVQCLR-D------------GIKFFQSSNGVILSFQSSNGVILSPGNDQGVIECKYFAKVT 174 Meyerozyma guilliermondii ATCC 6260 eukaryota>fungi>ascomycota
328769603 94 6 SKALSYLLRHG--AEK-ERLV--IESD-GFVKLK--DI--LSRKQFS------------GQTLESIQHLVESNA-KQRFALRQDpt------------------------------------------------------------------------------------------------------------------------------------------------------------tlQWSIRANQGHS--IN----------VNVEM---RTVQ-----------------------DSSEIP----LVVHGTYQQHL-ALILKQG--LRSMSRKHIHFAAGLpe----------------------HQDITSGMRNN-CNILIYVNTEKAMK-D------------GIVFVQSANNVILTEGVANNVILTEGVDGVLHPRYFSKITD 184 Batrachochytrium dendrobatidis JAM81 eukaryota>fungi>chytridiomycota
167377905 95 11 SKRLSYLLRHG--AIK-ERIP--ITKD-GWVLIK--DL--LNNRQMK------------GISEEEIKSIVAKDP-KKRYSIQGE--------------------------------------------------------------------------------------------------------------------------------------------------------------gnQIKIRANQGHS--IN----------VQVEM---KEIT-----------------------DASLYP----IVIHGTYMRNF-NSIIKNG--LQKMGRLHIHMAQGLpke---------------------IKEEKSGMRSS-CNIIIYIDIEKAMK-K------------GIKFYESENGVILSEGPIDISCFSEGPIDIS---------- 186 Entamoeba dispar SAW760 eukaryota>amoebozoa>entamoebidae
242785264 145 17 SKALSHLLRHS--AEK-ENLK--ISKE-GYVNVA--DL--LETRKVK----------SLKVTLPEIIQAVASSD-KQRFSLFYIspa----------------------------------tiesg------------nqesqeqqeavvataaseekqknatahalsvkd---------------------------------------------------------------------ndpsHFLIRATQGHS--MK---------SVDTTLFLEKLSL----------------ddtkedgAASNLP---DTVVHGTYHGAW-PLILASG-GLRSMSRLQVHFATGPtmdevypngrdapialldprs---KATVISGMRSD-AEILIYINLRRALE-A------------GCPFYRSENGVILSEGMNLGDSGEGKIVPIEFFDLKIVPIE 280 Talaromyces stipitatus ATCC 10500 eukaryota>fungi>ascomycota
119498195 146 20 SKALSLLLRHA--AEK-EGLK--MDSQ-GYANVA--DV--LAWKKLK----------SLKVTLPEIIHAVASSD-KKRFALLHIpsa----------------------------------kalgdktttgaregetpvcetepssmptsqvpttsagqenatatalavnd---------------------------------------------------------------------tdpsHFLIRATQGHS--IK---------SVDAAAFLERLTL----------------------eDESRLP---DTVVHGTYHAVW-PAILQSG-GLRCMGRNQVHFATGPslesvlpahvdgtahsamgssglnDGRVISGMRRD-AQILIYIDIKKAMA-A------------GCPFWRSENGVILSEGVDVGVILSEGVDVGENQEVGDGTSQ 276 Neosartorya fischeri NRRL 181 eukaryota>fungi>ascomycota
225682414 150 26 SKALSYILRHA--AEK-EGVK--IDSH-GYANVA--DV--LAWRKLK----------SLKVTLPEILSAVSTSD-KQRFGLLYEpls----------------------------------nspsatai----------ptdcsa----------stasrtataqaltand---------------------------------------------------------------------pepsHYLIRATQGHS--IK---------TVEASSLLQRLSLt---------------dgadaapSTPPLP---DTVVHGTYHGAW-PSILVSG-GLKCMNRNHVHFATGPplssvlpegreghvvtmapg----RGGVISGMRAD-AQILIYIDLKKALE-A------------GVPFWRSENGVILSEGLDMDVILSEGLDMDGDGRKIVGLEF 266 Paracoccidioides brasiliensis Pb03 eukaryota>fungi>ascomycota
296825168 154 19 SRELTFILRHA--AEK-EGIK--IDRQ-GYANVG--EL--LQYRKLK----------GLKATLADVLEAVSTSD-KQRFGLLYIpdq----------------------------------pslpeinake------------------eaatgdesslltatnqalaand---------------------------------------------------------------------pdpnNYLIRARQGHS--MK---------CIDSASLLTPLTLs--------------------enPSVPLP---ETVVHGTYHATW-PKILQSG-GLRCMGRNHIHFASGPpissvlpngrggevatppakshg-RDSVISGMRAD-AQILIYIDLKRALA-A------------GCPFGISENGVILSEGIENGVILSEGISSDGTDDKKIGLEF 262 Arthroderma otae CBS 113480 eukaryota>fungi>ascomycota
66807493 127 19 SKSLSYVLRHG--AEK-EGLK--IDSQ-GFIKVD--DI--LKNNLFK------------NTNFKEIQEVVDTND-KKRYHMELNds------------------------------------------------------------------------------------------------------------------------------------------------------------dgCYYIRANQGHT--LE--------NVDNVEM---TKIT-----------------------SADQVG----TVFHGTYRKHL-QSILNEG--LKKMDRNHIHCVNKIm-----------------------GQEITSGMRGS-CNMIVYIDVPLLLQ-D------------GIDLYLSQNNVALTDGLQNNVALTDGLNNTGILPPKYFIKI 190 Dictyostelium discoideum AX4 eukaryota>amoebozoa>mycetozoa>dictyosteliida
50547707 131 15 SRKLSYILRHG--ATK-EKLP--IRED-GYLSVG--VL--LNRAGIK-----------GKWNLEDTKRVVRDND-KQRYKLIFEptd------------------------------------p--------------------------------------------------------------------------------------------------------------------ndctGYWIRANQGHT--IN----------TKVEM---KALK-----------------------TPEDFPT--LEIFHATSKQVL-PIVLKEG--LSKMKRQHIHLATDLvt----------------------EGGSVAGKRLN-REVFIYINVPKALE-A------------GIEFFLSENGVVLTELSENGVVLTEGKDGKISREFFSKILD 198 Yarrowia lipolytica CLIB122 eukaryota>fungi>ascomycota
170105752 133 5 SKTLSYLLRHG--AQG-EGLP--MRKD-GYVKVA--DL--LQNPKLK----------TQGLDLDKIRDIVGKDS-KQRYDLISDst-----------------------------------------------------------------------------------------------------------------------------------------------------------dpnVWWIRARQGHS--LK---------TVELDL---KPIL-----------------------SATDIST--GVAVHGTTLAAW-ESISKQG--LSKMKRNHIHLAQGLpg----------------------HNGVISGMRSS-SQIFIYINIQAALS-S------------GIQFFFSDNGVVLTFFSDNGVVLTAGDDKGFLKPEFFLRVE 178 Laccaria bicolor S238N-H82 eukaryota>fungi>basidiomycota
336366767 134 31 SKSLSWLLRHG--AQS-DGLV--LRSD-GYARVA--DV--LANPRFR------------GVTYPMLEDIVRQDR-KQRYNLLCEags----------------------------------leas-------------------------------------------------------------------------------------------------------------------sgsdVWWIRANQGHS--IK---------TIEIEL---NPIA-----------------------SATDIP----MAVHGTNRKAW-ELISTQG--LSKMKRNHIHLAQGIa-----------------------GDSVVSGMRKS-SQILIYIDVQKAID-A------------GIKFSLSSNGVVLTELSSNGVVLTEGDETGFLAPRFFQRVE 206 Serpula lacrymans var. lacrymans S7.3 eukaryota>fungi>basidiomycota
242218580 135 2 SKTLSWVLRHG--ARS-EGLE--MRPD-GYVRVD--DLVSLKIPKMR------------EMNFDMLEQIVKADN-KSRYNLIHEpdk----------------------------------avg--------------------------------------------------------------------------------------------------------------------spsqIWWIRANQGHS--MK---------TVVLDL---QPIQ-----------------------SPADIPT--GLAVHGTSRKAW-DIICEQG--LSKMSRNHIHLAQGVp-----------------------GSGVIS-MRSS-SSILIFVDIQKALA-A------------GIRFYLSDNGVVLTDLSDNGVVLTDGDEKGFLSPQFFARVE 179 Postia placenta Mad-698-R eukaryota>fungi>basidiomycota
302686072 139 4 SKTLSYILRHG--AQK-EGIP--IRPD-GYVKVD--DL--LANNRLK----------SQAVTLEMIQQIVKDDV-KQRYDLVLEqp-------------------------------------------------------------------------------------------------------------------------------------------------------------sTWLIKANQGHS--LQ---------TVKLEL---KPIL-----------------------SRADIPT--GVTVHGTMNHAW-QSISKQG--LSKMKRNHIHLAQGKg-----------------------GKDVISGMRRS-SEVFIFVDVDRAIA-A------------GIKFELSDNGVVLTELSDNGVVLTEGDERGFLPVRFFQKVE 175 Schizophyllum commune H4-8 eukaryota>fungi>basidiomycota
296416279 156 69 SKALSYTLRHG--AVK-EGLA--LQDD-GYANVG--EL--LQLPKFR----------KMSLTFEKLRQVVSEND-KQRFSLTPTaa------------------------------------------------------------------------tatatepaataed-----------------------------------------------------------------------phTYLIRATQGHS--LP---------LTNTSTLLTPL--------------------------PPNI----TCAVHGTFYPAY-EAILACG-YLSRMGRTHIHLATG-------------------------EIGVKSGMRAD-AQVLFYVDVGRARR-Eg-----------GVEFWISENGVVLTWISENGVVLTAGDELGRLGLEFVERVV 257 Tuber melanosporum Mel28 eukaryota>fungi>ascomycota
154295249 158 4 SKALSKLLRHA--AES-EGVE--LDGE-GFARLD--LV--MQWPRLK----------SLKPTFADIRTAVTDNA-KQRFSMKPNps----------------------------------------------------------------------------lpeapspss---------------------------------------------------------------------enpaDWMIRANQGHS--IV----------IDSAALLIPITL-----------------------EAENVP---ETCAHGTYFAFY-EEILRSG-GLKKMGRTHVHFVTGIpe----------------------DGGLVSGMRGD-AELLIFVDVKRCLE-Eqp----------EMKWWISENRVVLTEGSENRVVLTEGDGEGVVGTRFWKRVE 193 Botryotinia fuckeliana B05.10 eukaryota>fungi>ascomycota
302916847 159 52 SKALSKLLRHQ--AGN-AGIQ--LDDE-GFAPLS--SV--LAWGPLR----------SLKVTLDDVQSIVTSND-KQRFTLKPNps----------------------------------------------------------------------------tnpslstts---------------------------------------------------------------------tspeDYLIRANQGHS--IK----------LESAALLAPITI-----------------------EAGNVP---DRVLHGTFFYFW-PKIVETG-GLKPMNRNHVHCSTGTp-----------------------EEGVVSGMRKD-AELVIEIDIEASLK-E------------GVKWWMSDNGVLLTEMSDNGVLLTEGDEQGILSSKFFKLAT 237 Nectria haematococca mpVI 77-13-4 eukaryota>fungi>ascomycota
322707126 160 40 SKALSRLLRHQ--AEN-AGIK--LDEE-GFAPLD--R---LSWGPIK----------SLSPSLQEVKDVVETNA-KKRFTLRPAdp--------------------------------------------------------------------------------lapep---------------------------------------------------------------------psaaGYLIRANQGHS--LK----------VDEAALFEPILL-----------------------GAADLP---GKVVHGTYFAFW-KAILESG-GLKPMSRGHIHCSDRTp-----------------------EEGAVSGMRRD-AELLVEIDIEASLK-D------------GVTWWRSDNGVILTDRSDNGVILTDGGEGGVLETKYFKMVT 220 Metarhizium anisopliae ARSEF 23 eukaryota>fungi>ascomycota
213408531 178 9 SRALSKVLRHT--ARS-CGLK--LTEE-GYARVD--DL--LKLPQFK------------GLTVDVLQQIVADND-KQRFALSTIn--------------------------------------------------------------------------------------------------------------------------------------------------------------dELHIRANQGHS--LT----------TVHVDMP-RIT------------------------DPAEIP----RVVHGTFAKFW-PAIYANG--LSRMKRQHIHCAKGLfg----------------------EPGVVSGIRKS-CDVFIFIDAARAMA-D------------GVVFYRSENGVILTEGIENGVILTEGIDGVLPRKFFLRVEN 180 Schizosaccharomyces japonicus yFS275 eukaryota>fungi>ascomycota
310792989 170 37 SKALSKLLRHQ--AEN-AGLK--LDEG-GYAPLD--KV--LAYGPIR----------SLQVSFADIQAAVTTSD-KQRFALKPNav----------------------------------------------------------------------------tnpsldeks---------------------------------------------------------------------tepsHWLIRANQGHS--IK----------VDSAGLLTPITL-----------------------DAGNVP---EVVVHGTYFAFW-RAIEESG-GLARMGRNHVHFATGLpgd---------------------EQGVVSGMRRD-AEVLVYVDVERALR-Eee----------GMRWWVSENGVVLTEGSENGVVLTEGDEEGRVPTRLFREVR 227 Glomerella graminicola M1.001 eukaryota>fungi>ascomycota
19115427 179 38 SKALSKVLRHT--AKA-NGLQ--IRED-GYIEVD--SI--LKLPQFR------------GMGMELLLSIVKGND-KKRFTMEEVe--------------------------------------------------------------------------------------------------------------------------------------------------------------gVLYIRANQGHS--IK----------AVQVPMA-RI------------------------dNASSIP----KVVHGTKKELW-PVISKQG--LSRMKRNHIHCATGLyg----------------------DPGVISGIRKS-CTLYIYIDSAKAMQ-D------------GVEFYRSENGVILTEGVENGVILTEGVNGLLSSKYFSRVET 207 Schizosaccharomyces pombe 972h- eukaryota>fungi>ascomycota
326431934 185 660 SKYLSYVLRHG--AQK-EGVS--MAPD-GSVALE--DL--LRRPQLK------------GLSSKEIKHIVETCP-KQRFVLLPGt------------------------------------------------------------------------------------------------------------------------------------------------------------gptGLRIRAAQGHT--IK---------VADESQLLTAIT------------------------DASKFP----VVVHGTYAKLV-PVIKREG--LSRMRRRHIHFATGLpg----------------------DQEVKSGMRKS-CTAFVYIDLAKCLR-D------------GIPFFVSSNNVVLSFVSSNNVVLSPGLGSTGILPPQYFTNV 832 Salpingoeca sp. ATCC 50818 eukaryota>choanoflagellida
303284891 186 69 ---LSQLLRHG--ALD-AGLGDVLTPA-GGVPLD--RV--LALPRFK------------GVTAEAIETLVANCP-KRRFELFLAek------------------ggggd------------------------------------------------------------------------------------------------------------------------------------dvtTKMIRATQGHS--IRg-------GALDDDAMLARVSV---------------------erARAELR----YAVHGTSLRAW-ETIKTEG--LLRMRRRHVHLAAALpgs---------------------ADEVTSGMRSD-AQVAVWVDVAAAVA-D------------GVAFFVAANGAVLTPGVANGAVLTPGVGRDGVLHPRYFHRA 253 Micromonas pusilla CCMP1545 eukaryota>viridiplantae>chlorophyta
255086119 187 3 SKNLSQILRHG--VVD-EGLADCLDAE-GFVPLA--RV--LALPRFR------------GVGADEIRALVAADR-KGRFELRDRt-------------------------------------------------------------------------------------------------------------------------------------------------------------dgIVHVRATQGHT--LRg-------DVLDDDAMATRLT------------------------RTSGIR----EAVHGTSMRAW-KRIRTHG--LSRMRRRHVHMATGLpg----------------------DGEVKSGVRND-CEVAVWVDVERGVA-E------------GVPFFVSANGVVLSFVSANGVVLSPG--------------- 176 Micromonas sp. RCC299 eukaryota>viridiplantae>chlorophyta
167518371 190 1 ---MTYLLRHG--AEK-EGVP--MSKD-GFVHTA--DL--RRHDKLR------------HLDDDTVREIVATDA-KGRFELRE----------------------------------------------------------------------------------------------------------------------------------------------------------------gPLRVRATQGHS--LN---------VQEDSLL-DPVL------------------------SAADWP----VVVHGTYHAAW-AQIQREG--LRTMGRQHIHFSTAEpg----------------------SREVISGMRTT-CNVWIYLDLDQVLR-D------------GIPVFISRNRVLLTFISRNRVLLTAGQDGVLHPRYFKRVVR 163 Monosiga brevicollis MX1 eukaryota>choanoflagellida
145493555 191 14 SKAMSYLLRHG--AQK-EGIP--IRQD-GFVLVQ--DL--LNWKSMA----------NLKANVQSIRNVVDNND-KKRFELKEId--------------------------------------------------------------------------------------------------------------------------------------------------------------gQLYIRCVQGHT--IE---------INEEELL----------------------------gENTQFP----VIVHGTYFQAW-ELIKNTG--LNRMARQHIHFAVGLpg----------------------NDAVISGMRNT-CEVIIEVDMERAMK-A------------GIEFYVSKNGVVLSSGIKNGVVLSSGIDGVIAPQFFKRVTT 187 Paramecium tetraurelia strain d4-2 eukaryota>alveolata>ciliophora
118362535 192 19 SKKLAWLLRHG--AEK-EGLN--MGSD-GYVLLQ--EI--MSRNDFS------------TITFDKVKSVVDNND-KKRFEMIQKeh----------------------------------------------------------------------------------------------------------------------------------------------------------ngkiEWFIRASQGHT--IS--------SINDEELL-DKISL----------------------dVASSLG----IVVHGTYKQFW-EPISKEG--LKTMQRNHIHFAIGYpg----------------------DKEVISGMRKT-CDVYIEIDLVKAIN-D------------GIDFFMSKNNVVLTSGIKNNVVLTSGINKVLPPKYFKVVKD 196 Tetrahymena thermophila eukaryota>alveolata>ciliophora
322802863 196 9 SKRLSYLLRHG--AVK-EGLN--IKPN-GFITVE--DL--LNK-SLL------------QYTIDDIKRVVKTNN-KQRFTLATId--------------------------------------------------------------------------------------------------------------------------------------------------------------gILKIKANQGHS--IP--------TINQLSL---RIL------------------------EFIDF-----DIIHGTYLKYW-PKIKTEG--LSRMKRNHIHFAKGL--------------------------NFINGLRQS-ADLFIYVNFDKAKE-D------------GLIFLESENGIVLCAGNENGIVLCAGNSKGFIETRYFLKVI 178 Solenopsis invicta eukaryota>metazoa>hexapoda
156543836 197 47 SKKLSYLLRHA--AVK-KGFN--IRPD-GFIPVQ--EI--LKETP--------------GCTVKDIERVVANND-KQRFTLSSFd--------------------------------------------------------------------------------------------------------------------------------------------------------------nVLMIKANQGHT--IS--------QVDSLNL---KLL------------------------DSVDF-----DIVHGTYHSCY-EKIRHQG--LSRMKRNHIHFAKGL--------------------------NFINGLRRN-AELFIFINYPKAKG-D------------GLKFYKSENNVILCYKSENNVILCPGNSEGFVKTKYFLKSY 209 Nasonia vitripennis eukaryota>metazoa>hexapoda
328862875 199 5 SKTLSYLLRHG--AAK-EGLK--MRSD-GFVKIN--DL--LARPKLK------------GVELGDIERIVGKDS-KQRYAMIREpp------------------pdgssss-----------------------------------------------------------------------------------------------------------------------------------edIVYIRANQGHS--IQ---------VPELDL---VPII-----------------------DPEDIP----TVVHGTYMKFW-DTILLEG--LKPMKRTHIHFASGLid----------------------QPGVISGMRAS-REIDIYLDVTKCIS-A------------GILFHRSKNGVILSQGLPNGVILSQGLPDSNSIPSTYFQKV 193 Melampsora larici-populina 98AG31 eukaryota>fungi>basidiomycota
331216956 200 54 SKTLSYILRHG--ALK-ERLV--IRAD-GCIRLD--DL--LKRPKLK------------NYTIDDVRRVVAENE-KQRFALVDEqa------------------adgs---------------------------------------------------------------------------------------------------------------------------------------iVNYIRANQGHS--IK--------EVDQPDL---TPLI-----------------------DPIELP----TVVHGTYSKFW-DSIAQDG--LKPMSRTHIHFAKGLlg----------------------EEGVISGMRAS-CDTFIYLDVEKCLQ-A------------QIEFFLSSNGVILSEGLPAGVILSEGLPASKSIPAQYFKKV 231 Puccinia graminis f. sp. tritici CRL 75-36-700-3 eukaryota>fungi>basidiomycota
260781042 203 22 SKSLSYLLRHG--AAK-MGFQ--LDPG-GFLYVD--EV--LKHPQFK------------RYTADDVRQVVADND-KKRFALQEEeg------------------------------------------------------------------------------------------------------------------------------------------------------------tgRLQIRANQGHT--LE---------VEELDL---TPIT-----------------------DPAEAP----TVVHGTFLSCW-DKIRTQG--LSRMRRNHIHFAPGEpg----------------------EDGVISGMRRT-CQVLVFIDMEAAMR-D------------GLQFFRSANNVILSFRSANNVILSPGNEEGLIPPKYFQQVL 192 Branchiostoma floridae eukaryota>metazoa
72010085 204 6 SKLLSLVLRHR--AQQ-LGFN--IYPG-GYVLVK--DL--LAHKMFK------------RFTEADIRRVVASND-KQRFSFKTNee------------------------------------------------------------------------------------------------------------------------------------------------------------tgELMICANQGHS--FD---------VPEPEL---EPIT-----------------------DASRFR----TVVHGTYFRHW-DQIRRQG--LKRMNRTHIHFAQGVpg----------------------ADGVISGMRRS-CQVMIFIDLPAALR-G------------GVKFFLSKNGVVLSFLSKNGVVLSPGDKDGILRTRYFSSVM 174 Strongylocentrotus purpuratus eukaryota>metazoa>echinodermata
221487185 210 907 IKKLNFILRHGAPLFK---LP--MRED-GYVRIR--EL--LELDCMR------------SVSWEEIYLVVASNF-KRRYEICYDptepehvgetgdlcvldelrnpvsqetmppavpptddasdlsfsptshhdadrkaarreeatkntnitssrtedrlhspasssasfsssadsskaryesaafpedaslgekslfsslrgrqaregdasggsggsgfcdvpafpssaapelandrwllratQGHLRATQGHT--IR---------QVASDLLL-RSIC-----------------------DPGELP----VCVHGTFLKNW-MAIRSAG--LSRMHRNHIHFAPGLps----------------------ECGVVSGMRRS-SDVAIYVNVHLAMK-E------------GVRFYVSNNNVILTEGLNNNVILTEGLRGKLVPSSSKSTGM 1229 Toxoplasma gondii GT1 eukaryota>alveolata>apicomplexa
198415504 211 420 SKELVRIVRHG--KYN-QQIQ--MDAE-GYVFVN--DI--LTCKRFY--------dqFPGVNELYIEKIVESND-KKRFELKFEe-------------------------------------------------------------------------------------------------------------------------------------------------------------gvGWKIKAAQGHT--VK---------IENRSL---RPIT-----------------------NPAEFP----VVIHGTYWENW-EFIKVNG--LNRMGRNHIHFAPGLpn------------------------EVVSGMRKS-CEVAIYINMTQALK-D------------GFKFFQSSNQVILTEQSSNQVILTEGDEKGRIHPKYFLKVV 590 Ciona intestinalis eukaryota>metazoa
157042782 216 26 SKSLSYVLRHG--ASK-MGLQ--MNSD-GFVFVE--EL--LAHQQFR------------SFSVDDVERVVASND-KQRFKLCKHp------------------------------------------------------------------------------------------------------------------------------------------------------------eddRLQIRANQGHS--VQ---------VTDLEL---REISq----------------------DDQDYP---REAVHGSYMKHW-PSIRSQG--LSRMNRTHIHLAPGLpg----------------------EGRVISGMRQS-CDLAVYIDVTKAMS-D------------GIKFFWSENGVLLTFWSENGVLLTPGDAAGILAPCYFSRAQ 196 Danio rerio eukaryota>metazoa>vertebrata>actinopterygii
197246418 219 24 SKCLSYALRHG--AVN-LGLP--MGTD-GFVPVS--SL--LLLPQFR------------TFSQVDIERVVSCND-KQRFTLRYSy------------------------------------------------------------------------------------------------------------------------------------------------------------adgALEIRANQGHS--LQ---------V-EVELTPL----------------------------GEELP---NQAIHGTYFRHW-PSIQQRG--LSRMNRTHIHLCTELpge---------------------GQECISGMRRD-CEVAIFIDLPKAVA-D------------GLLFFWSSNRVLLTFWSSNRVLLTPGNADGLLLPKYFLRAL 191 Xenopus (Silurana) tropicalis eukaryota>metazoa>vertebrata
297267544 220 32 SKALSYALRHG--ALK-LGLP--MGAD-GFVPLG--AL--LQLPQFH------------GFSAEDVRRVVDTNR-KQRFALQHGd------------------------------------------------------------------------------------------------------------------------------------------------------------pstGLLIRANQGHS--LQgshcclfNQVPELELMPLE--------------------------TPQALP---PMLVHGTFWKHW-PSILLKG--LSCGGRTHIHLAPGLpg----------------------DPSVISGMRPH-CEIAVFIDGPLALAAD------------GISFFRSANGVILTFRSANGVILTPGNTDGFLLPKYFKEAL 211 Macaca mulatta eukaryota>metazoa>vertebrata
238550149 220 32 SKALSYALRHG--ALK-LGLP--MGAD-GFVPLG--TL--LQLPQFR------------GFSAEDVQRVVDTNR-KQRFALQLGd------------------------------------------------------------------------------------------------------------------------------------------------------------pstGLLIRANQGHS--LQv-------gVPKLELMPLE--------------------------TPQALP---PMLVHGTFWKHW-PSILLKG--LSCQGRTHIHLAPGLpg----------------------DPGIISGMRSH-CEIAVFIDGPLALA-D------------GIPFFRSANGVILTPGNTDGFLLPKYFKEALQLRPTRKPLS 230 Homo sapiens eukaryota>metazoa>vertebrata
327286590 221 99 SKALSYTLRHG--ADK-LGLA--MGAD-GFVDVA--EI--LRLPQFK------------AWSLEDVQRVVETNE-KQRFALRPHp------------------------------------------------------------------------------------------------------------------------------------------------------------sdaHLQIRANQGHS--LQ---------VSELELVPLL--------------------------NPSDFP---EIVAHGTYLHHW-PAIRKDG--LSRMGRSHIHLAPGLpg----------------------DAAVLSGMRNN-CEVAIVIDIAKALAAD------------GIPFFRSANGVILTFRSANGVILTPGDAQGLLLPCYFREAL 269 Anolis carolinensis eukaryota>metazoa>vertebrata
195016166 226 11 SKQLSWLLRHG--AQK-EGLT--IQPD-GFVSIN--EI--LKHSRFG-----------SQYTREKLRQIVSTDA-KQRYTLRSNp------------------------------------------------------------------------------------------------------------------------------------------------------------ltgAEEIRANQGHS--LK---------AVQSEVC-MERIG-----------------------SISELP---SAVVHGTYYSNW-ERIKIEG--LKRMQRNHVHFALFNgdgd--------------------NRAVLSGFRSD-CQVLIYLNVAKVLG-D------------QLPMFRSSNNVILCAGISNNVILCAGIDGCIDKRYFERAIE 188 Drosophila grimshawi eukaryota>metazoa>hexapoda
28575019 227 4 SKKLSWLLRHG--AKT-EGIT--IRAD-GFVSVP--DL--QKHPRYL------------CFTLEKLKEIAAADA-KQRYTLRWNp------------------------------------------------------------------------------------------------------------------------------------------------------------elgVHEIRANQGHS--LA---------VLEGEAGGLENIT-----------------------HVSQVP----LAVHGTYYRHW-GAIRSQG--LSRMNRNHVHFACSDe-----------------------TNSTLSGFRSD-CQILIYLNVEKVLA-D------------GIPIYRSSNNVLLCPGISNNVLLCPGIEGFIHSSYFQRVVD 185 Drosophila melanogaster eukaryota>metazoa>hexapoda
198471764 228 13 -KKLTWLLRHG--AVK-EGIA--IQPD-GFVNIS--DI--QSHPRYA------------VFSLPKLQEIVADDA-KQRYILRWNe------------------------------------------------------------------------------------------------------------------------------------------------------------dakFHEIRANQGHS--LA---------AVQGEAC-LERIS-----------------------NAKQVP----LAVHGTYYRCW-EAIKAQG--LGRMRRNYVHFAVSDv------------------------GETLSGFRSD-SQLLVYLDVAKVLA-D------------NLPLFRSSNNVILCAGVSNNVILCAGVDGFIDKTYFSRAVD 183 Drosophila pseudoobscura pseudoobscura eukaryota>metazoa>hexapoda
91080221 231 9 SKTLSWLLRHS--AAT-EGLS--LTPE-GFAPVS--EV--LNHRQLR-----------GKFTVEDIQRIVESNN-KQRFFLRQNg--------------------------------------------------------------------------------------------------------------------------------------------------------------aILEIRANQGHS--MQ---------VTELELAS----------------------------YLNDPN---VDVVHGTFFRNL-DAIKRIG--LSRMSRNHIHFTRDL---------------------------AL--IRKN-VQVLIYIDVAKALS-D------------GIKFYMSSNGVILSYMSSNGVILSPGNEKGILEPKYFWKIV 168 Tribolium castaneum eukaryota>metazoa>hexapoda
298711928 238 59 SKRLTYALRHG--AEK-LGLR--LRPD-GFVSLD--EL--LSKPSFR------------GVSREQVEQVVASDE-KGRMTIATFp------------------------------------------------vsggeaagsasacadpgaatn-----------------------------------------------------------------------------------------qAVFIRANQGHS--VKg--------VIDEEKLLTRVE------------------------DAADVP----VCVHGTDRKSW-SNIREEG--LRCMNRTHIHFAAGLpg----------------------ESGVISGMRKA-CKVLIYVDVAAAMS-D------------GVAFFRSTNDGVAFFRSTNNPARTAPWSQGTSPALTALLLP 244 Ectocarpus siliculosus eukaryota>stramenopiles
198425598 207 535 ---LSSVLRHN----K-YGFK--VDKE-GYVPVD--AI--LKHQHFK----------KLGLTREEMHRIVREND-KQRFTIQVNed-------------------------------------------------------------------------------------------------------------------------------------------------------------gMEIIKANQGHS--VE---------VSSLNL---MTIT-----------------------DACEFH----DVIHGTFWTAW-KSIRKQG--LHCRKRMHIHMTTAEpns---------------------DQQVISGMRYS-CNVFVHIDMGQAIK-D------------GIPFFLSENKVILSFLSENKVILSPGDKNGYLRPKYFRKVE 700 Ciona intestinalis eukaryota>metazoa
291231763 206 401 SKKLSNILRHN--ANK-FGFQ--LDKG-GFLNVE--DM--LHHQHFR------------GYTIEDVKRVVTNND-KQRFALRNHpd------------------------------------------------------------------------------------------------------------------------------------------------------------snLLQIRANQGHS--VK---------VQGLEL---KRIT-----------------------DASEYP----TVIYGTYSKHL-ERIKEKG--LSRMGRNHIHFAPGMpd----------------------EVGVISGMRWD-CDVIIVLDLEKAIK-D------------GIEFMISANNVILSSGDEHGYILSSGDEHGYISV------- 577 Saccoglossus kowalevskii eukaryota>metazoa>hemichordata
145602059 162 26 SRALSRLLRHQ--AAN-AGIQ--LDGE-GYAPLD--KV--LAWGPIK----------SLKATLPEIREAVSSSD-KQRFSMKPLs-------------------------------------------------------------------------------astspds---------------------------------------------------------------------tdpaDFLIRANQGHS--IK----------LESAEHLTAVTV-----------------------EAGNVP---EVVVHGTYYAFW-PAIVASG-GLRPMGRNHVHCSTGLpss---------------------EAQVVSGMRRD-AELLVYLDVERALR-Dg-----------EMKWWLSDNGVVLTEGGQG------GLVPVKYFQGGLVPVK 223 Magnaporthe oryzae 70-15 eukaryota>fungi>ascomycota
85109317 164 52 SRALSRLLRHQ--AAS-AGIT--LDAE-GYAPLD--KV--LAWGPIR----------SLKPTFPEILKAVKESD-KQRFAIKLApg----------------------------------------------------------------------------kekedgeks---------------------------------------------------------------------eepgDWLIRANQGHS--IK----------LESEGLLRRLVLgrgggggqqqqqqqgqetegedgGTIPIP---ETVVHGTYFAFW-DKIIQSG-GLKPMGRNHVHFSTGLpedt--------------------ERGVISGMRSD-AEVLVFVDVERSIR-DaeeaekedkegkGIKWWMSDNGVVLTEGDKD------GLVPLKYFKDGLVPLK 287 Neurospora crassa OR74A eukaryota>fungi>ascomycota
116192183 166 62 SRALSRLLRHR--AGD-AGVE--LDRE-GFADLG--RV--IQWGPIR----------ALAPTFSEILNAVHNND-KKRFTIKPNpa----------------------------------------------------------------------------tnpdldess---------------------------------------------------------------------tnpsEWLIRANQGHS--IK----------LDSEHLLKALALpadd----------kdgtaalpeGAVAIP---PAVIHGTYFAFW-PSIVASG-GLKPMGRNHVHFSTGLpeds--------------------EAGVVSGMRRD-AEVLIYVDVAASLK-Dg-----------GIKWWISENGVVLTEGDVN------GLVPLKYFVNGLVPLK 276 Chaetomium globosum CBS 148.51 eukaryota>fungi>ascomycota
312220715 174 15 SKKVSWLLRHG--AAS-EGLK--LGKG-GYVNVQ--DA--LNTKTLK----------SLSVTFPELREVVANND-KQRYSMILAs---------------------------------------------------------------------aldgtdtaqppqenpes---------------------------------------------------------------------dkpsDYLIRANQGHS--IK----------VDTDGLLTPITQ-----------------------EAGNIP---ETVIHGTDEPAW-NLILKSG-GLRRMGRNHIHFASGLpagfkplapstdsaedhke-----SAPVISGMRKN-SSILIYIDIEAALA-A------------GIKFFVSENGVILSEGNEQ------GLLPYEFFEQGLLPYE 245 Leptosphaeria maculans eukaryota>fungi>ascomycota
224002288 181 59 SKSLSWVLRHS--APS-LGLR--PSPD-GYFSVE--DM--LSLKHPRfcnkgsshngGRKYTVDDIRRVVESSD-KQRFRLEYKd-------------------------------------------nqylakmmkhekssdrgetaatsnakestnapakldgssdnes-----------------------------------------------------------------------nlVLCIRANQGHS--FS--------KHIESDKLHTPLTK----------------------eELSDPNL---TIVHGTTRKAWEDHIRIEG--LSRMKRTHIHFATGLpts---------------------DNKPISGMRAT-SQIYIYINGEKCAK-D------------GVPFFKSDNGVILTAGVNEF-----DGLPVKYF-------- 303 Thalassiosira pseudonana CCMP1335 eukaryota>stramenopiles
219121541 182 5 SHRLSYVLRHG--ALD-MGLE--MTAD-GYVPVD--SL--LILQHPKfi--------GNQWTLQDIRDVVSDSD-KQRFKLREKp--------------------------------------------------------------------------------------------------------------------------------------------------------------aSDYGQATQRHT--IS---------FIKPELLLVRLSA----------------------eELRRIP----TIVHGTYSALW-PAIQISG-GLSRMKRTHIHCASGLig----------------------ENGVISGMRRG-CDVYIYINAEACAD-A------------GVVFYRSDNGVLLTAGIKI------GGLPCKY--------- 199 Phaeodactylum tricornutum CCAP 1055/1 eukaryota>stramenopiles
226471272 209 101 SKKLACILRHA--AEN-VGMN--YEPG-GYLYVD--KI--LQLKPFQ------------GVRVEDILRVVNSND-KKRYEVSTNpe------------------------------------------------------------------------------------------------------------------------------------------------------------ngRLKIRAFQGHS--VP---------IDGLDI---TLIE-----------------------NPENYP----NVIHGTYFRNW-ESIRKEG--LKRMRRTHIHFAPGEig----------------------ESGVISGLRSS-AEILIYIDLAKAMK-D------------GYKFYISKNNVILCEGNAD------GCLPTKYFADGCLPTK 282 Schistosoma japonicum eukaryota>metazoa
225707394 217 31 SYSLSFTLRHG--ANK-LGLH--MNPD-GFLFVE--DL--LAHPQFR------------SYSLEDVERVVAAND-KKRFKLCRHp------------------------------------------------------------------------------------------------------------------------------------------------------------edgRLQIRANQGHS--LQ---------VPDLEL---RPVQa----------------------GSPNCP---VEAVHRSYLCHW-TSIRTQG--LSRMARTHIHLC--Lpg----------------------EEGVAGGSSDV-RDLAIYIDVPKALA-D------------GIQFFLSENGVLLTPGDTE------GKLPLKYFTEGKLPLK 212 Osmerus mordax eukaryota>metazoa>vertebrata>actinopterygii
320168635 233 31 SKLLSYILRHG--------VP--ISPE-GFVDVE--VL--LGFPDFR------------AYTVADVRRAVTSSD-KQRFALEERi---------------------------------------------------------------tddnpv-----------------------------------------------------------------------------------------aRLYIRANQGHT--IE---------VEALELSPIT--------------------------ASEDAP----IVVHGTYDAAW-DLIKSQG--LSRMKRNHIHFAVGLpg----------------------ASGVISGMRSD-VTVLIYLDVARALA-D------------GIPFFRSSNNVILSPGLEN------GSIPAKYLENGSIPAK 210 Capsaspora owczarzaki ATCC 30864 eukaryota
66358336 243 10 SKKLTWLLRHGD-PAK-TGLN--MRND-GYVEVN--EI--LKQT---------------CISLEKLHYIVENDP-KGRFRIIDEn--------------------------------------------------------------------------------------------------------------------------------------------------------------gKNLIRANQGHS--LS---------FIEDEKLLARFEI--------------------dnnSEFIQR----IIIHGTYLDKW-KNIKING--LSRMSRSHIHFVSATnf----------------------KLESIKQGSKI-SEDMCIDQIVREMC-Ny-----------KCTAGIRPNYKCTAGIRPNC-----EVLVFIDVVNCVTNSA 176 Cryptosporidium parvum Iowa II eukaryota>alveolata>apicomplexa
310831101 247 1 SKKLSYYLRHN------LDIFN-YSKD-GYVKIS--EL--REKNIIK-----------KNTTIDAIDKIVKNDS-KNRYDLKFEi-----------------------------------------------------------------nngy-----------------------------------------------------------------------------------------kEYYIRANQGHS--SG---------NLDYSLILEE--------------------------IKEPIP----NIFHGTFIKKI-DSIKNTC--LNKMTRHFIHFAAD-------------------------DIIHNHLKRSI-SQVKVYVDMKKAMD-D------------EIKFYYAKNKVILSNGKNND-----GIIPAKYNNDGIIPAK 184 Cafeteria roenbergensis virus BV-PW1 dsdna viruses, no rna stage
110645302 248 14 SRSMCYLLRHD------RNFI--TSSD-GFVSID--TL--AKKL---------------NISNQQITEIAHRDS-KNRYEINN------------------------------------------------------------------------------------------------------------------------------------------------------------------DMIRAVQGHS--NR---------HVDFKMDKV---------------------------AINYKG----IAVHGTFKKHL-NSIISHG--LKRMSRNHIHLATS----------------------------KNNARKN--ANVFIYINIRHCLK-D------------GMIFYFSSNGYILTMGFD-------GTIPSKYIVKYEFASK 174 Neodiprion abietis NPV dsdna viruses, no rna stage
302851356 255 501 SKEMSRLLRHKP-PPG------AMDAA-GWVSLP--VL--LRHMR-------------NHPSEEQVRRIVETCD-KKRFVIDDSv--------------------------------------------------------------------------------------------------------------------------------------------------------------nPPRIRAAQGHS--VE---------LTEAVLEPV--------------------------vDPSKVP----IAVHVTSVSSW-EAIRTSGQ-LMRMNRTHIHFATE---------------------------PHHMRKNKW-AEIYLRLDLAAALE-Q------------GRQFFLSSNGVLLCE----------GPVPVSLVEEGPVPVS 678 Volvox carteri f. nagariensis eukaryota>viridiplantae>chlorophyta
307104106 256 1 -----------------------MDAS-GFVPLP--VL--LQELR-------------SPGATEAVVRHVVASDLKGRYELDESs--------------------------------------------------------------------------------------------------------------------------------------------------------------vPPRIRAVQGHS--VH---------LAAPQLAPV--------------------------gSADEVP----LALHITSLEGW-KAIQDSGE-LRRMSRTHVHFGTE---------------------------PGHLRRNSW-ATVLLRLDLRQAMQ-D------------GHAFFLAANGVLLCE----------GPLPARYLEEGPLPAR 155 Chlorella variabilis eukaryota>viridiplantae>chlorophyta
157126123 259 57 ---FSWLLRH---SAA-VAEH--MDPD-AFVEFE---V--LQQI--------------SGASKDRMLELIAQDQ-KGRYEIRG------------------------------------------------------------------------------------------------------------------------------------------------------------------EEVRAVNGHS--VH---------FCDNYEVL----------------------------SGERRP---EFLYHATNDKAL-PLIMAGA--LKRMGRHYIHMYDGPpq------------------------KTSVRYR------ILRIRPL-----P------------GHTLYRTKNGYILCR----------EDIPAEFIEREDIPAE 210 Aedes aegypti eukaryota>metazoa>hexapoda
262195534 260 6 SRRISSLLRHR--AGD-AGLS--MDAA-GWVEID--AL--LAHL---------------GESRELLDAVVQTNN-KARFEVAG------------------------------------------------------------------------------------------------------------------------------------------------------------------TRIRASQGHS--LEnmpv-----TRDALEAS----------------------------WSRFDGE--DSLWHGTQPEVV-ESIARDG--LLHGARSHVHLAESR--------------------------DSSVGKRSN-VGVLLEISPSELRA-A------------GWELFKSPNGVILCR-----------HVPPECILCRHVPPE 176 Haliangium ochraceum DSM 14365 bacteria>proteobacteria>deltaproteobacteria
284033571 261 2 SKRLSWLLRHG--AGE-QGLA--MTAD-GWASIE--DV--CVLT---------------DISRPALDRAVERND-KNRLEVDG------------------------------------------------------------------------------------------------------------------------------------------------------------------DRIRACQGHS--LAgmpv-----TREALENS----------------------------WRRVHPA--DLLWHGTTRAAV-EAIRREG--LKPGRRTHVHLAPSR--------------------------DSHVGKRFA-AAVLLAVDPVDL------------------VVFEAPNGVLLTR-----------QVPPDAILTRQVPPD 170 Kribbella flavida DSM 17836 bacteria>actinobacteria
162450235 262 1 SKKLSWLLRHA--APS-QGVA--MDDA-GWVAVD--DV--LKAL---------------RISRPVLDEVVEKNT-KNRLEIRG------------------------------------------------------------------------------------------------------------------------------------------------------------------DRMRASQGHS--RDgmpv-----TLAGLEAS----------------------------WEEVHDD--ASIWHGTSVDAV-RGIARDG--IRPAARTHVHCTDAL--------------------------GSAVGKRAK-VDVMLEISPARLRA-R------------GVRVFRSQNGVILVR-----------EVPVQCLLVREVPVQ 177 Sorangium cellulosum 'So ce 56' bacteria>proteobacteria>deltaproteobacteria
20094870 313 39 SKLLSGILRHF--PEE-VKVK--LDDE-GFTDCDVHEL--AERIKKYw----knreyYRWLTGEHIIAVVETCP-KGRFEIDEH-----------------------------------------------------------------------------------------------------------------------------------------------------------------GRIRARYGHSRRLS----------VRPTL------------------------------PEAENV---KELYHGTARENL-ESILQHG--IKPMGRRAVHLTDDE------------------------REALITALRHTRNPVILVVDAERLRR-H------------GLVPRKAGKNVYVVEG----------TVPPDCITRVIRNPR 218 Methanopyrus kandleri AV19 archaea>euryarchaeota
118430933 314 40 SKTLAGILRHH--PGR-YGVR--LTRE-GWARVS--EV--VEGLRKA---------gWSWVEEWHIVGVALHDP-KGRYELRN------------------------------------------------------------------------------------------------------------------------------------------------------------------GEIRARYGHS--IP----------VNVEP------------------------------LPGEPP---PILYHGTTEEAL-PLIMERG--IMRGRRLKVHLTSSL------------------------EDAVSTGRRHGNLVAVLLVDVECLRR-R------------GLKVERMSKTVYTVD-----------WVPPECIAEVRRESL 208 Aeropyrum pernix K1 archaea>crenarchaeota
119871538 315 35 SKLLSLALRHS--PHV-LGIT--LDVE-GWADIN--AV--VEGLRRA----------GLPASPQVLKAVAQLDD-KGRFEIRD------------------------------------------------------------------------------------------------------------------------------------------------------------------GRVRARYGHT--IK----------VQIRY------------------------------EVDLDT---RLLYHGTALYVL-PSILSQG--ILPMRRLYVHLAVDV------------------------ETACLNARRRQ-NPAVVEVDADCVRK-S------------GNPIYKATEKIRLTP-----------YVPPTCVKKWAICPT 199 Pyrobaculum islandicum DSM 4184 archaea>crenarchaeota
18314222 316 35 SKLLSLALRHS--PSV-LGLS--LDKG-GWADVK--TA--LEGLRKA----------GIRADYEALYAVVALDE-KGRFELKD------------------------------------------------------------------------------------------------------------------------------------------------------------------GKIRARYGHT--ID----------VEVEY------------------------------EADSES---KVLYHGTSRHLL-PSIMAQG--LLPMRRRYVHLSPDF------------------------ATACQNARRRP-LPVVIEIDAECLRA-R------------GYVVYAASGKVRLAK-----------HVPPECLKKVVDCPT 203 Pyrobaculum aerophilum str. IM2 archaea>crenarchaeota
145591275 317 38 SKTLSLALRHS--PAV-LGLV--LDSR-GWGEVE--AV--LRGLDRA----------GLKISREALEAVVALDD-KGRFEMSN------------------------------------------------------------------------------------------------------------------------------------------------------------------GKIRARYGHS--ID----------VEVEY------------------------------EVDEDS---ASLYHGTSKDNL-PFIMAVG--ILPMKRKFVHLATDV------------------------DTACLNAARRP-SPIVIEVDAECLRR-S------------GVVIYIGSRKIRLAK-----------YVPQSCIKRVFQCLS 204 Pyrobaculum arsenaticum DSM 13514 archaea>crenarchaeota
126460155 320 34 SKLLSLALRHS--PSA-LGMS--LDEG-GWAPLD--AV--VAGLKKL----------GLPASAEAVEAVAQLDK-KGRFELSN------------------------------------------------------------------------------------------------------------------------------------------------------------------GRIRARYGHS--VS----------VKVDY------------------------------EVDTET---RRLYHGTTRRSL-EGIMKMG--ILPMNRLYVHLAVDF------------------------YTACETAARRQ-DPVVLEVDADCARA-A------------G-PIYKASPAIRLSK-----------YIPPTCITGVYPCEK 197 Pyrobaculum calidifontis JCM 11548 archaea>crenarchaeota
305663054 322 43 SKLMSFLLRHD--PES-IGLK--MDSS-GWVYID--DL--VDGIRNRw----rnshlYRWVEKEHVIAIAMLDP-KGRFEICG------------------------------------------------------------------------------------------------------------------------------------------------------------------DRIRARYGHSKNLD----------IEIDY------------------------------PRDIET---KILYHGTAREFI-DRISIEG--LKPMNRHYVHLTIDM------------------------VDACIVGERHSGNPVVLKIDADCVRS-H------------GIDIYIASKSIRLAK-----------HVPRKCILAKHVPRK 218 Ignisphaera aggregans DSM 17230 archaea>crenarchaeota
307595891 323 37 SHLMTYLLRHD--PSA-VNLS--MDSE-GWVSID--EL--VHALRDKw-----dpkaYSWLTKEHIMAVASLDP-KGRFEIRD------------------------------------------------------------------------------------------------------------------------------------------------------------------GMIRARYGHNKSLD----------VNIRY------------------------------EVDSEV---RTLYHGTTKRAL-VRIMREG--IKPMNRKYVHLVLDP------------------------RDAYEVALRHGNDVVILKINVDCLRR-N------------DQQILIATDRIRLTD-----------YVPPQCIETDYVPPQ 212 Vulcanisaeta distributa DSM 14429 archaea>crenarchaeota
126465464 326 49 --------RHY--PWE-AGLR--IDSE-GWVDID--EL--VEGIKTRw----rnneiYQWLSREHIIAVAKLDP-KGRFEIRN------------------------------------------------------------------------------------------------------------------------------------------------------------------NKIRARYGHS--IN----------VKIKY------------------------------ELEYPP---TQLYHGTSIDKL-AKIMIEG--LKPMKRQFVHLTTSL------------------------ENAVETGKRHGK-PVVLIIDTMCLKE-K------------RIPLYKATEKIYLAP-----------KIPPQCILAPKIPPQ 213 Staphylothermus marinus F1 archaea>crenarchaeota
124028223 327 28 SKLMTTLLRHL--PHE-AGLR--LDPQ-GWVGID--EL--VRGIRERw----rnrhlYQWVTRDHVIAVALLDP-KGRFQLDLA----------------------------------------------------------------------------------------------------------------------------------------------------------------RGRIRAAYGHT--VR----------VELGY---------------------------rplSMDELP---DKLYHGTVAENL-ASILSEG--LKPMRRLMVHMTTDY------------------------SSAVETGRRHGPNVVVLVIDPRCLAK-H------------GIPVYRASDTIYLAP-----------SVPPNCILAPSVPPN 215 Hyperthermus butylicus DSM 5456 archaea>crenarchaeota
315230724 330 35 SKLMTYILRHS--PWE-FDLN--PDDF-GFIELD--EF--IKALKSV----------YPWVKEEHVRAVAELDP-KGRFEIRE------------------------------------------------------------------------------------------------------------------------------------------------------------------DKIRARYGHS--YE----------VFLDH------------------------------EEDTES---RTLYHGTPRKNL-DSILKEG--LKPMKRRFVHLTKDK------------------------TEAYYTGLRHGKDVVILVIDAECLRR-K------------GYRIYKAGKNVRIVK-----------YVPPECIVLWEVPPE 211 Thermococcus barophilus MP archaea>euryarchaeota
156937278 331 2 SKKMTYLLRHK--E-G-F-VD--PE---GWASLD--SL--VRELRKF----------FPWVSKEHVLEVISKDD-KGRYELRG------------------------------------------------------------------------------------------------------------------------------------------------------------------DKVRARYGHT--VK----------YVRPT------------------------------LEESYE---TLLYHGTSCEAA-RAILKEG--IKPMKRNFVHLTTSL------------------------EEAIENARRKGKCIKVLIVDGECLRK-R------------GIKIYKAGKHVRVCS-----------YVPPECVVGEAVPPE 174 Ignicoccus hospitalis KIN4/I archaea>crenarchaeota
284163819 337 32 SKFVSGALRHF--PED-VGLE--LDAH-GWTDYE--AL--AGAVEAK----------YDWAEPCHVAAVIATDP-KGRFERTDA--------------------------------------------------------------------sgtddga--gn----------------------------------------------------------------------------------GLVRASYGHS--VD----------VDLGP------------------------------TDEPVP---DELYHGTAPATL-ASIREDG--LRPMSRQQVHLSGSR------------------------EAARRVGQRHANDPVVLVVDATAMLA-D------------DQRITKRGRETYTTD-----------AVAPEYIDFPAVAPE 221 Haloterrigena turkmenica DSM 5511 archaea>euryarchaeota
55379941 338 30 SKFVSGALRHF--PED-AGIE--VDKA-GWTGFD--AL--RVAVERQ----------YDWADAAALAGVIATDP-KGRFERTGV---------------------------------------------------------------------gneagittag----------------------------------------------------------------------------------GRVRAAYGHS--VD----------VTLDG------------------------------TDDPVP---ATLYHGTAPRNV-DSIREAG--LKPMSRQTVHLSESA------------------------AAAREVGRRHAADPVVFVVDATAMQS-D------------DRRIVKRGTETYTTD-----------RVSPVYLTTDRVSPV 217 Haloarcula marismortui ATCC 43049 archaea>euryarchaeota
11499148 341 25 SKFLSGLLRHF--GRD-FGVR--LDED-GWAELR--DV--LKILSER----------Y-GVGRKHVELIVKFDP-KGRFELKN------------------------------------------------------------------------------------------------------------------------------------------------------------------GRIRAKYGHS--VE----------VRTDW-----------------------------sEGGEIP---EKLYHATSPENL-NSILKTG--LLPMRRREVHMCSSP------------------------QEAIEVGKRHSSNPVLLEIDAKGLMQ-D------------GIEVRRKGK-VYTVD-----------FVPPKFITVDFVPPK 200 Archaeoglobus fulgidus DSM 4304 archaea>euryarchaeota
327400244 342 2 SRFLSGLLRHF--PHK-FGVK--VDSE-GWASLE--DV--ERVIKER----------Y-GAGMDIIRHIVNNDP-KGRFEIKD------------------------------------------------------------------------------------------------------------------------------------------------------------------GRIRARYGHS--IA----------INTRW-----------------------------sEDGSIP---PKLYHGTRPEVV-KSIMQHG--LLPMRRLEVHLSGSV------------------------EEAIDVGRRHCPKPVVLEIDAEGMMG-E------------GIEIRKKGS-VYTAD-----------FVPPKFITADFVPPK 174 Archaeoglobus veneficus SNP6 archaea>euryarchaeota
288932585 343 33 SKFLSGILRHF--PDS-FGIR--LDKN-GFADLD--EV--IRILRER----------Y-GVGKREVEAIVLFDK-KGRFEIKD------------------------------------------------------------------------------------------------------------------------------------------------------------------GKIRARYGHS--VK----------VDYRW-----------------------------sEEGKIP---EKLYHGTKPENV-KSILKLG--LLPMKRNEVHLSESI------------------------DDAIEVGKRYCKNPVVLEIDAKKMLE-D------------GFEIRKKGR-VYTTD-----------YVPSKYITTDYVPSK 199 Ferroglobus placidus DSM 10642 archaea>euryarchaeota
147919656 348 40 GKIISGALRHF--PAD-LGLD--MDEH-GWVSLR--DL--TRVIERK----------YEWARSYHVDAMFKTDD-KGRYERKG------------------------------------------------------------------------------------------------------------------------------------------------------------------DKVRARYGHS--LN----------IKPDY------------------------------PEFDGD----KLYYGTSEEEA-DRILEIG--LKPVNQHFVHLSKSI------------------------EEAVKVACIRTEHPVIIEVDAKKARE-T------------GIEILDAGP-VCLTA-----------QIPAEFLQIGQIPAE 208 uncultured methanogenic archaeon RC-I archaea>euryarchaeota
20093417 349 27 GRFVSGTLRHF--PAS-AGVK--MDEY-GWVDLN--AF--CDVMKKR----------YNWMRKEYLYALVESDE-KGRYQIRG------------------------------------------------------------------------------------------------------------------------------------------------------------------FMIRARYGHS--VN----------IELDY------------------------------EESDAP----YVYYGASPEEV-DVLLENG--IFPIKQRYVHLSTSY------------------------EKAAEVALIHTESPVILQVDAFRAQE-D------------GISLKLATDYIVLAE-----------KIPPEYLYVIEEPPE 202 Methanosarcina acetivorans C2A archaea>euryarchaeota
336475983 350 27 GRFISGVLRHF--PRE-VGLK--MDDE-GWVDFE--LL--CSLLKSR----------YKWATRERLISLVESDE-KQRYEIDD------------------------------------------------------------------------------------------------------------------------------------------------------------------SRIRARYGHS--VD----------VDLDY------------------------------PDNELP----SLYYGVSQEEV-DMLLENG--ISPIRQTYVHLSTSY------------------------GKAVEVAQIHTENPVILEIDAEKARR-D------------GMSIMDANEDIALME-----------YVPSDYVCIFDGRSD 202 Methanosalsum zhilinae DSM 4017 archaea>euryarchaeota
294494713 351 27 GRFVSGVLRHF--PDD-VGLD--MDAQ-GWIELD--AF--CEAMKKR----------YKWAGKMRLVSLVESDP-KQRYEIDN------------------------------------------------------------------------------------------------------------------------------------------------------------------SFIRARYGHS--ID----------VDLDY------------------------------PLYDSD----VLYYGVSQEEV-DMLLENG--IKPYRQTYIHLSNSS------------------------QRARQAASVHTDNPVILEIDAASAAK-D------------GYEFLCANEEIVLSK-----------EILPEYIEIADDLPE 203 Methanohalophilus mahii DSM 5219 archaea>euryarchaeota
288931212 354 29 GRFISGLLRHY--PDK-YRLE--MDEN-GWVDFG--KL--VRVVKRR----------FKWANQWLVKAIVYSDE-KGRYEISN------------------------------------------------------------------------------------------------------------------------------------------------------------------DKIRARYGHS--VD---------NVKLDL------------------------------PEAEEE----TLYYGTSEEEA-SRVMEVG--IKPVNRRYVHLSTTL------------------------EKGEEVARLRTDEPIVLVIDAKEAKK-D------------GIRFIKVNENIVLAE-----------EIPPKYIKDFEIPPK 208 Ferroglobus placidus DSM 10642 archaea>euryarchaeota
330508961 355 26 GRLVAGGLRHF--PLD-LGLE--MDSR-GWIDLS--KL--GEVVQKR----------HRWANKEMVIALAQSDP-KQRYEISN------------------------------------------------------------------------------------------------------------------------------------------------------------------QRIRARYGHS--MD----------IELDH------------------------------PECHLP----RLYYGASEEEA-DRILEIG--LKSASQRYVHLSTTP------------------------NKAWDVAGYRTGNPKVIQVDAAPARE-A------------GVKMMTVNDDIVISE-----------MIPARFLCILASKDI 201 Methanosaeta concilii GP6 archaea>euryarchaeota
116754706 356 37 GRLLAGALRHF--PDD-LGLA--MSPQ-GWVEIP--VL--VDAIRTR----------YRWANENLVMALVRSDP-KGRYEING------------------------------------------------------------------------------------------------------------------------------------------------------------------TRIRARYGHS--VG----------VDLDY------------------------------PENELP----TLYYGTAEEEA-ERLLEVG--LKSATQRYVHLSTTP------------------------DKAWEVGTFRTSNPKIIVVDAAGAQR-E------------GVRMMKVNESMVISD-----------PIPPRFLSMMPAKAQ 208 Methanosaeta thermophila PT archaea>euryarchaeota
167043400 361 28 ARRLALVLRHA--PEK-FDLE--MDIN-GWIDVK--DI--VKQFKGSne------rrYHWFRPHHIRAISETDP-KGRYEVRG------------------------------------------------------------------------------------------------------------------------------------------------------------------NVIRATYAHT--VE----------IELDL------------------------------PTDNIP---DALYYPCSPDEY-ENLIEVG--ISPSGRAHVHLSANI------------------------RSAAEAGHVHHAIPTLLEVDTARLVA-A------------GETVWHAGITVYLAE-----------FVPGKYLLAEFVPGK 208 uncultured marine microorganism HF4000_APKG1C9
10639263 362 1 SRTLAAILRHD--PER-YHIR--LDSH-GYARIA--GI--VTVLRKYk--------gMKWITFDHILSLAETDP-KGRYQVSG------------------------------------------------------------------------------------------------------------------------------------------------------------------VLIRAMYGHT--IP---------VDLSDL------------------------------PEDNIP---DVLYYQSSAAEA-PLVKEAG--IYPSDKTWVHLSGTY------------------------RRSYVSGLYHIDDPFILRIDARSMID-S------------GHDIYRSSDDIYLTR-----------EIPPEYILTREIPPE 180 Thermoplasma acidophilum archaea>euryarchaeota
254169141 363 29 SRMLAGILRHF--PER-FGVK--LDDS-GWADIY--QI--VKGIKRRh-------prFRWLKDKHIIAIVLTDD-KGRYQLDME----------------------------------------------------------------------------------------------------------------------------------------------------------------NKRVRATYGHS--IK---------VDLSDL------------------------------PTDNIP---EKLYYPTTEEEY-EYIKEIG--LQPGDRKWVHLSKTY------------------------RDAYIAGLHRVEEPIILEIDTKKAIE-N------------GHQIYRAAKTVFIAS-----------QIPPEFINISQIPPE 213 Aciduliprofundum boonei T469 archaea>euryarchaeota
29830778 369 902 SRSLSYHLRHG------RELT--QNPQ-GWVPID--SL--VRALDPK-----------LRVSADELISVARAVS-EERFEVRG------------------------------------------------------------------------------------------------------------------------------------------------------------------DLVRARYGHS--RP----------TAIEY------------------------------EIRAPE---GRLYHCTPTTAL-HNIFERGEGLRPMTRQWVHLTTDR------------------------AAALSAGRRHGPCTLLCVPDPSAL------------------ECRHAGGATWLVA-----------QVPPSALTVVPLHRL 1051 Streptomyces avermitilis MA-4680 bacteria>actinobacteria
228983067 370 4 GGFLCKILRHS--PSQ-FHVS--LDEY-GYAPID--EL--LNAISSNe-------kwVNLVTVEMILEVVKTDE-KQRYKLDST----------------------------------------------------------------------------------------------------------------------------------------------------------------GTKIKARYGHS--IA----------VKSDE-----------------------------eQNRVLP---DILYHGTGMEHL-DSIQKLG--LLPMKRVNVHLSETT------------------------FFANKSAKRNQ-FPVLLKVDTIMAKN-L------------GVTVEYAGDEVWLSS-----------PIPSDCLLSSPIPSD 185 Bacillus thuringiensis Bt407 bacteria>firmicutes
251794334 371 5 SKLMTKILRHT--PEQ-FGIS--LDPEDGSCGIH--VL--LEAIQAQp--------kWAGITIEDIEQVVRNSE-KQRFAIED------------------------------------------------------------------------------------------------------------------------------------------------------------------GRIRARYGHS--HD-----------RVQY------------------------------TAGEPP---AILYHGTNRKAL-PSILGEG--LHPMNRQYVHLSEGT------------------------HFATLAGSRRG-ELVILKIDTSRAKE-A------------GVVFFFAGNEVWLAD-----------RVPADVWLADRVPAD 180 Paenibacillus sp. JDR-2 bacteria>firmicutes
310641074 372 11 SKFMSEILRHT--PEQ-FGLE--LDHE-GYCDIQ--DL--LRGIRSEd--------rWSDVSESDIKQVVSHCP-KQRYEMVN------------------------------------------------------------------------------------------------------------------------------------------------------------------GYIRANYGHS--AG-----------KLNY------------------------------EEATPP---TILYHGTNTKVI-HNLFTEG--IKPMGRKYVHLSESL------------------------EFAILAGKRRG-ELVILEVDTAKALA-N------------QVKFYKANHGVWLAD-----------LVPPQYLLADLVPPQ 178 Paenibacillus polymyxa SC2 bacteria>firmicutes
334135982 373 11 SKLMSKMLRHS--PGD-FGLV--LDGE-GFCSLG--DF--LTALNRVs--------gFEDVRPEDIQRVVRECE-KQRFEIAE------------------------------------------------------------------------------------------------------------------------------------------------------------------DYIRARYGHS--HE-----------RITY------------------------------EAAEPP---SVLYHGTNRKAV-ALIMAEG--LLPMSRQYVHLSEGL------------------------HFAALAGKRRG-ELVILEVDTALAGH-K------------GVRFYYAGNEVWLAD-----------RIPAEVWLADRIPAE 176 Paenibacillus sp. HGF7 bacteria>firmicutes
116495334 267 1 SKTLSMLLRHH--PEK-LGLV--LDQY-GRTDWK--TL--VRRFNAH---------yQMHLDRQVLQAIMAQST-KKRFALEG------------------------------------------------------------------------------------------------------------------------------------------------------------------TTIRAVYGHS--VP-----------------VMPLT-----------------------PATEPP---QWLYHGTSHQAA-TVIAKEG--LLPMNRDFVHLSEDV------------------------ATARQVGARHDTHPVIYRIAARDAAK-N------------GILFYPTSSRVWLVS-----------ELPARFLLVSELPAR 178 Lactobacillus casei ATCC 334 bacteria>firmicutes
227508115 268 13 SKRLSFILRHH--PEK-IDIK--LDQY-GRTNLN--VL--IRHFNKH---------yGTPISQSIITAIIQQSD-KQRYAIEG------------------------------------------------------------------------------------------------------------------------------------------------------------------NTIRALYGHS--IP-----------------VKPLT-----------------------PPKMPP---EYLYHGTTHSAA-RLIETEG--LKKMDRDFVHLSANQ------------------------QMAIQVGRRRDPRPVVFRVAAKNAAK-N------------NVLFYPTKSGIWLVD-----------AMPAQFLEVDAMPAQ 189 Lactobacillus brevis subsp. gravesensis ATCC 27305 bacteria>firmicutes
338811714 270 5 SKTMSYALRHA--PWE-YELE--MDEG-GWVSII--QL--LHSLQEE--------qkWSDVKAENIYYVAKTSD-KGRFEIAD------------------------------------------------------------------------------------------------------------------------------------------------------------------SKIRALYGHS--IP-----------------LRIIK-----------------------APGEPP---QLLYHGTSRQEA-DAIMANG--LEPRGRQYVHMAVDP------------------------KMALQVGKRRDNKPVLLTIKAREARQ-D------------GVAFYKGNDLVWLAE-----------FVVAKYIDIEFVVAK 178 Acetonema longum DSM 6540 bacteria>firmicutes
303240380 271 7 SKAMSYALRHA--PWE-YELE--IDEH-GWVNIE--HL--LYSFHEE--------kkWSELEIKDIIYVVENCD-KKRFEVDD------------------------------------------------------------------------------------------------------------------------------------------------------------------KRIRALYGHS--VP-----------------QKIIK-----------------------EPMQPP---EILYHGTAKRFL-SMIKEKG--LIPKGRQYVHLAVDS------------------------DMALQVGKRRDDHPALLIINSRDAWN-E------------GIKFYKGNEKVWLAD-----------FIDSQYIEADFIDSQ 177 Acetivibrio cellulolyticus CD2 bacteria>firmicutes
256006093 273 2 SKEVAYALRHA--PWE-YGLE--LDAE-GWVDIN--QL--LSSLHEC--------ekWKKVSEHDLHVMIEKSD-KKRYEISN------------------------------------------------------------------------------------------------------------------------------------------------------------------GKIRALYGHS--IP-----------------QRIIK-----------------------EQKCPP---EVLYHGTARRFV-KSIKEKG--LQPQGRQYVHLSADV------------------------ETALQVGKRRDIKPVLLIVNALEAWS-E------------GIKFYLGNDKVWLAD-----------AIPSKYIRFDAIPSK 178 Clostridium thermocellum DSM 2360 bacteria>firmicutes
295093305 275 2 SKEVSYALRHA--PWE-YELE--MDEE-GWVSVE--QL--VDALNKD--------mkWIGTSEDDLLVMIDKSE-KKRHEISG------------------------------------------------------------------------------------------------------------------------------------------------------------------GKIRAFYGHS--IP-----------------MHIKK-----------------------EKMIPP---DILYHGTARRFL-SSIKING--LLPQGRQYVHLSQDI------------------------STAQSVGLRRDNKPCVLQIDAKRAWE-D------------GILFYFGNEKVWLAD-----------VIPSKYILADVIPSK 177 Coprococcus sp. ART55/1 bacteria>firmicutes
49477941 276 1 SKEVSYALRHA--QWK-YELE--LDEN-GWVSVE--QL--LHALHQS--------ieWRDVKIEDLKIMIEKSE-KKRHELKE------------------------------------------------------------------------------------------------------------------------------------------------------------------NKIRALYGHS--IP-----------------MKIVK-----------------------EEGVPP---EFLYHGTSPRFL-NSIESNG--LSPMSRQYVHLSEDI------------------------ITAELVGKRKDKHPIILEVNTGKARE-E------------GVKFYLGNEKVWLAD-----------EIPSEFILADEIPSE 180 Bacillus thuringiensis serovar konkukian str. 97-27 bacteria>firmicutes
304405428 278 1 SKEVSYALRHA--PWE-FELE--LDAE-GWVAVE--QL--LHSLRHQ--------aqWTSISEADLATMIDQSE-KKRHELAD------------------------------------------------------------------------------------------------------------------------------------------------------------------GKIRALYGHS--VP-----------------AKIIK-----------------------NIERPP---AVVYHGTARHLL-ETILAAG--LKPMGRQYVHLAVDQ------------------------ETAITVGKRKDSEPALLAVDAQKAWQ-D------------GIRFYRGNHSIWLAD-----------QVPPIYILADQVPPI 179 Paenibacillus curdlanolyticus YK9 bacteria>firmicutes
325108247 281 3 SRAMSHALRHE--PWV-YELE--LDEE-GWTSTE--RL--LSALRKQ-------kskWRNVTERDFVRLMESAT-KQRYEMAD------------------------------------------------------------------------------------------------------------------------------------------------------------------GRIRAFYGHS--VT-----------------GLLKK-----------------------TPAEPP---AVLYHGTSPEVV-EFILAEG--LRPMARQFVHLSTEI------------------------VTAKEVGRRKCKVPVILQIDSPLAVQ-Q------------GSCFYLGNEMVWLAD-----------KIPEMVWLADKIPGN 178 Planctomyces brasiliensis DSM 5305 bacteria>planctomycetes
339009751 282 1 SKEISYALRHA--PHE-YELE--LDEY-GWVQTE--QL--LHSLHEQ--------pvWRNVSEKDLQVMISQFD-KKRFEMEN------------------------------------------------------------------------------------------------------------------------------------------------------------------GKMRALYGHS--TA-----------------KRVLK-----------------------EESEPP---EFLYHGTPKRFV-SLILEQG--LLPKGRQYVHLSEEI------------------------QTAKQVGKRRDTHPTILKIEAKKAWA-N------------KVTFYHGNEMVWLAD-----------KIDRQYILADKIDRQ 176 Brevibacillus laterosporus LMG 15441 bacteria>firmicutes
319936601 285 1 GKEISYVLRHH--PEK-YNLD--IDNE-GWVDVG--DL--LNALESR----------FGLLKEEDIVALMQQSE-KERYELKN------------------------------------------------------------------------------------------------------------------------------------------------------------------HRIRAYYGHS--FS-----------------KKIMK-----------------------QRNIPP---KVLYHGTARRFV-SSILTTG--LQPMSRQYVHLSQDV------------------------ETAKQVGMRHDTQPVILMINAQSAFQ-D------------GVAFYLGNEKVWLSE-----------TIPPQYIEERKQPPQ 175 Coprobacillus sp. 29_1 bacteria>firmicutes
332361966 286 6 SREVSYILRHN--PDK-YGIK--LDSE-GWCSVD--DL--IHNLSET--------plWKGLTRDDLETMIELSD-KKRHEIKG------------------------------------------------------------------------------------------------------------------------------------------------------------------EKIRAFYGHS--IK-----------------DKLSK-----------------------TANKPP---KVLYHGTVQRFL-NQILQTG--LIPKERQYVHLSSDV------------------------STAKQVALRRDDRAIILEVAAQSAWE-N------------GVKFYIGNEDIWLSE-----------PIPSEYILSEPIPSE 177 Streptococcus sanguinis SK49 bacteria>firmicutes
125717421 287 3 SREISYILRHN--PLK-YNLT--LDKE-GWADIN--DL--LQKLNAR--------seWNGLSKKDLEKMIASSD-KKRHEIQS------------------------------------------------------------------------------------------------------------------------------------------------------------------DKIRAFYGHS--LK-----------------EKVQK-----------------------SPCQPP---NVLYHGTVEKFV-DSILEKG--LITKERQYVHLSTTP------------------------ETAIKVALRRDKKAIILKIDAQKAWD-S------------GIKFYLGNEDIWLSE-----------PIASKFISFEPIASK 179 Streptococcus sanguinis SK36 bacteria>firmicutes
227893699 291 14 SKKMSYCLRHN--PGK-YGLK--LDEY-GFVDLQ--EF--LNAMNRI-------hqhFPKLTEMKIREIMHNSD-KERFEIKN------------------------------------------------------------------------------------------------------------------------------------------------------------------GKICALYGHS--LP-----------------GIIKR-----------------------KKAIPP---KVLYHGTAHRFL-TSIEREG--LLPMGRQYVHLSTDI------------------------AMAESVGKRRDHHPAILLVNAEKAHK-D------------GIDFYIGNDEVWLCD-----------CVPSKYLLCDCVPSK 184 Lactobacillus ultunensis DSM 16047 bacteria>firmicutes
298245737 293 2 SKTMAYVLRHD--PQS-HGLT--LDAE-GWVSLK--DL--LAALRQQ-------rsyWATLKEADLLAVLEQSE-KQRFEVRN------------------------------------------------------------------------------------------------------------------------------------------------------------------GKIRAYYGHS--VP-----------------TKVEK-----------------------QPVTPP---EILYHGTTPQAA-NLIKGRG--LSPMKRQYVHLSADE------------------------ETAMVVARRRTNHPIILKVHARKAEA-N------------GVRFYLGNDMVWLAE-----------PIPSDYIQFEPIPSD 181 Ktedonobacter racemifer DSM 44963 bacteria>chloroflexi
226313333 296 6 RKRLLSILRQN--SEA-FQLY--YDTY-GYTPVE--PL--LEYLHTL--------kgCAYITRQDLHQVVEFDP-ERSIEWDGG-----------------------------------------------------------------------------------------------------------------------------------------------------------------SLIRVTYGF---LP------------------SIAKs--------------------rlMEIVPP---DVLYYGTHRKLL-KQVLTGG--LLPIASEYVQLADRP---------------------------EHIGEPTDTLR-LVTVNAKEAHE-A------------GICFYRVGEHYCLSD-----------AVPSSYLQLDAVPSS 180 Brevibacillus brevis NBRC 100599 bacteria>firmicutes
312142649 297 5 SKTLSYILRHH--PES-FDLK--LAAD-ASVETD--EL--LNSLKNK----------FKKITKDDLIKVVEADP-KGRFSFLDEq----------------------------------------------------------------------------------------------------------------------------------------------------------------KRIRANYGHS--IE------------------GVNP---------------------eyEAVKPP---EFLYHGTTPEAK-NKILAEG--IKPMGRNYVHLSVNI------------------------KEAKKVAQRRTNNELIFKIRALKAYQ-A------------GQEFYKTAENIYLTD-----------QIAAKYLFFDQIAAK 179 Halanaerobium hydrogeniformans bacteria>firmicutes
116748284 300 3 ARMLSYIGRHS--PGE-FGLY--WNPD-GTMPWK--EF--YWALQED--------eaLRFVRESHVREIALQGL-ELPFSLEN------------------------------------------------------------------------------------------------------------------------------------------------------------------NRLRLIGPAA--PP-------------------EYP-----------------------VSEFLP---GRLFYACRRAHL-EVIRLRG--LQASGRPYVLLCTER------------------------EQAVRIAKRREAEPIVIEIKAEEARA-A------------GTLFRKAGATVYLVE-----------CVAADHLVFPCVAAD 177 Syntrophobacter fumaroxidans MPOB bacteria>proteobacteria>deltaproteobacteria
328952864 303 12 ARLLRYILCHH--PDE-FGLV--LDKS-GRLAVK--EL--LRALGQE--------egWRFVRRSHLEEVVNLIN-PGDFELDQ------------------------------------------------------------------------------------------------------------------------------------------------------------------TYIRALHPQP--AE----------LRSQ-------------------------------EAAWPP---PLLYRAITANSH-HAVAERG--LQPPSGGELVLADNQ------------------------ELAKRLGQRRDPQAIMVIVQAQAAAK-R------------GVNFFSYGPKLYLSD-----------AIAPEYLQLPAIAPE 183 Desulfobacca acetoxidans DSM 11109 bacteria>proteobacteria>deltaproteobacteria
301058276 304 1 --MLTYVLAYR--PDE-FGLI--PSEE-GFVRYK--EL--LKALHEE--------egWRHVRQSHINEMLMGED-RALFETEG------------------------------------------------------------------------------------------------------------------------------------------------------------------DRIRSRKRHW--VM-----------DDQ-------------------------------SDHPLP---GLLYTSVRKRAH-PVAMEKG--LKAETGSHIALSPHR------------------------EMALRMGRRRDQHPVLLEIPAMLAEK-K------------G-MRIFSFGVLFLTP-----------EIPAHCISGPEIPAH 168 delta proteobacterium NaphS2 bacteria>proteobacteria>deltaproteobacteria
308270161 306 5 SKFVSYILERK--PDE-FGLV--PDEN-GYIKIK--SL--LLALNEE--------dgYKFVRRHHIDDILSSIP-DSQLEIND------------------------------------------------------------------------------------------------------------------------------------------------------------------DLIRSKYRDN--LP-----------KPT-------------------------------VSENPP---KLLYTCVRKKAY-SFALEKG--IFPVGNKKVVLSPAK------------------------EMAERMGKRFSPLPVVLTVNVQKALE-A------------GVIFHNSSE-LYTAD-----------AIPADCFTGPAIPAD 180 uncultured Desulfobacterium sp. bacteria>proteobacteria>deltaproteobacteria
158521555 307 3 ARVIAYMLGQA--PAE-FGLV--PDAS-GYVKIK--EL--IKALHEE--------egWRHVRASMLNTLVLTLD-DVPFEIQD------------------------------------------------------------------------------------------------------------------------------------------------------------------DKIRTKDQTP--GA-----------PAE-------------------------------PVSGLP---KLLYTCVRQRAH-GRVAQAG--ITPSFAEAVVLSPDR------------------------EMAQRIGKRRDPDPVVLVVETRAALE-N------------GVAFRQTEGDLFLAD-----------FIPVDLFLADFIPVG 175 Desulfococcus oleovorans Hxd3 bacteria>proteobacteria>deltaproteobacteria
302344076 301 6 ARMLRYILGVC--PAE-LALL--PDAE-GWVRQK--DL--LAALHGE--------dgWKHVRQTMLTDMADRLA-SDVFEADD------------------------------------------------------------------------------------------------------------------------------------------------------------------TRIRCRQRSY--AP-------------------------------------------pnPEAKPP---AHLYYGARRRAY-PVIRERG--LDADDGPGLIVCADS------------------------QRALAIGRRRDAEPVLVTIQARLAQE-N------------GIQARLAQENGAALAAWGEEGLFVA-QWIDAQFLMGPPLPD 160 Desulfarculus baarsii DSM 2075 bacteria>proteobacteria>deltaproteobacteria
218780694 305 11 NKFLAYALGRR--PDE-FGLF--PDED-GWVKVK--DL--VRALSEE--------dgWKHVNKAHIKEVAYTLE-DPAIEYEHEe----------------------------------------------------------------------------------------------------------------------------------------------------------------GIVRAVEWDP--SL----------YYTG-------------------------------VPEDLP---KLLYVGARNKTY-PEIDKKG--IFPVGAPFVILCRDE------------------------DMAFRIGKRRDGNPIVLTVNTAMAQE-L------------GVVFAMAQELGVVFEQAGEVLLTAE-FIPKGCFTGPPLPKV 163 Desulfatibacillum alkenivorans AK-01 bacteria>proteobacteria>deltaproteobacteria
consensus 100 % ........................................................................................................................................................................................................................................................p...............................................................................h...s..l.......l.h............................................h................................................................
consensus 95 % ...hs..LRH.........h........Ga.......h..h........................l..hh..s..K.Ra.h......................................................................................................................................................................lpA.bGHo............................................................hhaus....h...l...G..l....p..lHhs.................................u.b......hh.l........................h..s...l..s...........................
consensus 90 % .+.hs.hLRH...s.....l...hp...Gah.h....l..l....................p...l..hh..s..K.Ra.h.....................................................................................................................................................................bI+A.bGHo..h...................................................s.....hhHGT....h...I..pG..l....R..lHhs.s..............................su.R.....hhh.l....h................s..hb.s.p.lhLs...........................
consensus 85 % u+.hu.hLRH...s.....l...hp...Gah.l....l..l...................hs...l..ll.ps..K.Ra.h.....................................................................................................................................................................bIRA.bGHo..h...................................................s.....lhHGT..p.h...Ib.pG..l....RpalHhu.s..............................sG.R..s..hhl.lp...h................G..hh.u.s.lhLs...........................
consensus 80 % S+.lobhLRH...s....sl...hs...Gah.lp...l..l...................hsb..l..lV.pss.KpRa.hp....................................................................................................................................................................bIRA.bGHS..l............p......................................P.....lhHGT..p.h...Ib.pG..L....RpalHhu.s...........................s..sG.Rp.s..lll.lps..h................G..ha.u.s.VhLs...........................
consensus 75 % S+.lSblLRH...s.p.bslp..hc.p.Gah.lp..pl..l.....p.............hsb..lpplV.pss.KpRa.hp....................................................................................................................................................................bIRAsQGHS..l............p..h...................................P.....lhHGT..p.h...IbppG..L..bpRpalHhu.s...........................u..sG.Rp.sp.lll.lss..h...p............Gh.aabu.NsVhLsp............ls............
consensus 70 % SK.LShlLRH...s.p.hGlp..lc.p.Gahplp..pl..l...p.p.............hsbpplpplV.pss.KpRaphp....................................................................................................................................................................bIRAsQGHS..lp...........p..h.................................p.P.....lhHGT..p.h...IbppG..Lp.bpRpaVHhuss.........................p.u..sGbRp.spslllblcs.ph...s............Gh.FabupNsVhLsp............ls..hh........
PDB:1wfxA - - HHHHHHHHHH--------------------EEHH--HH--HHHHHHH--------------HHHHHHHHHHHH----EEEEE-------------------------------------------------------------------------------------------------------------------------------------------------------------------EEEEEE--------------------------------------------------------------EEEEE-------------------------EEEEEHH------------------------HHHHHHHH-----EEEEEEEHHHHHH-H---------------------EEEEE-----------------EEEEEEEE--
Back to Contents
ALIGN -------EE---EEEEE------EEEEE-------------------------------------------------EEEE---HHH-----H-HHHHHH--------HHHEEEEEEE-------------------------------------------------------------EEE-----HHHHHH----
HMM --EE-EEEE---EEEEEE---EEEEEEEH-----------------EEEEE--------------------------EEEEEEEEEE--------EEEEE-------EEEEEEEEEEEE----EEEEE---------------------------------------------------EEEEE----EEEEEEEE-
FREQ --------E---EEEE------HEEEEHH-------------------------------------------------EEE-----H----------------------EEEEEEEEE------------------------------------------------------------EEEEE----HHHHHHHH--
PSSM ------------EEEE--------HHHHH------------------------------------------------EEEE----E-----------EE--------EEEEEEEEEEE-----EEEE---------------------------------------------------EEEEE------EE------
FINAL --------E---EEEEE------HHHHHH------------------------------------------------EEEE---EEE----------EEE-------EEEEEEEEEEE------EEE---------------------------------------------------EEEEE-----EEEEEEEE-
NEURL4_Hsap_53829370 1408 EAGTLTKKW---HMAYHGSNVAAVRRVLD-RGELGAGTASILSCRPLKGEPGVGFEEPGENCAPPREE------QPPPVLLSPSLQYAGAETLASKVQFRDPKSQRTHQAQVAFQVCVR--PGSYTPGP-------------------------------PSAALGEPPDPHFSPAE-LEWVTKEKGATLLCALLVR 1560 9606 Homo sapiens eukaryota>metazoa>chordata>vertebrata
Neurl4_Mmus_29748106 178 EAGTLTKKW---HMAYHGSSVAVVRRVLD-RGELGAGTTSILSCRPLKGEPGVGFEEPGENCAPPREE------QPPPVLLSPSLQYAGAEMLASKVQFRDPKSQRTHQAQVAFQVCVR--PGSYTPGP-------------------------------PSAALRELPDQHFSPSE-LEWVTKEKGATLLYALLVR 330 10090 Mus musculus eukaryota>metazoa>chordata>vertebrata
GSTEN:00009647:G:001_Tnig_47211351 1132 EVSTALKKW---HIAYHGTGVGTLRRTLD-HSQLLPGTSSVFSVSPVKTEGPNDYGEPEENSAPGRE--------VPRVRLSPTMRYSGMETFAPKVKFQDPRSRRCHQAQVAFQVCIR--PGSYKVGA-------------------------------QSVGHSETLDPRFSNAE-IEWITKEQGGTLLYGLLIR 1282 99883 Tetraodon nigroviridis eukaryota>metazoa>chordata>vertebrata>actinopterygii
LOC581240_Spur_115948408 208 LNVF--ESW---HVAYHGTSVGSVRKILD-RGTLLPPGDTSL-GRLYQPET-LGSS-LNKPSLVPD---------LMQIFVSPTLKYAGCDIFSHRCKFIDSLTQKEHFARVAFQVRIR--PGCYTAGP-------------------------------QSIGANHTIDPYIENSR-IEWTTKETSSIVLCALLIH 351 7668 Strongylocentrotus purpuratus eukaryota>metazoa>echinodermata
BRAFLDRAFT_74056_Bflo_260810360 1003 SQRNVFTDW---HRGYHGTPAGTVKKILQSSSQLLLPGDVT-----PGGEKMGPGKGKGFD--------------SVQVFLSPSIKYSGRDLYAKPMRIKDNTDGKEYTARVAFQVCIR--PGCYGIMHETV----------------------------GASRKGETIDPLFSNKE-LEWFTKERGVHALYGLLVK 1146 7739 Branchiostoma floridae eukaryota>metazoa>chordata
EHI_155600_Ehis_67480865 253 GFGE--EEW-----AFHGSSIDSIQGIIK-EGFKLPD-DV---------DAVKLDS----------------GYFGHGIYLTYFSDYA--LFYSNS-----------RNSNQMVLCQIL--PGNVFKCKKRM----------------------------DGKKCQKGYDSHFSPKG-NEIVIFDPKHILPKYIIEF 371 294381 Entamoeba histolytica HM-1:IMSS eukaryota>amoebozoa>entamoebidae
BRAFLDRAFT_90934_Bflo_260831601 778 TALGVFQKW---HVAFHGTTVGALESILN-TGDLIKAGDKTMEGSRLSERDGHYKDSWKPE-----------GFDTKQVFVSPSIHYAGLPAYAKPSSFT--HRGTTYEAKVALQLYIK--PGSYKVA--------------------------------ASTVARKNVDKKFSDSE-IEWSTDRHGVIIVYGLLVK 922 7739 Branchiostoma floridae eukaryota>metazoa>chordata
cgd5_910_Cpar_66357730 115 EEEN-VKNW---DLSYHGTTHKAIKSILK-DKRLVIPNNKTVHIRKGHI------------------------PNQYFIFTSPSLLYASFGLYSAPFKIKE----SKKWWQIVVEIVQK--PNSYVKEWE------------------------------TSGLGNYEFDKYIGNYE-LEWKSDQEMGNLIKAVLVR 245 353152 Cryptosporidium parvum Iowa II eukaryota>alveolata>apicomplexa
BBOV_III011060_Bbov_156089639 70 TYHP-INYI---GIGLHNNKEDTVDNETD-SGASMEPPDNVFSIPVITNDAT---------------------YFKQHIFASPSCMYATLPEMASALDFE----GLNVGLRIVIEVLVK--PASYVTGPA------------------------------SVKNIKNGFDCCFDNQN-IEWFVKNLDHIVPHRLLFR 203 484906 Babesia bovis T2Bo eukaryota>alveolata>apicomplexa
Phum_PHUM397400_Phum_242016155 1565 TEKI--DTW---QVAFYGTRPDAIRRILD-HGELVLPCLLGMERTRVKAKEDETD--------------------SSHIVFSPSIKYAACDYFVTKFRFYDSRTKNKTEATLAFQILVQ--PGSYKVGPP------------------------------SVDVSKEIPDTRFERDA-TEWVTKERGATTLSALLIK 1702 121224 Pediculus humanus corporis eukaryota>metazoa>hexapoda
PTSG_01796_Ssp._326433251 405 THARATKLWETSHVCYHGTSIGALKPIIE-GGEILPPGEVNVTHTHIIPRDDEDNPREGRLPTVYTTPAHNLDRIHKSVFVSPSVAYASSSTYAERYYW----PGGRQFLVPVLQTRIR--PDTYDVR--------------------------------SSTLRDTPHDPCYSADE-MEWYTPRRGVIQIYGLLLK 561 946362 Salpingoeca sp. ATCC 50818 eukaryota>choanoflagellida
TP02_0033_Tpar_71029920 104 NHFS--DNF---SIKHFLVKIIRSPRLSD-DDFSQLRNHINGASDPQSSVTKQSD--------PSHPDPNISNTIGEGLMVTPSCMYATKQEISSILTFEE----LDVKLQILIQIKAK--PGSYTVSP-------------------------------NSIKLNDNFDSCFPNSE-IEWYVKNVDDIIAERLLFK 248 333668 Theileria parva strain Muguga eukaryota>alveolata>apicomplexa
TA12305_Tann_84995898 103 RHFT--DNF---SIKHFLLKIIRNPRLSD-DDFSKFRNYITGNSDLSSAVINNKD--------QPPADAATTDHKDEGLMITPSCMYATKPEISSILTFEE----LDVKLQILIQIKTK--PDSYTTSP-------------------------------NSITLNENFDSCFPNSE-IEWYVKNVDDIIAERLLFK 247 353154 Theileria annulata strain Ankara eukaryota>alveolata>apicomplexa
TRIADDRAFT_57456_Tadh_196007734 1231 NVNL--NEW---YIGYYPSTVGNVRQILD-NRILATGNEDDYDRDISVST--------------------------NICHIQEHVEI---SQF-RHEVF--------GLVSVAFEVYIK--PDATTIA----------------------------------------DIEGTGDQCSMLTFKHSPRNMILSALLIK 1341 10228 Trichoplax adhaerens eukaryota>metazoa>placozoa
SINV_00048_Sinv_322786335 1518 QSTT--DKW---HVAFYSIRLDAIRLILD-RGELMTK-EQLDVSNLTSGT-KSED-------------------QNPQVMFSPAVKYAASDEFTRKYPYIDMQLNKKLNASTAFQLLVR--PGSYTTFP------------------------------------KVFRDENERYCESVKWATKEAGATVIVALLVH 1649 13686 Solenopsis invicta eukaryota>metazoa>hexapoda
LOC100117587_Nvit_345484523 1620 QSTT--DKW---HVAFYGTRIGTVRWILD-RGELLTK-EQLDTDSLTTGT-STED-------------------QNPQVVFSPNIKCASSEEFTKQYSYIDTQLNKKVNASTAFQLLVR--PGSYTTS--------------------------------------SKKDGLDSQLECIEWATKETGATVIIALLIH 1749 7425 Nasonia vitripennis eukaryota>metazoa>hexapoda
EAI_14437_Hsal_307195422 1616 QSTT--DKW---HVAFYGIRLDAIRLILD-RGELMTK-EQLDMSNLAMSI-KSED-------------------QNPQVSFSPSIKYAVSDEFTRKYPYIDTQSNKKLNVSTAFQLLVR--PGSYTISP-------------------------------------GDKDSIDLHCESCKWATKEAGATVIVALLVK 1745 610380 Harpegnathos saltator eukaryota>metazoa>hexapoda
blue_Amel_328784754 1583 QNAI--DKW---HVAFYGIRLDAIRLILD-TGELIPK-EQLDLSNLTMNI-KMED-------------------QNPQVVFSPSIKYAASEEFTKKYPYIDTESNEKLNASTAFQLLVR--PGSYTINS-------------------------------------SSKDSDDSQFQSVKWATKEAGATVIMALLIR 1712 7460 Apis mellifera eukaryota>metazoa>hexapoda
blue_Tcas_270008234 1288 NTAT--DKW---HTAFYVCKVGAVRCILD-KGQPLTK-GQAQWCNLVAQ--KEDD---------------------VQVVFYPTLQNCKTSGYKTNN----------RVVHAAFQLLVK--PSAYSVSR-----------------------------------------------DPPEWSTKETGAIVLHSLLIQ 1395 7070 Tribolium castaneum eukaryota>metazoa>hexapoda
blue_Dmel_78214301 1604 VHFDLNGDW---LPFYYMTRVDKIRAILD-RGQPLPL-ETDPDEEPAAAA-LKDE-----------------PGTRLELYYSPNATVIEPVLPQHHFAS-EQ---GLHRISTSFEVYVR--RQSISGVTTGKAAAEAKRRSLGSTDHDHGGTGQGADGVGVTPSATLNESSVHLLND-LCWFTKEAGACIINALIIH 1769 7227 Drosophila melanogaster eukaryota>metazoa>hexapoda
AgaP_AGAP011965_Agam_158300710 1597 TADE--FVW---TTAYYNTRVDKIRSVLD-HGQPLPI-ETGQLLPE-SST-LNDN---------------FIPGTHILLRSVPDAAEPASNATSTSSHF--------FHIKTAFEVRVR--AQSLSAVDHSG-AGEGLNASTGGAGV--TGTGGCTSGVSTVPTA--GGVASGTDFTFRSWTTKEADACVLTALLIH 1754 180454 Anopheles gambiae str. PEST eukaryota>metazoa>hexapoda
DAPPUDRAFT_309455_Dpul_321459414 1336 PGIN--EKW---QTAYHQTRPCVVRRILD-EGHLLSP-DLNVWQRTKAAR-RSSK--------------GNDGESNGQLLFSPTLQ-PAS-LAPIAELY-DPILKKNQRGQVVLQVLVQ--PGSYKVRRATSPLNGPAPTVPTANTVGSVTCSPDPTHQQQLLNPPADTTAITDEDPAILWYTKERGAAIVQALLIS 1504 6669 Daphnia pulex eukaryota>metazoa>crustacea
NEMVEDRAFT_v1g131035_Nvec_156360568 144 SQVP--REW---PVAYHGTNFTNANSILQ-KGLKPGD----------------------------------RALYGKGVYTSPSLQMV--EKYYAQEFKYE-----GKSYKIVFQSRVN--PDQSNGHL-------------------------------KIIPASKTGVGADYWLSPKQNVRKGPHDVRPYGILIK 260 45351 Nematostella vectensis eukaryota>metazoa>cnidaria
TTHERM_00581840_Tthe_118371452 890 DTSD--KTW---IVLFHGNKKLSTQELIE-EGYKQGG-------------------LQQYQGHQCRFG---RGLIKQGIYFYEKIQDA--EKHADTFFIND------KQYNLLFQCRVN--PKTVKSP----------------------------------------------INKPSCYVANDPKDVRPYRILIK 1002 5911 Tetrahymena thermophila eukaryota>alveolata>ciliophora
TTHERM_00621420_Tthe_118369526 1032 YNSK--EQW---IVLYHGTSIQGVEGITK-EGFRLGQ-------------------HHKYAGAKCRITGKIIEKSSKCVYLTDDANVA--GRYSTPFEI------KGKAYQMVFQCRVN--PKVVRSP------------------------------------------KEKPDYYIIEESGQPQQNIRPYRILLK 1151 5911 Tetrahymena thermophila eukaryota>alveolata>ciliophora
ubqP_Ddis_66808359 209 CNGP--NEW---LVSYHGTKEESCNPIAM-EGYKLSS--------------------------------CSGFAFGVGIYSTPSIDIA--KTYGRTFKK-D-----NCHYVIVFQNRVN--PKTVIKI-----------------------------------------------DNIQYWISPNDADIRPYGVCIK 310 352472 Dictyostelium discoideum AX4 eukaryota>amoebozoa>mycetozoa>dictyosteliida
ubqK_Ddis_66813768 205 NNTD--GEW---PVSYHGTGKHESKSIAE-KGYDLSK--------------------------------GKRFLYGRGVYSTPSIKCA--EAYATSFIH-E-----GSTYRVVFQNRVN--PKTLIKIP------------------------------------------KSQTNFEEYWISPKDEDIRPYSICIK 311 352472 Dictyostelium discoideum AX4 eukaryota>amoebozoa>mycetozoa>dictyosteliida
ubqM_Ddis_66813772 165 NNVD--GEW---PVSYHGTGKHESKSIAE-KGYDLSK--------------------------------GKTFKFGYGIYSTPSIKCA--ETYANSFEY-E-----GCTYLVVLQNRVN--PKTLIKIP------------------------------------------KSQTNDEEYWVSPKDEDIRPYCICIK 271 352472 Dictyostelium discoideum AX4 eukaryota>amoebozoa>mycetozoa>dictyosteliida
GSPATT00016112001_Ptet_145525701 190 NGNQ--NEW---RIMYHGTKQHFVSSIVK-TNLKPGSNN------SYCDQLCFDE-------------FNNQVKVGNGIYFSDKIEVCF--GYTNYTQI------GNKQFAVIFMSRVN--PREIRQ--------------------------------------------SKEMIAQRFFVINNSEDVRPYRILLH 307 412030 Paramecium tetraurelia strain d4-2 eukaryota>alveolata>ciliophora
EDI_044520_Edis_167386548 202 SNVT--GEW---AVSFHGSNCSKFTEIVQ-WGDKLGVSN----------------------------------VGGMSVFCTPDFRVA--LQHSDVVT--DP--QTGKKYKVIFQNRVK--PSSIIRA-------------------------------------------SKVGGPNNFWYITNPSDVRAYSICLF 307 370354 Entamoeba dispar SAW760 eukaryota>amoebozoa>entamoebidae
EHI_013080_Ehis_67481957 201 SNRD--EEW---PVSFHGSNCSKFTEIVQ-WGDKLGVSG----------------------------------VGGMAVFCTPDFRIA--LQHSDVVT--DP--QTGRKYKVIFQNRVR--RSSIIRA-------------------------------------------SNVGGPDNFWYITNPSDVRAYSICLF 306 294381 Entamoeba histolytica HM-1:IMSS eukaryota>amoebozoa>entamoebidae
ubqP_Ppal_281212323 218 QSAP--GEW---IVSYHGTTTDEFGSMSN-DGYRISKSE--------------------------------KKDFNQGIYSTPSIKLA--ERFAQKFQF-D-----GAQYLVILQNRVN--PNTVEKL-----------------------------------------------GNGTYYLSPNENDVIPYGICIK 319 670386 Polysphondylium pallidum PN500 eukaryota>amoebozoa>mycetozoa>dictyosteliida
GSPATT00020219001_Ptet_145536409 315 DGNK--DEW---RILFHGTKNENVNDIIV-SSLKEGWRS------LYEDDLCKDE-------------FGNNVPVGKGIYFSDKFTVCVDKGYAKPIQV------NNKSFSAIFMTRVN--PKKIRQS--------------------------------------------DRMKQERYFLVNRSADVRQYRVLIY 434 412030 Paramecium tetraurelia strain d4-2 eukaryota>alveolata>ciliophora
LOC100206592_Hmag_221109790 223 TDVP--GEW---PVSYHGTGVNEAKSIAE-DGYNLTK--------------------------------GKRFAFGRGVYSTPNIKVA--EKYALNFMH------KNKQYAVVLQNRVN--PTTLLKIS------------------------------------------ADHTKIGEYWISPSDKDIRPYGVCIR 329 6085 Hydra magnipapillata eukaryota>metazoa>cnidaria
LOC100200953_Hmag_221109705 214 SNNP--GEW---PVSYHGTGVYQDKTFAM-NGYDLTK--------------------------------GKMFAFGRGVYSTPNIKVA--EKYAIKFLY------KNEHYAVILQNRVN--PTTLVKIS------------------------------------------ADRIGEGEYWISPSDKDIRPYGVCIR 320 6085 Hydra magnipapillata eukaryota>metazoa>cnidaria
DAPPUDRAFT_48503_Dpul_321472004 97 SSAE--DEW---PVSYHGTSYHNGLSIAS-EGFKLSK--------------------------------GTRFRHGKGIYSTPEIEVA----AQYAE---EATV-NGKTYKVVMQNRVN--PKNLEKV------------------------------------------DKAETGVGEYWISPSDEDIRPYGFCIR 203 6669 Daphnia pulex eukaryota>metazoa>crustacea
LOC100639670_Aque_340383127 195 ESSK--GEW---PVSYNGTTKEGTMTIAA-KGYGEDK--------------------------------LARENFGRGFYSTPSVEIA--ADFARRFDHTD-----GKRYEAIIQNRVNLNPGHSEIIP-----------------------------------------VEKTRHGAEYYLTYSSDDLRPYGICIR 305 400682 Amphimedon queenslandica eukaryota>metazoa
LOC100639047_Aque_340386726 249 ESSK--GEW---PVSYHGTGREEAKGIAV-EGYD-SKRW------------------------------REKCYHGKGHYSTPDIEVA--AKYYTK-PF-D---QNGKKYEVVMQNRVNLSPGHTIIIP-----------------------------------------KEKTRAGAEYYLTYSSDDLRPYGICIR 360 400682 Amphimedon queenslandica eukaryota>metazoa
Back to Contents
134103275 ------------------------------RARV-AH-PDRLRGVSDEEISALLTYTYDHGSCYALNKSMREG-TPDREEMEP-YRRLLTSALNK--IRAN----DEAMG----V-PATQLVERKISVSPESMAGFREKYGNSGATVREEAFMSGTEVE---SRH--VPDGHREGEDYLVTMQVWNGTNVNIASLSR---LP-GEGEVLRIGDGEFRVARYEENGLKVNV--VLEEVGQ-----
148546317 EKTVAAAPKKLMSLRDAVGKDMAERWIAEGRARADIRAPELSRLLSDDQIGALYGYSTNDV-YKAYNQALRE--GTATPGIKA-FAEHATEGLAR--LPRYL-GAETYRG-TD-L-PQHVLNRMQM-----------------GAVETDMAFFS---SS---ATT--PFSGN-------TQMVVRGVSGKDISFLTQ---I--PEAEVLYPPGTSFRVLNRIEQGPTTRL--LLEE--------
157371257 -----------------------------ARANAEKNNAQLSTLLTDDQIGAIYGYTTNEG-YTALNPALRGQ-TPLTPELEA-FTGHVTDGLNK--LPAYN-G-ETYRG-TT-L-PAHILEQNQI-----------------GGTVSDGGFMS---TS---AKT--PFDGD-------VSISVRGNSGKQIDFLSK---YK-NEAEVLYPPNTRFEVINRIEQNGTTHLL-------------
15893630 -----------------------------ANEWGSQYYDNWLKSLNDSERNAIRQYTGND--YKKINNYLRGV-NDSLDGIDPKIIEDIKSGLKKASVPHDM---KVYRG-TD-LNPLRNLIDVGK----DGSLDFSSLV---GKTFKDDGFMS-TALV---KES--SFDYM----N--VSWEINVPKGTEAAYVSKISYFP-DEAELLLNHGQEM-IIKEATVGSDGKLNIVLDLNLK-----
167033761 --------------------------------------------LTDDQIGALHGYTTNEG-YQWINPALRGQ-TPLSPQMEA-FVTHANEGLAK--LPSYTLG-DTFRG-TT-L-PEDVMSRMQV-----------------GLPTSDAAFLS---TS---ADRALAFNGN-------VKMTLQGVTGKDISFLSG---H--REAEVLFGPGTRFNVVDRVDNGS------------------
16802114 ------------------------------EKWGIDGFSVWRNSLSSREIQAIRDYTDIWH-YGNMNGYLRGSVEKLAPDNAE-RIKNLSSALEKAELPDNI---ILYRG----T-SSEILDNFLD----LKNLNYQNLV---GKTIEEKGFMS-TTTI---SNQ--TFSGN-------VTMKINAPKGSKGAYLAHFSETP-EEAEVLFNIGQKMLIKEVTELNGKIE--IIVDLL-------
221200352 --------------KEKWGSKDVEDALA-----AKRGNAVLDKLLTDNEYLAIRGYTSNL--YEEINPALRAG---NPGEWGR-LTAEASNGLTK--LADN--G-YAHVG--------DVVRNLRL-----SNEQVEQLFPV-GGVFQDKAFLS-TTSD---LDG--VFPGK-------VTMNITSRSGVSVSSLSE---YP-REAEVLFKPDTPFKVLDRTHDPAKGSWNITLEE--------
228992027 -----------------------------AHEWGSKHFDNWIESLTESERSAIRQYTGDD--YRKINNYLRGI-ADSLNDVESSVIDNIKSGLNKASVPYDI---QVYRG-TD-LKPFKNLYKIDD----EGKIVVDSLV---GKTVKDNGFVS-TAMV---KES--SFDHM----N--VSWEINVPKGANAAYVGKISYIP-TEAELLFNSGQEM-VIKSANVDSDGKIHLILDLI-------
229007965 -----------------------------------------------------------------------------------------------------M---QVYRG-TD-IKPFKDLIELGK----DGRSDFESLI---NKTIKDDGFVS-TAIL---KAS--SFDYM----E--VSWEINVPKGASAAYVGKISQFS-NEAELLLNASHEM-IIKSVNVERNGKLHVTLDLILKK----
255030176 ------------------------------EKWGIDGFSVWRNSLSSREIQAIRDYTDIWH-YGNMNGYLRGSVEKLAPDNAE-RIKNLSSALEKAELPDNI---ILYRG----T-SSEILDNFLD----LKNLNYQNLV---GKTIEEKGFMS-TTTI---SNQ--TFSGN-------VTMKINAPKGSKGAYLAHFSETP-EEAEVLFNIGQKMLIKEVTELNGKIE--IIVDLL-------
291007932 --------------------------------RARVAHPDRLRGVSDEEISALLTYTYDHGSCYALNKSMREG-TPDREEMEP-YRRLLTSALNK--IRAN----DEAMG----V-PATQLVERKISVSPESMAGFREKYGNSGATVREEAFMSGTEVE---SRH--VPDGHREGEDYLVTMQVWNGTNVNIASLSR---LP-GEGEVLRIGDGEFRVARYEENGLKVN--VVLEEVGQ-----
304399359 -------------------------------------------MLTDDQVGALYGYTTNEG-YTALNPALRGQ-TPLTPELEA-FAAHAKDGLSK--LPPNK-G-LSYRGINS-L-PEEILAKNQP-----------------GNIVSDGAFMS---TS---SNE--PFQGN-------ILIKVNGASGRDVAFLSE---YP-LEAEVLYPPDTQFKV--------------------------
313625682 ------------------------------EKWGIDGFSVWRNSLSSREIQAIRDYTDIWH-YGNMNGYLRGSVEKLAPDNAE-RIKNLSSALEKAELPDNI---ILYRG----T-SSEILDNFLD----LKNLNYQNLV---GKTIEEKGFMS-TTTI---SNQ--TFSGN-------VTMKINAPKGSKGAYLAHFSETP-EEAEVLFNIGQKMLIKEVTELNGKIE--IIVDLL-------
325518063 --------------KDKWGSKDVADALE-----AKRGNPVLDKLLTDNEYLAIRGYTSNL--YEEINPALRAG---NPGEWGR-LTTEASNGLTK--LADN--G-YAHVG--------DVVRNLRL-----TNEQVEQLFPV-GGVFQDKAFLS-TTSD---LDG--VFPGK-------VTMNISSRSGVSVSSLSE---YP-REAEVLFKPDTPFKVLDRTHDAANGSWNITLEEL-------
354724236 --------------AEAVGKQRAENWISRGRELADNRDPALSALLSDEQVGALYGYTTDPG-YQMVNPALRGM-KPMTKEMEA-FTQHINDGLDQ--LPVYN-G-ETFRG-MNSL-PSNILEGYTP-----------------GKTVIDPAFVS---TD---INQ--GFSGP-------IQMRIEGVSGRKIDFLSE---FNATETEVLFKPNTTFEVISRSD---------------------
358463913 -------------------------------------------SFTNAEAEGLRVYTSND--YTYINNYLRGFSDDLGPISTS-TISDIDSALSKMELPADL---TLYRG-TS---SAPFMNIVDK-NY-NGTLDWNSLV---GKTFEDRAFVS-TSVE---SKT--AFGGG-------VRWEINAPKGSKGGMVNTFSMFP-NENELLLPRNSKFLIKGIDKVDNNII--LKMDLI-------
359410883 ----------------------------------GSKIIKSVSDLDKSQIEALIKYTGDD--YVNINNSLRGF-ETLSADNAE-AVDIMKSTLSNASLPEDM---ILYRG-TS-I---EELGSLKN-------LPPDELI---GKTFTQPSFLS-TSTENSVATG--TFSGN-------MQIEIEASQGAHGLDVSSISEYGSDEAEVLFNAGQKMFITDA-----------------------
365970965 --------------------------------------KRLSSLLTDDEVGALYGYTTNEG-YPMVNNALRGQ-TELTPEIQA-FADHATNALDK--LPSYE-G-ITYRG-AT-L-PENVLMENQV-----------------GRVVSDPAFMS---TD---QKV--PFSGD-------TTIKINGKTGKPIDFLSE---YKGTETEVLFKPGTKFEVIERVDSGGKTAL--------------
Back to Contents
RES VIDKTVTLFRPVGQKEMELIRKSGYTSFPPRLPFQPIFYPVLSEEYAVQIARDWNTK-DAASGYIGYVTTFRVRANFLSLYPVQTVG---SSK-HQEY--WIPAEKLAEFNQNIIGLIEVIGKFR
FINAL ----EEEEEE---HHHHHHHHHH-------------------HHHHHHHHHHH------------EEEEEEEHHHHH-----EEEE---------EEE--E--HHHHHHHHHHH---EEEEEE--
ALIGN -----EEEE----HHHHHHHHH--------------------HHHHHHHHHHH------------EEEEEEEHHHHHH-----EE---------EEEE--E----HHHHH--HH--EEEEE----
HMM ----EEEEEE--HHHHHHHHHHH-------------EEEEEE-HHHHHHHHHHHE-E-------EEEEEEHHHHHHHH----EEEE---------EEE--EE-HHHHHHHHHH----EEEEEE--
FREQ ----EEEEE-----HHHHHHHH---------------------HHHHHHHHHHH-----------EEEEEEEHHHHH-----EEE---------EEEE----HHHHHHH--HHHH--EEEEEE--
PSSM -----EEEE----HHHHHHHHHH-------------------HHHHHHHH----------------EEEEE----H-------E----------------------HHHHHHH----HHHH----
300869632 VIDKTVTLFRPVGQKEMELIRKSGYTSFPPRLPFQPIFYPVLSEEYAVQIARDWNTK-DAASGYIGYVTTFRVRANFLSLYPVQTVG---SSK-HQEY--WIPAEKLAEFNQNIIGLIEVIGKFR
294817221 VQRATTTLWRPTGPAELELVRELDWRAWPPRLPEQPIFYPVLNEEYAVRIARDWNVR-HDG---AGFVTRFEVDTEFLRRYPVRQAG---GRT-ILEL--WVPADELDTFNAHIVGTIQVVREFH
289770606 TESGTTTLWRPTGPEELALVEASGWTAWPPRLPEQPIFYPVLNEDYAVRIARDWNVP-ASG---SGHVTRFEADTAFLARYPVRRAG---GET-ILEL--WVPAEELAEFNRHIVGRIEVVREFH
21222199 TESGTTTLWRPTGPEELALVEASGWTAWPPRLPEQPIFYPVLNEDYAVRIARDWNVP-ASG---SGHVTRFEADTAFLARYPVRRAG---GET-ILEL--WVPAEELTEFNRHIVGRIEVVREFH
325917965 TAAATVTMHRPLRPEQDALVRVPGFRRWPPRLPEQPGFPPATDRRYAGEIASRWNVK-DSG---VGDVAQFAALAAFVDQYAMQTVG---GAH-HTEW--WIPAEDFDKFNAAIVGSITIIARFD
297204161 TRSSTTTLWRPTGPKELDLVRELDWRAWPPRLPEQPIFYPVLDEDYAIKIARDWNVK-HDG---AGFVTRFEVESDFLSRYPVQQAG---GRT-ILEL--WVPAEELDEFNAHIVGPIEVVHEFR
311900362 TQRSTTTLWRPTGPEELDLVRELDWRAWPPRLPEQPIFYPVLNEDYAIRIARDWNVK-HSG---VGFVTRFEVETEFLSRYPVQQVG---GQT-ILEL--WVPAEELDEFNSHIIGRIQVVHEFR
315504426 SSDVTTVLWRPLGQQELDLVREAEGRRWPPLSPEQTHFFPMLDEDFAVRAAQNWNLF-----GPVRYVARFHVETGFLGRYSTRSFG---GSA-APML--WVAADELDEFNAHIVGSIEVIHEFR
304309800 SSATSVTLYRAVGPGQMRAIMERGFARFPARLPQQKFFYPMLTESFASFVATVWNVP-HSG---AGYVLRFRVAPEGIEGKRAFRVG---GPE-HREF--RIGREDFNRFNAAICGPIEVVAVFG
328886920 SQQTTTTLWRPTGPKELDLVRELNYRAWPPRLPEQPIFYPVLNEDYAIRIARDWNVK-HDG---AGFVTRFEVESEFLSRYPVQQAG---GQT-ILEL--WVPAEELDDFNAHIVGEIQVVHEFR
334120906 SDQETVTLFRAVGKKEMELIKESDFLAFPPRLSFQPTFYPVLHKAYAIQIARDWNTR-DAASGYFGYATRFRVAAEFLKNYPVQNVG---SSI-HQEY--WIPAEELAQFNQNIVGKIEIFAEYQ
29826642 SRHGTTTLWRPTGPKELDLVRELKWRAWPARLLGQPFFYPVLNEDYAVKIARDWNVK-HDG---AGFVTRFEVESQFLRRYPVRQAG---GQT-ILEL--WVPAAELDDFNAHMAGEIEVVHEFR
254383863 SRQATTILWRPTGPKELDLVRELNWRAWPPRLPEQPIFYPVLNEDYAIRIARDWNVK-HDG---AGFVTRFEVETEFLSRYPVQQAG---GQT-ILEL--WVPAEELDEFNAHIVGEIQVVHEFR
329935140 SQQATTTLWRPTGPRELDLVRDLNWRAWPPRLPGQPIFYPVLNEDYAIRIARDWNVK-HDG---AGFVTRFEVESEFLSRYPVQQAG---GQT-ILEL--WVPAEELDDFNAHIVGEIQVVHEFR
302869104 SSDVTTVLWRPLGQQELDLVREAGGRRWPLLSPEQTHFFPMLDEAFAVRAAQNWNLF-----GPVRYVARFHVETGFLGRYSTRSFG---GSA-APML--WVAADELDEFNAHIVGSIEVIHEFR
239992555 SRQTATPLWRPTGPKELELVRELNWRAWPPRLPEQPIFYPVLNEDYAVRIARDWNVK-HDG---AGFVTRFEVESEFLSRYPVQQAG---GRT-ILEL--WVPAEELDDFNAHIVGEIQVVHEFR
238061986 SDDGTTVLWRPTGPQELDLVRESGWCKWPPRLPDQPIFYPVLNEDYAVMIARDWNVP-ASG---VGYVTRFRVESEFLSRYPVRQAG---GKT-ILEL--WVPAEELDEFNAHIVGLIEVVHEFR
320333489 PVGETVTLYRPVGEQELTLIADTDFRAFPPRLPDQPIFYPVLNFPYAEEIARDWNAR-HNTPP-VGYVTAFEVDARVATGYAIQIVG---REDRHQEL--WVPAEELGAFNAAIRGPIRVLAHHV
160939744 PLGGKMILYRPVGSKELELIKKSNYRRFPPRLVEQPIFYPVLNEQYATEIASSWNVK-YN-EDHRGYVTKFEVDDQYCRQFEVHQVG---GPH-HKEL--WVPAEKLDEFNEHIIGEIHIISEFS
149173583 NGKQTVTLFRPVGQQELDLIQASGWKEFPPRLYWQPIFYPVLTEEYAIMIARDWNTK-DPNSGYVGYVLQFDVEFDYLSRYEPQEAG---GRD-LKEY--WIPSEDLQEFNQHIMGTIDVIHEFR
291301515 NPDGTTTLWRPTGPQELALVEQSGWRAWPPRLADQPIFYPVLNENYAVRIAREWNVP-ASG---SGFVTKFHIDTPYARTLPTQRAG---GNN-EREL--WVPAERLTEFNEHIVGTIEVTHRFS
223935744 MNNETITLFRPVGPKELGLVREGGFKGFPPRLPEQPIFYPVTNEEYAVQIAQRWNVP-DSG---SGYVTRFQVRKEFLSKYDVKNVG---ASK-HNEY--WIPAEDLNEFNRNIVGEIEVIAEFH
298246337 MQEETITLYRPTGPEELALIVESQCTAFPPRLFWQPIFYPVLFEEYAVQIARDWNAR-DGN---SGYVTRFRMRKAFLDRYEVQKVG---SAI-HQEY--WIPAEELDEFNRNIVGPIEVIAEYH
302526847 MDTATTELWRPTGPAELELVRQSGWREWPPRLPEQPIFYPVLNEDYAVKIARDWNVR-YDG---AGYVTRFRVETAFLDRYPVRQAG---GET-ILEL--WVPAEELAEFNAHLVGEIEVVHEFR
296446434 LGDDVMILWRPVGPRELELISASGMREFPPRLPEQPIFYPVTTEAYAIKIARDWNAP--RG---GGFVTRFQVRRSFISRYPIHIAG---GRE-NMEY--WIPAEDLVEFNGAIVGQIEIVAEFP
332671633 IETDVVTLWRPTGPDELALVEASGWRRWPPRLPDQPIFYPVLNEDYAVRIARDWNVK-ASG---AGYVTKFDVRRGHLEEYDVQQVG---GET-ILEY--WIPAERLEELNDNIVGTIEVVRTFR
186681810 GDRETITLFRPTGPKELALIKESGDSEFPPRLPEQPIFYPVLNEEYAAQIARNWNAA-STDTGYIGYVTRFQVRAEFLSRYSVKTVG---GSI-HQEY--WIPAEDLPEFNRNIVGLIEVIAEFR
218679791 EDIETVTLWRPVGPEELALMRDLDMRGFPPRLPDQPIFYPVLSEDYAVKIARDWNVP-RSG---SGFVTRFEVRKDYLNTYAVQEAG---GRA-HLEY--WIPAEEMDRFNAAIVGTIEVMQTFP
330469448 DDVNTTVLWRPTGPRERELVRASGWRAWPPRLPDQPIFYPVLNEDYAIKIARDWNVP-ASG---AGYVTRFHVETDFLSRYPVRQVG---GDT-ILEL--WVPAEELDEFNSHIVGQIEVVHEFG
302553253 DRRTTTTLWRPTGPKELDLVRELDWRAWPPRLPEQPIFYPVLNEDYAVRIARDWNVK-HDG---AGFVTRFEVDSDFLRRYPVQQAG---GET-ILEL--WVPAEELDEFNAHIVGRIELVHEFH
297192271 ATTPTTTLWRPTGPEELELVRKSGWRAWPPRLPEQPIFYPVLNEDYAIRIARDWNVK-HDG---AGFVTRFEVESEFVARYPVQQAG---GRT-ILEL--WVPAEELDEFNAHIVGEIQVVHEFR
171913882 APKPTVTLYRPVGPAELELISASAWKRFPPRLPDQPIFYPVLNEVYAAQIARDWNVA-ASG---SGHVLKFEIDAVYISRFDRQVVG---GSQ-HEEL--WVPAEELEEFNDHIVGTIEVVANYG
302866493 -MTETTTLWRPTGPRELDLVRASGWRAWPPRLPDQPIFYPVLNEQYAVMIARDWNVP-ASG---AGYVTRFHVERAFAARYPVRQVG---GRD-ILEL--WVPAEELDEFNRHLVGPIEVVHEFR
318058555 --MRTTTLWRPTGPAELALVRASGMRAWPPRLPEQPIFYPVLNEDYAIRIARDWNVK-HDG---AGYVTRFAVAADFLARYPVRQAG---GET-ILEL--WVPAEELPEFNVHLVGPIEVVREFH
145596643 -MAETMTLWRPTGPEELDLVRASGWKAWPPRLPDQSIFYPVLNEQYAIMIARDWNVP-ASG---VGYVTRFDADRD---SRPVTRSGRQAGAT-SLSCGCWPRIS--TKFNQHIVGQIEVVHEFR
159038599 -MAETTILWRPTGPEELELVRASGWKAWPPRLPDQPIFYPVLNEQYAIMIARDWNVS-ASG---VGYVTRFEVDREFASRYPIRQAG---GRD-ILEL--WVPAEELDEFNRYLVGLIEVVHEFR
182412866 -MTKTTTLYRPVGPKELALIEASGFRSFPPRLPDQPIFYPVTNEDYAIQIARDWNVP-ASG---SGFVTRFQVESDFLKQYPPRVVG---SKV-HEEL--WIPAEALDEFNRHIIGLIEVTHRFG
297561422 -MPATLTLWRPTGPAELALVGDSGWREWPPRLPEQPIFYPVLNEDYAVRIAREWNLP-RDG---EGHVTRFRVDADFASRYPVRQAG---GRT-ILEL--WVPAGELAAFNAHLVGPIELVRSFL
145595385 -MAETTILWRPTGPEELELVRASGWKAWPPRLPDQPIFYPVLNEQYAIMIARDWNVP-ASG---VGYVTRFEVDRAFASRYPVRQAG---GRD-ILEL--WVPAEELDEFNRHIVGLIEVVHEFR
239626468 -----MILYRPVGTKELELIKKSNYRSFPPRLPEQPIFYPVLNEQYATEIASGWNVK-YN-DDHKGYVTKFEVDDSYCGQFEVHQVG---GAH-HKEL--WVPAEKLEEFNEHIVGEIQIISEFS
163754443 ----MKTLYRPIGEKELILIAESNFTKFPPRLEWQPIFYPVLNEEYAVEIASKWNTK-DEFGNYLGFVTEFEITEEEFNKYKTENVG---SAH-HNEF--WVPAEKLEEFNNAIIGRIKVIKVFI
124007251 -----MKLYRPVGLKELELILAANAKAYPPRLQWQPIFYPVLNFEYARQIATRWNLD-DELSGYAGFVTAFDINDAYIAQFEVQNVG---AHL-HNEL--WIPAESLAEFNTHIHGYIQVLAAYY
284038124 ---MTTTLFRPVSKKELDLIEQSNWTKFPPRLHEQPIFYPVTNIEYARQITIEWNVP-AYG---NGYVTQFEVDSEYLKKYNVENVG---GSI-HNEL--WVPAEELDEFNSQIVGPIKVVESYE
159901068 -----MILYRPVGLEELTLIAQAGYRSFPAQLAEPPIAYPILNLEYASHVAESVKTK-DAEAGYAGFVAEFEISEQYARQFAVKSVG-I-RRR-HREL--LVPIEEFHNFNTRILGHIKVIASFY
256420608 --MNTTILYRPTGIKELALIAATDFKHFPPRLSWQPIFYPVLNQPYAEQIALEWNTN-DEASGYCGIVTRFAVDAAFLERYDIQNVG---DGS-HNEL--WVPAEELEMFNQHITGKIEVVKTFL
83649603 --MKTVTLFRPTGPNELALVEESGFKRWPPRLSEQPIFYPVCNEDYARQIARDWNVK-DSG---VGYVTRFAVDADYLSRFDVKVVG---GRE-HAEY--WIPAEQLEEFNDHIIGGIEVIATYR
296130683 --MSTRTLWRPTGPEELALVEASGRRAWPPRLPDQPIFYPVLNEDYATRIARDWNVK-ASG---VGYVTRFEVATEFLDRYDVQQAG---GET-ILEY--WIPAEDLDELNAHIVGTIEVVAEYR
225390142 -----MILYRPVGKRELELIEQSGYRAFPPRLPEQPIFYPVLNQRYAQEIAGRWNTR-DARSGYRGYVTRFEVEDRYISRFESHVVG---ASW-HEEF--WIPAGELEEFNRHILGRIEVVKTFG
256376037 --MDDVVLWRPTGQAELDLVAGSGWREWPPRLPEQPIFYPVVNREYATRIAREWNASGAEG---VGYVTRFAVEGEFLAKYPVQSAG---GSG-IDEH--WVPAEELEEFNRHVVGRIEVEAEYR
333985238 -----MILYRPVGHNELALIVESGLKGFPPRLPDQPIFYPVLNAGYAKQIALEWNTK--S-DTFSGYVTRFNIDNDYAQKFNREIVG---GKV-HEEL--WVPSEELSEFNQKIVGHIEIISAYF
338532263 -MSNPLTLYRPVGLKEAELILDSGCSAFPPRLPDQPIFYPVMNAEYARQIARDWNTP-DAGSGYAGFVTAFGVDADYASRFPVRTVG---NSL-HQEL--WVPAEDLATFNQHIQGPVRFTEAWY
303241812 -----MKLYRPVGISELELIKQSGMTKFPPRLPDQPIFYPVLNRKYACQIAREWNTK-SA-PGYAGFVTEFDVDDDYISKFEVKTVG---AFV-HTEL--WIPAEELDEFNRHIIGEIKVIESYY
269118724 -----MKLYRPVGLQELEKILNFGSEKFPDRQVWQPILYIVENYGYAEQISTMWNLK-DENSGFSGYILEFTISDDYMKNYDIKQVG---DKT-HLEY--WIPAEDTKKFNNSLTSKIKIINAFY
108763108 -MPNTRALYRSVGLKEAELFLVSGCSAFLAPTARPAHLLPGDERRVRTANCRDWNTP-DAGSGHAGFVTAFDVGADYASRFPVRTVG---NSR-HQEL--WVPAEELATFNQHIQGPVRFTEAWY
16126106 --MTSVTLYQPVGLEELQAIKASDWRAFPPHDIEQPVFRPVTSEAFAAQLARDWNAA-HTTYR-RGYVVQFAVSKTFLDAYENKVSG---TPG-HEEY--WIPSEDLSLLNAAIQGQIAVAGTFA
162453007 -----MILYRPVGLAELRLIAEAGYRAFPPRLSHQPIFYPVLTEEYARKIARDWNTA-DETSGFAGWVTRFEVEDDFARRYPVQIAG---GRS-HEEL--WVPAEELEEFNRHLVGTIEITEVYC
126740444 -----MKLFRPTGLKELVLVRDSGWASWPPRLPDQPIFYPVTTFGYAEKIARDWNSV-LPAPDNMGFVTEFTISEAAARRYPVEEAG---GRE-HREL--WVPAEELEWFNGELTSTIRIVSAYR
300774507 --MKTTTLYRPVGEKEMILIMESGFKSFPPRLEWQPIFYPVLNEEYASEIAEKWNTR-DEAGNYLGFVTQFEVLEEVADQYPTQNVG---ARN-HNEL--WVPSEELNSFNKAIIGDIKYR----
consensus/100% .......habs....b...h.......a.........h.......h....s..hp............h..F.h.......b.....G.............b........hN..h.u.l.h.....
consensus/95% .......LaRs.G..Eh.hl.......aPsb...Qs.hhPh.pb.aA.bhu..WN..........GaV..F.h....h..h..p.sG...s.....bh..Wls..ph..hN..l.G.Iph...a.
consensus/90% .......LaRPsG..Eh.Ll...shp.aPsRL..QPhFYPl.sb.YA.blAppWNs.........GaVspF.l...hh.pa..p.sG...s.....Eh..WlPu-ch.pFN..l.G.Ipl...a.
consensus/85% .......LaRPsG.pEL.Ll...shp.aPPRLs.QPIFYPV.sb.YA.bIApcWNs.........GaVspFplp..ah.pa.sp.sG...u.....Eh..WlPAEcL.pFN..lhG.Iplh..a.
consensus/80% ....s..LaRPsG.pEL.Llb..shp.aPPRLspQPIFYPVlscpYA.bIApcWNs...ss...sGaVTcFplp..ahppassppsG...up....Eh..WlPAE-L.cFN.pIlG.Icll.pa.
consensus/75% ....s..LaRPsG.pEL.Llb.ssac.aPPRLs-QPIFYPVLscpYA.bIAc-WNs...ss...sGaVTcFcVc..ahppYslppsG...up...bEh..WlPAE-LscFN.pIlG.IcVl.pa.
consensus/70% ....o.sLaRPsG.pEL.Llb.usa+.aPPRLP-QPIFYPVLNEpYA.bIAR-WNs...su...sGaVT+FcVcspahs+YslppsG...Gpp..bEh..WlPAE-Ls-FN.cIlG.IcVlppF.
#==== Truncated members
126740444 -----MKLFRPTGLKELVLVRDSGWASWPPRLPDQPIFYPVTTFGYAEKIARDWNSV-LPAPDNMGFVTEFTISEAAARRYPVEEAG---GRE-HREL--WVPAEELEWFNGELTSTIRIVSAYR
119477262 -----------MSPAQLAAVVASDWRQFLQEAPQQTIFYPKMYVGYAEQIAKQWNAR-QYS---AGYVVGFTMPGTFMDRYETQTIA---YEE-HRDY--KLPVAELDVFNSHIQGRIRVAAAFA
148256740 ------------------MIAASGMRAFPPRLPEQPIFYPVLTEAYAVKIARDWNVP-ASG---SGHVLRFEVLRTFVDRYEVREAG---GRD-HLEY--WIPSEHLAEFNAAIVGPIVLVKTFP
146341856 ------------------MIQATGMRAFPPRLPEQPIFYPVLTEDYAVKIARDWNVP-ASG---SGHVLRFQVRREFIDRYEVREAG---GRD-HREY--WIPSEDLAEFNAAIVGTIALVKSFP
330467180 -------------------MEASGWREWPPRLPDQPIFYPVLNRWYATKIAREWNVP-AGG---VGYVTRFEVQREYMDRYEVHQVG---GRD-VLEY--WIPAEELADFNAHLVGAITEEADYR
290960596 --------------MELDLVRESGWRAWPPRLPEQPIFYPVLDEAYAVQIARDWNVK-HDG---AGFVTRFEVDAGFLRRYPVRQAG---GRT-ILEL--WVPAEELEEFNAHIVGAIEVVHEFR
94971452 ----------------------------------------MLTIEYARQIARDWNTR-HERSGYAGYVLRFAVDTDFLSRYEIQRAG---SDA-HLEY--WIPAEEMEEFSVHIVGDIEVLEQYT
239626503 -----------------------------------------MNKQYAIEIASGWNVK-YN-EDHRGYVTKFEVDDQYCRQFEVHQVG---GAQ-HKEL--WVPAEKLDEFNEHIIGEIHIIKEFP
312888451 -----------------------------------------MNEEYAIQIARDWNVP-AWG---SGFVTRFAVSSSYLKKFEVQNVG---GVI-HNEL--WVPAEELEEFNDHIIGLIEVTKTFL
282864000 -------------------------------------------------------MK-HNG---VGYVTRFEVGSDFLVRHPLQQDD---GRT-IPEL--RVPAEEPDDLDAQSAGDIRVVHKSR
13470985 ------------------------------------------------------------------------MLKSFLDRYRVEHAG---SKA-HLEY--WIPAEDLDDFNKAIVGKIEVTATFG
158333527 -----------------------------------------------------------------------------MDNYDIQKVG---GAH-HTEW--WIPAEKLEELNDNIVGEIEVIGEYR
289663132 -------------------------------MPEQPIFYPVTNQRYAEEIASRWNVK-DSG---LGYVAQFEVSAAFVEHDAIQNVG---GAH-HTEW--WIPAEELDALNDTIAGLNDIIGQFD
13470984 EAQPTITLWRPIGPEELKLIEASNMRAFPPRLPEQPIFYPVLSEAYAVQIARDWNVP-ASG---AGFVTGLPC----------------------------------------------------
329184512 AMKDVVCLYRPVGEAELQLIAAAVFKAFPPRLPEQPIFYPVLNFEYAAQIARNWNTK-DKNSGRAPRRSV-------------------------------------------------------
310818708 --METVTLWRPVGPEELALIREADMRAFPPRLPEQPIFYPVTTRDYAVKIARDWNVP-ASG---SGFVTQFEVRKDFLDHYEVQEAG---GQA-HRE----------------------------
153873366 ME--TITLFRPIGQTEMDLIVQSDYLAFPPRLPFQPIFYPVLQEDYAVQIHEIGILMMRLRAMLAM-----------------------------------------------------------
315502903 TE--TTTLWRPTGPRELDLVRASGWRAWPPRLPDQPV----------------------------------------------------------------------------------------
Back to Contents
ALIGN --------------HHHHHE-E-----EEEEEE----HHHHHHHHH----------------EE----HHHHHHH----------HHHHHHHHHHH--HHHHHHHHH-------------------------------------------------------------HHHHHHH------EEEE-------------H----HHHHH-----HHHH-HHH--EE--EEEE---HHHHHH-HH-HHH--------------------------------------HH-HHH-------------
HMM ---------------EEEEE-EE----EEEEEEE---HHHHHHHHH------------E--EEEE--HHHHHHHHH---------HEEEEHHHHHHHHHHHHHHH--------------------------------------------------------------HHHHHHHH------EEEEE---H-------------EEEEEE---HHHHH-HHHHHHH--EHHHHHHHHHHHH-HH-HHH-------------------------EE----E----HHHH-HHH-------------
FREQ --------------HHHHHH-H-----EEEEEEH--HHHHHHHHHH----------------EE--HHHHHHHHH----------HHHHHHHHHHHHHHHHHHHHH-------------------------------------------------------------HHHHHHHH------EEE------------HHH----HHHHHH---HHHHH-HHH--EE--EEEE---HHHHHH-HH-HHH---HH------------------HH------------HHH-HHHHH-----------
PSSM ---------------EEEEE-EE-----EEEEE----H-HHHHHHH---------------EEEEE--HHHHHHH-----------EEEEEEEE-HHHHHHHHHH---------------------------------------------------------------HHHHHHH------EEEEE-----------------EEEEE----HHHHH-HH----E--EEE----HHHHHH-HH-HH--------------------------------------HHH-HH--------------
FINAL ---------------EEEEE-EE----EEEEEEE--HHHHHHHHHH---------------EEEE--HHHHHHHH-----------EEEEHHHHHHHHHHHHHHH--------------------------------------------------------------HHHHHHHH------EEEEE------------E----EEEEEE---HHHHH-HHH---E--EEEE---HHHHHH-HH-HHH------------------------------------HHHH-HHHH------------
294781860 M--------KYEEQERKIYA-KYDD-KTIRVYQAYNDKIADEAIKLGTF-GEH-FSLTR--MTWIKPSFLWMMYRCGW-AEK-ENQERVLAIDIKREAFDEIVKNSVISSYKPNLGI-------------------------------------------------TEDEWKEEVKNS--LVRCQWDPERDIHGKLIGR----RSIQLGIR-GEAVE-KYVNEWI--VKITDITDDVKRI-KK-VLIMELLK----------------------------------------------------
256422007 ------------MKEKTIRA-LYDE-ESITVYQAYNGLIAKRAVEAQTF-TTPPFRRDR--MTWIKPSFCWMMYRSGW-ATK-EDQEYILAIKIKRSGFEWALQNAVLSKFDHKIHS-------------------------------------------------TTNEWNRLLKAS--PVRVQWDPERDIYLQPTDQ----RALQIGIS-GTAVD-QYISEWI--IGIEDITAYSQHI-GQ-LVKVRKIE----------------EAMALLPQERPY-PLPV-------------------
300789763 MFE------EQRVPDRQVRA-AQTE-TTVRVYQACSPAVADAALEEQTF--------ERGGTVQLTPSFRLAAYGSEN-GRK-PGHERILAIDLTRDGFEQALTHS----------------------------------------------------------------------------HVEWEAERDLDHTALNF----QAIRIGLD-S-----APADEWI--TAITDVTPVVRDI-AG-LLATDQLH----------------LAVKLVPHEPPY-ELG--------------------
228473982 MK-------DITQEERKIYA-LYDN-NTIRVYQAYNAEIAEEALKLGTF-GSH-FSLTR--MTWIKPSFLWMMYRCGW-AEK-ENQERVLAIDIKREAFDEIVRKSVLSSYKADLGI-------------------------------------------------TEEQWKEDVKNS--LVRCQWDPERDIYGKPIGR----RSIQLGIR-GAFVE-KYVNDWI--VKITDITEEVKRI-KQ-HIDKGTFT------------------KDLLPKEQEY-IIP--------------------
257125945 ---------MKKGEERNIYA-VFDD-KTIRVYQAYNNEIADEALKLGKF-GSK-FSLTR--MTWIKPSFLWMMYRSGW-ASK-QGQERILAIDLKREGFDEIVKNSVLSSFREVSDL-------------------------------------------------SKEEWKNKLDNS--EVRCQWDPDRDIYGNPLGR----RAIQLGIK-GETVK-KYVNDWI--VNITDITDKVVEI-RN-SIQNGTFS------------------ESMLPKEIKY-I----------------------
254302431 M--------KYEEQERKIYA-KYDD-KTIRVYQAYNNVIAGEAIKLGTF-GEH-FSLTR--MTWIKPSFLWMMYRCGW-AEK-ENQERVLAIDIKREAFDEIVKNSVISSYKTNLGI-------------------------------------------------TEDEWKEEVKNS--LVRCQWDPERDIYGKPIGR----RSIQLGIR-GEAVV-KYINEWI--VKITDITDEVKRI-KQ-SIDNGTFK------------------ESFLPEEKEY-IVK--------------------
336250841 MEKHLP---KYSIPERQIRA-FFTK-DFIRVYQAYSDEIADSAIKNNTF-VSPPFSLTR--MTWIKPSFLWMMYRSGW-GKKDSNQTRILAIDLSHDAFQKILHLGVPSDYHSASTF------------------------------------------------QNKEEWQDKIKNS--DIIFQWDPERDIHLNKLNY----RTIQIGIR-NQAVI-NFCNEWI--VNLHDITHQVQEI-HN-LVSLGDFC----------------KAKTLIPTEKTY-HFQL-------------------
260889576 ---------MKKEEERNIYA-VFDD-KTIRVYQAYNNEIADEALKLGKF-GSK-FSLNR--MTWIKPSFLWMMYRSGW-ATK-QGQERILAIDLKREGFDEIVKNAVLSSFREVSDL-------------------------------------------------SKEEWKNKLENS--EVRCQWDPDRDIYGNPIGR----RAIQLGIK-GETVK-KYVNEWI--VNITDITDKVIEM-RE-KIENGSFL------------------DSNLPIEEKY--V---------------------
256374811 ------------MESRQIRA-DFDE-RTLVVYQAYSPEIAEPALAAGTF-VPP-FKPGR--MTWVKPSFLWMAYRCGW-ARK-AGQERVLAVRVLREPFDAAVLAAVPSREVVEGKP---------------------------------------------------------------EIRVQWDPERGLRHEALGH----RSLQLGLA-GGASR-RYVEEWI--TGLTDVTGLMTRV-GA-AVAAGELE----------------LARELLPVERAY-PLEV-------------------
226327538 MNDD-----RVDCPECEVRA-YYTN-DFVRVYQAYSNTIAQSAVANGTF-VSPPFSMTR--MTWVKPSFLWMMYRSGW-GRKDANQASILAVDITHEGFQEMLTQGVVSHFDPDRYV-------------------------------------------------SAEAWKAASETS--NIRIQWDPERDIYLNRLSY----RTIQIGLR-NQAVE-KYCQEWI--VNITDITDKARKI-DN-CIANGDLD----------------TAYSLLPVEKPY-HFGE-------------------
197286762 MNDD-----RVDCPECQVRA-YYTD-DFVRVYQAYSTTIAQSAVANGTF-VSPPFSMTR--MTWVKPSFLWMMYRSGW-GRKDPNQASILAVDITHEGFQQMLTQGVVSHFDPDHYV-------------------------------------------------SAKEWQEATETS--DIRIQWDPERDIYLNRLSY----RTIQIGLR-NQAVE-KYCNEWI--VNITDITDKVRKI-DT-CITNGDLD----------------TAYSLLPIEQPY-HFAK-------------------
262067268 M--------KYEEQERKIYA-KYDD-KTIRVYQAYNDKIADEAIKLGTF-GEH-FSLTR--MTWIKPSFLWMMYRCGW-AEK-ENQERVLAIDIKREAFDEIVKNSVISSYKPNLGI-------------------------------------------------TEDEWKEEVKNS--LVRCQWDPERDIHGKPIGR----RSIQLGIR-GEAVG-KYVNEWI--VKITDITDDVKRI-KK-SIDNGTFK------------------ENLLPEEKEY-IIK--------------------
340754465 M--------KYEEQERKIYA-KYDD-KTIRVYQAYNNVIADEAIKLGTF-GEH-FSLTR--MTWIKPSFLWMMYRCGW-AEK-ENQERVLAIDIKRAAFDEIVKNSVISSYKPNLGI-------------------------------------------------TEDEWKEEVKNS--LVRCQWDPERDIYGKPIGR----RSIQLGIR-GEAVE-KYVNEWI--VKITDITDEVKRI-KK-SIDNGTFK------------------ENLLPEEKEY-IIK--------------------
167588668 MKSHLKQT-PEAIPLRQIRA-MYDD-RTIRVYQAYSDAIADSALTHGTF-VSPPFKTER--MTWIKLSFLWMMYRSGW-GLKDSGQARILAIDISREGFEWALAHSCLSHPDESMHR---------------------------------------------------DEWQRMKEKA--PVRIQWDPERDLLLQPLAY----RAIQVGLS-KQAVD-LYVHEWI--QRITDVTPLAHSL-HA-LVGQGDFE----------------SAQALLPLEQPY-CIGA-------------------
191169136 -----------MADYFEIRA-DYNQ-HTITIYQAYNDAIADVAVRDGRF-GAP-FSFNR--MTWIKPSFMWMMERSNW-GLK-KDQQHILAIRIKRTFFDTLLEQAVLTTPEAHVYP-------------------------------------------------HAGIWETLFAQA--NVYVQWDPERSINGKKLEH----RSLQLGIS-RNLIS-QFNEDAI--VAIDDLTPLVRKC-HN-LLINGKTT----------------QAKSFLPPEKIY-PVSEAA-RKALG--MK-------
345368115 -----------MADYFEIRA-DYNQ-HTITVYQAYNDAIADVAVRNGRF-GAP-FSFNR--MTWIKPSFMWMMERSNW-GLK-KDQQRILAIRIKRTFFDTLLEQSVLTTPEAHVYP-------------------------------------------------HAGIWETLFAQA--NVYVQWDPERSINGKKLEH----RSLQLGIS-RNLIS-QFNEDAI--VAIDDLTPLVRKC-HN-LLINGKTT----------------QAKSFLPPEKIY-PVSAAA-RKALG--MK-------
193070962 -----------MADYFEIRA-DYNQ-HTITIYQAYNDAIADVAVRDGRF-GAP-FSFNR--MTWIKPSFMWMMERSNW-GLK-KDQQHILAIRIKRTFFDTLLEQAVLTTPEAHVYP-------------------------------------------------HAGIWETLFAQA--NVYVQWDPERSINGKKLEH----RSLQLGIS-RNLIS-QFNEDAI--VAIDDLTPLVRKC-HN-LLINGKTT----------------QAKSFLPPEKIY-PVSAAA-RKALG--MK-------
312199543 VDRRP----ADGAGMREVLA-SHTA-ATLTVYQAYSPAIAGPALRAGTF-VEP-FRVGR--MTWVKPSFLWMMYRCGW-ATK-PDQERVLAVEIGRDDLLWALARACLSSFEPGQHA-------------------------------------------------DPRSWRAALAAA--PVRVQWDPDRDLYLRPTGR----RAIQIGLG-PEASR-HYVSSWI--RSIRDVTPLAREI-HA-RVQADDLD----------------GARALLPEEHPLALPSEIA-RRLGA--SP-------
218547498 -----------MADYFEIRA-DYNQ-HTITVYQAYNDAIADVAVRDGRF-GAP-FSFNR--MTWIKPSFMWMMERSNW-GLK-KDQQRILAIRIKRTFFDTLLEQAVLTTPEAHVYP-------------------------------------------------HAGVWETLFAQA--NVYVQWDPERSINGKKLEH----RSLQLGIS-RNLIS-QFNEDAI--VAIDDLTPLVRKC-HN-LLINGKTT----------------QAKSFLPPEKIY-PVSAAA-RKALG--MK-------
170684105 -----------MADYFEIRA-DYNQ-HTITVYQAYNDAIADVAVRDGRF-GAP-FSFNR--MTWIKPSFMWMMERSNW-GLK-KDQQRILAIRIKRTFFDTLLEQAVLTTPEAHVYP-------------------------------------------------HAGVWETLFAQA--NVYVQWDPERSINGKKLEH----RSLQLGIS-RNLIS-QFNEDAI--VAIDDLTPLVRKC-HN-LLINGKTT----------------QAKSFLPPEKIY-PVSATA-RKAWG--MK-------
311896751 ---------MTETPKRQVRA-RYDE-ETVTVYQAFRPEIAEPAVAGGRF-PAA-FDPGR--MTWVKPSFRWLMHRSDW-ARS-EGQQRVLGVVLWRAGFDAALEAAVLSSYERGVHA-------------------------------------------------SRAEWQRELRRS--EGRAQWDPERDLELRPLAH----RSLQLGLS-GSLVE-RYLGEWL--VRIDDLTPLARAL-HA-TRDP-----------------------GLLPPERPY-PLPAGA-AVRLG--AS-------
255930929 ---------MTSTTYRAIRA-KQTP-TTVTVYQAYPPEIADPALEAHTF-VPP-FSRDR--MTWIKPSFLWMAYRSGW-ATK-PRQERVLAIEISREGFEWALRNCCLSHYSPSEET-------------------------------------------------SQEKWRKRLRAS--PVRVQWDPERDLSLRSLDY----RSIQIGLS-GEAVR-RYIDEWI--VSIADVTHTMKQI-DG-YLKDGDVD----------------AARSDLPEERPY-ILPEDL-QENLR--MK-------
163754444 ITQNN----EWPQNGHHIMA-QYDD-EKIIVYQSYRPAIGLFAAENQFF-GGP-FSLER--MTWIKPNFLWMMYRNGW-GTK-VGQEVVLAIHLKREAFQKYLENAVHSSFKPELYE-------------------------------------------------SQEMWKEAVKSS--NVRLQWDPDHDPYGAKLER----RAIQIGIR-NEFIR-SYAKEDI--LEIENISEFVAEQ-YE-FVKSNQLE------------------KLMIPAERPFLPEGDEL-RKKLQ--LQ-------
239987775 MNT------PPVPPRHEIRA-LHTA-TTVTVYQAYRPAIGLPAARDGRF-PAE-WKRDR--MTWIKPSFLWMMYRCGW-GTK-EGQEVVLAVEIDRSGLEWALANAELSHYVRDVHP-------------------------------------------------DQATWKRSLRTA--PARVQWDPERDLDLNPLPY----RSLQLGLS-GEASR-RYADEWT--VSVRDVTPLAREV-HA-AVRAGERE----------------RAAALLPVETPL-DLAAPR-PVQVDDLAA-------
291444753 MNT------PPVPPRHEIRA-LHTA-TTVTVYQAYRPAIGLPAARDGRF-PAE-WKRDR--MTWIKPSFLWMMYRCGW-GTK-EGQEVVLAVEIDRSGLEWALANAELSHYVRDVHP-------------------------------------------------DQATWKRSLRTA--PARVQWDPERDLDLNPLPY----RSLQLGLS-GEASR-RYADEWT--VSVRDVTPLAREV-HA-AVRAGERE----------------RAAALLPVETPL-DLAAPR-PVQVDDLAA-------
124002565 ---------MKQKNKYEIRA-LYTP-KHIALYAAFSSSIANVALKSQQL-LPP-FSYDR--MTWVKPSYLWMMYRSDW-AQK-DNMQRILRIWIKRIDWELALKEAILTTPEAHVYN-------------------------------------------------DAKKWRKQLDKA--RVRVQWDPERDIQNKHLSF----KSIQVGIM-PSLAE-TYAKKWI--AKIEDVTPLTQHI-RS-LVVAQQFE----------------QATQLLPKEQAY-PVEAEL-KRILG--IG-------
110639136 ------------MLEKQIRA-VYDQ-QTITVYQAYKNEIAIPAVKNQKF-VAP-FKIER--MTWIKPSFLWMMYRSGW-AAK-EGQEHVLAIKLKREGFEWALANCCLSHFDSTMFS-------------------------------------------------SLEAWKNKLEHT--QVRLQWDPEKDIHLQNLAY----RSIQIGLS-GVAVE-HYVNDWI--VSIDDITPVCKKI-HA-LVLDKKTE----------------EANSLLPAENIY-PVSETL-KHTIG--AD-------
344999740 MNV------QATPPRYEIRA-QHTA-ATVTVYQAYRPAIGLPAARDGRF-PAA-WKRDR--MTWVKPSFLWMMYRCGW-GAK-EGQEVVLAVEVERAGLAWALANAELSHYVRGVHP-------------------------------------------------DEAAWKQALRSA--PARVQWDPERDLNLNPLPY----RSLQLGLS-GEAAR-RYADEWT--VSIRDVTPLARDV-HA-LVRAGDRD----------------RAASLLPTETPL-HLPAPR-PL--------------
326779281 MNT------QALPPRYEIRA-RQSA-TTVTVYQAYRPAIGLPAARDGRF-PAA-WKRDR--MTWIKPSFLWMMYRCGW-GTK-EEQEVVLAVEIDRGGLEWALAHAELSHYAAEVHP-------------------------------------------------DQAFWKRSLRTA--PARVQWDPERDLDLNPLPY----RSLQLGLS-GEAAR-RYADEWT--VSVRDVTPLAREV-HA-AVRAGERE----------------RAAALLPVETPL-DLAAPR-PVRA---AS-------
124004042 KDYET----DLPQEGRHILG-QMTNAENLIVYQAFNPSIAKYAVTHQQF-GGSQYSFSR--MSWIKPNFLWMMYRAGW-ASK-PNQERILAIEISKQNFELILEEAIHSSYVAEVYG-------------------------------------------------SRADWQAKLKAS--NVVMQWDPDHAPNGDKLQR----RAVQLGLR-NELLK-NFGTHWA--VSIQDITDFVLEQ-GK-CLRGQKMD------------------ELLVMQEQVI-AIDNPE-VVKRLG-LA-------
336471510 FSNL-----PPKPPSRQIRALQEDDGTTITVYQAYPSTIATAAVIHQRLDASPEFRTTR--MTWIKPSWAWMLYRSGY-SYKDPGQERILAIKMKREDFLGLLGRGVLTHGTAPPRP----------------GPQQGQGITSDAQGRTSGER---GEEAAPKESTRESKRKDRLQSL--DVKIQWDPERTVRLHSLNY----RSIQIGIP-AGLIR-EWAQDMI--VNIEDVTDKARTL-KK-ILDERPDV-----------NDEELAELGLIPKETEF-EVPVEL-RSRLG-----------
169773039 MATNN----ANLQPFRAIRA-QSTQ-STITVYQAFSPEIAEPALRAQKF-VPP-FSRTR--MTWIKPSFLWMAYRCGW-ATK-PKQERVLAIEITREGFEWALRRSCLSHVPGSRDQ-------------------------------------------------DQEKWRQRLRES--PVRVQWDPERDLWHRPLGY----RSIQIGLS-GEAVE-RYVDEWI--VSITDVTGLMGDV-KR-ALDKADAE----------------GAEGLLPVESVY-PLSEEL-RDILD--AT-------
85068247 FSNL-----PPKPPSRQIRALQEEDGATITVYQAYPSTIATAAVTYQRLDASPEFRTTR--MTWIKPSWAWMLYRSGY-SYKDPGQERILAIKMKREDFLGLLGRGVLTHGTAPPRP----------------GPQQGQEMTSDAQGRTSGER---GEEAAPKESTRESKRRDRLQSL--DVKIQWDPERTVRLHSLNY----RSIQIGIP-AGLIK-EWAQDMI--VSIEDVTDKARAL-KK-ILDERPDV-----------IDEELAELGLIPKETEF-EVPVEL-RSRLG-----------
182438632 MNT------QALPPRYEIRA-RQSA-TTVTVYQAYRPAIGLPAARDGRF-PAA-WKRDR--MTWIKPSFLWMMYRCGW-GTK-EGQEVVLAVEIDRGGLEWALAHAELSHYAAEVHP-------------------------------------------------DQASWKRSLRTA--PARVQWDPERDLDLNPLPY----RSLQLGLS-GEAAR-RYADEWT--VSVRDVTPLAREV-HA-AVRAGERE----------------RAAALLPVETPL-DLAAPR-PVRA---AS-------
254387007 PDPA-----PVPVPNRAVRA-AHTA-RTVTVYQAYAPHLGLPAARDGRF-PHA-WKRER--MTWVKPSFLWMMYRCGW-ATK-ADQETVLAVEITREGFDHALRRACLSHYEPGTHA-------------------------------------------------DRASWQRALRGA--PARVQWDPERDLHLNPLPY----RSLQLGLS-GPASR-AYADEWT--LSIRDVTPLAREI-HG-LLRAGNAD----------------AARALLPGETPY-P-SPPL-PHLGA-----------
70988759 ---------MARHPYRQIRA-KYTS-TTITVYQAYSPSIADAAVDAQKF-VPP-FSRTR--MTWIKPSFLWMAYRSGW-ARK-PKQERVLAIDITREGFEWALQHSCLSHYPGHDVE-------------------------------------------------EKAKWQKRLQNS--PVRVQWDPERDLQFTPLDY----RSIQIGLS-ADAVD-KYVDDWI--VGITDVTEVMRQI-EK-CLAEDRME----------------DATRLVPAEEVY-PLSEEL-KGILE--AT-------
302535927 P--------APETPRHQIRA-AHTA-TTVTVYQAYAPHLGVPAARDGRF-PPA-WKRER--MTWIKPSFLWMMYRCGW-AAK-ADQETVLAVEISREGFDRALAQACLSHYVPGVHA-------------------------------------------------DREAWKASLAGS--PARVQWDPERDLHLNPLPH----RSLQLGLS-GPASR-AYADEWT--VSIRDVTPLAREI-HG-LVRAGDLD----------------AARALLPAETPY-PAGPLP--HLGA-----------
66813652 M--------SNKNYKRIIKA-VYND-ETIRVYQAYNKEIAEGAVKNQRF-VDP-WLTTR--TTWIKPSLCWMMYRAGY-GYKDKNQERILAIDIKREAFEWILDTYYDNNNENLNDL------------------------------------------------------KAYAKN---SLVIQWDPERSIKIGKLEN-GELRSIQIGIK-PNLTQ-KFNNEWI--AEINDITDIVHQI-KR-EIDDGNIE----------------KAISLLPIEKVYTPINVKF-----------------
66802638 M--------TDNNYKKIIRA-VFTD-DTVRVYQAFNSKIADDAILNQKFTLESGWSDNR--TTWIKPSFCWILYRSGY-ACK-HNQERILAIDIKREAFEYILENHIDAHETGKSAI------------------------------------------------------PSSKK----KIVVQWDPERNISISKLDGCGDIRSIQIGVK-KAKIK-EYNEQWI--QAITDVTPIAHQI-KK-ELDKGDLE----------------KAKSLLPDELVYTPKNVRF-----------------
124007793 -----------MNNTQEIRA-QYDA-DTITVYQAYGKAIALPATKVNQF-APP-FSFQR--MTWIKPSYLWLMERSNW-ATK-PQQEFILGIKIKRAYWEYALSLGVLTHPDLAIYT-------------------------------------------------DGLDWEQKFSQA--KVHIQWDPERTLRGAKLQV----RSIQVGIS-RHLIE-QYNNEWI--VAIDDLTPLTRKI-SQ-LKKQGKYK----------------EAKQLLPKEQVY-VLPDEL-QKRIG--VR-------
119497805 ---------MARHPSRQIRA-KYTS-TTITIYQAYSPSIADAAVDAQKF-VPP-FSRTR--MTWIKPSFLWMAYRSGW-ARK-PNQERVLAIEITRKGFEWALQHSCLSHCPGQDAE-------------------------------------------------EKAKWQKRLQNS--PVRVQWDPERDFQFRPLDY----RSIQIGLS-ADAAD-KYVDEWI--VGIADVTEAMRQI-EK-CLAEGRTE----------------DAARLMPAEEVY-PLSEEL-KDILE--AT-------
121719366 ----------MNPPYRQIRA-KYTP-TTITVYQAYNDTIATNALAAQTF-VAP-FSRTR--MTWIKPSFLWMAYRCGW-GKK-PRQERVLAIEITRDGFEWALRHSSLSHYGGRDPE-------------------------------------------------GKAAWQERLRAR--PVRVQWDPERDLEFKGLAY----RSIQVGLG-GEAVE-RYVDEWI--VGITEVTETMREI-EQ-CMEEGRME----------------EARALVPLEEEY-PLSEEL-REILE--AR-------
303240837 --------------MNRIFA-YFDD-EGVYVYQAFKPNIVKNAVEIGTF-GKG-FGLDR--ITWIKPSFGWILHRSSY-ATK-HRMEAIAKIKLSHKAWLEILSQSVPSQFDSSRYK-------------------------------------------------NETIWKADFEKS--DVIHQM---------KLNR----RAIQIGLR-NEAIK-KYVYEWI--IGVEDVTDLAKEI-SS-IIKSGKDP------------------SSLLPDISEY-PISDDL-KNIIG--YT-------
322708785 M--------ASTPPYRQIRA-TYTP-DTITVYQAYKRSIADAAVKHQKLNASPDFRPGR--MTWVKPSWSWMMYRAGY-SYKDPGQERILALRMKHEHFIALLDKGVLSAHTERIGG------------------------------------------------VGGGEQGPRDKTS--EVRIQWDPERDERLRVLPY----RSIQIGIP-GSLSK-KWAEEWI--AEIEDVTEKARGL-KA-ALDERADV-----------TREELLDMGYVPEERVF-EVGHDI-RERLG-----------
256376409 -----------MAPQRQIRA-DYDD-SHITVYQAYSSAIADPALAAGRF-VPP-FSFGR--MTWVKPSYLWLMHRSNW-ARK-PGQERVLAVRITRAGWERALAQAVLTGSPGLEGA---------------------------------------------------------------RVHVQWDPERSLRGAALNH----YSIQVGVG-RDVVR-ELVDEWT--TGVADLTGRTRRI-AA-LLQAGRAE----------------QARRLLPPERPY-PLPVAI-ATRLD--AG-------
322699163 M--------ASTPPYRQIRA-TYTP-DTITVYQAYKRSIADAAVEHQKLDASPDFRPGR--MTWVKPSWGWMMYRAGY-SYKDPGQERILALRMKHELFVALLEKGVLSAHTERIGG-------------------------------------------------GGGEQGPRDKPS--EVRIQWDPERDERLRALPY----RSIQIGIP-ASLSQ-KWAEEWI--TEIEDVTEKARGL-KA-VLDERGDV-----------TREELVDMGYVPEERVF-EVSQDI-RERLA-----------
346318305 SQA------TPTVPYRQIRA-LYDD-STITVYQAYSPSIADAAVAAQRLDASPDFRPGR--MTWIKPSWAWIMYRAGY-SYKDARQARILALRMTHAHFLGLLNRGVLSHGGNLAPD-------------------------------------------------------RLDKNA--EVRIQWDPERTPALHRLPY----RSIQIGIP-GSLSA-QWVADWI--ISIEDVTDTAREL-KR-TLDENPDV-----------ELQELVNRGLVPVEKFF-PVPESI-MAKLD-----------
162457230 -----------MPKLHEIRA-DYDA-ETIVMYQAYAPAIAEPALAAQRF-VAP-FSFGR--MTWIKPSFLWLMHRSNW-GRK-AGQERILAVRIRRTGWEHALSLAVLTSPEATVFR-------------------------------------------------SPDEWSKAFAEA--KVHIQWDTERNLRGGPLPC----YSIQVGVG-RDLIR-EYAESWV--VAIEDRTPLVRKM-YQ-QIQAGHAD----------------SAAKSLPRERPY-AVDEKI-ARRLL--ID-------
340521231 MSR------PSDIPHRQIRA-SHDK-DHIVVYQAYKPSIASAAVKAQKLNASEDFSPDR--MTWIKPSWCWMMYRSGY-SYKDPNQSNILAIKMKMEHFLELLRQGVLSNHPSEHAR----------------------------------------------VDKDSTNKTAHERPS--DVRIQWDPERNARLEALPY----RSIQIGIP-PNLGT-KWVDEWI--VGIEDVTERAREL-KR-VLEEEPHI-----------GEDELVKRGLVPEETPV-DVPDDI-MTRLD-----------
302529076 ------------VPRRDVRA-GYTD-QTITVYQAYSRHIADVAVESQTF-AAP-FKRER--MTWIKPSFLWMMYRSGW-ATK-PEQERILEIQLTREGFEWALAHAALSSYEPGAYA-------------------------------------------------GQQHWAERKRTS--PVRIQWDPDRSLTLAPLDR----RAIQIGLS-GEAVE-RYLDQWI--AKITDITPFAERI-HR-HVSSGRLE----------------AAREELPGERVY-PVPAPI-LGMIG--AS-------
262199521 ---------MSQTSTREIRA-DYNA-DSIVVYQAYRDDIADPALREQRF-VEP-FSFHR--MTWIKPSFLWLMHRSNW-GAK-KGQERTLRVRIGRAGWEEALAQGVLTSPDGPVFG-------------------------------------------------NAAKWQRAFAAA--KVHVQWDTERSLRGAALDH----LSIQVGLG-RHIIQ-RFVEEWI--VAIDDMTASVAKM-RR-LLQQGKVA----------------EAKRLLPSERVY-SVPDDI-ARRLW--FD-------
238490968 MATNN----ANLQPFRAIRA-QSTQ-STITVYQAFSPEIAEPALRAQKF-VPP-FSRTR--MTWIKPSFLWMAYRCGW-ATK-PKQERVLAIEITREGFEWALRRSCLSHVPGSRDQ-------------------------------------------------DQEKWRQRLRES--PVRVQWDPERDLWHRPLGY----RSIQIGLS-GEAVE-RYVDEWI--VSITDVTGLMGDV-KR-ALDKADVE----------------GAEGLLPVESVY-PLSEEL-RDILH--AT-------
115387213 MEGSHASTVHHAHGYRVIRA-KYTP-TTITVYQAYSPEIADAAIRAQRF-VSP-FRRQR--MTWIKPSFLWMAYRCGW-ASK-PNQERVLAVEITREGFEWALRHSCLSHAAAT----------------------------------------------------KQEEWQQKLQSR--PVRVQWDPERDLSFRPLGY----RAIQVGLG-RESVD-RYIDDWI--VSITDVTQTMKQV-AQ-YVADGMVE----------------EAKACLPEERVY-PLSDEL-REILD--AT-------
290963088 -----------MAPPYQIRA-DYDA-DTIVVYQAYAPAMADAALRAGRF-VAP-FSFRR--MTWIKPSFPWLMHRSNW-ARK-PGQQRVLAVRMSRHGWEEALSRAVLTTEDPAAVA-----------------------------------------------------------RA--AVHVQWDPERSSRGAALNH----YSIQVGIG-RDLIR-TFTDEWI--VSLTDLTPQVRKA-AT-LTQTGHAA----------------QAQRLFPAERVY-PLPPHL-ERLL---TS-------
168699093 -----------MGAAREIRA-DYDR-DTIAIYQAYPPAIADAALAAGRF-VPP-FSFHR--MTWIKPSFLWLMHRSNW-AQK-RGQERVLCVRVRRSGWEAALAQAVLTSFEPTVFT-------------------------------------------------DPDTWAEQFATA--RVHLQWDPERSLRGAGLPY----DSIQVGLS-RHVIR-EYADDWV--ARIEDYTPVVRKV-YT-LLQSGRAD----------------KARRFLPPERVY-PVGGEL-GRRLS--LR-------
328866607 MSS------EFISKEFQIRA-VYNK-ETIRVYQAYNNEIADYAVKHQTFTGCPHWSTER--TTWIKPSFLWMMYRSGW-AQKDKNQNRILAIDIHIKDFEYAIQNNYKSSTKQKYQI------------------------EGQELPPPSKEHS------------QPPVSKVDKSNY--DIVVQWDPERSIKLGKLGSN--IKSIQIGIK-KRIAE-QYSSNWI--TQITDITNQCLEI-KQ-LLDNGHLD----------------QAQSLLPIEKVY-IPSFIK-----------------
288940281 ------------MPENSVRA-IFDD-KTIRVYQAYRADIALPALAAGRF-VPP-FKMDR--MTWIKPSFGWMMYRSGY-ASK-PGQEFVLGIDITRDGFEWALAHATLSSFKPSVHP-------------------------------------------------SYEVWKADIESK--PVRVQWDPERDWKLQPIRGV---RAVQIGLS-REAIK-YYARDWI--VKIEDVTPLVKKASQA-IIMPPDLP----------------SA-----LERPY-PLPADL-AYIC---CD-------
320095331 ------------QPLRQIRA-LYDA-TTITVYQAYSPAIADAALRAGAF-VPP-FKEER--MTWIKPSFLWMMYRSGW-GTK-PGQERTLAVRITREGFEAALADACLSHFDPDVHS-------------------------------------------------TRQAWSAAVAAC--PNRIQWDPERNASGDPLAH----RSIQIGIG-PARVG-AYAHEWV--VGISDVSDLVEAL-RL-AP-ARLGE--------------------LGPRERPY-PLPAGL-AQRIG--AS-------
256395290 MGN------ENNLPLHQVRA-DYDR-ETIVVYQAYRAQIAEPAVRAQRF-VEP-FSLQR--MTWIKPSFLWMMGRSNW-ARK-PGQEHVLAVRITREGWENALSQAVLTGYKRGVHA-------------------------------------------------DHADWEQQMKHA--RVHVQWDPERTLSGAVLDA----RSIQVGLS-RHVVA-DYVNAWT--TEIRDITPTVRKM-AD-LLKEGRKD----------------RAAQHLPKERPY-ELPPHIA-RRLR--GE-------
238061717 ------------VPVRQIRA-RYSA-ATITVYQAYPPQIALPAVSAGRF-VAP-FKRDR--MTWIKPSFLWMMYRCGW-ATK-PGQERVLSIDITRDGFEWALARACLSHYDRDVHG-------------------------------------------------DKATWSRQLKTS--PVRVQWDPERSLHLNALPY----RSLQVGLS-GEAVD-RYVDDWI--VAVTDITPTVERA-RD-LLRRGDDQ----------------AAAAQLPVEYVY-PLPDRIA-VGLH--AS-------
162457272 AAQSA----RWPTAGRHILA-QFDA-ETIVVYQAYRPSIARHAALHQRL-GGPEFSFGR--MSWIKPNFLWMMFRSGW-GTK-PDQEAVLAIRIQRAGFDAILAAAVPSGFVPDLHP-------------------------------------------------SEEAWKSDLQRS--DVRLQWDPDHHPSGAPVAR----RAIQLGLR-GATLR-RFAEEWT--VGVEDISALVAEQ-RE-VLRGRGVG------------------ELEIPREEVY-WPTAAEAARRVG--IE-------
159037621 ------------VPVRQIRA-RYSA-DTITVYQAYPPQIALPAVAASRF-VAP-FKRDR--MTWIKPSFLWMMYRCGW-ATK-PGQERVLSIDITREGFEWALARACLSHYDRDLHG-------------------------------------------------DKATWLRQLKIS--PVRVQWDPERSLQLKALPY----RSLQVGLS-GEAVD-RYVDDWA--VAITDITPTVHLV-RD-LLRSGDGQ----------------AAAALLPVEQVY-PLPDQIA-VGLN--AS-------
124002814 -------------MQKQIYA-AYDD-EGLFVYQAFKPKVVATAAAKGTF-GTG-FNTNR--LTWIKPSFAWVLQRTKY-ATK-HRMNAIARIKLSHEGWLHLLRQAVPTQYDAQRYT-------------------------------------------------NEEDWQQALDKA--VVIHQWDPERDLLGKKLDR----AAIQVGVR-SEELSLRYVNEWI--LGIEDVTELAHAI-GS-LQKRRNPP------------------LPETPEERLY-PVSEEMA-LALG--CF-------
333374005 MEQME----RWPAEGRHILA-QYDP-SSIVVYQAYKPKIGRFAVDHGYF-GGE-FRFNR--MSWIKPNFLWMMFRSGW-GTK-PDQETILAIHIERSGFDSLLEQAVHSTWNQSLHP-------------------------------------------------DREAWQKDLRKS--EVRLQWDPDHDPFGQPVKR----RAVQLGLR-GETLI-RYARDWI--VEIEDITNFVKKQ-KA-YVDQGKLD------------------RLETPQETVY-PPASVQGRV--------------
168703011 PEQVK----VWPKDGRHILA-QFDH-DSVVVYQAYSPAIGRYAIEHGRF-GGA-FSFER--MSWIKPNFLWMMYRSGW-GTK-ENQEVTLALRLRRAFFESLLAEAVPSTWDRDLFA-------------------------------------------------TFEEWSRAVGRS--AVRLQWDPDHHPSGAKLDR----RAIQLGLR-GRVLE-AFGTTEL--LEVIDLSEFVAQQ-RE-LLAARGTS----------------AL--ITPRERVY-SPTDPAIAAQLR--LA-------
298250918 EDQLK----VWPQQGKHILA-QYDE-TSVVVYQAYRPAIGHFAARRGYF-GGG-FSLER--MSWVKPNFLWMMYRSGW-AQK-EHQEVVLAVRLKRAAFDEILAQAVHSTYKEALYG-------------------------------------------------SHEAWKQALETS--HVRLQWDPDHDPRGVKLER----RVIQLGLR-GPVLA-QYAREWI--LDIEDISQFVYEQ-YH-YVESGAFD------------------QLIMPAERVY-PIVNTHIAARLG--II-------
300854685 -------------MEKKICA-SYTE-NSIRVYQAYNNKVAEECLKLGTF-GES-FKMER--MTWIKPSFLWMMYRCGW-GKK-ENQERVLAIDISRNGFEEMLSNVVLSTYSEKVYK-------------------------------------------------SHENWKFQLKTS--NVRCQWDPERDIYGNKLDR----RSIQIGLQ-GEMVY-KYVNNLI--LNIEDMTNKVSKW-SK-DIRDKKLD------------------FKELPVENEY-YV-DNLI-KEKLGMSI-------
296121824 AEQAE----QWPHEGRHILA-QFDQ-DTIIVYQAYQPAIGHYTAMHRTF-GGG-FSYSR--MSWIKPNFLWMMYRSGW-GTK-ANQEITLALRIRREFFDALLAEAVPSSWDPTEFV-------------------------------------------------TEDEWSQAVSKS--SVRLQWDPDHHPTGAKLER----RAIQLGLR-GDVLK-AFGQQEL--IDVIDISDFVSAQ-RE-RLLSRGTS------------------ALVTPLERVY-SPADPEIALRLK--LA-------
340377247 IEQQTG---VWPKDGKHILA-QYDD-EDIIVYQAYSRGIGSYAIEHQKF-GGPLFSYSR--MSWIKTNFLWMMYRSGW-GSK-ENQEMVLAVRISRNGFDTILSHALTGHDEKLLGK----------------------------------------------------------GQS--PVRLQWDPDHHPDGSALSR----RAIQLGLR-NDILA-RYGDEWT--TDITDISDFVHDQ-YQANVISRQWD------------------KLLVPRERVY-HVTNEEIAKQIK--LI-------
281203630 ------------MKERIIRA-IYDD-TTITLYQAFNSVIGRYAVKNQSFIGCPGFKIDR--MTWVKPSFLWMMYRSGW-ATK-HNQECILAIRIKREGFEWALQNSSLSQHLSISAE-------------------------------------------------QREEHREQLLSQ--PVRIQWDPEKDIDLKALPY----RSIQIGLS-GVAVT-KYLNEWI--VSIEDITPKCKTI-YQ-LLATHQRE----------------EALRQLPQESIY-NIDNHHIEIHIN--LS-------
290974944 M--------ITQQVTGSIIT-IDDE-ECIVFYQAYNSGIADWVVKNQTFDECPNFDKKR--MSWIKPNYLWMMYRSEY-ATA-KNQTNILALFITRKSFEEELLKHAVCAMYYPELE----------------------GYYKSQKEWKVNCSQMKEKVAQLMNKNDTDTI-MTDNVC--FARVQWDPYHTPAFGNING-GLTRAIQIGVK-GSFLR-SMCKSGA-CKKIEDITKYVHEQ-HA-----EYLK----------------TKDLLIPVERYI-HINDKDIKGRLA--IT-------
290974534 -EARN----EWPDDGNHIIA-SYTE-DAVLVYQAFNDEIADYAVKHQKFDGCPSYNDTR--MTWVKSNWLWMMYRSNY-ATK-QNQTRILGLWLKKSAYDDILKKARLKGAGAGL------------------------------------------------------------------TRAQWDPDYSPELEPIKRR---RDLQLGIK-KRETF-RNGEDF---VEIVDCTELAHIS-KK--T-------------------------KTIPHERVYTPDNEVCI--NLQ--VS-------
83647694 LEQTS----LWPASGRHILA-HQDQ-DTLIVYQAYRPEIGEYAIKHGRF-GGA-YSYSR--MSWIKPNFLWMMYRCGW-GMK-EGQEVVLGLRIRRQFFEDILSQAVPSSYNPEEFA-------------------------------------------------TQETWKEAVQNS--NVRLQWDPDHTPNGAKCER----RAIQLGLR-GDMLA-RYGKEEI--LEVIDFREFIAEQ-RA-QATPDRYA----------------EL--LTPQEQVF-IPSDDAIGARLR--LD-------
294669065 ------------MNQNTIRA-VYGE-HTIRVYQAYSDPIADAALAHGTF-VSPPFKMER--MTWIKPSFLWMMYRAGW-GLKDEGQKRILAIDISREGFEWALRHACLSHPPAGMGK---------------------------------------------------DDWQRLKAQS--PVRIQWDPERDLQLKALPY----RSIQIGLS-GEAVN-YYVNDWI--QDITEITPLARQI-RE-LVEQNRLD----------------EAQILLPPEQPY-PAVYVPI----------------
21223327 ----------MQQPQREVRA-VHTA-STVTVYQAYSPEIGLPAIREGRF-PAA-WKRDR--MTWIKPSFLWMMYRCGW-AAK-AGQETVLAVEIGREGFEWALRHACLSSYQPGVHP-------------------------------------------------DRATWQREVKRS--PTRVQWDPERDLRLQPLPY----RSLQLGLA-GEAAR-RYADEWT--VAIRDVTPLAHEI-HG-LVRDGDLD----------------AARRLLPREQPY-PAAEELL-SNLRP----------
297561069 ----------MDVPRHQIRA-LHTD-STVTVYQAYAPSLGLAAAREGRF-PSA-WKRDR--MTWIKPSFMWAMYRSGW-GLK-RDQETVLAVEITRAGFAWALRNACLSHHAPAVHP-------------------------------------------------DRETWRARLREA--PARVQWDPERDLYLSPLEH----RSLQLGLA-GEAAR-RYADEWI--VSITDVTPLARRV-HT-LVQEGDTA----------------AAARLLPAERPY-PVAQGEL-DHLRPARE-------
333027909 -----------PVPRHEIRA-LHTA-DTLTVYQAYRPSLGVPAARDGRF-PEA-WGRGR--MTWVKPSFLWMMYRCGW-GTK-EGQETVLAVEIAREGFLWALRNATLSHFERGVHG-------------------------------------------------DRAEWQRSLRRA--PARVQWDPERDLHARPLEH----RSLQLGLS-GEASR-RYADEWI--VGIRDVTPLAREA-HG-LVRDGELD----------------GARALLPVERPY-EVPVDAL-AGLLP-VP-------
295839520 PPPAAS---PPEIPRHQVRA-LHTA-DTLTVYQAYRPSLGLPAARDGRF-PPE-WGRER--MTWIKPSFLWMMYRCGW-GTK-EGQETVLAVEITRAGFLWALRHAALSHYEAATHG-------------------------------------------------SREAWRRALRGA--PARVQWDPERDPRGRALAH----RSLQLGLS-GEASR-RYADEWT--VGIRDVTPLAREA-HA-RVREGRPE----------------AARALLPVERPY-EVPADAL-AGLLP-AP-------
297202026 --------------MG------------------------ALRRRTEPWNPPRERVCEHA-LTWIKPSFLWMMYRCGW-GAK-AGQETVLAVEISRDGFEWALRHACLSSHVRGAHP-------------------------------------------------DRAAWQRQLKRA--PARVQWDPERDLHLRPLPY----RSLQLGLS-GEAVR-RYADEWT--VAIRDVTPLAHEI-HA-LVRGGDMA----------------SATGLLPQERPY-PAEAESL-AHLLA----------
312886331 KQSLT----LLPQNGQHILA-HQTG-NDMVVYQAYKPGIAKFAVDNQFL-GGPDFSFTR--MSWIKPNFLWMMYRCGW-AEK-ENQERVLAIWIAQKDFEEILRQAVFSSFNPQYYR-------------------------------------------------DHDHWKNELSLK--EVRLQWDPDHDPYGNKVER----RAIQLGLK-GEMLR-FFSSK-I--KSIEDITDFVNQQ-KN-LLDHHGLD------------------ELEVPVETIF-KTSDPIL-NKQIG-IT-------
297194315 ---------MTDEPRHRVRA-RYTD-DTVTVYQAYSPAIGVPAARDGRF-PAA-WKRER--MTWIKPSFLWMMYRCGW-ATK-ADQETVLAVEIRRDGFEWALRNACLSHYQEGVHE-------------------------------------------------SREAWKRELRQA--PARVQWDPERDLRLNPLPY----RSLQLGLG-GDAAG-RYADEWT--TGITDVTPLARQM-RR-LVLEGDLA----------------GAGRLLPEERPY-PADTGLL-GHLVPSAG-------
297162424 M--------AMQEPRHQIRA-LHTE-STVTVYQAYAPHLGLPAARDGRF-PTA-WKRDR--MTWIKPSFLWMMYRCGW-GAK-EGQETVLAVEITREGFEWALGRSCLSHYERGLHP-------------------------------------------------DQAAWKRALKAA--PARVQWDPERDLRLRPLPY----RSLQLGLS-GGAAR-RYADEWT--VAITDVTPLAHEV-HA-LVRRDELD----------------AAVRLLPEERPY-PAGDELL-SHLRAPVA-------
328884339 MEETRT---ADDEPKYRIRA-LHTD-RTVTVYQAYRPEIGLAAAREGRF-PAI-WKRDR--MTWIKPSFLWMMYRSGW-GTK-EGQETVLAVEITREGFEWALRNACLSHHVRGFHP-------------------------------------------------DQATWKARLRTA--PARVQWDPERDQRLRALPY----RSLQLGLS-GEASR-RYADEWT--VSVTDVTPLAHRV-RD-LVRAGDLE----------------AAGRLLPREEPY-PESAGLL-EHLRVPQA-------
297202028 ----------MEEPLHRIRA-LHTA-STITVYQAYRPEIGGPAARKGRF-PAA-WKPDR--MTWIKPSFMWMMYRSGW-GMK-ESQETVLAFEITREGFDWALRHACLSHYVRGLHP-------------------------------------------------DRDTWQRDLKRA--PARVQWDPERDLHLHPLPY----RSLQLGLS-GEASS-RYADEWI--VSISDVTPLAHEI-HA-LVRDGELD----------------SAARLLPQEQEY-PANAELL-AHLCP----------
291438820 --------------MA----------RRPRRCSLHRDDGSLPALTQAGW--AHEKVCERG-STWIKPSFLWMMYRCGW-GTK-EGQGTVLAVEITREGFEWALEHACLSHYEQGLHG-------------------------------------------------DRATWKRRLERA--PARVQWDPERDLRLQPLPH----RSLQLGLA-GEAAR-LYADEWI--VSITDVTPLAHAV-HA-QVRSGDLD----------------IARQLLPRERPY-PMNDELL-AHLHQ----------
329935335 ----------MAPPQREVRA-AHTD-ATVTVYQAYAPEIGVPAAEAGRF-PAA-WKRDR--MTWIKPSFLWMMYRCGW-GTK-QGQETVLAVEISREGFEWALRHACLSSYAPGVHP-------------------------------------------------DRTTWQRELKRA--PTRVQWDPERDLYLRPLPY----RSLQLGLA-GEAAR-RYADEWT--VSLTDVTSLAHEI-HA-LVRDGDTD----------------SAARLLPRESPY-PGQDELL-ARLRG----------
345013407 ----------VAEPKYQIRA-LHTE-STVTVYQAYAPEIGLPAAREGRY-PAV-WQRDR--MTWIKPSFLWMMYRCGW-GTK-EGQETVLAAEISREGFEWALEHACLSHYEHGLHA-------------------------------------------------DRATWKRQLKRA--PARVQWDPERDLHLQPLAH----RSLQLGLT-GEAAR-LYADEWT--VSITDITSLAHTI-HA-HVQGGDLD----------------AARQLLPRERPY-PVNEGDL-AHLYQ----------
302548144 ----------MEDQNHQIRA-RHNP-ATVTVYQAYAPHIGLPAARDGRF-PSA-WKRDR--MTWIKPSFLWMMYRCGW-GLK-EGQETVLAVEITHEGFAWALRNACLSHYVRGLHP-------------------------------------------------DQAAWKRQLHRS--PTRVQWDPERDLQLRPLPY----RSLQLGLA-GEAAR-RYADEWT--VSITDVTPLAREV-HA-LVRAGDLD----------------AAAARLPEERPY-PAADDLL-SHLRVPRP-------
330801102 ----------MSGYKRIINA-VYDD-ETVRVYQAYKATIADDAIKNQRFTEASGWKQDR--MTWIKPSFCWMLYRSGY-ATK-HNQERILAIDIKRSAFEWILENHIDSTETAKSSI------------------------------------------------------PSEKK----KIVVQWDPERNFKIGKIDGCGDVRSIQIGIK-AVKTK-EYNEDWI--VRIQDVTDLAHQI-KE-LVELKDFE----------------KANALLPNERIYKPKNVRFN----------------
291453417 TNPT-----ALPHPTHQIRA-RQTP-TTVTVYQAYPPSIALPAARDQRF-PAA-WKRDR--MTWIKPSFLWMMYRSGW-SRK-EGQERVLAVEISRAGFDWALGHACLSAYHPDVHA-------------------------------------------------GRDGWREALRGA--PARVQWDPERDWRLRPLPW----RALQLGLS-GEAVR-RYAEEWL--VSVVDVTGLAHAV-QE-RVRAGDEA----------------GARELLPEERVY-VPEGGLP--ASLVG---------
29829850 ----------MEETQRRIRA-VHTT-STITVYQAYSPEIGLPAVREGRF-PTA-WKRDR--MTWIKPSFLWMMYRCGW-GAK-AGQETVLAVEITRDGFEWALRHACLSSYVRGVHP-------------------------------------------------DRATWQRQLKHA--PTRIQWDPERDLHLQALPY----RSLQLGLA-GEAAR-RYADEWT--VSISDVTPLAREI-RT-LVGNGDLD----------------SAARLLPQELPY-LPADELP--AHLRP---------
332668288 -------------MCTNIIG-YQTE-EEIVVYQAYKPEIAKFAVENQKL-GGASFGFQR--MSWIKPNFLWMMYRCGW-AEK-ENQEHVLAIWIKKQDFELILEQAVLSSFQKEIYH-------------------------------------------------TEEDWKLQLSQS--EVRLQWDPDHDPKGNKLER----KAIQIGMK-GEMLH-LFANKYI--QHIEDITTFVRKQ-KL-YVDRRELE------------------KLLIPKESIF-TSLSAQR-KTHTL-AT-------
260802161 VSQIDH---HWPPTGKHILA-QYDD-NSVVVYQAFRPEIAEYAVKNQRF-GGSHYSWER--MSWIKPNFLWMMYRCGW-ASK-KGQERVLAVRITRTGFDEILANAYTPKTQAEAGL-------------------------------------------------PKDQL---------KVRLQWDPDHDPSGTSVQR----RAIQLGLK-GEILS-HFAQDWI--VSITDVTDFVHEQ-HN-VLQTSGTE------------------QLQVAAERVY-QVTDPKT-KALIG-VE-------
260782199 VSQVQQ---HWPQTGKHILA-QYDD-NSVVVYQAFRPEIAEYAVKNQRF-GGPHYKWER--MSWIKPNFLWMMYRCGW-ASK-KAQERVLAVRITRNGFDEILANAYTPKTQAEAGL-------------------------------------------------PKDQL---------KVRLQWDPDHDPSGTSLQR----RAIQLGLK-GEILN-HYAQDWI--VSITDVTDFVHEQ-YN-VLQTSGTE------------------QLQVAAERVY-QVTDPKT-KALIG-VE-------
158335219 LHQKD----RWPQQGRVILA-QYDT-DSIVVYQAYRPAIGNFAAQHGYF-GGE-FKLSR--MTWIKPNFLWMMYRSGW-GAK-PGQEVVLAIRLQRSAFDSILAQAVHSSFQSGLYD-------------------------------------------------SQESWQKAVQTS--DVRLQWDPDHNPAGHKLER----RAIQLGLR-GDAIR-KYAQEWI--LDIEDISDFVADQ-RQ-HVVSGNYE------------------ALLTPAEAPY-PVSDLKT-AHRLQ-VP-------
72006229 CDQNNV---CWPIAGKHILA-QFDE-HSVVVYQAFCPAIAKYAVDHQRF-GGDKFSFSR--MSWIKTNFLWMMYRCGW-ASK-PNQERVLAVRITREGFDEILSKAYTPQTQATAGL-------------------------------------------------GKEEI---------EVRLQWDPDHAPNGDKMDR----RAIQMGLK-GETLR-KYATEWI--VSIRDVTDFVKEQ-SK-NTDRKRLN------------------LLDVAQERVY-PVSNPKT-AQLIG-LG-------
300867123 LTQVS----RWPKAGRHILA-QFDE-NSIVVYQAYRPAIGDFAALHGYF-GGE-FKLSR--MSWIKPNFLWMMYRSGW-GTK-EGQEVILAVRLKRSAFDEVLTAAVHSTFVSEVYA-------------------------------------------------SEKEWKQAAKNS--SVRLQWDPDHHPNGSQEER----RAIQLGLR-GEILV-HYAQDWI--INIEDISEFVQEQ-HQ-NLKEG-MA------------------NLLTPSEEVY-PITNSDT-AKRLQ-IS-------
291237935 MEIMK----LWPKNGNHVLA-QYDD-HNIVVYQAFCPEIANYAVKNQRF-GGPHYSFDR--MSWIKPNFLWMMYRCGW-ATK-SKQERVLAVRITREGFDSILSKAYSAQAQKAAGL--------------------------------------------------------NKNDI--QVRLQWDPDHKPSGAPTLR----RAIQLGLK-GEILR-KYATEWI--VSIEDVTPFVQEE-MV-KLTPENID------------------KLVVPIEKVY-HVTDKKT-ANLIN-VE-------
307105263 VRQEAE---FWPAVGRHVLA-QATE-DTVVVYQAYTPSIGVLAAGQGDFRGIPGFSETR--MTWVKTNFLWMAFRCGW-ASK-PNQETVLAITLKRPFFERMLAASLSTSAGTTAKG----------------------------------------------------------PCIGADVVLQWDPDHLPDGSKHPGR---RAVQLGLR-GGVRD-EYISGRH-TVCIEDITPFVREM-GA-IAAGGEPR----------------WVGLLVPSERVL-RLRD-EV-RSHIA-AD-------
149922143 LEQRE----RWPQTGRHVLA-HYDD-EAVVVYQAYNPAIAAWAVKHQRF-GGP-WSFER--MSWIKPNFLWMMFRCGW-ATK-RDQERVLAVHLERAGFDAILGQAVHSSFVAERYA-------------------------------------------------DRATWQARGRRS--DVRLQWDPDHGPRGGKLER----RAIQLGLR-RATLR-AFAEGWC--RGIEDITPFVHAQ-RT-FVDSRQLG------------------RLQTPLERVY-PVLDAEV-AAHLG-VT-------
299472429 S--------APTATGRCLLA-QFTD-REVIVYQAYKPELGNFAVENQYF-GGDGFNFKR--TSWVKPNFTWMMHRCGW-ASK-QNQEVVLALALRRDFWDDVLSQAVMSNYESYRST-------MSAEVPR---------------------------------GDAQRRWKASLQAS--DVVMQWDPDHMPFTGHKTNH---RAIQLGLR-GDALA-AFRGPAFGETGIQDVSAFAKAT-EE-IHRPRAADGGGGGGHPDAPAATPPPPALLLPIEETY-PVVDASV-AQRLG-ID-------
170940179 TM-------STPTPYKQIRA-LHTP-RSITLYQAYNHPIASAAVSAQSLTASPLFKTTR--MTWIKPSWAWMLYRSGY-SFKDANQSRILALTMSHEDFLWLLSQGVVSHRSPEEKG-----------------------------------------------------DQGGKKLG--GVRIQWDPERDVKMERMGY----RSIQIGIPGGEVCE-RWVG-MV--KKIEDVTDKAREL-KR-VIDERPEV-----------TVGVLKEMGLVPEEKVF-EIEDEEV-RRRLG----------
87310926 -----------MFHFREIRA-SFDR-DTIVVYQAYNDAIANAALTVGKF-VPP-FSFQR--MTWIKPSFLWLMERSGW-GTK-ANQTRILAVRIARSGWDAAIGQGVLTSYHSDIHR-------------------------------------------------SQDDWRTQFENA--MVHVQWDPERSLRGKKLEY----RSIQVGVG-RRLIT-EFAEQWT--QEIVDLTPLTAKL-RQ-FRQAGDHD----------------KAKRLLPRESIY-RVNNAT--ASRLG-IE-------
238020853 ---------MT-TPPKQIRA-VYTD-TTIRVYQAYSDAIADTALAAGRF-VSPPFKMER--MTWIKPSFLWMMYRAGW-GGKDDNQKRILAIDISRSGFEWALHHACLSHPPAGMDS---------------------------------------------------ATWQQTKAAH--PVRIQWDPERSLKLEPLPH----RSIQIGLT-GEAVP-RYVNEWI--QNISEITDVVQEI-HA-LIAQDNLA----------------AAQALLPPERVY-PFDWET--DFQAA----------
239815282 MK-------TDVIPHNQIRA-MYDA-DTIRVYQAYSDAIADSALAQGRL-VSPPFKLER--MTWIKPSFLWMMYRAGW-GLKDEGQKRILAIDITREGFEWALAHSCPSHSPEGMSG---------------------------------------------------EEYAALKQRC--PVRVQWDPERDLHLQPLAH----RAIQIGLS-KEAVR-LYVNEWT--CKITEMTALAHEV-QA-LVQQGQLQ----------------KAASKLPMERAY-PGQQAT-----------------
254392683 -----------MVALRQIRA-QYDD-RTIVVYQAYSSAIAEPALRAGTF-VPP-FSFGR--MTWIKPSFLWLMHRSNW-ARK-PGQERILAVRITREGWEEALSQAVLTTSHPDRVA-----------------------------------------------------------QA--PVHVQWDPERSLRGAALNH----YSIQVGVG-RGLIE-RYAKEWV--VGITEVTSQARKA-AE-LAQGGRAE----------------KAKRLLPPERPY-PVPRAT--AQRLD-ID-------
295658070 MDQP-----NVAPTKYAIRA-QYTS-KTITVYQAYSPAIANAALSAGKF-VAP-FKRVR--MTWIKPSFLWMAYRCGW-ATK-KDQERVLAIEITREGFEWALAHACLSHPTPRLYA-------------------------------------------------DHAAWEHRKNES--SVRVQWDPERDFEFRPLEY----RSLQVGLK-EEAVD-RYVDEWT--VGIRDVTWLMQEI-GQ-LVREGKIE----------------EARRKMPVEEVY-VLPTDV--ATVVG-AD-------
302504024 M--------TDNNPYRAIRA-KFTE-NTITVYQAYSNEIADAALGAGTF-VAP-FKRGR--MTWIKPSFLWVAYRSGW-ATK-PNQERVLAIEITRSGFEWALRNACLSHVDNSLYK-------------------------------------------------DKSAWESRMQAS--CVRVQWDPERDFHFNPLGY----RSIQIGLK-GEAVD-QYVDEWI--VSITDITEQIRKV-SG-LVSSGQLG----------------EAKKQMPEECLY-DLPGDV--GEMIG-AS-------
239606461 MESQQPL--KAGPSNYAIRA-QHTP-TTITIYQAYSPSIANAAVAAGKF-VAP-FKR----MTWIKPSFLWMAYRCGW-ATK-KDQKRVLALEVTREGFHWALAHACLSHPSPHLYA-------------------------------------------------DQATWEKRKEES--PVRVQWDPERDFEFRALEY----RSLQVGLK-GEAVD-RYVDEWI--VGIRDVTGLMREV-GR-LAGEGRLD----------------EAREMMPVEEEY-VLPADV--ARVIG-AD-------
303312351 M--------SREQGYRAVRA-KFTA-ETITVYQAYSAEIASPALRAGKF-VPP-FKRTR--MTWIKPSFLWMAYRSGW-ASK-PNQERVLAIEISREGFEWALFNSFVNSHDKSLYP-------------------------------------------------DKHAFEHRKQNT--CVRVQWDPERDFGFTPLSY----RSIQIGLS-GEAVD-RYVDEWI--VSIQDVTDRMVKM-GQ-LVAAGKIE----------------EAQKLMPIEEPY-PLPKQV--GAAVG-AS-------
302657470 M--------TDSNPYRAIRA-KFTE-NTITIYQAYSNEIADAALGAGTF-VAP-FKRGR--MTWIKPSFLWVAYRSGW-ATK-PNQERVLAIEITRSGFEWALRNACLSHVDNSLYK-------------------------------------------------DKSAWESRMQAS--CVRVQWDPERDFHFNPLGY----RSIQIGLK-GDAVD-RYVDEWI--VSITDITEQIRKV-SG-LVSSGQLG----------------EAKKQMPEECLY-DLPDDV--GEMIG-AS-------
326470706 M--------TDNNPYRAIRA-RFTE-NTITVYQAYSNEIADAALGTGTF-VAP-FKRGR--MTWIKPSFLWVAYRSGW-ATK-PNQERVLAIEITRSGFEWALRNACLSHVDNSLYK-------------------------------------------------DRSAWVLRMQAS--CVRVQWDPERDFHFNPLGY----RSIQIGLK-GEAVD-RYVDEWI--VSITDITEQVRKV-SG-LVSSGQLD----------------EAKKQMPEECLY-DLPGDV--GEMI-----------
302411952 DH-------SSPTPPRQIRA-DFDD-TTITLYQAYSAAIAEPAVAAQKLTAAPSFKPTR--MTWVKPSWAWMLYRAGY-SFKDAGQERILALKMRHADFLALLRRGVLASQATTAEG---------------------------------------------------------------EVRVQWDPERTVRLDKLPH----RSIQIGIP-RGLSQ-QWADEWV--VGIEDVTDRARKL-KD-VLDVRPGV-----------SNAELLEMGLVPAERVY-QVPEDV--IRRLC----------
336117044 ------------PPFRQVRA-VHDE-DTITVYQAYSPAIASAAVAAGGF-VPP-FRRER--MTWIKPSFLWMMYRCGW-ATK-PGQERVLAIRMLRSGFEEALSMASLSHFDPAVYA-------------------------------------------------DQEVWQQRKAAS--PVRVQWDPERDVRLEPLAW----RSLQVGLG-GVAVE-RYVDDWV--VGIEDITAMVEEL-RE-RAPDDRRS--------------------SLPIELPY-PLPPEV--AAVVG-AT-------
119193120 M--------SREQGYRAVRA-KFTA-ETITVYQAYSAEIASPALRAGKF-VPP-FKRTR--MTWIKPSFLWMAYRSGW-ASK-PNQERVLAIEISREGFEWALFNSFVNSHDKSLYP-------------------------------------------------DKHAFEHRKQNT--CVRVQWDPERDFGFSPLSY----RSIQIGLS-GEAVD-RYVDEWI--VSIQDVTDRMVKM-EQ-LVAAGKIE----------------EAQKLMPIEEPY-PLPKQV--GAAVG-AS-------
240272965 MEQP-----KTSPSKYAIRA-QYTP-TTITVYQAYSPAIANAAVAAGKF-VPP-FRRGR--MTWIKPSFLWMAYRCGW-ASK-KNQERVLAVEITREGFHWVLAHACLSHPSPRLYV-------------------------------------------------DQATWEKRKDAS--PVRVQWDPERDFEFRPLEY----RSLQVGLK-GEAVD-RYIDEWI--VGIKDVTGLMQDV-GR-LVSEGQLE----------------EAKRRMPVEEEY-VLPEDV--ARIIG-AD-------
225559493 MEQP-----KTSPSKYAIRA-QYTP-TTITVYQAYSPAIANAAVAAGKF-VPP-FRRGR--MTWIKPSFLWMAYRCGW-ASK-KNQERVLAVEITREGFHWALAHACLSHPSPRLYV-------------------------------------------------DQATWEKQKDSS--PVRVQWDPERDFEFRPLEY----RSLQVGLK-GEAVD-RYIDEWI--VGIKDVTGLMQDV-GR-LVSEGQLE----------------EAKRRMPVEEEY-VLPEDV--ARVIG-AD-------
342875667 MPTA-----PSTAPYRQVRA-CYND-TTIIVYQAYKESIAKAAVDAQKLNASPDFKSGR--MTWIKPSWAWMMYRAGY-SYKDPGQSRILALRMKHEYFITLLERGVLSSHAHKLNP-----------------------------------------------------GEKRETTV--DVRIQWDPERTAKLEVLPY----RSIQIGIP-GALSK-QWANEWI--VEIEDVTDKAREL-KR-VIDERPGI-----------TDEELLNMGLIFEERPF-EVPEAV--HTKLE----------
327352957 MESQQPL--KAGPSNYAIRA-QHTP-TTITIYQAYSPSIANAAVAAGKF-VAP-FKRGR--MTWIKPSFLWMAYRCGW-ATK-KDQKRVLALEVTREGFHWALAHACLSHPSPHLYA-------------------------------------------------DQATWEKRKEES--PVRVQWDPERDFEFRALEY----RSLQVGLK-GEAVD-RYVDEWI--VGIRDVTGLMREV-GR-LAGEGRLD----------------EAREMMPVEEEY-VLPADV--ARVIG-AD-------
296821722 ---------MTDNLYRAIRA-KFTD-DTITVYQAYSDEIADAALGANTF-VSP-FKRGR--MTWIKPSFLWVAYRSGW-ATK-PNQERVLAIEITRSGFEWALRNACLSHVDESLYR-------------------------------------------------DKSAWEARMQAS--CVRVQWDPERDFNFTPLNY----RSIQIGLK-GEAVD-RYVDEWI--VSIADATEQIRTV-SR-LVSSGRLS----------------EAGKELPEEKLY-DIPEDV--AKIIG-AS-------
302922871 TSTSP----DTSIPYHQIRA-HYDG-KTITVYQAYKESIARDAVAAQKLNASPDFKPGR--MTWVKPSWAWMMYRAGY-SYKDSRQSHILAIRMKHEHFIGLLERGVLSKHAKKAPE---------------------------------------------------DSTVKREKTS--DVRIQWDPERTPKLGVLPY----RSIQIGIP-GALST-QWADEWI--FEIEDVTDKAREL-KR-VIDERPDI-----------TEEELLELGLIFEERPF-EVPESV--GERLE----------
315054759 ---------MADNPYRAIRA-KFTE-NTITVYQAYSNEIADAAMRARTF-VSP-FKRGR--MTWIKPSFLWVAYRSGW-ATK-PDQERILAIEITRSGFEWALRNACLSHVDNSLYR-------------------------------------------------DKSAWESRMQSS--CVRVQWDPERDFYFNALSY----RSIQIGLK-GEAVD-RYVDEWI--VSITDVTEQIRKV-SE-LVSSGELG----------------GARKEMPEERLY-GIPEDV--GAMIG-AS-------
226293790 MDQP-----NVAPTKYSIRA-QYTS-KTITVYQAYPPAIANAALYAGKF-VAP-FKRRR--MTWIKPSFLWMAYRCGW-ATK-KDQERVLAIEIAREGFEWALAHACLSHPTPRLYA-------------------------------------------------DHAAWELRKNES--PVRVQWDPERDFEFRPLEY----RSLQVGLK-EEAVD-RYVDEWT--VGIRDVTGLMQEI-GQ-LVGEGKIE----------------EARRKMPVEEVY-VLPTDV--ATVVG-AD-------
327308048 M--------TDNNPYRAIRA-KFTE-NTITIYQAYSNEIADAALGAGAF-VAP-FKRGR--MTWIKPSFLWVAYRSGW-ATK-PNQERVLAIEITRSGFEWALRNACLSHVDNSLYK-------------------------------------------------DKSPWESRMQAS--CVRVQWDPERDFHFNPLGY----RSIQIGLK-GEAVD-RYVDEWI--VSITDITEQIRKV-SD-LVSSGQLG----------------EAKKQMPEKCLY-DLPGNV--GEMIG-AS-------
225684169 MDQP-----NVAPTKYSIRA-QYTS-KTITVYQAYPPAIANAALYAGKF-VAP-FKRRR--MTWIKPSFLWMAYRCGW-ATK-KDQERVLAIEIAREGFEWALAHACLSHPTPRLYA-------------------------------------------------DHAAWERRKNES--PVRVQWDPERDFEFRPLEY----RSLQVGLK-EEAVD-RYVDEWT--VGIRDVTGLMQEI-GQ-LVGEGKIE----------------EARRKMPVEEAY-VLPTDV--ATVVG-AD-------
315506327 ------------VPRHQIRA-AYTG-TAVTVYQAYPPEIADAALRAGRF-VPP-FKRER--MTWIKPSFRWMMYRCGW-ALK-PCQERVLAVDISRAGFEWALRHACLSSYDPRLHP-------------------------------------------------DRDAWRHSLRVS--PVRVQWDPERSLRLAPLPY----RSLQVGLT-GDAVR-RYVDEWV--VGLTDVTGLARSV-HG-RLTDGDEA----------------GAAALLPVERLY-PLPAEVA--RVVD-AG-------
302867267 ------------VPRHQIRA-AYTG-TAVTVYQAYPPEIADAALRAGRF-VPP-FKRER--MTWIKPSFRWMMYRCGW-ALK-PCQERVLAVDISRAGFEWALRHACLSSYDPRLHP-------------------------------------------------DRDAWRHSLRVS--PVRVQWDPERSLRLAPLPY----RSLQVGLT-GDAVR-RYVDEWV--VGLTDVTGLARSV-HG-RLTDGDEA----------------GAAALLPVERPY-PLPAEVA--RVVD-AG-------
258574383 M--------STSHPYRAIRA-KFTP-DTITVYQAYSAEIALPAVRAGKF-VAP-FKRTR--MTWIKPSFLWMAYRSGW-ASK-PNQERILAIEISRAGFEWALLNSFVNTHDPAFYG-------------------------------------------------DHRALEERKRNT--CVRVQWDPERDFGFEPLPY----RSIQVGLS-GEAVE-RYVDEWI--VAIEDVTELMVGM-GR-LVAEGKIE----------------EARELMPVEKAY-PLPEEVA--KVVG-AS-------
310796940 GH-------RPPTPFRQIRA-RFDE-ESITVYQAYNSAIAAAAVEAQRLDASPGFKVTR--MTWIKPSWAWMMYRAGY-SFKDPGRERILALKMRHGDFVDLLRKGVVARRGNESRD-----------------------------------------------------------GR--GVRIQWDPERDVRLGRLQR----RSIQIGTP-----------------------PRYLEL-KR-VLEERPGV-----------GDGELIDLGLLPAEKEF-EVPKDVE--ELLE-MN-------
269121733 --------------MRKINA-LYDD-DTVRVYQAYRNEIADEALELGTF-GSH-FKRTR--MTWIKPSFLWMMYRAGW-AEK-EGQERILAIDITKDGFLTILKNSVLSHYDRKVYE-------------------------------------------------KAEEWELDKRNF--SGRCQWDPERNIFGSPLEF----RAIQLGLK-DEIVE-SYIKKWI--VNIEDITPMVRKI-KK-MRDEGKDI------------------KEYLPVEKELRIEDSEVI--KRLR-ID-------
290961991 PTEDL----APTEPKFRIRA-RHTT-DTITVYQAYRPEIGGPAARDGRF-PAA-WKRDR--MTWIKPSFLWMMYRCGW-GMK-EGQETVLAVEIGREGFEWALRHACLSHFVPELHT-------------------------------------------------DQAEWKRRLRRA--PARVQWDPERSLRLGPLPY----RSLQLGLV-GEAAA-RYADEWI--VGIEDVTPLAREV-HG-HVRAGALD----------------RAAALLPQEPPY-PVAEDVL--AHLR----------
294628199 MNDHH----AEAEPRFRIRA-RHTD-TTVTVYQAYRPQIGGPAARTGRF-PAD-WKRDR--MTWIKPSFLWMMYRCGW-GTK-EGQETVLAVEIRRDGFEWALRNACLSHHVPALHG-------------------------------------------------DQASWRRRLREA--PARVQWDPERDLHHNPLPY----RSLQLGLA-GPAAA-RYADEWI--TGIEDVTPLAAEI-HA-LVRTGELE----------------RATALLPKERPY-PVADEVL--AHLR-A--------
302549980 MN-------DRNEPRFRVRA-RHTE-STITVYQAYRPEIGGPAARDGRF-PAA-WKRDR--MTWIKPSFLWMMYRCGW-GTK-EGQETVLAVEISRDGFLWALRNACLSHHVPALHG-------------------------------------------------EQADWKRQLRRA--PARVQWDPERDLRLAPLPY----RSLQLGLA-GEAAA-RYADEWI--VGIEDVTPLATEV-HA-LVRAGELD----------------AAAGLLPEERPF-HVDDEVL--ARLG-AR-------
300774505 KEQLL----EWPQQGYHIMA-QYDD-EKIIVYQSYRKEIGEFAVKNQFF-GGG-FSLER--MTWIKPNFLWMMYRNGW-GKK-EGQECVLAIHLKKEAFKNYLENAVYSSYNKKLGI-------------------------------------------------SREEWQDQIKES--SVRLQWDPDHDPFGNKLER----RAIQIGLR-NEFTR-SFAKDDI--ILIKNISDFVKEQ-YQ-FVLNDDLD------------------NLIVPEEKPL-LFD-EVL-NKKLN-LR-------
320010749 MND------RTGPPRHEIRA-RHTD-STVTVYQAYRPAIGLAAARDGRF-PSE-WKRDR--MTWIKPSFLWMMYRCGW-GAK-EGQETVLAVEISREGFGWALENAELSHYVRGVHA-------------------------------------------------DRATWQRDLRRR--PTRVQWDPERDLHLNALPH----RSLQLGLS-GEAAR-RYADEWL--VSVTDVTPLAHEI-HA-LVRAGETD----------------RASALLPVEEPLTGLQAPVP-ADR------------
298248426 LTQRE----NWPDEGRHILA-QYDE-QSVVVYQAFKPTIGRFAAMHGFF-GGG-FRLDR--TSWVKTNFLWMMYRSQW-GTV-PQQEIVLAVFLKRDAFDWLLSQAVHSLYHADLYP-------------------------------------------------SDTAWYAQLRRS--PVVLQWDPDHAPTGHRLSR----SAIQLGLR-GEALA-KYAREWI--VAIEDISDFVAQQ-RL-FVQTKAFE------------------QLQVPYETVY-PVADPVV-AARLL-LA-------
299472531 LFSEAKA--HWAAPYRQVFC-QHDK-DTVVLFRACCEHLGPHATATQCFRGSPCYEKDRTRMMWFDSSFLVSMRKSEW-GTK-KGREVVLAIWVKRSFIEDCFGMAVCSNTFGPSCGGGGGGNGSSGGRKGSGGIGRRSSFAVTPFPTSDSGGDDGRSPPTSGFPTPVNSVAGSPPASPVSGQQHQRREQEATASESE---GGRASG-----GDGAR-DDARRAA--AAAATSTALLSKG-QA-SLAQGNEN---------------DEDDDNIPRGRAVTGDPSTRY---YFG-GSAGDPLG-
271967482 ----------MNMPHRQIRA-AYTE-KSITVYQAYDPAVAEPAVAAQRF-VAP-FKRER--MTWIKPSFLWMMYRCGY-ATK-PGQTRVLAIDLTRAGFEWALAHSCLSHPGRDGDQ---------------------------------------------------ETWKERLRHS--PVRVQWDPERDPHHNALPH----RSIQIGLS-GQAVD-RYLDDWT--VSITDITDRVRDV-HT-ALRDGR------------------DVTALLPPERPY-PVPVELA--RTIG-ATAGGDAG-
consensus/90% .................lbA...s..psl.lYQAa.s.lu..Ah....hs....ap..R..MoWlKPsahWhhaRssa.u.K...Qp.lLAlclp+..a..hL.puh.sp.......................................................................s.hQWDP-+s.....l......RulQlGl.........a.pph.....lpDlo..h........h..........................bhP.Ep.h........................
consensus/85% .................lbA..as..psl.VYQAY.s.Iu..Ah...pFs.s..ap..R..MoWlKPsFhWhhaRssa.u.K..sQp.lLAlclp+.sa..hL.puh.op............................................................b..........s+lQWDP-+s.....l......RulQlGl....h...paspch.....lpDlT.bhpp......l..........................bhP.Ep.a........................
consensus/80% ................pIbA..as..pol.VYQAYps.Iu..Ah...pFs.ss.apbpR..MTWIKPSFhWMhYRsGW.u.K..sQcplLAlclpRpsFc.hL.puh.op............................................................hp.....s...s+lQWDP-+s.....L......RulQlGl..sphhp.pasp-W...h.IpDlTsbhpph.....l..........................bhP.Ep.a..hs....................
consensus/75% .............s.ppIbA..as..pol.VYQAYps.Iu..Ah...pFs.ss.apbpR..MTWIKPSFLWMhYRsGW.u.K..sQEplLAlclpRpuF-.hL.puhlSp........................................................s...Wp..bp.u..slRlQWDPERshp.p.L......RulQlGlp.sphhp.pasp-Wh..lsIpDlTsbhpch.p..hl..sp......................hlP.Ep.Y..hs....................
consensus/70% h............s.+pI+A..as..pTlsVYQAYps.IupsAlp..pFs.ss.FpbsR..MTWIKPSFLWMMYRsGW.upK..sQEplLAlcIpRpuF-bhL.puhlSp....h...................................................sp..Wpp.bppu..sVRlQWDPERshp.psLsb....RolQlGlp.uphhc.cYsp-Wl..lsIpDlTsbhcch.p..hlppsp.p....................hlP.EpsY..ls.......h............
consensus/100% ......................................................................................................h.................................................................................pb..................s...G...............................................................................................
consensus/95% .................lbu...s....l.lYQAa...lu..Ah....hs....a...R...oWlKssa.Whh.Rssa.u.K...Qp.lLul.h.+..h..hl..s..s..........................................................................hQWDP-+......h......bulQlGl.........a.pp......l.-ho..h.....................................s.E..h........................
Back to Contents
This domain is found close to a PARP gene in our operons and may be associated with NAD or ADP-ribose processing
ALIGN -----------H-HHHHHHHHHHHHHH--------------HHHHHH-HHHHHHHHH---------------------------------------------------------------------------H-HHH---HHHHHHHHHH---EEEE-------HHEEEEEE-------------EEEE-----H--------HHHHHHHHHHHH---
HMM ---------HHHHHHHHHHHHHHHHHH---------------HHHHH-HHHHHHHHHHHHHHH------------------------------------------------------EEEE-----------HHHHH---HHHHHHHHHH---EEEEE-----EEEEEEEEEE------E----EEEEEEEHHHH--------HHHHHHHHHHH----
FREQ ------------HHHHHHHHHHHHHH---------------HHHHHH-HHHHHHHHHHHHH----------------------------------------------------------------------HHHHHH---HHHHH--------EEEEE----HHHHHHHHEHH-----------EEEEEE-H-----------HHHHHHHHHHHHH--
PSSM -----------HHHHHHHHHHHHHHHHH---------------HHHH-HHHHHHHHHHHHHHH------------------------------H--------------------------------------HHHHH---HHHHHH-------EEEEE-------EEEEEEEE-----------EEEEEEE-HHH--------HHHHHHHHHHH----
FINAL -----------HHHHHHHHHHHHHHHH---------------HHHHH-HHHHHHHHHHHHHHH--------------------------------------------------------------------HHHHHH---HHHHHH-------EEEEE-----EEEEEEEEEE-----------EEEEEEEHHHH--------HHHHHHHHHHHH---
167753772 -----MEYKNIFEIEFIQRTQEIVNGYQ-----------IPFENTLF-INACVGLLIIPQQSL------------------------------FNHLPTEVVS--------AD---KWGIADTDISCIKEPNKSVKN---VARHIRNAIAHDGIRFGSDNGKDITHIKITDWKDERHKTE----TFKAVIEVTKF--------KTFVWAFAQFALTQQ
206575484 -----MGNYSDFETEFVQRTLALIDQYNEMIKELGKPFREQYNYTLT-LNCLLGLIVMPKERA------------------------------LSFLPAERLT--------QQLKTSMGLQESQLP---GPEMTLRA---LILKMRNSVAHFSVQVVSVSDERL--VDLIAFRDDPEDEN----AY-ATFSAPEL--------LPFLKYYASLLLNNM
209544855 -----MGIPSDPLLDIMRRSLINLDFIEANYQDHGL-----YEVTQL-VNTFLGAFIHPFEKSAKGKEF------------------------ISYFRARPPP--------VPFAAKT-----------AEDFNYLE---FIYFVRHALAHGDLHYNANKIKQI--ESITLWNSKYGEKA----IR-ITLSIRDM--------RVLLLDFKNILEKMF
209921977 -----MGNYSDFETDFIERTLALIDQYNNMIE--GKPFPEQYNYTLT-LNCLLGLIVMPRERA------------------------------VSYLPSDRLT--------PELKAEIGLNESQLP---GEEMNLRE---LIHKMRNSVAHFCVQVESISDARL--VDQIIFKETHGAGR----AY-AIFSAPEL--------LPFLKYYAALLIANM
217979676 -----MGMPTEPLLVIMRRSMANLAFVETHAGPAGP-----YEVTQL-INTFLGALAHPFEAM------------------------------RDDLMALPLA--------DAAVLGWPTINKERPSD-REPASLGD---LIRLMRNGMAHGNLDYLSDGKGQI--HALRVWNTHPRTGAR---TWGTVVPIADV--------RRFLGLFVDLIERRH
225181269 -----MER-QVVEKDFVARTMHILENYD------GP-----YGVTLL-INCLLGLIVLPRERGFNR---------------------------VCHQEGIGFS--------DLGIDPQEICWGRIA---EQEQTASR---FLQCMRNSVAHIKIESISEQGE-I---ESLRFKDQSGFE--------VVMKIEKV--------KELATKLAQYVQ---
228923828 -NISLLWIQECFKPDNQDRKLKDVLSEFITIND-NIN--LYNNPGMLLMASYL-FFVYAKE---------------------------------KDFIGRDYS--------FADTSKFEVLECEKE---KRDSNY-----ICRRIRNALAHSRVHIGE--NGLI------TFEDFKPEGTKRLDYFKCTISYTDF--------GNFISAFYHGVKDRY
229175166 -NISLLWIQECLKPENQNKKVNELLREFLNKNE-NIN---LLNPSVLLMASYL-LFVYTKE---------------------------------KDFNDGDYS--------FVDISKFNVIASRKR---RPDGNY-----ICRRVRNALAHSRVHIDE--SLQI------TFEDSKPDGT---DYFKCVISCVDF--------GNFINNFMFTLKDSY
238916184 SENVTQNEIEKYKKQLEKSLLELREDKNAKISFK-----IGFVYLYA-MNFALRTEDDDYEELK-----------------------------YQELNVSKFK--------YQKENWIQYSQRNKT---QNCLFPRY---IVERMRNSLMHGNIEILLNNKGKI----EFIFRDKYNKRD----EV-ISIILEDL--------EEFLSQKCLYTGIPK
239908249 -------MYTHLHHDFAAKTRANLEFIEKACME-GIP--GTYNATQL-INSLLGMVVFLNEGKL-----------------------------VPAIPFSQLC--------SCEEIQVHLDDN------QDCSKADK---FIQQFRNAIAHCRFQAFG-SKDNI--QSFTMYDQRPKEPI----DWKIDITTQGI--------RDIAFRLVAYVIKNS
256367844 -----MGNYSDFETDFVQRTLALIDQYNEMIEVLGKPFREQYNYTLT-LNCLLGLIVLPKERA------------------------------LSFLPADRLT--------RQLKAEMGLHESQLP---GPEMNLRE---LIHKMRNSVAHFCVQVESASDAHL--VDWIVFRESQEDGE----VY-ASFSAPEL--------LPFLKYYATLLLDNM
270293299 -IEDVSPEKTQNQIKEINKSIRELKEDEDKIV--------GFNFMFP-VLRLLDISLRLEDDD------------------------------LKKISPLSVNIDGFTYEEDNLQKYYQNNSSTINK--RSETKYYY---ILERIRNAIAHGHITTYLDSNSNI----VYKLEDIWNNR--------TEKVEIDY--------DSMINFLEQPIFTER
283783211 RIIDYKIAIDSKKAKMIDRILKSIDELKEDSDSWIE-FRWFFKIIYI-INFSLRLEDTDLESIK-----------------------------YSVLNVDDFEYDSSQ---MALFVKKKISDGTIR---SRDEKFGNTIYILHKIRNAIAHGRIKLEVIDDKVY-----YVFEDCYYKRT----EL-IKIAVENM--------NQFINNVNALIK---
291288929 -----MGNYSDFETDFVQRTLALIDQYNEMIEELGKPFSEQYNYTLT-LNCLLGLIVLPKERA------------------------------LSFLPADRLT--------RQLKAEMGLHESQLP---GPEMNLRQ---LIHKMRNSVAHFCVQVESVSDAHL--VDWIVFRESQGDGD----VY-ASFSAPEL--------LPFLKYYATLLLDNI
313682815 -MGHYPEEKSEFIREFFKRTLHNLHIYLEDQQ--NSKFRYPYDVTQT-INSFLGLIVFLQDSDI-----------------------------VFTQELEDFVE-------AHLPIQWTCFDGNNG---LEEHNFRN---YLKRLRNAVSHRKIKSIPDQNNEI---MALEFRDGKNGG-----CFCAKLSVESV--------NLLITLLSRNILGAQ
329996741 -----MGNYSDFETDFVQRTLALIDQYNEMIEVQGKPFREQYNYTLT-LNCLLGLIVLPKERA------------------------------LSFLPADRLT--------LQLKAEMGLHESQLP---GPEMTLRT---LILKMRNSVAHFSVQVISVSDEHL--VDLIAFRDDPEDEN----AY-ATFSAPEL--------LPFLKYYAAQLLGNM
333378220 -------SIQYFDISFIERTLENLKKYEGK-----------YDFTML-LNSLLGLLVVPNEYNIAKKRRFKYPFLNEKISKFSSIKEIFKNKSYSFLDKDKKEI-------NQYKFRWLDDNKNVLT--INNITLES---FLRRIRNGIAHFGITPVKEDSLWIG-IIIRNYKNREMNME-------VYFEEDEL--------RTFALFIAEKYLETV
58383293 -----MGNYSDFETDFVQRTLALIDQYNEMIEVLGKPFREQYNYTLT-LNCLLGLIVLPKERA------------------------------LSFLLADRLT--------RQLKAEMGLHESQLP---GPEMNLRE---LIHKMRNSVAHFCVQVESASDAHL--VDWIVFRESQKDGE----VY-ASFSAPEL--------LPFLKYYATLLLDNM
78223734 -----QEYFRDFMVE-LNHAFLHLTEINQFDWHDQLDTSDNYELTRFIDQNIHPTYLRLIEAVYSPMLRI-----------------------PAYFSRLKRGKG------TEKLDVFNIVEELKT---SDLNELTVH--YRHVVRNGIAHGGIKFF---DNSI------SYKDKQRNED----VL-SDRTMVNVCDNIIDTCNAIVLAFSVFVIANQ
91203343 ------MDYKQIVRDFAQRTKILINEYKGD-----------YEVTLL-VNCCLGLLVVPKEID------------------------------FKKIPVEVIPE-------KDTLWGLSRESVSVKCK-ECSYVLRD---VIKKIRNGICHFDITSIPDENNQI---EFLVIKDRGGFE--------AKLSVAQL--------KELAISLTDHVYKP-
consensus/100% .........p........p.........................................p...................................b...........................................h...hRpuh.H..hp........h.......hpp....................h..........hh...........
consensus/95% .........p....p...+.b..l.................h...b..h..hl.......-...................................b.....................................h.....hh..hRNulsH..lp........l.......hpp...............b...ph..........hh..h...hb...
consensus/90% .........p....p..p+.b..l..b..............ap..b..hs.hL.hbh..b-...................................h....................b.............p.ph.....hh..hRNuluH..lp........l.......acp...............h...ph..........hh..h...hb...
consensus/85% ........bpp.b.cbhp+ph..lp.bp.............aphsb..hsshL.hhl..bE.................................p.h....hs..............h...p.p.......p.ph.....hhpbhRNulAH.plp.....p..l.......acpp............h.h.h.ph..........hh..h...lb...
consensus/80% ........bpphb.chhp+sh..lpbhp.............aphob..lNshLshhl.sbE................................hp.h.s..hs..............h...p.p.......p.ph.....hlpbhRNulAH.plp....ps.pl.......ac-p..p.........h.hsh.ph..........hl..hs..lb...
consensus/75% .....b..bpphb.-hhpRoh..lpbhp.............aphTh..lNshLshhl.sbE................................hp.h.spphs...........b.bh.h.pspb......p.sh.....hlc+hRNulAH.plph...ps.pl.......ac-p..p.......h.h.hsh.ch..........hl..hs.blb...
consensus/70% .....b..bpphc.-hhpRol..lcbhp.............YshTh..lNshLGlhlhsbE................................hs.lsspphs.........pbb.bh.h.pspb......p.shpp...llc+hRNulAH.plphbs.ps.pl.....b.ac-p..p.......h.hshsh.cl........bshl..hs.blb.pb
Back to Contents
Eukariotic branches are colored blue, Archaeal branches are red and bacterial branches are green.
Supplementary table S1: organism identifiers used in this work.
| Organism Code | Scientific Name |
|---|---|
| Aaeg | Aedes aegypti |
| Abau | Acinetobacter baumannii |
| Aben | Arthroderma benhamiae |
| Abip | Asticcacaulis biprosthecum |
| Aboo | Aciduliprofundum boonei |
| Acal | Acinetobacter calcoaceticus |
| Acap | Ajellomyces capsulatus |
| Acar | Anolis carolinensis |
| Acel | Acetivibrio cellulolyticus |
| Acit | Acidovorax citrulli |
| Acla | Aspergillus clavatus |
| Acol | Anaerotruncus colihominis |
| Ader | Ajellomyces dermatitidis |
| Afla | Aspergillus flavus |
| Afum | Aspergillus fumigatus |
| Agos | Ashbya gossypii |
| Agyp | Arthroderma gypseum |
| Alai | Albugo laibachii |
| Alon | Acetonema longum |
| Aman | Aurantimonas manganoxydans |
| Amar | Acaryochloris marina |
| Amax | Arthrospira maxima |
| Amed | Amycolatopsis mediterranei |
| Amir | Actinosynnema mirum |
| Aory | Aspergillus oryzae |
| Aota | Arthroderma otae |
| Aput | Alistipes putredinis |
| Aque | Amphimedon queenslandica |
| Asp. | Actinomyces sp. |
| Ater | Aspergillus terreus |
| Aven | Archaeoglobus veneficus |
| Avin | Allochromatium vinosum |
| BP0305phi8-36 | Bacillus phage 0305phi8-36 |
| BP1 | Roseovarius sp. 217 phage 1 |
| BPSP18 | Shigella phage SP18 |
| BPphiAS5 | Aeromonas phage phiAS5 |
| BPphiEF24C | Enterococcus phage phiEF24C |
| Bado | Bifidobacterium adolescentis |
| Bamb | Burkholderia ambifaria |
| Bbre | Brevibacillus brevis |
| Bcel | Bacillus cellulosilyticus |
| Bcen | Burkholderia cenocepacia |
| Bfra | Bacteroides fragilis |
| Bfuc | Botryotinia fuckeliana |
| Bgla | Burkholderia gladioli |
| Bhyo | Brachyspira hyodysenteriae |
| Blat | Brevibacillus laterosporus |
| Bmar | Bacteriovorax marinus |
| Bmar | Bermanella marisrubri |
| Bmar | Blastopirellula marina |
| Bmur | Brachyspira murdochii |
| Bpar | Bordetella parapertussis |
| Bpse | Burkholderia pseudomallei |
| Bsp. | Bacillus sp. |
| Bsub | Brevundimonas subvibrioides |
| Bthu | Bacillus thuringiensis |
| Bubo | Burkholderia ubonensis |
| Bvie | Burkholderia vietnamiensis |
| Bxyl | Bacteroides xylanisolvens |
| CAcc | Candidatus Accumulibacter |
| CKor | Candidatus Koribacter |
| CKue | Candidatus Kuenenia |
| CPor | Candidatus Poribacteria |
| Caci | Catenulispora acidiphila |
| Casp | Clostridium asparagiforme |
| Cbac | Clostridiales bacterium |
| Cbei | Clostridium beijerinckii |
| Cbes | Caldicellulosiruptor bescii |
| Cbol | Clostridium bolteae |
| Ccon | Campylobacter concisus |
| Cdif | Clostridium difficile |
| Cdub | Candida dubliniensis |
| Ceut | Coprococcus eutactus |
| Cfim | Cellulomonas fimi |
| Cfla | Cellulomonas flavigena |
| Cfla | Chthoniobacter flavus |
| Cgin | Capnocytophaga gingivalis |
| Cgla | Candida glabrata |
| Cgle | Chryseobacterium gleum |
| Cglo | Chaetomium globosum |
| Cgra | Campylobacter gracilis |
| Chir | Clostridium hiranonis |
| Chom | Cardiobacterium hominis |
| Cimm | Coccidioides immitis |
| Clju | Clostridium ljungdahlii |
| Clus | Clavispora lusitaniae |
| Cmat | Corynebacterium matruchotii |
| Cmil | Cordyceps militaris |
| Cmit | Catenibacterium mitsuokai |
| Coch | Capnocytophaga ochracea |
| Cowc | Capsaspora owczarzaki |
| Cpin | Chitinophaga pinensis |
| Cpos | Coccidioides posadasii |
| CrVB | Cafeteria roenbergensis virus BV-PW1 |
| Cram | Clostridium ramosum |
| Crem | Caenorhabditis remanei |
| Csp. | Capnocytophaga sp. |
| Csp. | Carnobacterium sp. |
| Csp. | Coprobacillus sp. |
| Csp. | Coprococcus sp. |
| Csp. | Cyanothece sp. |
| Cspu | Capnocytophaga sputigena |
| Ctes | Comamonas testosteroni |
| Cvar | Chlorella variabilis |
| Cvio | Chromobacterium violaceum |
| Cyou | Citrobacter youngae |
| Dace | Desulfobacca acetoxidans |
| Daci | Delftia acidovorans |
| Dalk | Desulfatibacillum alkenivorans |
| Dalk | Dethiobacter alkaliphilus |
| Dbaa | Desulfarculus baarsii |
| Ddes | Deinococcus deserti |
| Dfas | Dictyostelium fasciculatum |
| Dfor | Dorea formicigenerans |
| Dgad | Dysgonomonas gadei |
| Dgri | Drosophila grimshawi |
| Dhan | Debaryomyces hansenii |
| Dmag | Desulfovibrio magneticus |
| Dmar | Deinococcus maricopensis |
| Dmos | Dysgonomonas mossii |
| Dole | Desulfococcus oleovorans |
| Dpro | Deinococcus proteolyticus |
| Dpro | delta proteobacterium |
| Drer | Danio rerio |
| Dsp. | Delftia sp. |
| Dsp. | Dermacoccus sp. |
| Dsp. | Desmospora sp. |
| Dzea | Dickeya zeae |
| Eaer | Enhydrobacter aerosaccus |
| Eaer | Enterobacter aerogenes |
| Ecor | Eikenella corrodens |
| Edis | Entamoeba dispar |
| Eeli | Eubacterium eligens |
| Efer | Escherichia fergusonii |
| Eict | Edwardsiella ictaluri |
| Esab | Eubacterium saburreum |
| Esir | Eubacterium siraeum |
| Esp. | Erythrobacter sp. |
| Esp. | Escherichia sp. |
| Etar | Edwardsiella tarda |
| Faln | Frankia alni |
| Fjoh | Flavobacterium johnsoniae |
| Foxy | Fusarium oxysporum |
| Fper | Fusobacterium periodonticum |
| Fpla | Ferroglobus placidus |
| Fpra | Faecalibacterium prausnitzii |
| Fpsy | Flavobacterium psychrophilum |
| Fsp. | Frankia sp. |
| Fsp. | Fusobacterium sp. |
| Fsuc | Fibrobacter succinogenes |
| Gbem | Geobacter bemidjiensis |
| Gdia | Gluconacetobacter diazotrophicus |
| Ggra | Glomerella graminicola |
| Ghan | Gluconacetobacter hansenii |
| Glov | Geobacter lovleyi |
| Gmax | Glycine max |
| Gobs | Gemmata obscuriglobus |
| Gobs | Geodermatophilus obscurus |
| Gpro | gamma proteobacterium |
| Gvag | Gardnerella vaginalis |
| Haur | Herpetosiphon aurantiacus |
| Hbut | Hyperthermus butylicus |
| Hche | Hahella chejuensis |
| Hfil | Holdemania filiformis |
| Hhyd | Halanaerobium hydrogeniformans |
| Hhyd | Haliscomenobacter hydrossis |
| Hmar | Haloarcula marismortui |
| Hoch | Haliangium ochraceum |
| Htur | Haloterrigena turkmenica |
| Hwin | Helicobacter winghamensis |
| Iagg | Ignisphaera aggregans |
| Ihos | Ignicoccus hospitalis |
| IiV6 | Invertebrate iridescent virus 6 |
| Ipol | Ilyobacter polytropus |
| Jsp. | Jannaschia sp. |
| Kalg | Kordia algicida |
| Kfla | Kribbella flavida |
| Klac | Kluyveromyces lactis |
| Kora | Kingella oralis |
| Kpas | Komagataella pastoris |
| Kpne | Klebsiella pneumoniae |
| Krac | Ktedonobacter racemifer |
| Kset | Kitasatospora setae |
| Ksp. | Klebsiella sp. |
| LV | Lausannevirus |
| Lagg | Labrenzia aggregata |
| Lbac | Lachnospiraceae bacterium |
| Lbic | Laccaria bicolor |
| Lbra | Leishmania braziliensis |
| Lbre | Lactobacillus brevis |
| Lbuc | Leptotrichia buccalis |
| Lelo | Lodderomyces elongisporus |
| Lgoo | Leptotrichia goodfellowii |
| Lhof | Leptotrichia hofstadii |
| Linf | Leishmania infantum |
| Lmac | Leptosphaeria maculans |
| Lsp. | Lyngbya sp. |
| Lthe | Lachancea thermotolerans |
| Lult | Lactobacillus ultunensis |
| MV | Marseillevirus |
| Macr | Metarhizium acridum |
| Mact | marine actinobacterium |
| Madh | Marinobacter adhaerens |
| Mani | Metarhizium anisopliae |
| Maur | Micromonospora aurantiaca |
| Mcht | Microcoleus chthonoplastes |
| Mcon | Methanosaeta concilii |
| Mext | Methylobacterium extorquens |
| Mful | Myxococcus fulvus |
| Mgam | marine gamma |
| Mglo | Malassezia globosa |
| Mgui | Meyerozyma guilliermondii |
| Mkan | Methanopyrus kandleri |
| Mlar | Melampsora larici-populina |
| Mmah | Methanohalophilus mahii |
| Mmar | Microscilla marina |
| Mmet | Methylomonas methanica |
| Mmul | Macaca mulatta |
| Mory | Magnaporthe oryzae |
| Mpal | Mucilaginibacter paludis |
| Mpet | Methylibium petroleiphilum |
| Mpho | Microlunatus phosphovorus |
| Mrum | Methanobrevibacter ruminantium |
| Msil | Methylocella silvestris |
| Msp. | Marinobacter sp. |
| Msp. | Micromonas sp. |
| Msp. | Micromonospora sp. |
| Msp. | Moritella sp. |
| Msta | Methanosphaera stadtmanae |
| Mthe | Methanosaeta thermophila |
| Mtri | Methylosinus trichosporium |
| Mtun | Methylobacter tundripaludum |
| Mvag | Microcoleus vaginatus |
| Mzhi | Methanosalsum zhilinae |
| Nabi | Neodiprion abietis |
| Nbac | Nocardioidaceae bacterium |
| Ndas | Nocardiopsis dassonvillei |
| Nelo | Neisseria elongata |
| Nfis | Neosartorya fischeri |
| Nfla | Neisseria flavescens |
| Nhae | Nectria haematococca |
| Nhal | Nitrosococcus halophilus |
| Nmar | Nitrosopumilus maritimus |
| Nmul | Nakamurella multipartita |
| Nspu | Nodularia spumigena |
| Nsub | Neisseria subflava |
| Ntet | Neurospora tetrasperma |
| Nvit | Nasonia vitripennis |
| Oant | Octadecabacter antarcticus |
| Obat | Oceanicola batsensis |
| Oluc | Ostreococcus lucimarinus |
| Omor | Osmerus mordax |
| Osp. | Oribacterium sp. |
| Osp. | Oscillatoria sp. |
| Oter | Opitutus terrae |
| Otri | Oscillochloris trichoides |
| Pans | Podospora anserina |
| Parc | Psychrobacter arcticus |
| Pars | Pyrobaculum arsenaticum |
| Pbra | Paracoccidioides brasiliensis |
| Pbra | Planctomyces brasiliensis |
| Pcal | Pyrobaculum calidifontis |
| Pcap | Pseudoflavonifractor capillosus |
| Pcar | Pectobacterium carotovorum |
| Pchr | Penicillium chrysogenum |
| Pcry | Psychrobacter cryohalolentis |
| Pcur | Paenibacillus curdlanolyticus |
| Pent | Pseudomonas entomophila |
| Pgra | Puccinia graminis |
| Pisl | Pyrobaculum islandicum |
| Plav | Parvibaculum lavamentivorans |
| Plim | Planctomyces limnophilus |
| Pmar | Penicillium marneffei |
| Pmar | Perkinsus marinus |
| Pmar | Planctomyces maris |
| Pmen | Pseudomonas mendocina |
| Pmir | Proteus mirabilis |
| Pori | Prevotella oris |
| Ppac | Plesiocystis pacifica |
| Ppal | Polysphondylium pallidum |
| Ppar | Pedosphaera parvula |
| Ppen | Proteus penneri |
| Ppol | Paenibacillus polymyxa |
| Prum | Prevotella ruminicola |
| Prus | Providencia rustigianii |
| Psit | Picea sitchensis |
| Psp. | Paenibacillus sp. |
| Psp. | Psychrobacter sp. |
| Psp. | Pusillimonas sp. |
| Psuc | Phascolarctobacterium succinatutens |
| Psyr | Pseudomonas syringae |
| Ptim | Prevotella timonensis |
| Ptor | Psychroflexus torquis |
| Ptri | Pyrenophora tritici-repentis |
| Pver | Prevotella veroralis |
| Ralb | Ruminococcus albus |
| Rbal | Rhodopirellula baltica |
| Rbro | Raphidiopsis brookii |
| Rcas | Roseiflexus castenholzii |
| Rden | Rothia dentocariosa |
| Retl | Rhizobium etli |
| Rfla | Ruminococcus flavefaciens |
| Rgna | Ruminococcus gnavus |
| Rint | Roseburia intestinalis |
| Rleg | Rhizobium leguminosarum |
| Rpic | Ralstonia pickettii |
| Rsli | Runella slithyformis |
| Rsp. | Rahnella sp. |
| Rsp. | Roseibium sp. |
| Rsp. | Roseiflexus sp. |
| Rsp. | Roseobacter sp. |
| Rsp. | Ruegeria sp. |
| Salb | Streptomyces albus |
| Sare | Salinispora arenicola |
| Saur | Stigmatella aurantiaca |
| Sbin | Streptomyces bingchenggensis |
| Scar | Staphylococcus carnosus |
| Scel | Sorangium cellulosum |
| Scla | Streptomyces clavuligerus |
| Scom | Schizophyllum commune |
| Sdeg | Saccharophagus degradans |
| Sfla | Streptomyces flavogriseus |
| Sfum | Syntrophobacter fumaroxidans |
| Sgha | Streptomyces ghanaensis |
| Sgri | Streptomyces griseoaurantiacus |
| Sgri | Streptomyces griseoflavus |
| Sgri | Streptomyces griseus |
| Shel | Slackia heliotrinireducens |
| Shim | Streptomyces himastatinicus |
| Sinv | Solenopsis invicta |
| Sjap | Schistosoma japonicum |
| Sjap | Schizosaccharomyces japonicus |
| Skow | Saccoglossus kowalevskii |
| Skuj | Sulfuricurvum kujiense |
| Slac | Serpula lacrymans |
| Slin | Spirosoma linguale |
| Slip | Syntrophothermus lipocalidus |
| Sliv | Streptomyces lividans |
| Smar | Staphylothermus marinus |
| Snas | Stackebrandtia nassauensis |
| Spar | Streptococcus parasanguinis |
| Spri | Streptomyces pristinaespiralis |
| Sput | Shewanella putrefaciens |
| Sros | Streptomyces roseosporus |
| Sros | Streptosporangium roseum |
| Ssan | Streptococcus sanguinis |
| Ssat | Shuttleworthia satelles |
| Ssca | Streptomyces scabiei |
| Sscl | Sclerotinia sclerotiorum |
| Ssp. | Salpingoeca sp. |
| Ssp. | Sphingomonas sp. |
| Ssp. | Streptococcus sp. |
| Ssp. | Streptomyces sp. |
| Ssti | Scheffersomyces stipitis |
| Ssvi | Streptomyces sviceus |
| Ster | Sebaldella termitidis |
| Stro | Salinispora tropica |
| Sven | Streptomyces venezuelae |
| Svio | Streptomyces violaceusniger |
| Svir | Streptomyces viridochromogenes |
| Taqu | Thermus aquaticus |
| Tbac | Thermotogales bacterium |
| Tbar | Thermococcus barophilus |
| Tbru | Trypanosoma brucei |
| Tcas | Tribolium castaneum |
| Tcur | Thermomonospora curvata |
| Tden | Thiobacillus denitrificans |
| Tmel | Tuber melanosporum |
| Tree | Trichoderma reesei |
| Trub | Trichophyton rubrum |
| Tsp. | Thauera sp. |
| Tsti | Talaromyces stipitatus |
| Tsul | Thioalkalivibrio sulfidophilus |
| Tthe | Tetrahymena thermophila |
| Tton | Trichophyton tonsurans |
| Ttur | Teredinibacter turnerae |
| Tvag | Trichomonas vaginalis |
| Tver | Trichophyton verrucosum |
| UDes | uncultured Desulfobacterium |
| Umet | uncultured methanogenic |
| Uree | Uncinocarpus reesii |
| Valb | Verticillium albo-atrum |
| Vbac | Vibrionales bacterium |
| Vdis | Vulcanisaeta distributa |
| Vhar | Vibrio harveyi |
| Vmar | Verrucosispora maris |
| Vpar | Variovorax paradoxus |
| Vpol | Vanderwaltozyma polyspora |
| Vspi | Verrucomicrobium spinosum |
| Vspl | Vibrio splendidus |
| X(Si | Xenopus (Silurana) |
| Xfus | Xanthomonas fuscans |
| Xnem | Xenorhabdus nematophila |
| Xper | Xanthomonas perforans |
| Xves | Xanthomonas vesicatoria |
| Ylip | Yarrowia lipolytica |
| Zmob | Zymomonas mobilis |
| Zrou | Zygosaccharomyces rouxii |
Supplementary table S2: sequence accession numbers.
| gi | accession | identifier |
|---|---|---|
| 153817467 | ZP_01970134 | A5C_A0388_Vcho_153817467 |
| 169634335 | YP_001708071 | ABSDF2913_Abau_169634335 |
| 184156423 | YP_001844762 | ACICU_00103_Abau_184156423 |
| 158335874 | YP_001517048 | AM1_2731_Amar_158335874 |
| 158336844 | YP_001518018 | AM1_3712_Amar_158336844 |
| 300783556 | YP_003763847 | AMED_1633_Amed_300783556 |
| 167769817 | ZP_02441870 | ANACOL_01151_Acol_167769817 |
| 303238852 | ZP_07325383 | AceceDRAFT_0731_Acel_303238852 |
| 303240378 | ZP_07326896 | AceceDRAFT_2244_Acel_303240378 |
| 256377585 | YP_003101245 | Amir_3505_Amir_256377585 |
| 226314127 | YP_002774023 | BBR47_45420_Bbre_226314127 |
| 30022569 | NP_834200 | BC4488_Bcer_30022569 |
| 206563730 | YP_002234493 | BCAM1881_Bcen_206563730 |
| 225619532 | YP_002720789 | BHWA1_00589_Bhyo_225619532 |
| 301167374 | CBW26956 | BMS_2150_Bmar_301167374 |
| 295087466 | CBK68989 | BXY_40670_Bxyl_295087466 |
| 134288349 | YP_001110512 | Bcep1808_6822_Bvie_134288349 |
| 255010211 | ZP_05282337 | Bfra3_010100013815_Bfra_255010211 |
| 296125416 | YP_003632668 | Bmur_0365_Bmur_296125416 |
| 302383816 | YP_003819639 | Bresu_2709_Bsub_302383816 |
| 212646224 | NP_507592 | C08E8.4_Cele_212646224 |
| 257460202 | ZP_05625306 | CAMGR0001_0616_Cgra_257460202 |
| 257093308 | YP_003166949 | CAP2UW1_1710_CAcc_257093308 |
| 239627871 | ZP_04670902 | CBFG_01593_Cbac_239627871 |
| 157165319 | YP_001467147 | CCC13826_2022_Ccon_157165319 |
| 295094771 | CBK83862 | CCU_25310_Csp._295094771 |
| 283836396 | ZP_06356137 | CIT292_10857_Cyou_283836396 |
| 225020576 | ZP_03709768 | CORMATOL_00583_Cmat_225020576 |
| 110802054 | YP_697488 | CPR_0151_Cper_110802054 |
| 282897552 | ZP_06305552 | CRD_01664_Rbro_282897552 |
| 256392113 | YP_003113677 | Caci_2927_Caci_256392113 |
| 256393748 | YP_003115312 | Caci_4610_Caci_256393748 |
| 256395008 | YP_003116572 | Caci_5873_Caci_256395008 |
| 150018370 | YP_001310624 | Cbei_3546_Cbei_150018370 |
| 256419128 | YP_003119781 | Cpin_0074_Cpin_256419128 |
| 220905714 | YP_002481025 | Cyan7425_0270_Csp._220905714 |
| 307153746 | YP_003889130 | Cyan7822_3925_Csp._307153746 |
| 66812724 | XP_640541 | DDB_G0281625_Ddis_66812724 |
| 66810169 | XP_638808 | DDB_G0283925_Ddis_66810169 |
| 330798615 | XP_003287347 | DICPUDRAFT_22458_Dpur_330798615 |
| 330802814 | XP_003289408 | DICPUDRAFT_35661_Dpur_330802814 |
| 330843562 | XP_003293720 | DICPUDRAFT_42446_Dpur_330843562 |
| 330846708 | XP_003295151 | DICPUDRAFT_85573_Dpur_330846708 |
| 166032191 | ZP_02235020 | DORFOR_01894_Dfor_166032191 |
| 15806282 | NP_294987 | DR_1263_Drad_15806282 |
| 160901192 | YP_001566774 | Daci_5761_Daci_160901192 |
| 320334379 | YP_004171090 | Deima_1776_Dmar_320334379 |
| 325284428 | YP_004256968 | Deipr_2488_Dpro_325284428 |
| 149186578 | ZP_01864890 | ED21_31874_Esp._149186578 |
| 158079465 | YP_001504278 | EFP_gp169_BPphiEF24C_158079465 |
| 67472915 | XP_652245 | EHI_017590_Ehis_67472915 |
| 170684265 | YP_001745340 | EcSMS35_3361_Ecol_170684265 |
| 298707265 | CBJ25892 | Esi_0017_0056_Esil_298707265 |
| 298714411 | CBJ27468 | Esi_0071_0113_Esil_298714411 |
| 298711392 | CBJ32535 | Esi_0345_0025_Esil_298711392 |
| 32565136 | NP_498956 | F44E2.8_Cele_32565136 |
| 46111757 | XP_382936 | FG02760.1_Gzea_46111757 |
| 150026339 | YP_001297165 | FP2309_Fpsy_150026339 |
| 295103146 | CBL00690 | FPR_02440_Fpra_295103146 |
| 111221771 | YP_712565 | FRAAL2340_Faln_111221771 |
| 237744336 | ZP_04574817 | FSDG_00336_Fsp._237744336 |
| 261415758 | YP_003249441 | Fisuc_1361_Fsuc_261415758 |
| 146298513 | YP_001193104 | Fjoh_0750_Fjoh_146298513 |
| 288920206 | ZP_06414521 | FrEUN1fDRAFT_4219_Fsp._288920206 |
| 312200713 | YP_004020774 | FraEuI1c_6936_Fsp._312200713 |
| 237813318 | YP_002897769 | GBP346_A3087_Bpse_237813318 |
| 291459520 | ZP_06598910 | GCWU000341_01684_Osp._291459520 |
| 229828516 | ZP_04454585 | GCWU000342_00580_Ssat_229828516 |
| 119476904 | ZP_01617185 | GP2143_10137_Mgam_119476904 |
| 254482777 | ZP_05096014 | GPB2148_1261_Mgam_254482777 |
| 296414614 | XP_002836993 | GSTUM_00003347001_Tmel_296414614 |
| 296424705 | XP_002841887 | GSTUM_00011304001_Tmel_296424705 |
| 261410041 | YP_003246282 | GYMC10_6272_Psp._261410041 |
| 197117872 | YP_002138299 | Gbem_1485_Gbem_197117872 |
| 189425639 | YP_001952816 | Glov_2583_Glov_189425639 |
| 168698168 | ZP_02730445 | GobsU_010100001512_Gobs_168698168 |
| 168699662 | ZP_02731939 | GobsU_010100009074_Gobs_168699662 |
| 168700969 | ZP_02733246 | GobsU_010100015693_Gobs_168700969 |
| 168704676 | ZP_02736953 | GobsU_010100034385_Gobs_168704676 |
| 154278399 | XP_001540013 | HCAG_05480_Acap_154278399 |
| 83646809 | YP_435244 | HCH_04109_Hche_83646809 |
| 83647036 | YP_435471 | HCH_04340_Hche_83647036 |
| 83649602 | YP_438037 | HCH_06997_Hche_83649602 |
| 262281016 | ZP_06058799 | HMPREF0012_02967_Acal_262281016 |
| 258545510 | ZP_05705744 | HMPREF0198_1779_Chom_258545510 |
| 300774513 | ZP_07084376 | HMPREF0204_10236_Cgle_300774513 |
| 299141967 | ZP_07035101 | HMPREF0665_01551_Pori_299141967 |
| 315224011 | ZP_07865852 | HMPREF1977_0666_Coch_315224011 |
| 326335654 | ZP_08201841 | HMPREF9071_1307_Csp._326335654 |
| 325690155 | EGD32159 | HMPREF9382_1113_Ssan_325690155 |
| 325694076 | EGD35994 | HMPREF9383_1770_Ssan_325694076 |
| 319937960 | ZP_08012360 | HMPREF9488_03196_Csp._319937960 |
| 223985602 | ZP_03635653 | HOLDEFILI_02959_Hfil_223985602 |
| 311695670 | ADP98543 | HP15_2779_Madh_311695670 |
| 237752248 | ZP_04582728 | HWAG_01373_Hwin_237752248 |
| 159896886 | YP_001543133 | Haur_0354_Haur_159896886 |
| 15078868 | NP_149618 | IIV6gp151_IiV6_15078868 |
| 310778851 | YP_003967184 | Ilyop_1055_Ipol_310778851 |
| 89055288 | YP_510739 | Jann_2797_Jsp._89055288 |
| 163754439 | ZP_02161561 | KAOT1_16128_Kalg_163754439 |
| 311894452 | BAJ26860 | KSE_10250_Kset_311894452 |
| 311895942 | BAJ28350 | KSE_25370_Kset_311895942 |
| 284029681 | YP_003379612 | Kfla_1718_Kfla_284029681 |
| 48696395 | YP_024435 | KgORF4_BPK_48696395 |
| 119486659 | ZP_01620709 | L8106_12950_Lsp._119486659 |
| 170107053 | XP_001884737 | LACBIDRAFT_252516_Lbic_170107053 |
| 170117768 | XP_001890069 | LACBIDRAFT_316770_Lbic_170117768 |
| 170095960 | XP_001879200 | LACBIDRAFT_318005_Lbic_170095960 |
| 327409634 | YP_004347054 | LAU_0089_LV_327409634 |
| 217965001 | YP_002350679 | LMHCC_1724_Lmon_217965001 |
| 217965272 | YP_002350950 | LMHCC_1997_Lmon_217965272 |
| 72168255 | XP_793312 | LOC588539_Spur_72168255 |
| 154331017 | XP_001561948 | LbrM06_V2.0110_Lbra_154331017 |
| 146070759 | XP_001463095 | LINJ_06_0130_Linf_146070759 |
| 124010457 | ZP_01695096 | M23134_00353_Mmar_124010457 |
| 124004845 | ZP_01689688 | M23134_02260_Mmar_124004845 |
| 124004851 | ZP_01689694 | M23134_02266_Mmar_124004851 |
| 124009340 | ZP_01694019 | M23134_07250_Mmar_124009340 |
| 284504143 | YP_003406858 | MAR_ORF111_MV_284504143 |
| 254412559 | ZP_05026333 | MC7420_6514_Mcht_254412559 |
| 254413191 | ZP_05026962 | MC7420_678_Mcht_254413191 |
| 238062132 | ZP_04606841 | MCAG_03098_Msp._238062132 |
| 330502141 | YP_004379010 | MDS_1227_Pmen_330502141 |
| 164657874 | XP_001730063 | MGL_3049_Mglo_164657874 |
| 315054313 | XP_003176531 | MGYG_00619_Agyp_315054313 |
| 108762267 | YP_633480 | MXAN_5330_Mxan_108762267 |
| 240141986 | YP_002966496 | MexAM1_META2p0262_Mext_240141986 |
| 302868047 | YP_003836684 | Micau_3582_Maur_302868047 |
| 117924481 | YP_865098 | Mmc1_1181_Masp_117924481 |
| 124262828 | YP_001023298 | Mpe_B0288_Mpet_124262828 |
| 84489297 | YP_447529 | Msp_0486_Msta_84489297 |
| 119509756 | ZP_01628901 | N9414_00365_Nspu_119509756 |
| 290996214 | XP_002680677 | NAEGRDRAFT_31151_Ngru_290996214 |
| 290996009 | XP_002680575 | NAEGRDRAFT_31328_Ngru_290996009 |
| 290990814 | XP_002678031 | NAEGRDRAFT_36485_Ngru_290990814 |
| 290997341 | XP_002681240 | NAEGRDRAFT_46602_Ngru_290997341 |
| 326330475 | ZP_08196783 | NBCG_01909_Nbac_326330475 |
| 302884348 | XP_003041070 | NECHADRAFT_29138_Nhae_302884348 |
| 261381097 | ZP_05985670 | NEISUBOT_05210_Nsub_261381097 |
| 301059840 | ZP_07200732 | NPH_6632_Dpro_301059840 |
| 258651665 | YP_003200821 | Namu_1431_Nmul_258651665 |
| 297563442 | YP_003682416 | Ndas_4523_Ndas_297563442 |
| 254453984 | ZP_05067421 | OA238_4610_Oant_254453984 |
| 156564215 | YP_001429725 | ORF234_BP0305phi8-36_156564215 |
| 300866977 | ZP_07111648 | OSCI_3190004_Osp._300866977 |
| 309791192 | ZP_07685724 | OSCT_1675_Otri_309791192 |
| 145348536 | XP_001418703 | OSTLU_35648_Oluc_145348536 |
| 149908726 | ZP_01897387 | PE36_21039_Msp._149908726 |
| 70733106 | YP_262879 | PFL_5821_Pflu_70733106 |
| 149175186 | ZP_01853808 | PM8797T_20343_Pmar_149175186 |
| 149176205 | ZP_01854821 | PM8797T_29763_Pmar_149176205 |
| 212541268 | XP_002150789 | PMAA_059590_Pmar_212541268 |
| 308069201 | YP_003870806 | PPE_02438_Ppol_308069201 |
| 281209628 | EFA83796 | PPL_02864_Ppal_281209628 |
| 226326967 | ZP_03802485 | PROPEN_00827_Ppen_226326967 |
| 294673111 | YP_003573727 | PRU_0345_Prum_294673111 |
| 294673143 | YP_003573759 | PRU_0382_Prum_294673143 |
| 152987782 | YP_001348410 | PSPA7_3050_Paer_152987782 |
| 152985284 | YP_001350552 | PSPA7_5219_Paer_152985284 |
| 330874307 | EGH08456 | PSYMP_06728_Psyr_330874307 |
| 332285914 | YP_004417825 | PT7_2661_Psp._332285914 |
| 189204778 | XP_001938724 | PTRG_08392_Ptri_189204778 |
| 326434983 | EGD80553 | PTSG_01145_Ssp._326434983 |
| 304407843 | ZP_07389494 | PaecuDRAFT_4172_Pcur_304407843 |
| 255940726 | XP_002561132 | Pc16g08100_Pchr_255940726 |
| 93005719 | YP_580156 | Pcryo_0891_Pcry_93005719 |
| 325107565 | YP_004268633 | Plabr_0990_Pbra_325107565 |
| 296122446 | YP_003630224 | Plim_2199_Plim_296122446 |
| 294875527 | XP_002767363 | Pmar_PMAR024558_Pmar_294875527 |
| 148652988 | YP_001280081 | PsycPRwf_1182_Psp._148652988 |
| 71064897 | YP_263624 | Psyc_0321_Parc_71064897 |
| 71065404 | YP_264131 | Psyc_0844_Parc_71065404 |
| 311978014 | YP_003987134 | R617_APMV_311978014 |
| 94501287 | ZP_01307808 | RED65_02704_Bmar_94501287 |
| 291535823 | CBL08935 | ROI_18700_Rint_291535823 |
| 240146453 | ZP_04745054 | ROSINTL182_08410_Rint_240146453 |
| 240147581 | ZP_04746182 | ROSINTL182_09631_Rint_240147581 |
| 154503599 | ZP_02040659 | RUMGNA_01423_Rgna_154503599 |
| 268609453 | ZP_06143180 | RflaF_010100008155_Rfla_268609453 |
| 241589866 | YP_002979891 | Rpic12D_5003_Rpic_241589866 |
| 317056301 | YP_004104768 | Rumal_1634_Ralb_317056301 |
| 259416444 | ZP_05740364 | SCH4B_1850_Sisp_259416444 |
| 302674848 | XP_003027108 | SCHCODRAFT_258659_Scom_302674848 |
| 302674850 | XP_003027109 | SCHCODRAFT_258660_Scom_302674850 |
| 302693411 | XP_003036384 | SCHCODRAFT_36431_Scom_302693411 |
| 302783817 | XP_002973681 | SELMODRAFT_413953_Smoe_302783817 |
| 329936685 | ZP_08286392 | SGM_1884_Sgri_329936685 |
| 156053544 | XP_001592698 | SS1G_05618_Sscl_156053544 |
| 125718681 | YP_001035814 | SSA_1883_Ssan_125718681 |
| 291448123 | ZP_06587513 | SSGG_05341_Sros_291448123 |
| 302558106 | ZP_07310448 | SSRG_01621_Sgri_302558106 |
| 170078553 | YP_001735191 | SYNPCC7002_A1948_Syn_170078553 |
| 224477787 | YP_002635393 | Sca_2305_Scar_224477787 |
| 90020054 | YP_525881 | Sde_0405_Sdeg_90020054 |
| 284036735 | YP_003386665 | Slin_1821_Slin_284036735 |
| 239939813 | ZP_04691750 | SrosN15_010100002350_Sros_239939813 |
| 271963927 | YP_003338123 | Sros_2401_Sros_271963927 |
| 269121732 | YP_003309909 | Sterm_3136_Ster_269121732 |
| 17564644 | NP_503984 | T24A6.7_Cele_17564644 |
| 254787804 | YP_003075233 | TERTU_3943_Ttur_254787804 |
| 99081738 | YP_613892 | TM1040_1897_Rsp._99081738 |
| 242799239 | XP_002483337 | TSTA_012120_Tsti_242799239 |
| 118370894 | XP_001018647 | TTHERM_00289300_Tthe_118370894 |
| 118401008 | XP_001032825 | TTHERM_00486130_Tthe_118401008 |
| 118397133 | XP_001030901 | TTHERM_00998900_Tthe_118397133 |
| 123462122 | XP_001316875 | TVAG_227690_Tvag_123462122 |
| 72391614 | XP_846101 | Tb927.7.4780_Tbru_72391614 |
| 71654521 | XP_815878 | Tc00.1047053507521.60_Tcru_71654521 |
| 269124625 | YP_003297995 | Tcur_0355_Tcur_269124625 |
| 113476072 | YP_722133 | Tery_2448_Tery_113476072 |
| 220934941 | YP_002513840 | Tgr7_1771_Tsul_220934941 |
| 84392320 | ZP_00991747 | V12B01_14190_Vspl_84392320 |
| 330468357 | YP_004406100 | VAB18032_22000_Vmar_330468357 |
| 269960099 | ZP_06174476 | VME_08600_Vhar_269960099 |
| 28899861 | NP_799516 | VPA0006_Vpar_28899861 |
| 148975384 | ZP_01812308 | VSWAT3_18363_Vbac_148975384 |
| 171913880 | ZP_02929350 | VspiD_010100021915_Vspi_171913880 |
| 294664143 | ZP_06729532 | XAUC_02590_Xfus_294664143 |
| 300723771 | YP_003713078 | XNC1_2895_Xnem_300723771 |
| 82407990 | 2b3wA | _Ecol_82407990 |
| 308516893 | CBW46998 | _BP1_308516893 |
| 154487137 | ZP_02028544 | _Bado_154487137 |
| 33601359 | NP_888919 | _Bbro_33601359 |
| 33595978 | NP_883621 | _Bpar_33595978 |
| 221067792 | ZP_03543897 | _Ctes_221067792 |
| 160945657 | ZP_02092883 | _Fpra_160945657 |
| 160945914 | ZP_02093140 | _Fpra_160945914 |
| 238022350 | ZP_04602776 | _Kora_238022350 |
| 298249651 | ZP_06973455 | _Krac_298249651 |
| 298250178 | ZP_06973982 | _Krac_298250178 |
| 32471506 | NP_864499 | _Rbal_32471506 |
| 17232521 | NP_489069 | all5029_Ana_17232521 |
| 229129773 | ZP_04258740 | bcere0015_42140_Bcer_229129773 |
| 330822167 | YP_004350995 | bgla_2p0770_Bgla_330822167 |
| 330818849 | YP_004351066 | bgla_3p0420_Bgla_330818849 |
| 330814539 | YP_004362714 | bgla_4p0890_Bgla_330814539 |
| 228982721 | ZP_04142980 | bthur0002_58540_Bthu_228982721 |
| 308814565 | YP_003934839 | gp30.3_BPSP18_308814565 |
| 288561223 | YP_003424709 | mru_1967_Mrum_288561223 |
| 325680741 | ZP_08160279 | nadE_Ralb_325680741 |
| 60461911 | YP_209629 | pIL105p2_Llac_60461911 |
| 310722519 | YP_003969342 | phiAS5_ORF0053_BPphiAS5_310722519 |
| 162451636 | YP_001614003 | sce3364_Scel_162451636 |
| 22300007 | NP_683254 | tlr2465_Telo_22300007 |
| 300869472 | ZP_07114055 | ybiA_Osp._300869472 |
| 311112847 | YP_003984069 | ybiA_Rden_311112847 |
| 296876279 | ZP_06900331 | ybiA_Spar_296876279 |
| 325693558 | EGD35477 | ybiA_Ssan_325693558 |
| 104779561 | YP_606059 | PSEEN0279_Pent_104779561 |
| 104779562 | YP_606060 | PSEEN0280_Pent_104779562 |
| 10639263 | CAC11265 | Ta0118_Taci_10639263 |
| 107099046 | ZP_01362964 | PaerPA_01000055_Paer_107099046 |
| 108763108 | YP_634797 | MXAN_6680_Mxan_108763108 |
| 110638931 | YP_679140 | kptA_Chut_110638931 |
| 110639136 | YP_679345 | CHU_2753_Chut_110639136 |
| 110645302 | YP_667941 | NANV_gp93_Nabi_110645302 |
| 110800227 | YP_694609 | kptA_Cper_110800227 |
| 113473935 | YP_718198 | ORF258_Ssp._113473935 |
| 11499148 | NP_070382 | AF1553_Aful_11499148 |
| 115387213 | XP_001211112 | ATEG_01934_Ater_115387213 |
| 116192183 | XP_001221904 | CHGG_05809_Cglo_116192183 |
| 116252353 | YP_768191 | kptA_Rleg_116252353 |
| 116495334 | YP_807068 | LSEI_1867_Lcas_116495334 |
| 116748284 | YP_844971 | Sfum_0839_Sfum_116748284 |
| 116754706 | YP_843824 | Mthe_1409_Mthe_116754706 |
| 118362535 | XP_001014494 | TTHERM_00854280_Tthe_118362535 |
| 118430933 | NP_147045 | kptA_Aper_118430933 |
| 118591032 | ZP_01548432 | SIAM614_20266_Lagg_118591032 |
| 119193120 | XP_001247166 | CIMG_00937_Cimm_119193120 |
| 119477262 | ZP_01617498 | GP2143_03029_Mgam_119477262 |
| 119483244 | ZP_01618658 | L8106_04306_Lsp._119483244 |
| 119497805 | XP_001265660 | NFIA_033290_Nfis_119497805 |
| 119498195 | XP_001265855 | NFIA_035260_Nfis_119498195 |
| 119871538 | YP_929545 | Pisl_0018_Pisl_119871538 |
| 120608868 | YP_968546 | Aave_0160_Acit_120608868 |
| 121719366 | XP_001276382 | ACLA_003690_Acla_121719366 |
| 124002565 | ZP_01687418 | M23134_05268_Mmar_124002565 |
| 124002814 | ZP_01687666 | M23134_04262_Mmar_124002814 |
| 124003655 | ZP_01688504 | M23134_03314_Mmar_124003655 |
| 124004042 | ZP_01688889 | M23134_05434_Mmar_124004042 |
| 124007251 | ZP_01691959 | M23134_04698_Mmar_124007251 |
| 124007793 | ZP_01692495 | M23134_01690_Mmar_124007793 |
| 124028223 | YP_001013543 | Hbut_1373_Hbut_124028223 |
| 125717421 | YP_001034554 | SSA_0561_Ssan_125717421 |
| 125718682 | YP_001035815 | SSA_1884_Ssan_125718682 |
| 126131670 | XP_001382360 | PICST_56016_Ssti_126131670 |
| 126460155 | YP_001056433 | Pcal_1549_Pcal_126460155 |
| 126465464 | YP_001040573 | Smar_0558_Smar_126465464 |
| 126652604 | ZP_01724768 | BB14905_19555_Bsp._126652604 |
| 126667035 | ZP_01738010 | MELB17_05794_Msp._126667035 |
| 126740444 | ZP_01756132 | RSK20926_16597_Rsp._126740444 |
| 13470984 | NP_102553 | msr0834_Mlot_13470984 |
| 13470985 | NP_102554 | msr0835_Mlot_13470985 |
| 145493555 | XP_001432773 | GSPATT00034855001_Ptet_145493555 |
| 145591275 | YP_001153277 | Pars_1047_Pars_145591275 |
| 145595385 | YP_001159682 | Strop_2864_Stro_145595385 |
| 145596643 | YP_001160940 | Strop_4133_Stro_145596643 |
| 145602059 | XP_001403403 | MGG_12911_Mory_145602059 |
| 146294612 | YP_001185036 | Sputcn32_3528_Sput_146294612 |
| 146298511 | YP_001193102 | Fjoh_0748_Fjoh_146298511 |
| 146305602 | YP_001186067 | Pmen_0565_Pmen_146305602 |
| 146341856 | YP_001206904 | BRADO4987_Brad_146341856 |
| 146417847 | XP_001484891 | PGUG_02620_Mgui_146417847 |
| 147919656 | YP_686600 | kptA_Umet_147919656 |
| 148256740 | YP_001241325 | BBta_5454_Brad_148256740 |
| 148654473 | YP_001274678 | RoseRS_0296_Rsp._148654473 |
| 148821249 | YP_001286003 | TBFG_10058_Mtub_148821249 |
| 148907021 | ABR16654 | _Psit_148907021 |
| 149173583 | ZP_01852213 | PM8797T_22603_Pmar_149173583 |
| 149175185 | ZP_01853807 | PM8797T_20338_Pmar_149175185 |
| 149186577 | ZP_01864889 | ED21_31869_Esp._149186577 |
| 149246000 | XP_001527470 | LELG_02299_Lelo_149246000 |
| 149919906 | ZP_01908381 | PPSIR1_29218_Ppac_149919906 |
| 149922143 | ZP_01910582 | PPSIR1_00892_Ppac_149922143 |
| 150018230 | YP_001310484 | Cbei_3402_Cbei_150018230 |
| 151945531 | EDN63772 | TPT1_Scer_151945531 |
| 153817479 | ZP_01970146 | A5C_A0387_Vcho_153817479 |
| 153872688 | ZP_02001506 | BGP_2335_Begg_153872688 |
| 153873366 | ZP_02001971 | BGP_1609_Begg_153873366 |
| 154253368 | YP_001414192 | Plav_2928_Plav_154253368 |
| 154295249 | XP_001548061 | BC1G_13438_Bfuc_154295249 |
| 154496777 | ZP_02035473 | BACCAP_01070_Pcap_154496777 |
| 154497918 | ZP_02036296 | BACCAP_01896_Pcap_154497918 |
| 15607201 | NP_214573 | _Mtub_15607201 |
| 156543836 | XP_001606670 | LOC100123064_Nvit_156543836 |
| 156740099 | YP_001430228 | Rcas_0073_Rcas_156740099 |
| 156845856 | XP_001645817 | Kpol_1054p4_Vpol_156845856 |
| 156937278 | YP_001435074 | Igni_0484_Ihos_156937278 |
| 157042782 | NP_001013309 | zgc:113138_Drer_157042782 |
| 157126123 | XP_001654547 | AaeL_AAEL010417_Aaeg_157126123 |
| 158333527 | YP_001514699 | AM1_0325_Amar_158333527 |
| 158335219 | YP_001516391 | AM1_2062_Amar_158335219 |
| 158337724 | YP_001518900 | AM1_4608_Amar_158337724 |
| 158521555 | YP_001529425 | Dole_1544_Dole_158521555 |
| 15891357 | NP_357029 | Atu3583_Atum_15891357 |
| 159037621 | YP_001536874 | Sare_2007_Sare_159037621 |
| 159038434 | YP_001537687 | Sare_2868_Sare_159038434 |
| 159038599 | YP_001537852 | Sare_3040_Sare_159038599 |
| 159901068 | YP_001547315 | Haur_4556_Haur_159901068 |
| 159901400 | YP_001547647 | Haur_4889_Haur_159901400 |
| 160939744 | ZP_02087091 | CLOBOL_04635_Cbol_160939744 |
| 16126106 | NP_420670 | CC_1863_Ccre_16126106 |
| 161528666 | YP_001582492 | Nmar_1158_Nmar_161528666 |
| 162450235 | YP_001612602 | kptA_Scel_162450235 |
| 162453007 | YP_001615374 | sce4731_Scel_162453007 |
| 162457230 | YP_001619597 | sce8945_Scel_162457230 |
| 162457272 | YP_001619639 | sce8987_Scel_162457272 |
| 163754443 | ZP_02161565 | KAOT1_16148_Kalg_163754443 |
| 163754444 | ZP_02161566 | KAOT1_16153_Kalg_163754444 |
| 163754445 | ZP_02161567 | KAOT1_16158_Kalg_163754445 |
| 163814521 | ZP_02205910 | COPEUT_00672_Ceut_163814521 |
| 163847525 | YP_001635569 | Caur_1965_Caur_163847525 |
| 163849264 | YP_001637308 | Caur_3741_Caur_163849264 |
| 167043400 | ABZ08102 | ALOHA_HF4000APKG1C9ctg2g5__167043400 |
| 167377905 | XP_001734581 | EDI_237770_Edis_167377905 |
| 167518371 | XP_001743526 | MONBRDRAFT_23195_Mbre_167518371 |
| 167588668 | ZP_02381056 | BuboB_010100025264_Bubo_167588668 |
| 167749542 | ZP_02421669 | EUBSIR_00500_Esir_167749542 |
| 167753772 | ZP_02425899 | _Aput_167753772 |
| 167757534 | ZP_02429661 | CLORAM_03084_Cram_167757534 |
| 167769835 | ZP_02441888 | ANACOL_01169_Acol_167769835 |
| 168049051 | XP_001776978 | PHYPADRAFT_194205_Ppat_168049051 |
| 168698114 | ZP_02730391 | GobsU_010100001232_Gobs_168698114 |
| 168699093 | ZP_02731370 | GobsU_010100006203_Gobs_168699093 |
| 168703011 | ZP_02735288 | GobsU_010100026009_Gobs_168703011 |
| 169773039 | XP_001820988 | AOR_1_740144_Aory_169773039 |
| 170105752 | XP_001884088 | LACBIDRAFT_153942_Lbic_170105752 |
| 170683612 | YP_001746786 | kptA_Ecol_170683612 |
| 170684105 | YP_001742169 | EcSMS35_0052_Ecol_170684105 |
| 170940179 | CAP65406 | _Pans_170940179 |
| 171913881 | ZP_02929351 | VspiD_010100021920_Vspi_171913881 |
| 171913882 | ZP_02929352 | VspiD_010100021925_Vspi_171913882 |
| 172064765 | YP_001812415 | BamMC406_6764_Bamb_172064765 |
| 182412866 | YP_001817932 | Oter_1044_Oter_182412866 |
| 182437433 | YP_001825152 | SGR_3640_Sgri_182437433 |
| 182438632 | YP_001826351 | SGR_4839_Sgri_182438632 |
| 18314222 | NP_560889 | PAE3647_Pyae_18314222 |
| 186681810 | YP_001865006 | Npun_R1352_Npun_186681810 |
| 189425258 | YP_001952435 | Glov_2199_Glov_189425258 |
| 189425638 | YP_001952815 | Glov_2582_Glov_189425638 |
| 19115427 | NP_594515 | SPAC2C4.12c_Spom_19115427 |
| 191169136 | ZP_03030895 | EcB7A_0638_Ecol_191169136 |
| 192290492 | YP_001991097 | Rpal_2100_Rpal_192290492 |
| 193070962 | ZP_03051891 | EcE110019_5086_Ecol_193070962 |
| 195016166 | XP_001984354 | Dgri\GH16409_Dgri_195016166 |
| 196229950 | ZP_03128814 | CfE428DRAFT_1979_Cfla_196229950 |
| 197246418 | AAI68833 | _X(Si_197246418 |
| 197286762 | YP_002152634 | PMI2933_Pmir_197286762 |
| 198415504 | XP_002120125 | LOC100186294_Cint_198415504 |
| 198425598 | XP_002120031 | LOC100175594_Cint_198425598 |
| 198471764 | XP_002133835 | Dpse\GA22571_Dpse_198471764 |
| 20093417 | NP_619492 | MA4638_Mace_20093417 |
| 20094870 | NP_614717 | KptA_Mkan_20094870 |
| 206563731 | YP_002234494 | BCAM1882_Bcen_206563731 |
| 206575484 | YP_002235807 | KPK_A0162_Kpne_206575484 |
| 206579710 | YP_002240751 | KPK_4974_Kpne_206579710 |
| 209527878 | ZP_03276367 | AmaxDRAFT_5193_Amax_209527878 |
| 209527890 | ZP_03276379 | AmaxDRAFT_5205_Amax_209527890 |
| 209544855 | YP_002277084 | Gdia_2732_Gdia_209544855 |
| 209921977 | YP_002296050 | ECSE_P1-0025_Ecol_209921977 |
| 210621794 | ZP_03292823 | CLOHIR_00768_Chir_210621794 |
| 21222199 | NP_627978 | _Scoe_21222199 |
| 21223327 | NP_629106 | _Scoe_21223327 |
| 213408531 | XP_002175036 | SJAG_03913_Sjap_213408531 |
| 213962768 | ZP_03391028 | CAPSP0001_0556_Cspu_213962768 |
| 213966822 | ZP_03394973 | kptA_Psyr_213966822 |
| 215486216 | YP_002328647 | E2348C_1093_Ecol_215486216 |
| 217979676 | YP_002363823 | Msil_3572_Msil_217979676 |
| 217979677 | YP_002363824 | Msil_3573_Msil_217979677 |
| 218295754 | ZP_03496550 | TaqDRAFT_4249_Taqu_218295754 |
| 218547498 | YP_002381289 | EFER_0059_Efer_218547498 |
| 218679791 | ZP_03527688 | RetlC8_010100013251_Retl_218679791 |
| 218779300 | YP_002430618 | Dalk_1450_Dalk_218779300 |
| 218780694 | YP_002432012 | Dalk_2854_Dalk_218780694 |
| 219121541 | XP_002181123 | PHATRDRAFT_21228_Ptri_219121541 |
| 221067794 | ZP_03543899 | _Ctes_221067794 |
| 221487185 | EEE25431 | TGGT1_013520_Tgon_221487185 |
| 222529646 | YP_002573528 | Athe_1661_Cbes_222529646 |
| 223935744 | ZP_03627660 | Cflav_PD6472_Ppar_223935744 |
| 223939130 | ZP_03631013 | Cflav_PD1558_Ppar_223939130 |
| 224002288 | XP_002290816 | THAPSDRAFT_22854_Tpse_224002288 |
| 224477788 | YP_002635394 | Sca_2306_Scar_224477788 |
| 224542154 | ZP_03682693 | CATMIT_01329_Cmit_224542154 |
| 225023628 | ZP_03712820 | EIKCOROL_00488_Ecor_225023628 |
| 225075180 | ZP_03718379 | NEIFLAOT_00180_Nfla_225075180 |
| 225181269 | ZP_03734714 | DealDRAFT_2303_Dalk_225181269 |
| 225388916 | ZP_03758640 | CLOSTASPAR_02657_Casp_225388916 |
| 225390142 | ZP_03759866 | CLOSTASPAR_03892_Casp_225390142 |
| 225559493 | EEH07776 | HCBG_04655_Acap_225559493 |
| 225620034 | YP_002721291 | BHWA1_01104_Bhyo_225620034 |
| 225620246 | YP_002721503 | BHWA1_01320_Bhyo_225620246 |
| 225682414 | EEH20698 | PABG_02929_Pbra_225682414 |
| 225684169 | EEH22453 | PABG_04664_Pbra_225684169 |
| 225707394 | ACO09543 | KPTA_Omor_225707394 |
| 226293790 | EEH49210 | PADG_05289_Pbra_226293790 |
| 226313333 | YP_002773227 | BBR47_37460_Bbre_226313333 |
| 226327538 | ZP_03803056 | PROPEN_01409_Ppen_226327538 |
| 226330224 | ZP_03805742 | _Ppen_226330224 |
| 226355053 | YP_002784793 | Deide_02300_Ddes_226355053 |
| 226471272 | CAX70717 | _Sjap_226471272 |
| 227508115 | ZP_03938164 | HMPREF0496_0278_Lbre_227508115 |
| 227893699 | ZP_04011504 | HMPREF0548_1222_Lult_227893699 |
| 228473982 | ZP_04058723 | CAPGI0001_2523_Cgin_228473982 |
| 228911570 | ZP_04075359 | bthur0013_57000_Bthu_228911570 |
| 228923828 | ZP_04087106 | bthur0011_48030_Bthu_228923828 |
| 228983067 | ZP_04143326 | bthur0002_62010_Bthu_228983067 |
| 229129771 | ZP_04258738 | bcere0015_42120_Bcer_229129771 |
| 229175166 | ZP_04302682 | bcere0006_42470_Bcer_229175166 |
| 237654251 | YP_002890565 | Tmz1t_3595_Tsp._237654251 |
| 237742025 | ZP_04572506 | FSCG_00598_Fsp._237742025 |
| 237800583 | ZP_04589044 | POR16_17293_Psyr_237800583 |
| 237813317 | YP_002897768 | GBP346_A3086_Bpse_237813317 |
| 238020853 | ZP_04601279 | _Kora_238020853 |
| 238061717 | ZP_04606426 | MCAG_02683_Msp._238061717 |
| 238061986 | ZP_04606695 | MCAG_02952_Msp._238061986 |
| 238490968 | XP_002376721 | AFLA_108510_Afla_238490968 |
| 238496189 | XP_002379330 | AFLA_133160_Afla_238496189 |
| 238550149 | NP_001153861 | TRPT1_Hsap_238550149 |
| 238916184 | YP_002929701 | EUBELI_00218_Eeli_238916184 |
| 238921299 | YP_002934814 | NT01EI_3442_Eict_238921299 |
| 239606461 | EEQ83448 | BDCG_00253_Ader_239606461 |
| 239626468 | ZP_04669499 | CBFG_00190_Cbac_239626468 |
| 239626503 | ZP_04669534 | CBFG_00225_Cbac_239626503 |
| 239627870 | ZP_04670901 | CBFG_01592_Cbac_239627870 |
| 239815282 | YP_002944192 | Vapar_2298_Vpar_239815282 |
| 239908249 | YP_002954990 | DMR_36130_Dmag_239908249 |
| 239987775 | ZP_04708439 | SrosN1_010100010753_Sros_239987775 |
| 239992555 | ZP_04713219 | SrosN1_010100035003_Sros_239992555 |
| 240272965 | EER36489 | HCDG_09373_Acap_240272965 |
| 241952517 | XP_002418980 | CD36_80320_Cdub_241952517 |
| 242218580 | XP_002475079 | POSPLDRAFT_41997_Ppla_242218580 |
| 242785264 | XP_002480559 | TSTA_033670_Tsti_242785264 |
| 251788569 | YP_003003290 | Dd1591_0935_Dzea_251788569 |
| 251794334 | YP_003009065 | Pjdr2_0298_Psp._251794334 |
| 253687260 | YP_003016450 | PC1_0863_Pcar_253687260 |
| 254169141 | ZP_04875977 | ABOONEI_1429_Aboo_254169141 |
| 254245305 | ZP_04938626 | BCPG_00001_Bcen_254245305 |
| 254302431 | ZP_04969789 | FNP_0054_Fnuc_254302431 |
| 254383863 | ZP_04999210 | SSAG_03610_Ssp._254383863 |
| 254387007 | ZP_05002286 | SSAG_06599_Ssp._254387007 |
| 254392683 | ZP_05007857 | SSCG_05109_Scla_254392683 |
| 254410814 | ZP_05024592 | MC7420_292_Mcht_254410814 |
| 254573246 | XP_002493732 | PAS_chr4_0312_Kpas_254573246 |
| 254578506 | XP_002495239 | ZYRO0B06600g_Zrou_254578506 |
| 255010210 | ZP_05282336 | Bfra3_010100013810_Bfra_255010210 |
| 255086119 | XP_002509026 | MICPUN_76559_Msp._255086119 |
| 255103268 | ZP_05332245 | CdifQCD-6_020200020820_Cdif_255103268 |
| 255638634 | ACU19622 | _Gmax_255638634 |
| 255712699 | XP_002552632 | KLTH0C09460g_Lthe_255712699 |
| 255930929 | XP_002557021 | Pc12g01220_Pchr_255930929 |
| 256006093 | ZP_05431024 | ClothDRAFT_2885_Cthe_256006093 |
| 256023435 | ZP_05437300 | E4_010100008678_Esp._256023435 |
| 256367844 | YP_003108401 | pEK499_p136_Ecol_256367844 |
| 256374811 | YP_003098471 | Amir_0662_Amir_256374811 |
| 256376037 | YP_003099697 | Amir_1903_Amir_256376037 |
| 256376409 | YP_003100069 | Amir_2283_Amir_256376409 |
| 256379719 | YP_003103379 | Amir_5718_Amir_256379719 |
| 256394652 | YP_003116216 | Caci_5516_Caci_256394652 |
| 256395290 | YP_003116854 | Caci_6159_Caci_256395290 |
| 256419129 | YP_003119782 | Cpin_0075_Cpin_256419129 |
| 256420608 | YP_003121261 | Cpin_1564_Cpin_256420608 |
| 256422007 | YP_003122660 | Cpin_2983_Cpin_256422007 |
| 257063188 | YP_003142860 | Shel_04510_Shel_257063188 |
| 257093309 | YP_003166950 | CAP2UW1_1711_CAcc_257093309 |
| 257095819 | YP_003169460 | CAP2UW1_4295_CAcc_257095819 |
| 257125945 | YP_003164059 | Lebu_1175_Lbuc_257125945 |
| 257455836 | ZP_05621061 | ENHAE0001_1187_Eaer_257455836 |
| 258545015 | ZP_05705249 | kptA_Chom_258545015 |
| 258545511 | ZP_05705745 | HMPREF0198_1780_Chom_258545511 |
| 258574383 | XP_002541373 | UREG_00888_Uree_258574383 |
| 260554979 | ZP_05827200 | HMPREF0010_00583_Abau_260554979 |
| 260557664 | ZP_05829878 | HMPREF0010_03261_Abau_260557664 |
| 260590817 | ZP_05856275 | HMPREF0973_00239_Pver_260590817 |
| 260781042 | XP_002585636 | BRAFLDRAFT_274539_Bflo_260781042 |
| 260782199 | XP_002586178 | BRAFLDRAFT_132446_Bflo_260782199 |
| 260802161 | XP_002595961 | BRAFLDRAFT_128074_Bflo_260802161 |
| 260889106 | ZP_05900369 | GCWU000323_00265_Lhof_260889106 |
| 260889576 | ZP_05900839 | GCWU000323_00737_Lhof_260889576 |
| 260945038 | XP_002616817 | CLUG_04058_Clus_260945038 |
| 261334507 | CBH17501 | TbgDal_XI6190_Tbru_261334507 |
| 261344446 | ZP_05972090 | PROVRUST_05684_Prus_261344446 |
| 262039223 | ZP_06012541 | HMPREF0554_2331_Lgoo_262039223 |
| 262067268 | ZP_06026880 | FUSPEROL_01544_Fper_262067268 |
| 262195534 | YP_003266743 | Hoch_2307_Hoch_262195534 |
| 262199521 | YP_003270730 | Hoch_6367_Hoch_262199521 |
| 262383473 | ZP_06076609 | HMPREF0103_2522_Bact_262383473 |
| 268609383 | ZP_06143110 | RflaF_010100007781_Rfla_268609383 |
| 268610712 | ZP_06144439 | RflaF_010100014602_Rfla_268610712 |
| 269118724 | YP_003306901 | Sterm_0085_Ster_269118724 |
| 269121733 | YP_003309910 | Sterm_3137_Ster_269121733 |
| 269140414 | YP_003297115 | ETAE_3071_Etar_269140414 |
| 269140415 | YP_003297116 | ETAE_3072_Etar_269140415 |
| 270293299 | ZP_06199508 | HMPREF0850_01400_Ssp._270293299 |
| 271967482 | YP_003341678 | Sros_6206_Sros_271967482 |
| 281203630 | EFA77827 | PPL_09325_Ppal_281203630 |
| 281203700 | EFA77897 | PPL_09397_Ppal_281203700 |
| 281416943 | ZP_06247963 | _Cthe_281416943 |
| 282864000 | ZP_06273057 | SACTEDRAFT_3602_Ssp._282864000 |
| 282881570 | ZP_06290239 | HMPREF9019_0398_Ptim_282881570 |
| 283783211 | YP_003373965 | HMPREF0424_0738_Gvag_283783211 |
| 284033571 | YP_003383502 | Kfla_5697_Kfla_284033571 |
| 284038124 | YP_003388054 | Slin_3244_Slin_284038124 |
| 284038905 | YP_003388835 | Slin_4048_Slin_284038905 |
| 284119730 | ZP_06386788 | POR_1392_CPor_284119730 |
| 284163819 | YP_003402098 | Htur_0527_Htur_284163819 |
| 284988800 | YP_003407354 | Gobs_0177_Gobs_284988800 |
| 28575019 | NP_788477 | CG33057_Dmel_28575019 |
| 288457846 | YP_003422714 | ZZM4_0145_Zmob_288457846 |
| 288931212 | YP_003435272 | Ferp_0829_Fpla_288931212 |
| 288932585 | YP_003436645 | Ferp_2246_Fpla_288932585 |
| 288940281 | YP_003442521 | Alvin_0536_Avin_288940281 |
| 289663132 | ZP_06484713 | XcampvN_010100008602_Xcam_289663132 |
| 289770606 | ZP_06529984 | SSPG_03874_Sliv_289770606 |
| 290960596 | YP_003491778 | SCAB_62181_Ssca_290960596 |
| 290961991 | YP_003493173 | SCAB_76641_Ssca_290961991 |
| 290963088 | YP_003494270 | SCAB_88101_Ssca_290963088 |
| 290974534 | XP_002670000 | NAEGRDRAFT_59792_Ngru_290974534 |
| 290974944 | XP_002670204 | NAEGRDRAFT_74830_Ngru_290974944 |
| 290988948 | XP_002677132 | NAEGRDRAFT_49152_Ngru_290988948 |
| 291231763 | XP_002735833 | LOC100372879_Skow_291231763 |
| 291237935 | XP_002738885 | LOC100367844_Skow_291237935 |
| 291288929 | YP_003517432 | pKF94_017_Kpne_291288929 |
| 291300690 | YP_003511968 | Snas_3205_Snas_291300690 |
| 291301515 | YP_003512793 | Snas_4048_Snas_291301515 |
| 291438820 | ZP_06578210 | SSFG_03915_Sgha_291438820 |
| 291444753 | ZP_06584143 | SSGG_01970_Sros_291444753 |
| 291453417 | ZP_06592807 | SSHG_03710_Salb_291453417 |
| 292493384 | YP_003528823 | Nhal_3405_Nhal_292493384 |
| 294494713 | YP_003541206 | Mmah_0023_Mmah_294494713 |
| 294628199 | ZP_06706759 | SSTG_00199_Ssp._294628199 |
| 294657248 | XP_459547 | DEHA2E05236g_Dhan_294657248 |
| 294664142 | ZP_06729531 | XAUC_02580_Xfus_294664142 |
| 294669065 | ZP_06734151 | NEIELOOT_00979_Nelo_294669065 |
| 294781860 | ZP_06747192 | HMPREF0400_02088_Fsp._294781860 |
| 294817221 | ZP_06775863 | SCLAV_p0684_Scla_294817221 |
| 295087467 | CBK68990 | BXY_40680_Bxyl_295087467 |
| 295093305 | CBK82396 | CCU_05780_Csp._295093305 |
| 295658070 | XP_002789598 | PAAG_08523_Pbra_295658070 |
| 295839520 | ZP_06826453 | SSBG_06269_Ssp._295839520 |
| 296114887 | ZP_06833535 | GXY_03898_Ghan_296114887 |
| 296121824 | YP_003629602 | Plim_1570_Plim_296121824 |
| 296130288 | YP_003637538 | Cfla_2451_Cfla_296130288 |
| 296130683 | YP_003637933 | Cfla_2850_Cfla_296130683 |
| 296416279 | XP_002837808 | GSTUM_00005659001_Tmel_296416279 |
| 296446434 | ZP_06888378 | MettrDRAFT_2094_Mtri_296446434 |
| 296821722 | XP_002850170 | MCYG_00274_Aota_296821722 |
| 296825168 | XP_002850772 | MCYG_00876_Aota_296825168 |
| 297162424 | ADI12136 | SBI_09018_Sbin_297162424 |
| 297192271 | ZP_06909669 | SSDG_01873_Spri_297192271 |
| 297194315 | ZP_06911713 | SSDG_06844_Spri_297194315 |
| 297202026 | ZP_06919423 | SSEG_09591_Ssvi_297202026 |
| 297202028 | ZP_06919425 | SSEG_04858_Ssvi_297202028 |
| 297204161 | ZP_06921558 | SSEG_04772_Ssvi_297204161 |
| 297267544 | XP_001115358 | LOC717911_Mmul_297267544 |
| 297561069 | YP_003680043 | Ndas_2112_Ndas_297561069 |
| 297561422 | YP_003680396 | Ndas_2470_Ndas_297561422 |
| 297564265 | YP_003683238 | Ndas_5352_Ndas_297564265 |
| 297618118 | YP_003703277 | Slip_1960_Slip_297618118 |
| 298245737 | ZP_06969543 | _Krac_298245737 |
| 298246337 | ZP_06970143 | _Krac_298246337 |
| 298248426 | ZP_06972231 | _Krac_298248426 |
| 298250918 | ZP_06974722 | _Krac_298250918 |
| 29826642 | NP_821276 | SAV_102_Save_29826642 |
| 29829850 | NP_824484 | SAV_3308_Save_29829850 |
| 29830778 | NP_825412 | SAV_4235_Save_29830778 |
| 298711928 | CBJ48615 | Esi_0039_0083_Esil_298711928 |
| 299141966 | ZP_07035100 | HMPREF0665_01550_Pori_299141966 |
| 299472429 | CBN77617 | Esi_0004_0276_Esil_299472429 |
| 299472531 | CBN77316 | Esi_0044_0118_Esil_299472531 |
| 30022567 | NP_834198 | BC4486_Bcer_30022567 |
| 300774500 | ZP_07084363 | kptA_Cgle_300774500 |
| 300774505 | ZP_07084368 | HMPREF0204_10228_Cgle_300774505 |
| 300774507 | ZP_07084370 | HMPREF0204_10230_Cgle_300774507 |
| 300784169 | YP_003764460 | kptA_Amed_300784169 |
| 300789763 | YP_003770054 | AMED_7947_Amed_300789763 |
| 300854685 | YP_003779669 | CLJU_c15030_Clju_300854685 |
| 300867123 | ZP_07111789 | OSCI_3240019_Osp._300867123 |
| 300868768 | ZP_07113379 | OSCI_3800101_Osp._300868768 |
| 300868996 | ZP_07113599 | kptA_Osp._300868996 |
| 300869632 | ZP_07114212 | OSCI_4130042_Osp._300869632 |
| 301058276 | ZP_07199316 | NPH_6498_Dpro_301058276 |
| 302344076 | YP_003808605 | Deba_2657_Dbaa_302344076 |
| 302411952 | XP_003003809 | VDBG_06251_Valb_302411952 |
| 30249340 | NP_841410 | NE1363_Neur_30249340 |
| 302504024 | XP_003013971 | ARB_07691_Aben_302504024 |
| 302525419 | ZP_07277761 | SSMG_01801_Ssp._302525419 |
| 302526847 | ZP_07279189 | SSMG_03229_Ssp._302526847 |
| 302529076 | ZP_07281418 | SSMG_05458_Ssp._302529076 |
| 302535927 | ZP_07288269 | SSNG_03890_Ssp._302535927 |
| 302548144 | ZP_07300486 | SSOG_08569_Shim_302548144 |
| 302549980 | ZP_07302322 | SSQG_01209_Svir_302549980 |
| 302553253 | ZP_07305595 | SSQG_04482_Svir_302553253 |
| 302657470 | XP_003020456 | TRV_05457_Tver_302657470 |
| 302686072 | XP_003032716 | SCHCODRAFT_40957_Scom_302686072 |
| 302756333 | XP_002961590 | SELMODRAFT_35951_Smoe_302756333 |
| 302757341 | XP_002962094 | SELMODRAFT_77175_Smoe_302757341 |
| 302766619 | XP_002966730 | SELMODRAFT_85925_Smoe_302766619 |
| 302782377 | XP_002972962 | SELMODRAFT_98231_Smoe_302782377 |
| 302796097 | XP_002979811 | SELMODRAFT_111206_Smoe_302796097 |
| 302851356 | XP_002957202 | VOLCADRAFT_119630_Vcar_302851356 |
| 302864537 | YP_003833174 | Micau_0029_Maur_302864537 |
| 302866493 | YP_003835130 | Micau_2007_Maur_302866493 |
| 302867267 | YP_003835904 | Micau_2794_Maur_302867267 |
| 302868056 | YP_003836693 | Micau_3591_Maur_302868056 |
| 302869104 | YP_003837741 | Micau_4654_Maur_302869104 |
| 302916847 | XP_003052234 | NECHADRAFT_79207_Nhae_302916847 |
| 302922871 | XP_003053556 | NECHADRAFT_74824_Nhae_302922871 |
| 303240380 | ZP_07326898 | AceceDRAFT_2246_Acel_303240380 |
| 303240837 | ZP_07327349 | AceceDRAFT_2697_Acel_303240837 |
| 303241812 | ZP_07328308 | AceceDRAFT_3656_Acel_303241812 |
| 303284891 | XP_003061736 | MICPUCDRAFT_48280_Mpus_303284891 |
| 303312351 | XP_003066187 | CPC735_054120_Cpos_303312351 |
| 304309800 | YP_003809398 | HDN1F_01480_Gpro_304309800 |
| 304405428 | ZP_07387087 | PaecuDRAFT_1748_Pcur_304405428 |
| 304560215 | ADM42879 | ETAF_2777_Etar_304560215 |
| 305663054 | YP_003859342 | Igag_0628_Iagg_305663054 |
| 307104106 | EFN52361 | CHLNCDRAFT_138778_Cvar_307104106 |
| 307105263 | EFN53513 | CHLNCDRAFT_59736_Cvar_307105263 |
| 307150228 | YP_003885612 | Cyan7822_0291_Csp._307150228 |
| 307154521 | YP_003889905 | Cyan7822_4726_Csp._307154521 |
| 307299774 | ZP_07579566 | ThebaDRAFT_2537_Tbac_307299774 |
| 307595891 | YP_003902208 | Vdis_1783_Vdis_307595891 |
| 307823107 | ZP_07653337 | MettuDRAFT_1182_Mtun_307823107 |
| 307823108 | ZP_07653338 | MettuDRAFT_1183_Mtun_307823108 |
| 307946056 | ZP_07661391 | TRICHSKD4_4759_Rsp._307946056 |
| 308270161 | CBX26773 | N47_A08020_UDes_308270161 |
| 308446799 | XP_003087265 | CRE_02794_Crem_308446799 |
| 309811906 | ZP_07705678 | HMPREF0321_1867_Dsp._309811906 |
| 310641074 | YP_003945832 | PPSC2_c1614_Ppol_310641074 |
| 310778852 | YP_003967185 | Ilyop_1056_Ipol_310778852 |
| 310792989 | EFQ28450 | GLRG_03594_Ggra_310792989 |
| 310796940 | EFQ32401 | GLRG_07671_Ggra_310796940 |
| 310818319 | YP_003950677 | STAUR_1046_Saur_310818319 |
| 310818708 | YP_003951066 | STAUR_1435_Saur_310818708 |
| 310831101 | YP_003969744 | crov112_CrVB_310831101 |
| 311896751 | BAJ29159 | KSE_33500_Kset_311896751 |
| 311899069 | BAJ31477 | kptA_Kset_311899069 |
| 311900362 | BAJ32770 | KSE_70120_Kset_311900362 |
| 312142649 | YP_003994095 | Halsa_0262_Hhyd_312142649 |
| 312199543 | YP_004019604 | FraEuI1c_5750_Fsp._312199543 |
| 312220715 | CBY00656 | LEMA_P017860.1_Lmac_312220715 |
| 312886331 | ZP_07745943 | MucpaDRAFT_5912_Mpal_312886331 |
| 312888255 | ZP_07747832 | MucpaDRAFT_5105_Mpal_312888255 |
| 312888451 | ZP_07748025 | MucpaDRAFT_5539_Mpal_312888451 |
| 313682815 | YP_004060553 | Sulku_1692_Skuj_313682815 |
| 315054759 | XP_003176754 | MGYG_00842_Agyp_315054759 |
| 315230724 | YP_004071160 | TERMP_00961_Tbar_315230724 |
| 315502903 | YP_004081790 | ML5_2113_Msp._315502903 |
| 315504426 | YP_004083313 | ML5_3650_Msp._315504426 |
| 315506327 | YP_004085214 | ML5_5602_Msp._315506327 |
| 315652379 | ZP_07905368 | HMPREF0381_2362_Esab_315652379 |
| 317056274 | YP_004104741 | Rumal_1607_Ralb_317056274 |
| 317126949 | YP_004093231 | Bcell_0212_Bcel_317126949 |
| 318058555 | ZP_07977278 | SSA3_010100011465_Ssp._318058555 |
| 319936601 | ZP_08011014 | HMPREF9488_01847_Csp._319936601 |
| 320010749 | ADW05599 | Sfla_4190_Sfla_320010749 |
| 320095331 | ZP_08027020 | HMPREF9005_1632_Asp._320095331 |
| 320168635 | EFW45534 | CAOG_03518_Cowc_320168635 |
| 320333489 | YP_004170200 | Deima_0881_Dmar_320333489 |
| 320333790 | YP_004170501 | Deima_1184_Dmar_320333790 |
| 322505025 | CAM42259 | LBRM_24_0830_Lbra_322505025 |
| 322699163 | EFY90927 | MAC_03043_Macr_322699163 |
| 322707126 | EFY98705 | MAA_05844_Mani_322707126 |
| 322708785 | EFZ00362 | MAA_04139_Mani_322708785 |
| 322802863 | EFZ23054 | SINV_01220_Sinv_322802863 |
| 322815443 | EFZ24097 | TCSYLVIO_9776_Tcru_322815443 |
| 322832748 | YP_004212775 | Rahaq_2033_Rsp._322832748 |
| 323140426 | ZP_08075355 | HMPREF9443_00109_Psuc_323140426 |
| 32476856 | NP_869850 | _Rbal_32476856 |
| 325108247 | YP_004269315 | Plabr_1682_Pbra_325108247 |
| 325189229 | CCA23752 | AlNc14C205G8800_Alai_325189229 |
| 325283812 | YP_004256353 | Deipr_1598_Dpro_325283812 |
| 325690156 | EGD32160 | HMPREF9382_1114_Ssan_325690156 |
| 325917965 | ZP_08180134 | XVE_4155_Xves_325917965 |
| 325928686 | ZP_08189859 | XPE_3947_Xper_325928686 |
| 326431934 | EGD77504 | PTSG_08602_Ssp._326431934 |
| 326470706 | EGD94715 | TESG_02225_Tton_326470706 |
| 326779281 | ZP_08238546 | SACT1_5140_Sgri_326779281 |
| 326943719 | AEA19612 | CT43_P281274_Bthu_326943719 |
| 327286590 | XP_003228013 | LOC100564547_Acar_327286590 |
| 327308048 | XP_003238715 | TERG_00702_Trub_327308048 |
| 327352957 | EGE81814 | BDDG_04757_Ader_327352957 |
| 327400244 | YP_004341083 | Arcve_0335_Aven_327400244 |
| 328769603 | EGF79646 | BATDEDRAFT_4585_Bden_328769603 |
| 328862875 | EGG11975 | MELLADRAFT_101818_Mlar_328862875 |
| 328866607 | EGG14990 | DFA_09810_Dfas_328866607 |
| 328867666 | EGG16048 | DFA_09720_Dfas_328867666 |
| 328871094 | EGG19465 | DFA_00042_Dfas_328871094 |
| 328884339 | CCA57578 | SVEN_4292_Sven_328884339 |
| 328886920 | CCA60159 | SVEN_6873_Sven_328886920 |
| 328952864 | YP_004370198 | Desac_1154_Dace_328952864 |
| 328958126 | YP_004375512 | CAR_c18390_Csp._328958126 |
| 329184512 | AEB80270 | Dalk_0002_AVC_Dalk_329184512 |
| 329847506 | ZP_08262534 | ABI_05710_Abip_329847506 |
| 329935140 | ZP_08285131 | SGM_6648_Sgri_329935140 |
| 329935335 | ZP_08285301 | SGM_6818_Sgri_329935335 |
| 329996741 | ZP_08302538 | HMPREF9538_00174_Ksp._329996741 |
| 330467180 | YP_004404923 | VAB18032_16085_Vmar_330467180 |
| 330469061 | YP_004406804 | VAB18032_25530_Vmar_330469061 |
| 330469448 | YP_004407191 | VAB18032_27591_Vmar_330469448 |
| 330508961 | YP_004385389 | MCON_3311_Mcon_330508961 |
| 330795375 | XP_003285749 | DICPUDRAFT_46322_Dpur_330795375 |
| 330801102 | XP_003288569 | DICPUDRAFT_34288_Dpur_330801102 |
| 330977809 | EGH77712 | PSYAP_13685_Psyr_330977809 |
| 330983843 | EGH81946 | PLA107_02335_Psyr_330983843 |
| 331216956 | XP_003321157 | PGTG_02199_Pgra_331216956 |
| 332361966 | EGJ39768 | kptA_Ssan_332361966 |
| 332668288 | YP_004451076 | Halhy_6384_Hhyd_332668288 |
| 332671633 | YP_004454641 | Celf_3140_Cfim_332671633 |
| 333027909 | ZP_08455973 | STTU_5412_Ssp._333027909 |
| 333374005 | ZP_08465898 | HMPREF9374_3644_Dsp._333374005 |
| 333378220 | ZP_08469951 | HMPREF9456_01546_Dmos_333378220 |
| 333381571 | ZP_08473251 | HMPREF9455_01417_Dgad_333381571 |
| 333912499 | YP_004486231 | DelCs14_0840_Dsp._333912499 |
| 333985238 | YP_004514448 | Metme_3585_Mmet_333985238 |
| 334120906 | ZP_08494983 | MicvaDRAFT_0510_Mvag_334120906 |
| 334135982 | ZP_08509461 | HMPREF9413_4358_Psp._334135982 |
| 336117044 | YP_004571811 | MLP_13940_Mpho_336117044 |
| 336250841 | YP_004594551 | EAE_21855_Eaer_336250841 |
| 336366767 | EGN95113 | SERLA73DRAFT_143184_Slac_336366767 |
| 336428119 | ZP_08608104 | HMPREF0994_04110_Lbac_336428119 |
| 336471510 | EGO59671 | NEUTE1DRAFT_109155_Ntet_336471510 |
| 336475983 | YP_004615124 | Mzhil_0024_Mzhi_336475983 |
| 338211687 | YP_004655740 | Runsl_2196_Rsli_338211687 |
| 338532263 | YP_004665597 | LILAB_13060_Mful_338532263 |
| 338811714 | ZP_08623919 | ALO_06468_Alon_338811714 |
| 339009751 | ZP_08642322 | BRLA_c35710_Blat_339009751 |
| 340377247 | XP_003387141 | LOC100640582_Aque_340377247 |
| 340521231 | EGR51466 | TRIREDRAFT_75394_Tree_340521231 |
| 340754465 | ZP_08691218 | FSAG_02029_Fsp._340754465 |
| 342875667 | EGU77385 | FOXB_12108_Foxy_342875667 |
| 34497880 | NP_902095 | CV_2425_Cvio_34497880 |
| 344999740 | YP_004802594 | SACTE_2158_Ssp._344999740 |
| 345013407 | YP_004815761 | Strvi_5976_Svio_345013407 |
| 345368115 | EGX00122 | ECSTECMHI813_4950_Ecol_345368115 |
| 346318305 | EGX87909 | CCM_09532_Cmil_346318305 |
| 38505777 | NP_942396 | sll8002_Ssp_38505777 |
| 45198857 | NP_985886 | AGOS_AFR339W_Agos_45198857 |
| 46309426 | YP_006316 | ORF28_AsGV_46309426 |
| 49477941 | YP_037101 | kptA_Bthu_49477941 |
| 50290283 | XP_447573 | CAGL0I07469g_Cgla_50290283 |
| 50305581 | XP_452751 | KLLA0C12397g_Klac_50305581 |
| 50547707 | XP_501323 | YALI0C01287g_Ylip_50547707 |
| 53718401 | YP_107387 | BPSL0762_Bpse_53718401 |
| 55379941 | YP_137791 | kptA_Hmar_55379941 |
| 58383293 | YP_194865 | pU302L_059_Sent_58383293 |
| 60461910 | YP_209628 | pIL105p1_Llac_60461910 |
| 66358336 | XP_626346 | cgd2_1210_Cpar_66358336 |
| 66802638 | XP_635191 | DDB_G0291408_Ddis_66802638 |
| 66807493 | XP_637469 | DDB_G0286929_Ddis_66807493 |
| 66813652 | XP_641005 | DDB_G0280835_Ddis_66813652 |
| 67921554 | ZP_00515072 | CwatDRAFT_5127_Cwat_67921554 |
| 70733133 | YP_262906 | PFL_5848_Pflu_70733133 |
| 70988759 | XP_749234 | AFUA_2G00980_Afum_70988759 |
| 71064898 | YP_263625 | Psyc_0322_Parc_71064898 |
| 72006229 | XP_780840 | LOC575340_Spur_72006229 |
| 72010085 | XP_786744 | LOC581663_Spur_72010085 |
| 74317508 | YP_315248 | Tbd_1490_Tden_74317508 |
| 78223734 | YP_385481 | Gmet_2535_Gmet_78223734 |
| 83643039 | YP_431474 | HCH_00129_Hche_83643039 |
| 83647694 | YP_436129 | HCH_05019_Hche_83647694 |
| 83649603 | YP_438038 | HCH_06998_Hche_83649603 |
| 84392321 | ZP_00991748 | V12B01_14195_Vspl_84392321 |
| 84499284 | ZP_00997572 | OB2597_05135_Obat_84499284 |
| 84499293 | ZP_00997581 | OB2597_05180_Obat_84499293 |
| 84501233 | ZP_00999438 | OB2597_12748_Obat_84501233 |
| 85068247 | XP_962139 | NCU07285_Ncra_85068247 |
| 85109317 | XP_962858 | NCU06254_Ncra_85109317 |
| 87310926 | ZP_01093052 | DSM3645_18471_Bmar_87310926 |
| 87311897 | ZP_01094009 | DSM3645_04855_Bmar_87311897 |
| 88856595 | ZP_01131252 | A20C1_02579_Mact_88856595 |
| 90419305 | ZP_01227215 | SI859A1_01336_Aman_90419305 |
| 91080221 | XP_972212 | LOC660925_Tcas_91080221 |
| 91203343 | CAJ72982 | kustd2237_CKue_91203343 |
| 91215317 | ZP_01252289 | P700755_13507_Ptor_91215317 |
| 94971452 | YP_593500 | Acid345_4426_CKor_94971452 |