; SAM: prettyalign v3.1b (February 24, 1999) compiled 04/18/00_11:44:15 ; (c) 1992-1999 Regents of the University of California, Santa Cruz ; ; Sequence Alignment and Modeling Software System ; http://www.cse.ucsc.edu/research/compbio/sam.html ; ; ------ Citations (HMMs, SAM) ------ ; A. Krogh et al., Hidden Markov models in computational biology: ; ------------- Citations (SAM, SAM-T99, HMMs) ----------------- ; R. Hughey, A. Krogh, Hidden Markov models for sequence analysis: ; Extension and analysis of the basic method, CABIOS 12:95-107, 1996. ; K. Karplus, C. Barrett, R. Hughey, Hidden Markov models for detecting ; remote protein homologies, Bioinformatics 14(10):846-856, 1999. ; A. Krogh et al., Hidden Markov models in computational biology: ; Applications to protein modeling, JMB 235:1501-1531, Feb 1994. ; -------------------------------------------------------------- ; Sequence numbers correspond to the following labels: ; 1 T0103 ; 2 gi|1172505|sp|P42790|PICP_PSESR_216:587 ; 3 gi|5729770|ref|NP_000382.3|_249:556 ; 4 gi|6175068|sp|O14773|TPP1_HUMAN_249:556 ; 5 gi|4583351|gb|AAD25043.1|AF114167_1_249:556 ; 6 gi|6753448|ref|NP_034036.1|_249:555 ; 7 gi|6094507|sp|O89023|TPP1_MOUSE_220:527 ; 8 gi|881428|gb|AAA70103.1|_165:560 ; 9 gi|323087|pir||A44869_33:350 ; 10 gi|1086249|pir||S52769_202:603 ; 11 gi|2145514|pir||JC4900_235:625 ; 12 gi|1332716|gb|AAB36054.1|_1:369 ; 13 gi|5002192|gb|AAD37352.1|AF142415_1_256:482 ; 14 gi|5002190|gb|AAD37351.1|_5:357 ; 15 gi|7435650|pir||JW0075_165:381 ; 16 gi|5726590|gb|AAD48483.1|AF170567_1_165:381 ; 17 gi|494645|pdb|1THM|_59:269 ; 18 gi|135738|sp|P04072|THET_THEVU_59:269 ; 19 gi|1890101|gb|AAB49694.1|_176:387 ; 20 gi|6573500|pdb|1DBI|A_60:270 ; 21 gi|2118106|pir||I39974_181:391 ; 22 gi|2921857|gb|AAC04871.1|_204:571 ; 23 gi|732988|emb|CAA82213.1|_181:534 ; 24 gi|7473893|pir||A75474_217:583 ; 25 gi|6624962|emb|CAB63913.1|_212:450 ; 26 gi|6624950|emb|CAB63907.1|_212:450 ; 27 gi|628051|pir||JC2142_163:372 ; 28 gi|742825|prf||2011184A_163:372 ; 29 gi|4761119|gb|AAD29255.1|AF104385_1_163:372 ; 30 gi|6624958|emb|CAB63911.1|_172:383 ; 31 gi|117631|sp|P29138|CUDP_METAN_172:383 ; 32 gi|460032|gb|AAA91584.1|_148:358 ; 33 gi|6634475|emb|CAB64346.1|_171:368 ; 34 gi|131088|sp|P20015|PRTT_TRIAL_75:261 ; 35 gi|7473901|pir||D75286_10:170 ; 36 gi|4835715|gb|AAD30204.1|AF064522_1_163:264 ; 37 gi|545060|gb|AAC60459.1|_181:392 ; 38 gi|470731|gb|AAA67705.1|_185:379 ; 39 gi|384177|prf||1905286A_184:372 ; 40 gi|129234|sp|P28296|ORYZ_ASPFU_184:372 ; 41 gi|3549630|emb|CAA75805.1|_123:310 ; 42 gi|113482|sp|P09230|AEP_YARLI_225:431 ; 43 gi|2239272|gb|AAB62277.1|_225:438 ; 44 gi|7435653|pir||H72784_186:432 ; 45 gi|7481387|pir||T10926_89:322 ; 46 gi|7481372|pir||T36842_94:323 ; 47 gi|7473895|pir||A75589_239:445 ; 48 gi|7414560|emb|CAB86111.1|_251:481 ; 49 gi|135023|sp|P29141|SUBV_BACSU_211:572 ; 50 gi|7542318|gb|AAF63395.1|AF083618_2_199:466 ; 51 gi|130965|sp|P23314|PROA_XANCP_230:465 ; 52 gi|1168687|sp|P42779|BPRV_BACNO_221:466 ; 53 gi|576815|gb|AAA80562.1|_221:466 ; 54 gi|7473898|pir||D75393_205:429 ; 55 gi|2293484|gb|AAB65414.1|_1:200 ; 56 gi|5918763|gb|AAD56147.1|AF154675_7_173:429 ; 57 gi|7473900|pir||F75625_232:478 ; 58 gi|2731626|gb|AAB93489.1|_180:430 ; 59 gi|5302815|emb|CAB46075.1|_177:427 ; 60 gi|282432|pir||S25835_170:415 ; 61 gi|135018|sp|P28842|SUBT_BACS9_168:416 ; 62 gi|2127379|pir||JC6032_274:682 ; 63 gi|7595970|gb|AAF64521.1|AF253471_1_129:445 ; 64 gi|4115628|dbj|BAA36466.1|_113:359 ; 65 gi|3646417|emb|CAA07702.1|_113:359 ; 66 gi|3334242|sp|O13359|KEX2_CANAL_247:491 ; 67 gi|125348|sp|P09231|KEX1_KLULA_198:444 ; 68 gi|283589|pir||S27270_223:473 ; 69 gi|453663|gb|AAA27769.1|_223:474 ; 70 gi|542504|pir||S40449_223:474 ; 71 gi|480411|pir||S36823_223:474 ; 72 gi|7484206|pir||S73083_240:593 10 20 30 40 | | | | 1 AAGTAKGHNPTEFPT...IYDASSAPTAA......NTTVGIITIGGVSQTLQDLQQF........ 2 AAGTAKGHNPTEFPT...IYDASSAPTAA......NTTVGIITIGGVSQTLQDLQQF........ 3 ------------GNF...AHQASVARVVGqqg...RGRAGIE-------ASLDVQYL........ 4 ------------GNF...AHQASVARVVGqqg...RGRAGIE-------ASLDVQYL........ 5 ------------GNF...AHQASVARVVGqqg...RGRAGIE-------ASLDVEYL........ 6 -------------SF...THQASVAKVVGkqg...RGRAGIE-------ASLDVEYL........ 7 -------------SF...THQASVAKVVGkqg...RGRAGIE-------ASLDVEYL........ 8 WATAIQQYNPIPKIA...SISYGWAEVEQceitnsCSTLGIDSVVYVARSNVELQKVglr10fvs 9 PAVTTQPFNPTVDVLplyGIDTSDSNRGA......GQVIGIIDAYGASTAESDLAAF........ 10 --NATFSMNSARDTL...GHGTHTASTAA......GNYVNGA-------SYFGYGKG........ 11 AAAAVAAHHPQDFAA...IYGGSSLPAAT......NTAVGIITWGSITQTVTDLNSF........ 12 AAGTAKGHNPTEFPT...IYDASSAPTAA......NTTVGIITIGGVSQTLQDLQQF........ 13 ---------------...-----------......----------------------........ 14 ---------------...-------PVTG......NSSVGVIEFEDQNFAPSDLSDF........ 15 --DYVDNDNTSDDGN...GHGTHCAGITGalt...NNSVGIA---------------........ 16 --DYVDNDNTSDDGN...GHGTHCAGITGalt...NNSVGIA---------------........ 17 ----VDNDSTPQNGN...GHGTHCAGIAAavt...NNSTGIA---------------........ 18 ----VDNDSTPQNGN...GHGTHCAGIAAavt...NNSTGIA---------------........ 19 ---FIDRDNNPMDLN...GHGTHVAGTVAadt...NNGIGVA---------------........ 20 ----VDNDYDPMDLN...NHGTHVAGIAAaet...NNATGIA---------------........ 21 ----VDNDYDPMDLN...NHGTHVAGIAAaet...NNATGIA---------------........ 22 ------------NNN...AHGTHVAGTIAai....ANNEGVV---------------........ 23 -------------NN...AHGTHVAGTIAai....ANNEGVK---------------........ 24 --------YQLNDVS...HHGTHVAGTVFaqy...GAGTGASGL----QSGMDA--N........ 25 WGKTIPAGDADEDGN...GHGTHCSGTIA......GKKYGVA---------------........ 26 WGKTIPAGDADEDGN...GHGTHCSGTIA......GKKYGVA---------------........ 27 ---------TARDGN...GHGTHCSGTIG......SKTYGVA---------------........ 28 ---------TARDGN...GHGTHCSGTIG......SKTYGVA---------------........ 29 ---------GTTDGH...GHGTHCAGTIG......SKTYGVA---------------........ 30 ---------QNRDGH...GHGTHCAGTIG......SRSYGVA---------------........ 31 ---------QNTDGH...GHGTHCAGTIG......SKTYGVA---------------........ 32 ---------QNTDGN...GHGTHCAGTIG......SKTYGVA---------------........ 33 -----------SDRN...GHGTHVAGTIG......SKKYGVA---------------........ 34 --------GQDTDGN...GHGTHVAGTVG......GTTYGVA---------------........ 35 ---------------...-----------......----------------------........ 36 ---------------...-----------......----------------------........ 37 ---FVDNDNDATDCN...GHGTHVAGTIG......GGEYGVA---------------........ 38 ---------QHVDSV...GHGTHVAGTIG......GETYGVS---------------........ 39 -------GGSHVDSI...GHGTHVAGTIG......GKTTGVA---------------........ 40 -------GGSHVDSI...GHGTHVAGTIG......GKTYGVA---------------........ 41 -------GGSHVDSI...GHGTHVAGTIG......GKTYGVA---------------........ 42 ----------NADLL...GHGTHVAGTVG......GKTYGVD---------------........ 43 ---------SNVDDN...GHGTHVAGTIG......SRTYGVA---------------........ 44 --------SNYQDRN...GHGTHVTGTVAai....DNDIGVI---------------........ 45 -----QPGDERTDHE...GHGTGMAALIAgtgkh.GSKSGAY---------------........ 46 -----------RSWA...RHGTAMAGIIAghghgsGDAEGVM---------------........ 47 ------------GGV...GHGTAVAGIAT......----------------------........ 48 --------EEVADRH...GHGTHVTSTVG......GSGAASD--------------G........ 49 --FVDNDYDPKETPT...GDPRGEATDHG......THVAGTVAANGTIK--------........ 50 --GECGIFSAARDSS...WHGTHVAGTIAeat...GNAIGGA---------------........ 51 ---------PAASSS...WHGTHVAGTVAavt...NNTTGVA---------------........ 52 CGGYPDPRREKKFST...WHGSHVAGTIAavt...NNGVGVA---------------........ 53 CGGYPDPRREKRFST...WHGSHVAGTIAavt...NNGVGVA---------------........ 54 -----------HDTT...DHGTHTAGLLV......GSKVGVA---------------........ 55 ---------------...-HGTHVAGIAE......ANMPGWK---------------........ 56 ----TGSINDIDDKK...GHGTAVAGQIAan....----------GQIF--------........ 57 -------DNQVDENI...EHGTAVTSTIAaa....RDGRGVV---------------........ 58 -GATTPINNSCTDRN...GHGTHVAGTALadgg..SDQAGIY---------------........ 59 -GATTPINNSCTDRN...GHGTHVAGTALadgg..SDQAGIY---------------........ 60 -----FTDNSCTDRQ...GHGTHVAGSALang...GTGSGVY---------------........ 61 --GTTYTNNSCTDRQ...GHGTHVAGSALadg...GTGNGVY---------------........ 62 ------------NDQ...IVDNGCGEMHG......QHVAGIAGANGQVK--------........ 63 ------DPTPTDPDT...GHGTSVSGIIAav....DNAIGTK---------------........ 64 ------------NND...SHGTHVTGTMGaa....RDGVGMH---------------........ 65 ------------NND...SHGTHVTGTMGaa....RDGVGMH---------------........ 66 ------------FDD...YHGTRCAGEIAavk...NDVCGI----------------........ 67 ------------KDD...YHGTRCAGEIAafr...NDICGV----------------........ 68 -----------TWFN...SHGTRCAGEVSa.....AKDNGVC---------------........ 69 -----------TWFN...SHGTRCAGEVSa.....AKDNGVC---------------........ 70 -----------TWFN...SHGTRCAGEVSa.....AKDNGVC---------------........ 71 -----------TWFN...SHGTRCAGEVSa.....AKDNGVC---------------........ 72 ------------FNF...TLAYERGYTGG......GSNIAIEGVPESFVNVSDIYSF........ 50 60 70 80 90 100 | | | | | | 1 TSANGLAS..VNTQT......IQTGSSNGD.YSDDQQG..QGEWDLDSQSIVGSAGGAV..QQLL 2 TSANGLAS..VNTQT......IQTGSSNGD.YSDDQQG..QGEWDLDSQSIVGSAGGAV..QQLL 3 MSAGANIS..TW---......--VYSSPGR.HE-----..--------------GQEPF..LQWL 4 MSAGANIS..TW---......--VYSSPGR.HE-----..--------------GQEPF..LQWL 5 MSAGANIS..TW---......--VYSSPGR.HE-----..--------------SQEPF..LQWL 6 MSAGANIS..TW---......--VYSSPGR.HE-----..--------------AQEPF..LQWL 7 MSAGANIS..TW---......--VYSSPGR.HE-----..--------------AQEPF..LQWL 8 SGDDGAPS..FG-AA......SGNCPIDGT.KQYCPLG..GCNHKSSQCPMITIMESNG..TQCF 9 SRANGLPA..ANFQK......VDQNGGTNY.PKDDPDDasGDGWGVETALDLQIAHAVApaAKLI 10 TARGIAPR..ARVAV......YKVTWPEGR.YT-----..-------------------..---- 11 TSGAGLAT..VNSTI......TKVGS--GT.FANDPDS..NGEWSLDSQDIVGIAGGVK..QLIF 12 TSANGLAS..VNTQT......IQTGSSNGD.YSDDQQG..QGEWDLDSQSIVGSAGGAV..QQLL 13 --------..-----......---------.-------..-------------------..---- 14 ATSFSVPI..TPLTD......NHIIGSNDP.TS----P..QIEATLDIQYILG------..VLLV 15 ---GVAPQ..TSIYA......VRVLDNQGS.GT-----..-------------------..---- 16 ---GVAPQ..TSIYA......VRVLDNQGS.GT-----..-------------------..---- 17 ---GTAPK..ASILA......VRVLDNSGS.GT-----..-------------------..---- 18 ---GTAPK..ASILA......VRVLDNSGS.GT-----..-------------------..---- 19 ---GMAPD..TKILA......VRVLDANGS.GS-----..-------------------..---- 20 ---GMAPN..TRILA......VRALDRNGS.GT-----..-------------------..---- 21 ---GMAPN..TRILA......VRALDRNGS.GT-----..-------------------..---- 22 ---GVMPNqnANIHV......INVFNEAGW.GY-----..-------------------..---- 23 ---GLLPNqnVNLHI......VKVFNESGW.GY-----..-------------------..---- 24 GVGGVASG..VNLYM......ARVLGDDGS.GS-----..-------------------..---- 25 ------KK..ANVYA......VKVLRSNGS.GT-----..----MADVVKGVEFAATSH..VEQV 26 ------KK..ANVYA......VKVLRSNGS.GT-----..----MADVVKGVEFAATSH..VEQV 27 ------KK..VSIFG......VKVLDDNGS.GS-----..-------------------..---- 28 ------KK..VSIFG......VKVLDDNGS.GS-----..-------------------..---- 29 ------KK..ASILG......VKVLEDSGS.GS-----..-------------------..---- 30 ------KN..AKLFA......VKVLDDQGS.GS-----..-------------------..---- 31 ------KK..AKLYG......VKVLDNQGS.GS-----..-------------------..---- 32 ------KK..TKIYG......VKVLDNSGS.GS-----..-------------------..---- 33 ------KK..TKILG......IKVLSDQGS.GD-----..-------------------..---- 34 ------KK..TSLFA......VKVLDANGQ.GS-----..-------------------..---- 35 --------..-----......---------.-------..-------------------..---- 36 --------..-----......---------.-------..-------------------..---- 37 ------KN..VNIVG......VRVLGCNGS.GS-----..-------------------..---- 38 ------KK..ANLLS......VKVFQGESS.STSIILD..GFNWAANDIVSKGR-----..---- 39 ------KK..TNLLS......VKVFQGESS.STSIILD..GFNWAVNDIVSKGRTKKA-..---- 40 ------KK..TNLLS......VKVFQGESS.STSIILD..GFNWAVNDIVSKGRTKKA-..---- 41 ------KK..TNLLS......VKVFQGESS.STSIILD..GFNWAVNDIVSKGRTKKA-..---- 42 ------AN..TKLVA......VKVFAGRSA.ALSVINQ..GFTWALNDYISKR------..---- 43 ------KR..VTIFG......VKVLPARGT.SP-----..-------------------..---- 44 ---GVAHS..VEIYA......VKALGNGGY.GS-----..----WSDLIIAIDLAVKGP..DGVI 45 ---GLAPG..VEILP......IRMPEKIEG.-------..-------------------..---- 46 ---GIAPE..AKILP......VRVILEDGD.PS-----..-------------------..---- 47 ---QVAPM..VQIMP......VRALGTDGS.GD-----..-------------------..---- 48 KEKGVAPG..ATLAV......GKVLDDEGF.GS-----..-------------------..---- 49 ---GVAPD..ATLLA......YRVLGPGGS.GT-----..-------------------..---- 50 ---GVAYK..AKVLP......VRVLGHCGG.SFSDITD..AIVWASGGHVEGVPDN---..---- 51 ---GTAYG..AKVVP......VRVLGKCGG.SLSDIAD..AIVWASGGTVSGIPA----..---- 52 ---GVAYG..AKVIP......VRVLGKCGG.YDSDITD..GMYWSAGGHIDGVPDN---..---- 53 ---GVAYG..AKVIP......VRVLGKCGG.YDSDITD..GMYWSAGGHIDGVPDN---..---- 54 ------PG..AKVIS......ALVLPNNEG.TF-----..-------------------..---- 55 -MQGAAPG..AKIVS......AKACVYAGG.CT-----..-------------------..---- 56 ---GVSPG..TNLLV......YRVFGKSKS.KE-----..-------------------..---- 57 ---GVAPD..AKYLT......AAMFQPGSV.GS-----..-------------------..---- 58 ---GVAPD..ADLWA......YKVLLDSGSgYSDDIAA..AIRHAADQATATGT-----..---- 59 ---GVAPD..ADLWA......YKVLLDSGSgYSDDIAA..AIRHAADQATATGT-----..---- 60 ---GVAPE..ADLWA......YKVLGDDGSgYADDIAE..AIRHAGDQATALN------..---- 61 ---GVAPD..ADLWA......YKVLGDDGSgYADDIAA..AIRHAGDQATAL-------..---- 62 ---GVAPD..AQLLA......MKVFSNNAK.NSGAYDD..DIISAIEDSVKLG------..---- 63 ---GIAPR..AQLQG......FNLLDDNSQ.QL-----..------------------Q..KDWL 64 ---GVAYN..AQIYV......GNTNANDSF.LFGP---..-------------------..---- 65 ---GVAYN..AQLYV......GNTNANDSF.LFG----..-------------------..---- 66 ---GVAWK..SQVSG......IRILSGPIT.SS-DEAE..AMVYGLD------------..---- 67 ---GVAYN..SKVSG......IRILSGQIT.AE-----..-------------------..---- 68 -GVGVAYG..SKVAG......LRMLDQPFM.TD-----..-------------------..---- 69 -GVGVAFG..SKVAG......LRMLDQPFM.TD-----..-------------------..---- 70 -GVGVAFG..SKVAG......LRMLDQPFM.TD-----..-------------------..---- 71 -GVGVAFG..SKVAG......LRMLDQPFM.TD-----..-------------------..---- 72 WQLYGIPR..TGHLNviyfgnVTTGGQSGE.NELDAEW..SGAFAPAANVTIVFSNGYV..---- 110 120 130 140 | | | | 1 FYMA.....DQSASGNTGLTQAFNQAVSDN........VAKVINVSLGW........CEADANAD 2 FYMA.....DQSASGNTGLTQAFNQAVSDN........VAKVINVSLGW........CEADANAD 3 MLLS.....NESALPH--------------........---VHTVSYGD........DEDSL-SS 4 MLLS.....NESALPH--------------........---VHTVSYGD........DEDSL-SS 5 LLLS.....NESALPH--------------........---VHTVSYGD........DEDSL-SS 6 LLLS.....NESSLPH--------------........---VHTVSYGD........DEDSL-SS 7 LLLS.....NESSLPH--------------........---VHTVSYGD........DEDSL-SS 8 FPMGsesntCQSMLQNQNIVNGINEFVSSN........SKCQVAL----........-EQDTQQN 9 LCTA.....KSASDTNLN---ACIKTLTNL........HVNHISMSYGG........SEGDT--- 10 ----.....--------SDVLAGIDQAIAD........GVDVISISLGY........DGVPLYED 11 YTSAngds.SSSGITDAGITASYNRAVTDN........IAKLINVSLGE........DETAAQQS 12 FYMA.....DQSASGNTGLTQAFNQAVSDN........VAKVINVSLGW........CEADANAD 13 ----.....---------------------........-----------........----YLGS 14 QLDG.....SGLKVIVYRLYGFHHLFATKD........VPLVNSISYGW........NEEDQCEN 15 ----.....-------LDAVAQGIREAADS........GAKVISLSLGA........PNGGT--- 16 ----.....-------LDAVAQGIREAADS........GAKVISLSLGA........PNGGT--- 17 ----.....-------WTAVANGITYAADQ........GAKVISLSLGG........TVGNS--- 18 ----.....-------WTAVANGITYAADQ........GAKVISLSLGG........TVGNS--- 19 ----.....-------LDSIASGIRYAADQ........GAKVLNLSLGC........ECNST--- 20 ----.....-------LSDIADAIIYAADS........GAEVINLSLGC........DCHTT--- 21 ----.....-------LSDIADAIIYAADS........GAEVINLSLGC........DCHTT--- 22 ----.....------SSSLVAAIDTCVTSG........GANVVTMSLGG........SGSTT--- 23 ----.....-------SSTLVRAIQTCADN........GAKIVNMSLGG........SQSSR--- 24 ----.....-------SSGIINGVNWCAAQlksqggteSKVVISLSLGG........GRASQ--- 25 LRAK.....DGKRKGFKGS-----------........---VANMSLGG........-------- 26 LRAK.....DGKRKGFKGS-----------........---VANMSLGG........-------- 27 ----.....-------LSNVIAGMDFVASDyrsrncp.RGVVASMSLGG........-------- 28 ----.....-------LSNVIAGMDFVASDyrsrncp.RGVVASMSLGG........-------- 29 ----.....-------LSGVIAGMDFVATDrksrpcs.KGTVASMSLGG........-------- 30 ----.....-------YSGIISGMDFVAQDsksrncp.NGHIASMSLGG........-------- 31 ----.....-------YSGIISGMDYVAQDsktrgcp.NGAIASMSLGG........-------- 32 ----.....-------YSGIISGMDFAVQDsksrscp.KGVVANMSLGG........-------- 33 ----.....-------YSGILAGMDFAIQDsrtrgcp.KGVVANMSLGG........-------- 34 ----.....-------NSGVIAGMDFVTKDassqncp.KGVVVNMSLGG........PSSSA--- 35 ----.....------------SSINWAVGNkgs.....AAAVANMSLGG........-------- 36 ----.....---------------------........-----------........-------- 37 ----.....-------YSGVISGIDWVKNNas......GPSVANMSLGG........-------- 38 ----.....--------------------T........GKSAINMSLGG........-------- 39 ----.....---------------------........---AINMSLGG........-------- 40 ----.....---------------------........---AINMSLGG........-------- 41 ----.....---------------------........---AINMSLGG........-------- 42 ----.....---------------------dtl.....PRGVLNFSGGG........-------- 43 ----.....NSVIIKGMDFVHAMPSGVNAP........TDVVVNMSLGG........-------- 44 DADG.....DGVVAGDPD----------DD........APEVISMSLGG........SSPPP--- 45 --LD.....FTSGHNAARDFSKAIRFAADS........DAKVINISMGQ........AESGTKGG 46 ---R.....AKARKTRGNALAEGIRWAADH........GADIINLSLGD........DSASA--- 47 ----.....-------ISAVVQAIVWAVDH........GANIINLSLGS........NEASE--- 48 ----.....-------ESEIIAGMEWAARDv.......DADIVSMSLGS........TEPSDGTD 49 ----.....-------TENVIAGVERAVQD........GADVMNLSLGNsl......NNPDW--- 50 ----.....---------------------re......PAEIINISLGG........FGPCD--- 51 ----.....------------------NAN........PAEVINMSLGG........GGSCS--- 52 ----.....-------------------QN........PAQVVNMSLGG........GG------ 53 ----.....-------------------QN........PAQVINMSLGG........DGDCS--- 54 ----.....AQVIAGMQYVLDPDNNADTDD........GADVVNMSLGI........PGTWN--- 55 ----.....------SVALTEGMIELVGNQ........RVDIVNMSIGG........--LPALND 56 ----.....--------CWILKAIIDATNN........GANVINLSLGQyiki....PNGDIWES 57 ----.....--------AGVAKAILWMVDN........GAKVLNNSWGG........AGFDP--- 58 ----.....---------------------........-KTIISMSLGS........SANNS--- 59 ----.....---------------------........-KTIISMSLGS........SANNS--- 60 ----.....---------------------........TKVVINMSLGS........SGESS--- 61 ----.....--------------------N........TKVVINMSLGS........SGESS--- 62 ----.....---------------------........-ADVINMSLGS........VSSDV--- 63 YALG.....DSNASRDNRVFNHSYRMSVVD........PRSANSL----........DQSQL--- 64 ----.....----TPDPQYFKAVYSALVDS........GVRAINNSWGSqpk12lgdLHAAYAQH 65 ----.....---PTPDPKYFKAVYTALVDS........GVRAINNSWGSqpp12lagLHAAYAQH 66 ----.....---------------------........TNDIYSCSWGPt.......DNGKVLSE 67 ----.....DEAASLIYGL----------D........VNDIYSCSWGP........SDDGKTMQ 68 ----.....---------LIEANAMGHMPN........VIDIYSASWGP........TDDGKTVD 69 ----.....---------LIERNAMGHMPN........VIDIYSASWGP........TDDGKTVD 70 ----.....---------LIEANAMGHMPN........VIDIYSASWGP........TDDGKTVD 71 ----.....---------LIEANAMGHMPN........VIDIYSASWGP........TDDGKTVD 72 --GG.....PQLVGNLLNYYYEYYYMVNYL........NPNVISISVTV........PESFLAAY 150 160 170 180 | | | | 1 G........TLQAEDRIFATAAAQGQTFSVSSGDEGVYECNNRGY........PD.GST.....Y 2 G........TLQAEDRIFATAAAQGQTFSVSSGDEGVYECNNRGY........PD.GST.....Y 3 A........YIQRVNTELMKAAARGLTLLFASGDSGAGCWSVSGR........H-.--Q.....F 4 A........YIQRVNTELMKAAARGLTLLFASGDSGAGCWSVSGR........H-.--Q.....F 5 A........YIQRVNTEFMKAAARGLTLLFASGDSGAGCWSVSRR........H-.--Q.....F 6 I........YIQRVNTEFMKAAARGLTLLFASGDTGAGCWSVSGR........H-.--K.....F 7 I........YIQRVNTEFMKAAARGLTLLFASGDTGAGCWSVSGR........H-.--K.....F 8 Y........HIYSSCTCDK-------LKPYSDSDAGFKIVGYSYD........QDaGTL.....F 9 -........---SSDSYFQQAQEAGISLFASAGDSGAE-------........--.---.....- 10 P........IAIASFAAM----EKGVVVSTSAGNAGPFFGNMH--........--.---.....- 11 G........TQAADDAIFQQAVAQGQTFSIASGDAGVYQWSTDPTsgs15tvkID.LTH.....Y 12 G........TLQAEDRIFATAAAQGQTFSVSSGDEGVYECNNRGY........PD.GST.....Y 13 G........YLRRSDVEFQKLALMGITIIIADGDNGAGDLGAPPMlt......PD.CSTr....L 14 Gigg15saqYVARVNTEFQKIGLRGITLFAASGDSGAN-GRTDPD........CS.ESN.....L 15 -........---ALQQAVQYAWNKGSVIVAAAGNAGNT-------........--.---.....- 16 -........---ALQQAVQYAWNKGSVIVAAAGNAGNT-------........--.---.....- 17 -........---GLQQAVNYAWNKGSVVVAAAGNAGNT-------........--.---.....- 18 -........---GLQQAVNYAWNKGSVVVAAAGNAGNT-------........--.---.....- 19 -........---TLKSAVDYAWNKGAVVVAAAGNDNVS-------........--.---.....- 20 -........---TLENAVNYAWNKGSVVVAAAGNNGSS-------........--.---.....- 21 -........---TLENAVNYAWNKGSVVVAAAGNNGSS-------........--.---.....- 22 -........---TERNALNTHYNGGVLLIAAAGNAGDS-------........--.---.....- 23 -........---TEQNAMDALYERGVLMIAAAGNSGNT-------........--.---.....- 24 -........---TEQRAYTSVYNKGVLTVAATGNDGAA-------........--.---.....- 25 G........KTQALDAAVNAAVKAGIHFAVAAGNDNADACNYS--........--.---.....- 26 G........KTQALDAAVNAAVKAGIHFAVAAGNDNADACNYS--........--.---.....- 27 G........YSATVNQAAARLQSSGVFVAVAAGNDNRDAANTS--........--.---.....- 28 G........YSATVNQAAARLQSSGVFVAVAAGNDNRDAANTS--........--.---.....- 29 G........YSATVNQAAARLQASGVFVAVAAGNDNRDAAQTS--........--.---.....- 30 G........YSASVNQGAAALVRSGVFLAVAAGNDNRDAQNTS--........--.---.....- 31 G........YSASVNQGAAALVNSGVFLAVAAGNDNRDAQNTS--........--.---.....- 32 G........KAQSVNDGAAAMIRAGVFLAVAAGNDNANAANYS--........--.---.....- 33 G........YSAAINQAAAKMIQSNVFLAVAAGNDAKDASQTS--........--.---.....- 34 -........----VNRAAAEITSAGLFLAVAAGNEATDASSSS--........--.---.....- 35 G........ASQAVDDAVNNAASKNLVMAVAAGNENQNACNVS--........--.---.....- 36 -........------------------------------------........--.---.....- 37 G........VSQAVDDAVNNAVASGVSFVVAAGNDNSNACNYS--........--.---.....- 38 G........YSYAFNQAVEDAYDEGVLSVVAAGNDNIDASDSS--........--.---.....- 39 G........YSYAFNNAVENAFDEGVLSVVAAGNENSDASNTS--........--.---.....- 40 G........YSYAFNNAVENAFDEGVLSVVAAGNENSDASNTS--........--.---.....- 41 G........YSYAFNNAVENAFDEGVLSVVAAGNENSDASNTS--........--.---.....- 42 P........KSASQDALWSRATQEGLLVAIAAGNDAVDACNDS--........--.---.....- 43 G........YSKATNQAAARLVRAKYFVAVASGNNNRDARNYS--........--.---.....- 44 -........---ELHDVIKAAYNLGITIVAAAGNDGAD-------........--.---.....- 45 V........DTSELDAAVKYAVDKGKLIFAAAGNEGDG-------........--.--A.....N 46 H........PEPGEDEAIQYALKKGVVVVASAGNGGEL-------........--.--G.....D 47 -........---ALQSAVRYADEKGVAVVAAAGNAGNN-------........--.ELT.....Y 48 P........MAEAVNTLSR---ETGALFVIAAGNTGAP-------........--.---.....S 49 -........---ATSTALDWAMSEGVVAVTSNGNSGPN-------........--.--G.....W 50 -........--SAMQAAINGAVSRGTTVVVAAGNGGSD-------........--.---.....V 51 -........--TTMQNAINGAVSRGTTVVVAAGNDASN-------........--.---.....V 52 G........CSQNSQRMIDKTTNLGALIVIAAGNENQD-------........--.---.....A 53 -........--QSSQRIIDKTTNLGALIVIAAGNENQD-------........--.---.....A 54 -........---EFIVPVNNMLKAGVVPVFAIGNFGPA-------........--.--A.....G 55 G........NNTRSALYNRIIDEYGVQIFISAANSGAG-------........--.--T.....N 56 A........EALRYKFAIDYATRHNVIVVAATGNDGLSDDNGEVKtyy11gqdMS.QND.....T 57 -........---LIKAAMDYALERNVTVVVSAGNESRE-------........--.---.....- 58 -........---LISSAVNYAYSKGVLIVAAAGNSGYA-------........--.--Q.....G 59 -........---LISSAVNYAYSKGVLIVAAAGNSGYS-------........--.--Q.....G 60 -........---LITNAVDYAYDKGVLIIAAAGNSGPK-------........--.--P.....G 61 -........---LITNAVNYSYNKGVLIIAAAGNSGPY-------........--.--Q.....G 62 G........PSDPQQQAVAKASEAGVINVISAGNSGVAGSTADGN........PV.NNTgtselS 63 -........---DRLFEQQTLKAQGAAYIKAAGN-GFNKIAAGGYvln10gpkLP.FEN.....S 64 Y........NQNTWLDAAADVAKAGVINVFSAGNSGYANASVR--........--.-SA.....L 65 Y........NQGTWLDAAADVAKAGVINVFSAGNSGYANASVR--........--.-SA.....L 66 Pdviv....KKAMIKGIQEGRDKKGAIYVFASGNGGRF-------........--.GDS.....C 67 Apdtlv...KKAIIKGVTEGRDAKGALYVFASGNGGMF-------........--.GDS.....C 68 Gprnlt...MRAIVNGVNNGRNGLGNVYVWASGDGGPN-------........--.-DD.....C 69 Gprnlt...MRAIVNGVNNGRNGLGNVYVWASGDGGPN-------........--.-DD.....C 70 Gprnlt...MRAIVNGVNNGRNGLGNVYVWASGDGGPN-------........--.-DD.....C 71 Gprnlt...MRAIVNGVNNGRNGLGNVYVWASGDGGPN-------........--.-DD.....C 72 Ypa......MLDMIHNIMLQAAAQGISVLAASGDWGYESDHPPPN........FHiGTY.....N 190 200 210 220 230 | | | | | 1 SVSWPASSPNVIAVGGTTLYTTSA.GAY.....SNE........TVWNEGL........DSNGKL 2 SVSWPASSPNVIAVGGTTLYTTSA.GAY.....SNE........TVWNEGL........DSNGKL 3 RPTFPASSPYVTTVGGTSFQEPF-.---.....---........-----LI........TNEIVD 4 RPTFPASSPYVTTVGGTSFQEPF-.---.....---........-----LI........TNEIVD 5 RPSFPASSPYVTTVGGTSFQNPFR.---.....---........------V........TTEIVD 6 RPSFPASSPYVTTVGGTSFKNPF-.---.....---........-----LI........TDEVVD 7 RPSFPASSPYVTTVGGTSFKNPF-.---.....---........-----LI........TDEVVD 8 QPDYPASSPFITSVGATQITDVTK.PEI.....VCS........-------........VATGAI 9 -AEYPAASQYVVAVGGTTLHTNSD.GSF.....NSE........-------........---TAW 10 -----NGIPWVLTVAAGNIDRSFA.GTL.....TLGndq64rsnVAGAILI........SNHTKL 11 SVSEPASSPYVIQVGGTTLSTS-G.TTW.....SGE........TVWNEGLsaiapsqgDNNQRL 12 SVSWPASSPNVIAVGGTTLYTTSA.GAY.....SNE........TVWNEGL........DSNGKL 13 NPDWP--SQRLTSRLGLYIHHTLA.EPI.....CYT........DIDCRLDnpe9vgvsLDNGLF 14 NPAYPAASPYITSVGATQISQSSG.VAK.....LPNppp27pilHQVEDFL........WLPQHC 15 KANYPAYYSEVIAVASTDQSDRKS.SFS.....TYG........-------........------ 16 KANYPAYYSEVIAVASTDQSDRKS.SFS.....TYG........-------........------ 17 APNYPAYYSNAIAVASTDQNDNKS.SFS.....TYG........-------........------ 18 APNYPAYYSNAIAVASTDQNDNKS.SFS.....TYG........-------........------ 19 RTFQPASYPNAIAVGAIDSNDRKA.SFS.....NYG........-------........------ 20 TTFEPASYENVIAVGAVDQYDRLA.SFS.....NYG........-------........------ 21 TTFEPASYENVIAVGAVDQYDRLA.SFS.....NYG........-------........------ 22 TYTYPPSYDIVMSVAAVDSNLDHA.AFS.....QYTdq108ktaGAKGIIV........YSNTAL 23 AHSYPASYDSVMSVAAVDSNYDHA.SFS.....QATnq109nnaGALAAMV........YSNQQ- 24 -VSYPAAYTNVVGVGAIDSAEARA.SFS.....NFG........-------........---SQV 25 ----PAAAELPVTVGASAFDDSRA.YFS.....NYG........-------........------ 26 ----PAAAELPVTVGASAFDDSRA.YFS.....NYG........-------........------ 27 ----PASEPSVCTVGATDSSDRRS.SFS.....NYG........-------........------ 28 ----PASEPSVCTVGATDSSDRRS.SFS.....NYG........-------........------ 29 ----PASEPSVCTVGATDSSDRRS.TFS.....NFG........-------........------ 30 ----PASEPTACTVGATASDDSRS.TFS.....NYG........-------........------ 31 ----PASEPSACTVGASAENDSRS.SFS.....NYG........-------........------ 32 ----PASEPTVCTVGATTSSDARS.SFS.....NYG........-------........------ 33 ----PASEPSVCTVGATDSSDRLS.SFS.....NYG........-------........------ 34 ----PASEESACTVGATDKTDTLA.EYS.....NFG........-------........------ 35 ----PARAVNAITVGATTKTDSRDtGYS.....NYG........-------........------ 36 -----GNGYTAITRGLTTNTDARW.SFS.....NYG........-------........------ 37 ----PARAANAITVGSTTSSDARS.SFS.....NYG........-------........------ 38 ----PASAPNALTVAASTKSNTRA.SFS.....NYG........-------........------ 39 ----PASAPNALTVAAINKSNARA.SFS.....NYG........-------........------ 40 ----PASAPNALTVAAINKSNARA.SFS.....NYG........-------........------ 41 ----PASAPNALTVAAINKSNARA.SFS.....NYG........-------........------ 42 PGNIGGSTSGIITVGSIDSSDKIS.VWSggqgsNYG........-------........------ 43 ----PASEPSVCTVGGTDKFDSV-.YMS.....NWG........-------........---PAV 44 SPSYPAAYPEVIAVGAIDENGNVP.SWS.....NRN........-------........------ 45 RPRFPASTPGVVAVGSINEKVKRS.SFS.....EWG........-------........------ 46 HISYPAAYPGVIAATAVDRYGTRA.AFS.....TRR........-------........------ 47 PAAYARTSAGLLSVGSVSDSDVKS.GFS.....NYA........-------........------ 48 SIGSPGAADAALTVGAVDSADQAA.WFT.....SAG........-------........------ 49 TVGSPGTSREAISVGATQLPLNE-.YAV.....TFGsy117tfkLTVSKAL........GEQVAD 50 SSAVPANCANVVSVAATRLTGGLA.YYS.....NFG........-------........-SLIDL 51 SGSLPANCANVIAVAATTSAGAKA.SYS.....NFG........-------........------ 52 SRTWPSSCNNVLSVGATTPKGKRA.PFS.....NYG........-------........------ 53 SRTWPSSCNNVLSVGATTPKGKRA.PFS.....NYG........-------........------ 54 STGSPGNLPQAIGVGAVDSNGQVA.SFS.....SRG........-------........------ 55 TIADPSVATDAVSVAAGASKETW-.-LA.....NYG........AKAKEEYwaqn....YSSRGP 56 VEDYPSVLPNAIAVGSSDNNNQRS.SFS.....NYY........-----NQ........YQDNFI 57 YYQRPALFAGVIPSAALAVNNTKA.SFS.....SFG........-------........---RHI 58 TIGYPGALPNAIAVAALENVQQNG.TYR.....VAD........-------........YSSRGY 59 TIGYPGALPNAIAVAALENVQQNG.TYR.....VAD........-------........YSSRGY 60 SIGYPGALVNAVAVAALENTIQNG.TYR.....VAD........-------........FSSRGH 61 SIGYPGALVNAVAVAALENKVENG.TYR.....VAD........-------........FSSRGY 62 TVGTPGVTPDALTVASAENSKVTT.DTV.....KDElg116kfwLKQQKKV........RASRLK 63 NLDPSNSNFWNLVVSALNADGVRS.SYS.....SVG........-------........-SNIFL 64 PYFQPGLEGHWLAVSGLDKANNQK.---.....---........-------........------ 65 PYFQPELEGHWLAVSGLDKTNNQK.---.....---........-------........------ 66 NFDGYTNSIYSITVGAIDYKGLHP.QYS.....EAC........-------........------ 67 NFDGYTNSIFSITVGAIDWKGLHP.PYS.....ESC........-------........------ 68 NCDGYAASMWTISINSARNDGQTA.GYD.....ESC........-------........-SSTLA 69 NCDGYAASMWTVSINSATNDGQTA.GYD.....ESC........-------........------ 70 NCDGYAASMWTVSINSATNDGQTA.GYD.....ESC........-------........------ 71 NCDGYAASMWTVSINSATNDGQTA.GYD.....ESC........-------........------ 72 TIWYPESDPYVTSVGGIFLNASSN.GSI.....VEI........-------........--SGWD 240 250 260 270 | | | | 1 WATGGGYSVYESKPSWQSVVSGT.....PG........RRLLPDISFDAAQG.......TGALIY 2 WATGGGYSVYESKPSWQSVVSGT.....PG........RRLLPDISFDAAQG.......TGALIY 3 YISGGGFSNVFPRPSYQEEAVTK.....FLsss15nasGRAYPDVAALSDGY.......WVVSNR 4 YISGGGFSNVFPRPSYQEEAVTK.....FLsss15nasGRAYPDVAALSDGY.......WVVSNR 5 YISGGGFSNVFPQPSYQEEAVVQ.....FLsss15nasGRAYPDVAALSDGY.......WVVSNS 6 YISGGGFSNVFPRPPYQEEAVAQ.....FLkss15nasGRAYPDVAALSDGY.......WVVSNM 7 YISGGGFSNVFPRPPYQEEAVAQ.....FLkss15nasGRAYPDVAALSDGY.......WVVSNM 8 ITGGGGVAITQAQPSYQADAVAT.....YIks......GTLPPSYSYMPPID.......SIQILL 9 SGSGGGCSKYTKVIPEQNADPGYaslgcKG........KKALPDLAALADPN.......SGITII 10 FELGGGVSCPCLVISPKDAAALI.....KYakt39sypGILKPDVM--APGS.......LVLASW 11 WATGGGVSLYEAAPSWQSSVSSS.....T-........KRVGPDLAFDAASS.......SGALIV 12 WATGGGYSVYESKPSWQSVVSGT.....PG........RRLLPDISFDAAQG.......TGALIY 13 WTTGGGFADYPPRPQYQEAIISQ.....YLqsn15nsgGRAYPDIS---TVG.......HNLMTV 14 LSEGSHCSILQVRCNLASKLLLQ.....CC........CKRISDVS---ALG.......SAILIE 15 -----------------------.....--........----SWVDVAAPGS.......NIYSTY 16 -----------------------.....--........----SWVDVAAPGS.......NIYSTY 17 -----------------------.....--........----SWVDVAAPGS.......SIYSTY 18 -----------------------.....--........----SVVDVAAPGS.......WIYSTY 19 -----------------------.....--........----TWVDVTAPGV.......NIASTV 20 -----------------------.....--........----TWVDVVAPGV.......DIVSTI 21 -----------------------.....--........----TWVDVVAPGV.......DIVSTI 22 PRLQNPFVVDAD--SEILIPSMS.....VD........RTTGLALKAKLGQS.......TTVSNQ 23 -RPGLQNPFVLDQFNTYPLLSVS.....VN........RNVGQELAALVGQD.......ITVSTR 24 DLVGPGVSVLSSIPLGQGTRASAs....GG........GVTFTDVS--AADK.......SGKATF 25 -----------------------.....--........----KCTDIFAPGL.......NILSTW 26 -----------------------.....--........----KCTDIFAPGL.......NILSTW 27 -----------------------.....--........----RALDIFAPGT.......DITSTW 28 -----------------------.....--........----RALDIFAPGT.......DITSTW 29 -----------------------.....--........----KAVDIFAPGT.......GILSTW 30 -----------------------.....--........----RIVDIFAPGT.......GILSTW 31 -----------------------.....--........----RVVDIFAPGS.......NVLSTW 32 -----------------------.....--........----NLVDIFAPGS.......NILSTW 33 -----------------------.....--........----AAVDILAPGS.......DILSTW 34 -----------------------.....--........----SVVDLLAPGT.......DIKSTW 35 -----------------------.....--........----SCLDIFAPGT.......NITSTW 36 -----------------------.....--........----SCLDIFAPGS.......SITSAW 37 -----------------------.....--........----NCLDIYAPGS.......SITSAW 38 -----------------------.....--........----SVVDIFAPGQ.......DILSAW 39 -----------------------.....--........----SVVDIFAPGQ.......DILSAW 40 -----------------------.....--........----SVVDIFAPGQ.......DILSAW 41 -----------------------.....--........----SVVDIFAPGQ.......DILSAW 42 -----------------------.....--........----TCVDVFAPGS.......DIISAS 43 DINGPGVDVLSTLPNRRTVCFF-.....--........----FLIKIPAWRA.......EELTCM 44 -----------------------.....--........----PEVA--APGV.......NILSTY 45 -----------------------.....--........----PEIDVTAPGE.......DLVHAC 46 -----------------------.....--........--WYATVS--APGV.......DVIIAD 47 -----------------------.....--........----ASLEVLAPGE.......RIATYA 48 --------------------PRY.....GD........NALKPDLS--APGV.......GILAAR 49 FSSRGPVMDTWM-----------.....--........--IKPDIS--APGV.......NIVSTI 50 AAPGGGARDLETDTLYDGPIG--.....--........----SWIW--QTGY.......TGATTP 51 -----------------------.....--........----TGIDVSAPGS.......SILSTL 52 -----------------------.....--........----ARVHLAAPGT.......NILSTI 53 -----------------------.....--........----ARVHLAAPGT.......NILSTI 54 ------------PVAWQGEISGV.....F-........--TKPDIA--APGV.......NITSTV 55 REDGGFKPNIMAPGSAISAVPMF.....MD........PEDIPQVSYKLPV-.......------ 56 LAPGGGTPLLDQ--YGQEEWYNQ.....KL........----------FMKE.......QVLSTS 57 SVAAPGTDILMASPLFINDDGTR.....KL........GATPPDGS------.......------ 58 ISTAGDYVIQE------------.....--........----GDIEISAPGS.......SVYSTW 59 ISTAGDYVIQE------------.....--........----GDIEISAPGS.......SVYSTW 60 KRTAGDYVIQK------------.....--........----GDVEISAPGA.......AVYSTW 61 SWTDGDYAIQK------------.....--........----GDVEISAPGA.......AIYSTW 62 FGTALIDNSRAGKMSDFTSWGPT.....PE........LDFKPEIT--APGG.......KIYSLA 63 SATGGEYGTDTP-----------.....--........----AMVTTDLPGC.......DMGYNR 64 --------------------YNQ.....CG........IAKYWCIS--TPGA.......LINSTI 65 --------------------YNK.....CG........IAKYWCIS--TPGA.......LINSTV 66 ---------------------SA.....VM........VVTYSSGS----GE.......HIHTTD 67 ---------------------SA.....VM........VVTYSSGS----GN.......YIKTTD 68 STFSNGKSN--------------.....--........----------SRDA.......GVATTD 69 ---------------------SS.....TL........ASTFSNGKSSSRDA.......GVATTD 70 ---------------------SS.....TL........ASTFSNGKSSSRDA.......GVATTD 71 ---------------------SS.....TL........ASTFSNGKSSSRDA.......GVATTD 72 YSTGGNSVVYPAQIYEITSLIPFtp...VI........VRTYPDIAFVSAGGynipefgFGLPLV 280 290 300 310 | | | | 1 ........NYGQ........LQQIG....GTSLASPIFVGLWARLQSANS......NSLGFPAAS 2 ........NYGQ........LQQIG....GTSLASPIFVGLWARLQSANS......NSLGFPAAS 3 ........V--P........IPWVS....GTSASTPVFGGILSLINEHRIlsgr..PPLGFLNPR 4 ........V--P........IPWVS....GTSASTPVFGGILSLINEHRIlsgr..PPLGFLNPR 5 ........V--P........IPWVS....GTSASTPVFGGILSLINEHRLlsgl..PPLGFLNPR 6 ........V--P........IPWVS....GTSASTPVFGGILSLINEHRIlngr..PPLGFLNPR 7 ........V--P........IPWVS....GTSASTPVFGGILSLINEHRIlngr..PPLGFLNPR 8 llv17sntCPCA........LESVD....GTSCSSPTLAGMISLINDKLIgagk..PTLGFLNPL 9 ........FHGQe.......LEGIG....GTSLAAPLTAGRAAIRGDQVT......--------- 10 ........IPNEata14sshYNMVS....GTSMACPHASGVAALLKAAHP......---EWSPAA 11 ........VNGS........TEQVG....GTSLASPLFVGAFARIESAAN......NAIGFPASK 12 ........NYGQ........LQQIG....GTSLASPIFVGLWARLQSANS......NSLGFPAAS 13 ........ISGS........MTPVD....GTSPSATIFAGIVSLLTDARLragk..PALGFLNPL 14 ........TGGN........IQTVG....GTSASSPIFAGVVGLLNDYVNsktg..KPLGFVSPL 15 ........KGST........YQSLS....GTSMATPHVAGVAVLLANQ--......---GYSNTQ 16 ........KGST........YQSLS....GTSMATPHVAGVAALLANQ--......---GYSNTQ 17 ........PTST........YASLS....GTSMATPHVAGVAGLLASQ--......---GRSASN 18 ........PTST........YASLS....GTSMATPHVAGVAGLLASQ--......---GRSASN 19 ........PNNG........YSYMS....GTSMASPHVAGLAALLASQ--......---GKNNVQ 20 ........TGNR........YAYMS....GTSMASPHVAGLAALLASQ--......---GRNNIE 21 ........TGNR........YAYMS....GTSMASPHVAGLAALLASQ--......---GRNNIE 22 ........GNRD........YEYYN....GTSMATPHVSGVATLVWSYHP......---ECSASQ 23 ........TGED........YQYYN....GTSMATPHVSGVAGLVWSYHP......---QCSAKQ 24 sg103vavTGAD........YDFFD....GTSMATPHVSAAAAVVWAAKP......---TLTNTQ 25 ........IGSPta......VNTIS....GTSMASPHICGLLAYYLSLQPagdsefSVASITPKQ 26 ........IGSPta......VNTIS....GTSMASPHICGLLAYYLSLQPagdsefSVASITPKQ 27 ........IGGR........TNTIS....GTSMATPHIAGLGAYLLALE-......---GGSAST 28 ........IGGR........TNTIS....GTSMATPHIAGLGAYLLALE-......---GGSAST 29 ........NNGG........TNTIS....GTSMATPHIAGLGAYLLALG-......---KGTAGN 30 ........INGR........TNTIS....GTSMATPHIAGLAAYFSALSG......---KTSPAA 31 ........IVGR........TNSIS....GTSMATPHIAGLAAYLSALQG......---KTTPAA 32 ........IGGT........TNTIS....GTSMATPHIVGLGAYLAGLE-......---GFPGAQ 33 ........IGGI........TKSIS....GTSMATPHIVGLGAYLSSLEGf.....PGAQALCER 34 ........NDGR........TKIIS....GTSMASPHVAGLGAYFLGLGQ......KVQGL---- 35 ........IGSTsa......TNTIS....GTSMATPHVTGAVALLIAEG-......---NTTTSA 36 ........YTSSta......TNTIS....GTSMASPHVAGAAALYLALNP......---SATPAQ 37 ........YNSDts......TNTIS....GTSMAAPHVAGAVALYLDENP......---SLSPSQ 38 ........IGSTta......TNTIS....GTSMATPHVVGLSLYLIALEG......---LSSASA 39 ........IGSTta......TNTIS....GTSMATPHIVGLSVYLMGLENl.....----SGPA- 40 ........IGSTta......TNTIS....GTSMATPHIVGLSVYLMGLENl.....----SGPA- 41 ........IGSTta......TNTIS....GTSMATPHIVGLSVYLMGLEN......---LSGP-- 42 ........YQSDsg......TLVYS....GTSMACPHVAGLASYYLSIND......--EVLTPAQ 43 ........MQGR........LT---....GTSMATPHIAGLGAYLAAKNG......---RRAGPG 44 ........PDDT........YEELS....GTSMATPHVSGTVALIQAARL......-AAGLPLLP 45 ........IGGTg.......VCRTS....GTSDATAIASASAALVWSKHP......---TWTNNQ 46 ........PDHR........YYEGW....GTSAASAFVSGAAALVKAAHP......---DLTPAQ 47 ........PNNK........LALWT....GTSMSAPVVAGLLALMQGERQ......-AAGGENAV 48 srlae...GSGD........YTSMD....GTSMATPHIAGVAALLAEEHP......---DWSGAR 49 ........PTHDpdhpyg..YGSKQ....GTSMASPHIAGAVAVIKQAKP......---KWSVEQ 50 ........TSGQ........FTYIGpgfaGTSMASPHVAGTAALVQSALIad....GKAPLTPAA 51 ........NSGTttpgsas.YASYN....GTSMASPHVAGVVALVQSVAP......--TALTPAA 52 ........DVGQagpvrss.YGMKA....GTSMAAPHVSGVAALVISAANs.....IGKTLTPSE 53 ........DVGQagpvrss.YGMKA....GTSMAAPHVSGVAALVISAANs.....IGKTLTPSE 54 ........RNGG........YQAMS....GSSQASPITAGAVAVLLSAKP......---GASVDA 55 ........---G........LSMFN....GTSMARP--------------......--------- 56 ........NNGN........YDYAD....GTSISTGKVSGELAEIISNYH......--LQGDSSK 57 ........---G........YVLMS....GTSFSGPYTAATAALILGAHP......---ELDPYQ 58 ........YNGG........YNTIS....GTSMATPHVSGLAAKIWAENP......---SLSNTQ 59 ........YNGG........YNTIS....GTSMATPHVSGLAAKIWAENP......---SLSNTQ 60 ........FDGG........YATIS....GTSMASPHAAGLAAKIWAQSP......---AASNVD 61 ........FDGG........YATIS....GTSMASPHAAGLAAKIWAQYP......---SASNVD 62 ........NDNK........YQQMS....GTSMASPFVAGSEALILQGIKk.....QGLNLSGEE 63 ........TDDPstn17cdyNGVMN....GTSSATPSTSGAMALLMSAYP......---DLSVRD 64 ........PEGG........YGVKS....GTSMSAPHATGALALVMERYP......---YLNNEQ 65 ........PGGG........YGVKS....GTSMSAPHATGALALVMERYP......---YMTNEQ 66 ........IKKKc.......SATHG....GTSAAAPLASGIYSLILSANP......-NLTWRDVQ 67 ........LDEKc.......SNTHG....GTSAAAPLAAGIYTLVLEANP......-NLTWRDVQ 68 ........LYNNc.......TASHS....GTSAAAPEAAGVFALALEANR......-NLTWRDMQ 69 ........LYNNc.......TASHS....GTSAAAPEAAGVFALALEANK......-NLTWRDMQ 70 ........LYNNc.......TASHS....GTSAAAPEAAGVFALALEANK......-NLTWRDMQ 71 ........LYNNc.......TASHS....GTSAAAPEAAGVFALALEANK......-NLTWRDMQ 72 ........FQGQ........LFVWY....GTSGAAPMTAAMVALAGTR--......--LGALNFA 320 330 340 350 360 | | | | | 1 FYSAIS...STPS........LVHDVKSGNNG.......YGGYGYNAGTGWDYPTGWGSLDIAKL 2 FYSAIS...STPS........LVHDVKSGNNG.......YGGYGYNAGTGWDYPTGWGSLDIAKL 3 LYQQHG...AGL-........--FDVTRGCHEscldee.VEGQGFCSGPGWDPVTGWGTPNFPAL 4 LYQQHG...AGL-........--FDVTRGCHEscldee.VEGQGFCSGPGWDPVTGWGTPNFPAL 5 LYQQRG...AGL-........--FDVTRGCHEsclnee.VQGQGFCSGPGWDPVTGWGTPNFPAL 6 LYQQHG...TGL-........--FDVTHGCHEsclnee.VEGQGFCSGPGWDPVTGWGTPNFPAL 7 LYQQHG...TGL-........--FDVTHGCHEsclnee.VEGQGFCSGPGWDPVTGWGTPNFPAL 8 LYQAAK...EQPN........VFNDITTGANNcnray..CCQYGYTATTGYDAASGLGSINFKNF 9 -PAYVY...TGGI........QFRDITQGSNG.......H-----SAKAGLDLVTGEG------- 10 IRSAMM...TTA-........--NPLDNTLNP.......IHENGKKFHLASPLAMGAGHIDPN-- 11 FYQAFP...TQTS........LLHDVTSGNNG.......YQSHGYTAATGFDEATGFGSFDIGKL 12 FYSAIS...STPS........LVHDVKSGNNG.......YGGYGYNAGTGWDYPTGWGSLDIAKL 13 LYQIAA...EA--........LMHSVCSG---.......------------------GRKQMQKL 14 LYKMAA...ERPA........AFFDVIKGDNI.......CTEDGCSS------------------ 15 IRQIIE...STT-........---DKISGTGT.......YWKN--------------GRVNA--- 16 IRQIIE...STT-........---DKISGTGT.......YWKN--------------GRVNA--- 17 IRAAIE...NTA-........---DKISGTGT.......YWAKG--------------------- 18 IRAAIE...NTA-........---DKISGTGT.......YWAKG--------------------- 19 IRQAIE...QTA-........---DKISGTGT.......NFKYG--------------------- 20 IRQAIE...QTA-........---DKISGTGT.......YFKYG--------------------- 21 IRQAIE...QTA-........---DKISGTGT.......YFKYG--------------------- 22 VRAALN...ATAD........DL---------.......-------SVAGRDNQTGYGMVNATTA 23 IRQALT...QTA-........-----------.......--------------------LDLDVL 24 LLNLLT...STAK........DL---------.......-------GAAGKDNDFGSGLVN---- 25 LKDTLIei.STQG........VLTDIPNDTPN.......-------------------------- 26 LKDTLIei.STQG........VLTDIPNDTPN.......-------------------------- 27 ICARIQtl.STKN........AISGVPSGTVN.......Y------------------------- 28 ICARIQtl.STKN........AISGVPSGTVN.......Y------------------------- 29 LCQTIQtl.STKN........VLTGVPSGTVN.......Y------------------------- 30 LCQKIQdt.STKN........VIRNVPAGTVN.......FL------------------------ 31 LCKKIQ...DTATkn......VLTGVPSGTVN.......YL------------------------ 32 ALCKRIqtlSTKN........VLTGIPSGTVN.......Y------------------------- 33 IRSLAI...RNT-........-----------.......-------------------------- 34 ------...----........-----------.......-------------------------- 35 VTSALL...NN--........-----------.......-------ATTGKLSSIGTGSPN---- 36 VTTAIIna.STPN........KVTGAQTGSPN.......-------------------------- 37 IDSLLS...QRSSkg......KVSNPQSGSP-.......-------------------------- 38 VVSRIK...E---........-----------.......-------------------------- 39 ------...----........-----------.......-------------------------- 40 ------...----........-----------.......-------------------------- 41 ------...----........-----------.......-------------------------- 42 VEALIT...ESN-........-----------.......-------------------------- 43 LCRTIK...----........-----------.......-------------------------- 44 PGSESD...TTPD........TVRGVLHTTAT.......D-----AGDPGYDSLYGYGIIDAYD- 45 VLRVLI...NTM-........------KGNEE.......EWTHNESFGYG--------------- 46 VKSVLE...DTA-........--RNAPAG---.......----------GRDDSRGFGFVDPA-- 47 TAHAHD...ISGI........ALNQPFTG---.......--------------GLGYGRIDAA-- 48 LKDALM...STSK........-ELDVS-----.......------------AYQLGAGRVS---- 49 IKAAIM...NTAV........TLKD-------.......-------------------------- 50 LERLLK...RSAR........AF---------.......------PVQIPLATPAGSGIVDAGA- 51 VETLLK...NTAR........ALPGACSG---.......--------------GCGAGIVNADAA 52 LSDILV...RTTS........RFNG-------.......----------RLDRGLGSGIVDANA- 53 LSDILV...RTTS........RFNG-------.......----------RLDRGLGSGIVDANA- 54 IKNALF...TSA-........-----------.......------SNASAKNNNVGFGQISI--- 55 ------...----........-----------.......-------------------------- 56 ARSILL...NQVN........-----------.......-------------------------- 57 VRRLME...ETA-........---DGSVGENP.......N---------GFDRGTGYGRIQLGEL 58 LRSNLQ...ERA-........KSVDIKGG---.......-----YGAAIGDDYASGFGF------ 59 LRSNLQ...ERA-........KSVDIKGG---.......-----YGAAIGDDYASGFGF------ 60 VRGELQ...TRA-........SVNDILSGN--.......------SAGSGDDIASGFGF------ 61 VRGELQ...YRA-........YENDILSG---.......-----YYAGYGDDFASGFGF------ 62 LVQFAK...NSA-........-----MNTSHP.......VYDTEHTKEIISPRRQGSGEIN---- 63 LRDLLA...RSATrvdakhqpVMVSYTSSTGKvrdvkglEGWERNAAGMWFSPTYGFGLIDVNK- 64 ALQVLL...TTAT........QLNGAVTDAPT.......T-------------QVGWGVPDLG-- 65 ALQVLL...TTAT........QLDG-------.......------SITQAPNTVVGWGVPDLG-- 66 YISVLS...ATPI........NEEDGNYQTT-.......------ALNRKYSHKYGYGKTDAYKM 67 YLSILS...SEEI........NPHDGKWQDTA.......M-------GKRYSHTYGFGKLDAYNI 68 HLTVLT...SKR-........--NSLYDSNGI.......HHWKLNGAHLLFNHLFGYGVLDAAS- 69 HLTVLT...SKR-........--NSLYDSNGI.......HHWKLNGAHLLFNHLFGYGVLDAASM 70 HLTVLT...SKR-........--NSLYDSNGI.......HHWKLNGAHLLFNHLFGYGVLDAASM 71 HLTVLT...SKR-........--NSLYDSNGI.......HHWKLNGAHLLFNHLFGYGVLDAASM 72 LYHISY...QGIIesp11gkvAWIPITSGNNP.......L-----PAHYGWNYVTGPGTYNAYAM 370 | 1 SAYIRSNGFGH 2 SAYIRSNGFGH 3 ----------- 4 ----------- 5 ----------- 6 ----------- 7 L---------- 8 EQYVL------ 9 ----------- 10 ----------- 11 NTYAQAN---- 12 SAYIRSNG--- 13 SIH-------- 14 ----------- 15 ----------- 16 ----------- 17 ----------- 18 ----------- 19 ----------- 20 ----------- 21 ----------- 22 KAYL------- 23 ARYIVLD---- 24 ----------- 25 ----------- 26 ----------- 27 ----------- 28 ----------- 29 ----------- 30 ----------- 31 ----------- 32 ----------- 33 ----------- 34 ----------- 35 ----------- 36 ----------- 37 ----------- 38 ----------- 39 ----------- 40 ----------- 41 ----------- 42 ----------- 43 ----------- 44 ----------- 45 ----------- 46 ----------- 47 ----------- 48 ----------- 49 ----------- 50 ----------- 51 V---------- 52 ----------- 53 ----------- 54 ----------- 55 ----------- 56 ----------- 57 AQRLQSGPMP- 58 ----------- 59 ----------- 60 ----------- 61 ----------- 62 ----------- 63 ----------- 64 ----------- 65 ----------- 66 VHF-------- 67 VHMAK------ 68 ----------- 69 ----------- 70 ----------- 71 ----------- 72 -----------