Last active
June 20, 2018 14:25
-
-
Save ozagordi/b5ae59c27458d7288ca11d50f5b16c26 to your computer and use it in GitHub Desktop.
Make a table from a multiple sequence alignment
This file contains hidden or bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
| #!/usr/bin/env python | |
| """Create a csv table with the counts of aminoacids into an aligned fasta file, add the most frequent aa | |
| at the end of the table. | |
| """ | |
| import sys | |
| import pandas as pd | |
| from collections import Counter | |
| from Bio import AlignIO | |
| aas = 'ACDEFGHIKLMNPQRSTVWY-' | |
| msa = AlignIO.read(sys.argv[1], 'fasta') | |
| n = msa.get_alignment_length() # columns, number of positions | |
| col_dict = {} | |
| cons = [] | |
| for j in range(n): # iterate over columns | |
| c = Counter(msa[:, j]) | |
| letters = [c.get(a, 0) for a in aas] | |
| col_dict[str(j + 1)] = letters | |
| cons.append(c.most_common(1)[0][0]) | |
| col_dict['aa'] = list(aas) | |
| df = pd.DataFrame(col_dict) | |
| cols = [str(j + 1) for j in range(n)] | |
| cols.insert(0, 'aa') | |
| df = df[cols] | |
| df.to_csv('table.csv', index=False) | |
| cons.insert(0, 'cons') | |
| with open('table.csv', 'a') as oh: | |
| oh.write(','.join(cons)) |
This file contains hidden or bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
| >B.FR.83.HXB2_LAI_IIIB_BRU.K03455 | |
| MRVKEKYQHLWRWGWRWGT-MLLGMLMICSA----TEKLWVTVYYGVPVWKEATTTLFCA | |
| SDAKAYDTEVHNVWATHACVPTDPNPQEVVLVNVTENFNMWKNDMVEQMHEDIISLWDQS | |
| LKPCVKLTPLCVSLKCTD-----------LKNDTNTNSSSGRMIMEKGEIKNCSFNISTS | |
| IRGKVQKEYAFFYKLDIIPIDNDTTS----------------YKLTSCNTSVITQACPKV | |
| SFEPIPIHYCAPAGFAILKCNNKTFNGTGPCTNVSTVQCTHGIRPVVSTQLLLNGSLAEE | |
| EVVIRSVNFTDNAKTIIVQLNTSVEINCTRPNNNTRKRIRI-QRGPGRAFVTIGKI-GNM | |
| RQAHCNISRAKWNNTLKQIASKLREQFGNNK-TIIFKQSS-GGDPEIVTHSFNCGGEFFY | |
| CNSTQLFNSTW---FNSTWS-T-EGS-NNTEGSDT-------ITLPCRIKQIINMWQKVG | |
| KAMYAPPISGQIRCSSNITGLLLTRDGG----NSNNES-EIFRPGGGDMRDNWRSELYKY | |
| KVVKIEPLGVAPTKAKRRVVQREKRAV--G-IGAL-FLGFLGAAGSTMGAASMTLTVQAR | |
| QLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARILAVERYLKDQQLLGIWGCSGKL | |
| ICTTAVPWNASWS-NKSLEQIWNHTTWMEWDREINNYTSLIHSLIEESQNQQEKNEQELL | |
| ELDKWASLWNWFNITNWLWYIKLFIMIVGGLVGLRIVFAVLSIVNRVRQGYSPLSFQTHL | |
| PTPRGPDRPEGIEEEGGERDRDRSIRLVNGSLALIWDDLRSLCLFSYHRLRDLLLIVTRI | |
| VELLG-------RRGWEALKYWWNLLQYWSQELKNSAVSLLNATAIAVAEGTDRVIEVVQ | |
| GACRAIRHIPRRIRQGLERILL- | |
| >A.NG.09.09NG010499.KX389622 | |
| MRVRGMQRSWQNL-GRWGI-LFLGILIICRA----TDNLWVTVYYGVPVWKDAETTLFCA | |
| SDAKAHHTEAHNVWATHACVPTDPDPQEINLENVTEKFNMWKNKMVDQMHEDIISIWDQS | |
| LKPCVKLTPLCVTLECSK----VTINNSTTHNTAPNNNN-----TIEKEMRNCTYNMTTE | |
| VIDKKKKVHSLFYRLDIVPITNETTN-------------GSQYRLINCNTSAITQACPKV | |
| NFEPIPIHYCAPAGFAILKCKDKNFNGTGTCRNVSTVQCTHGIKPVVSTQLLLNGSLAEE | |
| NIRISSENLTDNAKIIIVQLNESVPINCIRPSNNTRESIRI---GPGQAFYAAGEIIGDI | |
| RQAHCNVSRTEWNNTLQKVAGELKRLF--NTTTIVFQNSS-GGDLEITTHSFNCGGEFFY | |
| CNTSDLFNSNW---TNGNWT-N---GIGSTETNDT-------ITLPCRIKQIIRMWQRVG | |
| QAMYAPPIKGVIECKSNITGIILVRDGG----KNNTDK-ETFRPGGGDMRDNWRSELYKY | |
| KVVKIEPLGVAPTRAKRRVVEREKRAV--G-IGAV-FLGFLGAAGSTMGAASITLTVQAR | |
| QLLSGIVQQQSNLLRAIEAQQHLLKLTVWGIKQLQARVLAIERYLKDQQLLGIWGCSGKL | |
| ICTTTVPWNSSWS-NKSYDDIWNNMTWMEWDREVSNYTNIIYSLIEESQNQQEKNEQDLL | |
| XLDKWASLWNWFDISHWLWYIRIFIMIVGGLIGLRIIFAVLSVVNRVRQGYSPLSLQTLI | |
| PSPRGPDRPEGIEEGGGEQDKDRSIRLVSGFLALAWDDLRSLCLFSYHRLRDFILIAARI | |
| VETLGHR-------GRQILKYLWSLAQYWGQELKNSAISLLNTTAIAVAEWTDRVIEIAQ | |
| SIGRAFINIPRRIRQGLERALL- | |
| >A1.CM.97.97CM_MP812.AM279344 | |
| MRVTETQKIYSLV-WRWGT-MILGLIIICSA----TGNLWVTVYYGVPVWKDAETTLFCA | |
| SDAKAYDTEVHNVWATHACVPTDPNPREINLENVTENFNMWKNNMVEQMHTDIISLWDQS | |
| LKPCVQLTPLCVTLDCVT---V----------------------NGSEEIRNCSYNMTTE | |
| VNDKKHKVHSLFYKLDVVPLNESNSN--SSNNNGS-----REYRLISCNTSTITQACPKV | |
| SFEPIPIHYCAPAGFAILKCNDKEFNGTGPCKNVSTVQCTHGIMPVVSTQLLLNGSLAEG | |
| KTMIRSKNFTNNAKIIIVQFNQSVEINCTRPYKNIRRRIHI---GPGRAFYATSGIEGGI | |
| RQAYCNVNATAWNKTLHMVAEQLKTQF--NK-TIIFDNSS-GGDIEITTHSFNCRGEFFY | |
| CNTSGLFNKTW----RANNA-S------QLGENGT-------ITLPCRIKQIVRMWQRVG | |
| QAMYAPPIPGVINCISXITGLLLTRDGG----ENNRTN-ETFRPEGGNIRDNWRSELYKY | |
| KVVKIEPLGVAPTEARRRVVEREKRAV--G-IGAV-LFGFLGAAGSTMGAASITLTVQAR | |
| QLLSGIVQQQSNLLKAIEAQQQLLKLTVWGIKQLQARLLAVERYLKDQQLLGLWGCSGKL | |
| ICTTTVPWNSSWS-NKTQQEIWGNMTWLQWDKEISNYTGIIYDLLEQSQTQQEKNERDLL | |
| ALDKWTNLWNWFDISNWLWYIRIFIMIVGGLIGLRIIFAVLSIVNRVRQGYSPLSFQTPT | |
| PVLQGLDRPGXIEEEGGEKGRDRSIRLVSGFLALAWDDLRSLCLFSYHHLRDFILIAART | |
| LN-------KGLRRGWESLKYLGNLLLYWGRELKISAISLLDATAITVAGWTDRIIDIIQ | |
| RFCRAILHIPTRIRQGAERAWL- | |
| >A1.CM.99.99CM_MP1433.AM279348 | |
| MRVMGTQRNYPPL-WKLGI-MVLGMIIICCNA---ADNLWATVYYGVPVWKDAETTLFCA | |
| SDAKAYKTEMHNVWATHACVPTDPNPQEIKLDNVTEEFNMWKNNMVEQMHADIISLWDQS | |
| LKPCVQLTPLCVTLNCSDVKVNTTKNNGTNSSNVLVINGTE---NGQEELKNCSYNVTTE | |
| LRDKKQRVYSLFYRLDIVPINEDNKS----SDNSS-----GEYRLINCNTSAITQACPKV | |
| SFEPIPIHFCAPAGFAILKCRDKNYNGTGLCKNVSTVQCTHGIKPVVSTQLLLNGSLAEG | |
| EIKVRSENFTNNAKTIIVQLDQPVIINCTRPNNNTRRSVRI---GPGQAYYATGEIIGDI | |
| RKAYCTVNKTAWNETKHKVMEKLRGIY--HR-PIKFNSSS-GGDLEITTHMFNCGGEFFY | |
| CNTSGLFAQEL----------K-----NDTNDNNT-------IILLCKIKQIINMWQRVG | |
| QAMYAPPRAGVIRCVSNITGLLLTRDGG--KNDNGTNGTEIFRPGGGDMRDNWRSELYKY | |
| KVVRIEPVGVAPTRAKRRVVEREKRAV--G-LGAV-FLGFLGAAGSTMGAASLTLTVQAR | |
| QLLSGIVQQQSNLLRAIEAQQHMLRLTVWGIKQLQARVLAVERYLRDQQLLGIWGCSGKL | |
| ICTTNVPWNSSWS-NKSYEDIWDNMTWLQWDKEISNYTALIYDLIEESQNQQEKNEKDLL | |
| ELDKWASLWNWFSISQWLWYIKIFIMVVGGLIGLRIIFAVLSLVNRVRQGYSPLSFQTHP | |
| PAPVGLDRPGGIEEEGGERGRDRSIRLVSGFLALAWDDLRNLCLFCYHRLRDFILIAART | |
| VELLGRNSLKGLRLGWEGLKYLWNLLAYWGRELKISAINLLDTIAIAVGGWTDSLIELTQ | |
| RIGRAILHIPRRIRQGFERALL- | |
| >A1.CM.97.97CM_MP640.AM279366 | |
| MRLRGMQMNWQNL-WRWGT-MMLGMLIISRA----TDNLWVTVYYGAPVWKDAETTLFCA | |
| SDAEAYETEKHNVWVTHACVPTDPNPQEIRXXNVTETFNMWKNNMVEQMHEDIISLWDQS | |
| LKPCVQLTPLCVTLXCTD-----------AKNTTANSTIES---EMNGEIKNCSFNMTTE | |
| LRDKSKKVYSLFYRLDVVPIKESNES--TNSVSNTSESKNRPYRLINCNTSAITQACPKV | |
| SFEPIPIHYCAPAGFAILRCNDEEFSGTGQCNDVSSVQCTHGIRPVVSTQLLLNGSLAKG | |
| KVKIRXESLTNNAKTIIVQFNETVRINCTRPNNNTRTSVHM---GPGKAFYATGDIIGDI | |
| RKAHCNVSRAKWKDTLQEVARQLSEHF--NKTEITFKNSS-GGDLEITTHSFNCGGEFFY | |
| CNTTDLFKGTW----NGTWV-NENXTWGNDSISDN-------MTIPCRIKQIINMWRRTG | |
| QAMYXPPIKGVIRCESXXXGLLSTGDGG-NKNNSQSQN-ETFRPEGGNMRDNWRSELYKY | |
| KVVQIEPLGVAPTKARRRVVQRAKRAV--G-MGAL-FIGFLGAAGSTMGAASIALTGQAR | |
| HLLSGIVQQQSNLLRAIEAQQHLLKLTVWGIKQLQARVLAVERYLRDQQLLGIWGCSGKL | |
| ICTTNVPWNSSWS-NKSMDDIWENMTWLEWDKEISNYTDIIYSLIGESQIQQEKNEQDLL | |
| ALDKWSNLWNWFDITSWLWYIRIFIMIVGGLIGLRIVFAVLSVINRVRQGYSPLSFQTLY | |
| PSPGGPDRPGRIEEEGGEQGRDRSIRLVSGFLALAWDDLRSLCLFSYHRLRDFILIAART | |
| VELLGHSSLKGLRLGWEGLKYLWNLLLYWGRELKISAISLLDTXAIAVAGWTDRVIEIGQ | |
| RICRAIINIPRRIRQGAERALL- | |
| >A.ZA.04.04ZASK162B1.DQ396400 | |
| MRVMETQRNYPRW-WIWGI-MILGMIIIGRS-----DNLWVTVYYGVPVWKDADTTLFCA | |
| SDAKAYSKEVHNVWATHACVPTDPNPQEMNLENVTEKFNMWKNGMVEQMHTDIISLWDQS | |
| LTPCVKLTPLCVTLNCTNS--NFTRNSNLTDDTDNNPNNTI---NMENEIKNCSFNVTTE | |
| IRDKRQKAYALFYKLDVVQIDNNSSE----------------YILINCNTSAITQACPKV | |
| TFDPIPIHYCAPAGFAILKCNDKQFNGSGICKNVSTVQCTHGIKPVVSTQLSLNGSLAEE | |
| DIMIRSENITDNTKNIIVQFNESVSINCTRPGNNTRKSIRI---GPGQTFFATGDIIGDI | |
| RQAHCNVSK-EWMKVLQQVVRKLRKEFE-NK-TIVFDNPS-GGDLEITMHSFNCKGEFFY | |
| CNTSGLFNRTW---NDTAWN-E--TTWNNINSNGS-------ITLQCRIKQILNMWQRVG | |
| QAMYAPPIPGEIRCESNITGLILTRDGG---LELNNTNNETFRPGGGDMRDNWRSELYKY | |
| KVIKIEPLGVAPTRAKRRVVEREKRAV--G-LGAV-FLGFLGAAGSTMGAASITLTVQAR | |
| QLLSGIVQQQSNLLRAIEAQQHLLKLTVWGIKQLQARVLAVERYLKDQQLLGIWGCSGKI | |
| ICTTTVPWNSSWS-NKSYDDIWDNMTWMQWEKEIGNYTELIYSLLEESQVQQEKNEQELL | |
| ALDKWASLWNWFDISRWLWYIKIFIMIVGGLIGLRIIFAVLSMLNRVRQGYSPLSFQTHI | |
| PNPEGLDRPGRIEEEGGEQGRDRSIRLVSGFLALAWDDLRNLCLFSYHRLRDFILIVART | |
| VEL-------GLRLGWKGIQYLWNLLLYWSQELRNSAISLLDTIAITVAGWTGRVIEIGQ | |
| RIVRAILHIPRRIRQGLERALQ- | |
| >A1.ES.05.X1608_8.FJ670519 | |
| MRVKGIQMNSQRL-LRWGT-MILGMIIICSA----AENLWVTVYYGVPVWKDAETTLFCA | |
| SDAKAYDTEKHNVWATHACVPTDPNPQEIRLDNVTEEFNMWKNNMVEQMHTDIISLWDQS | |
| LKPCVELTPLCVTLNCTE----------AYNDTDVNRTIAQ---GMEKEIQNCSFNMTTE | |
| LTDRQQKVHSLFYSLDLAQMGNSSYKGQIQTSNNNLSVTYHTYRLIHCNTSTIRQACPKV | |
| SFEPIPIHYCAPAGFAILKCNDTEFNGTGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAIG | |
| KVRIRSENITNNAKNIIVQFNSTVYINCTRPNNNTKRGLRI---GPGRTLYAADKIIGNI | |
| RQAHCNVSRTQWNKTMQEVGEQLETYF--NK-TIVFNSSS-GGDLEITTHSFNCGGEFFY | |
| CNTTGLFDGTW----NGTKS-N-ITW---ESINDT-------ITLPCKIKQVVRMWQRVG | |
| QAVYAPPITGAISCNSTITGLILTRDGG---DNSSGRESETFRPGGGDMRDNWRSELYKY | |
| KVVKIEPLGVAPTRAKRRVVEREKRAV--GMIGAV-FLGFLGAAGSTMGAAALTLTVQAR | |
| QLLSGIVQQQSNLLRAIEAQQHMLRLTVWGVKQLQARVLALERYLRDQQLLGIWGCSGKI | |
| VCTTNVPWNSSWS-NKTHXQIWENMTWLQWDREISNYTEIIYNLLEXSQNQQEXNEKDLL | |
| ALDKWANLWNWFDISKWLWYIKIFIMIVGGLIGLRIVFTVFSIINRVRQGYSPLSFQTLI | |
| PSAGDPDRPRGIEEGGGEQDRGRSIRLVSGFLALAWDDLRSLCLFSYHRLRDFILIATRT | |
| VELLGHNSLKGLRLGWEGLKYLWNLLVYWGRELKLSAVNLYDTIAIAVAGWTDRVIEIGQ | |
| RLCRAILNIPRRIRQGLERALL- | |
| >A1.CY.05.CY064.FJ388909 | |
| MRVMGTQRTCPCL-WRWGM-IILGMIIICSV----TGNLWVTVYYGVPVWKDADTTLFCA | |
| SDAKAYDTEVHNVWATHACVPTDPNPQEINLENVTEEFNMWKNNMVEQMHTDIISLWDQS | |
| LKPCVQLTPLCVTLNCRD---DDDINVANSTDTTNEVKNGS---ANITDEKNCSFTMTTD | |
| LIDKLIEVFSVFYRLDVVHIDKNSNN--------------SGYRLIN-NTTTVTQAGPKV | |
| SFDPIPIHYWAPAGFAILKCIEKDFNGTGTCKNVSSIHCTHGIKPVVSTQLLLNGSLAEG | |
| EVKIRSENLTNNAKTIIVQFVEPVHITCIRPYNNTRKGIHI---GPGQAFYAMSNIIGDI | |
| RQAHCNVSKTKWNATLSQVAKQLGNKFN-NR-TIIFNSSS-GGDIELTRHSFNCGGEFFY | |
| CNTSGLFNSTW---NNDTWNGNDTQESNETSSNGT-------IIPPCKIKQIVNMWQRVQ | |
| QAMYPPLVEGVIRCESIITGLLSTRDGG----INSRTN-ETFRPGGGDMRDNWRSELYKY | |
| KVVKIEPLGVAPTTAKRRVVEREKRAA--G-LGVM-FLGFLGAAGSTMGAASITLTVQAR | |
| QLLSGIVQQQSNLLKAIEAQQHLLRLTVWGIKQLQARVLAVERYLKDQQLLGIWGCSGKL | |
| ICTTTVPWNSSWS-NRSQEEIWNNMTWLQWEKEIGNYTGIIYRLLEESQNQQEKNEQDLL | |
| ALDKWASLWNWFSISNWLWYIKIFIMIVGGLIGLRIVFTVLSIINRVRQGYSPLSFQTHP | |
| PVQGDLDRPGRIEEEGGEQGRDRSIRLVSGFLALAWDDLRSLCLFSYHRLRDFILIAART | |
| VELLGHSSLKGLRLGWEGLKYLGNLLIYWGKEIKNSAVNLVDTIAIAVAGWTDRVIEIGQ | |
| RVGRAILNIPRRIRQGLERALL- | |
| >A1.CY.06.CY154.FJ388943 | |
| MRVMGIQRNCQRL-WRWGT-MLFWVIIICNA----TEKLWVTVYYGVPVWKDAETTLFCA | |
| SDAKAYDTEVHNVWATHACVPTDPNPQEINLGNVTEDFNMWKNPMVEQMQTDIISLWEQS | |
| LKPCVQLTPLCVTLDCSY---NITINKTDISNITYDLKRTDIG-NITDDLRNCSYNITTE | |
| LRDRRQNKYSLFYKLDVVQINNNDSR---------------HYRLINCNTSAITQACPKV | |
| SFEPIPIHYCAPAGYAILKCNDKEFNGTGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEK | |
| KIMIRTENITNNAKIIIVQLVKPVQIKCTRPGNNTRQSVRI---GPGQSFYATGDIIGDI | |
| RKAHCTVNATEWNNTLNNVTKQLQEIW--NK-TIAFDNPS-GGDLEITTHSFNCGGEFFY | |
| CNTSKLFKKDN----ETNKN-N-ETNNANITIQTT-------KIIPCRIKQIINMWQRVG | |
| QAMYAPPIKGVINCVSNITGLLLTRDGGNTGNSTTNKT-ETFRPGGGDMRDNWRSELYKY | |
| KVVKIEPLGIAPTKAKRRVVEREKRAI--G-MGAAFFIGFLGTAGSTMGAASMTLTAQAR | |
| QLLSGIVQQQNNLLRAIEAQQHLLKLTVWGIKQLQARVLAVERYLKDQQLLGIWGCSGKL | |
| ICTTNVPWNSSWS-NKSQSEIWENMTWLQWDKEISNYTYLIYTLIEESQHQQEKNEQELL | |
| ALDKWANLWNWFDISNWLWYIKIFIMIVGGLIGLRIVFAVLSVINRVRQGYSPLSFQTLT | |
| PNPRELDRPGRIEEEGGEQDRDRSIRLVSGFLALAWEDLRNLCLFSYHRLRDFILIAART | |
| VELLGRNSLKGLSLGWEGLKYLWNLLSYWGRELKTSAISLLDTIAVAVAEWTDRVIELGQ | |
| RAGRALLHIPRRIRQGLERALL- | |
| >A1.CD.02.LA01AlPr.KU168256 | |
| MRVMGTQKSYQNL-WRWGI-VIFGLVIICNA-----GQLWVTVYYGVPAWKDAVTTLFCA | |
| SDAKAYDKEVHNVWATHACVPTDPNPQEIKLVNVTEEFNMWKNPMVEQMHTDIIGLWDQS | |
| LKPCVQLTPLCVTLDCHD---NITSDNITNNGNTTNSPNITN--EMGGEIKNCSFNMTTE | |
| LRDKRKKVHSLFYRLDIVEIGNSSSS------NNH-----GQYRLINCNTSAITQACPKV | |
| TFEPIPIHYCAPAGFAILKCTEKRFNGTGPCRNVSTVQCTHGIKPVVSTQLLLNGSLAEE | |
| NVTIRSENITDNAKTLIVQLVKPVNITCIRPNNNTRKGIGI---GPGQTFYAADAIIGNI | |
| RHAYCVVNKTEWNKTLQQVVHKLREHW--NK-TIIFAPSS-GGDIEITTHSFNCGGEFFY | |
| CNTSGLFNSTW----HVNNT-S-----SLVNSTGN-------ITLPCRIKQIINMWQRVG | |
| QAMYAPPIPGIIKCESNITGLLLIRDGG---INNNSMN-ETFRPGGGDMRDNWRSELYKY | |
| KVVQIEPLGVAPTKAKRRVVEREKRAV--G-FGAV-FLGFLGAAGSTMGAASITLTAQAR | |
| QLLFGIVQQQSNLLRAIEAQQHLLKLTVWGIKQLQARVLAVERYLKDQQLLGLWGCSGKL | |
| ICTTAVPWNSSWS-NKSQEQIWENMTWQQWEKEISNYTSIIYDLLEDSQNQQEKNEQELL | |
| ALDKWTNLWNWFDISKWLWYIKIFIMIVGGLIGLRIVFAVLAILNRVRQGYSPLSFQTHI | |
| PNPEGLDRPRGIEEEGGEQGKIRSIRLVSGFLALAWDDLRSLCLFSYHRLRDFVLIAART | |
| VELLGHSSLKGLRLGWEGLKYLGNLLLYWGRELKISAINLLDTIAVAVAGWTDRVIEIGQ | |
| RACRALLNIPRRIRQGFERALL- | |
| >A1.CH.03.HIV_CH_BID_V3538_2003.JQ403028 | |
| MRVMGMQRNYPHW-WKWGI-VLFWLLIICNA----TEKLWVTVYYGVPVWKDAVTTLFCA | |
| SDAKAYDTEVHNVWATHACVPTDPNPHEIPLANVTEEFNMWKNNMVEQMHTDIISLWDQS | |
| LKPCVKLAPLCVTLECND-------------ANRTNINIT----EEEFKVKNCSFNMTTI | |
| LRDKKQKMHALFYRTDVVQIGSNSSE--------R-----YKYRLINCNTSAITQACPKV | |
| SFEPIPIHYCAPAGFAILKCNDKEFNGTGPCMNVSTVQCTHGIKPVASTQLLLNGSLAEG | |
| KIMIRSENLTDNAKIIIVQLNESVSINCTRPNNNTRKSWHI---GPGQAFYAMDDILGDI | |
| RKAQCNVNRTAWENTLQKIATQLRIMY--NK-TIEFKNSS-GGDLEITTHSFNCGGEFFY | |
| CNTTELFNSTW------NDT-S-NTS-QGTNNNST-------ITLPCRIKQFVNMWQRVG | |
| QAMYAPPIKGKIQCISNITGLLLTRDGG---KGKSNIT-EIFRPEGGNMKDNWRSELYKY | |
| KVVKIEPLGVAPTKAKRRVVEREKRAV--G-LGAV-FLGFLGAAGSTMGAASITLTAQAR | |
| QLLSGIVQQQSNLLRAIEAQQHLLKLTVWGIKQLQARVLAVERYLQDQQLLGIWGCSGKL | |
| ICTTNVPWNSSWS-NKSQEDIWGNMTWLQWEKEISNYTSIIYELLEESQNQQEKNEQDLL | |
| ALDKWASLWNWFNISNWLWYIKIFIMIVGGLIGLRIVFTVLSIINRVRQGYSPLSFQTHT | |
| PNPEGLDRPGRIEEEGGEQGRGRSIRLVSGFLALAWDDLRSLLLFSYHRLRDFALIAART | |
| VELLGHNSLKGLRLGWEGLKYLGNLLLYWGRELRVSAITLLDATAITVAGWTDRVIEIGQ | |
| RFCRAILHIPRRIRQGLERALI- | |
| >A1.CY.08.CY230.JF683779 | |
| MRAREMQMNSHCW-LKWGTMMILGMIIICSA----ENNLWVTVYYGVPVWKEADTTLFCA | |
| SDAKAYKTEVHNVWATHACVPTDPNPQEINMANVTEKFNMWKNNMVEQMHTDIISLWDQS | |
| LKPCVKLTPLCVTLNCNN-----------VNNTSNTNNTTNVTAEMREEIKNCSFNATTI | |
| LRDKTQRIHSLFYRLDIVPINSNNSN--------N-----SENRLKNCNTSSITRDCSNV | |
| SFDRLPVPYGAPAGFASLQCDVKDLNGTGIGNNVTRIHCTDGIRPVVSTQLLLNGSLAEN | |
| RTMIRSENITNNAKNIIVQFNTTVNITCIRPNNNTRTSVRI---GPGQAFYATGDIIGDI | |
| RQAHCNVSGEQWNKALQKVVKELRIHF--NK-TIIFTKSS-GGDPEITTHSFNCGGEFFY | |
| CNTSGLFNSTW----YTNNS-M------QPNYTKT-------ITLPCRIKQVINMWQRVG | |
| QAMYAPPIPGIIQCVSNITGLILTRDGG----HNNSAN-ETFRPGGGDMRDNWRSELYKY | |
| KVVKVEPLGVAPTRARRRVVEREKRAV--G-IGAV-FLGFLGAAGSTMGAASVTLTVQAR | |
| QLLSGIVQQQSNLLRAIEAQQHMLKLTVWGIKQLQARVLALERYLQDQQLLGIWGCSGKL | |
| ICTTNVPWNSTWS-NKNLTQIWDNMTWQQWDKEIDNYTQVIYNLLEESQNQQEMNEKDLL | |
| ELDKWANLWNWFSITNWLWYIRLFIMIVGGLIGLRIVFAVLSVINRVRQGYSPLSFQTHT | |
| PSPRELDRPREIEEEGGEQGRDRSIRFVSGFLAIAWDDLRSLCLFSYHRLRDFISIATRT | |
| VELLGHSSLKGLRLGWEGLKYLGNLLIYWIQELKSSAISLVDTIAVVVAGWTDRVIEIGQ | |
| RIGRAIFNIPRRIRQGLERALL- | |
| >A1.CY.08.CY218.JF683767 | |
| MRARGIQRNYQHL-LTWGT-IILGLIIICSA----AQNLWVTVYYGVPVWKDAETTLFCA | |
| SDAKAYETEKHNVWATHACVPTDPNPQEIPLENVTENFNMWKNNMVEQMHTDIISLWDQS | |
| LQPCVKLTPLCVTLNCTNVR-NVTGNSTGSSFTGGPEELKT---GGPEELKNCSFNMTTV | |
| LRDKKQKVYSLFYRLDIVQIDKDNNS---SGNNSY-----NEYRLINCNTSAITQACPKV | |
| SFEPIPIHYCAPAGFAILKCRNNSFDGTGPCNNVSTDQCTHGIKPVVSTQLLLNGSLAEE | |
| KIMIRSENITNNAKTIIVQLVKPVTINCTRPNNNTRKIVRIGPGGPGQAFY-TNDIIGDI | |
| RRAYCTVNASEWNETLEQVVEQLRVHFG-NK-TINFTKPS-GGDLEITTHSFNCGGEFFY | |
| CNTSGLFNSSW----NINGS-R---S-NSTRSNGN-------ITLPCRIKQIINMWQRTG | |
| QAMYAPPIQGVIRCVSNITGLLLTRDGG---GNNTNET-EIFRPGGGDMRGNWRSELYKY | |
| KVVKIDPPGVAPNTARRRVVGREKRAA--GIIGAV-FLGFLGAAGSTMGAASVTLTVQAR | |
| QLLSGIVQQQSNLLRAIEAQQHLLKLTVWGIKQLQARVLAVERYLKDQQLLGIWGCSGKL | |
| ICPTNVPWNSSWS-NKSMEDIWDNMTWLQWEKEISNYTDIIYNLIEESQNQQEKNEQDLL | |
| ALDKWANLWNWFEISKWLWYIKIFIMIVGGLIGLRIVFAVLSIINRVRQGYSPLSFQTLT | |
| PNPRELDRLGRIEEEGGEQDRGRSIRLVSGFLALAWDDLRSLCLFSYHRLRDFTLIAART | |
| VEILGHSSLKVLRLGWEGLKYLWNLLVYWGQELKTSATNLFDTIAIAIAGWTDRIIEIGQ | |
| RIVRAFLNIPRRIRQGFERALL- | |
| >A1.BE.94.VI1383_20.FM165645 | |
| MRVMGIQMNCQNL-WRWGT-MILGMIIICSA----TTNLWVTVYYGVPVWKDAETTLFCA | |
| SDAKAYDTEVHNTWATHACVPTDPNPQEIQLENVTEKFNMWKNNMVEQMHEDIISLWDQS | |
| LKPCVKLTPLCVTLECHN-----------YKGNGTNNTYINGTDAMQGEIKNCSYNMTTE | |
| LRDKKQKVYSLFYRLDIVPISEKNSN--SNSNNSS-----SKYRLINCNTSAITQACPKV | |
| SFEPIPIHYCAPAGFAILKCNDIDFNGTGLCKNVSTVQCTHGIRPVVSTQLLLNGSLAEK | |
| EVRIRSENITNNAKTIIVQLDQPVNITCMRPNNNTRKSVHI---GPGQAFYATGDIIGNI | |
| REAHCNVSREDWNNTLQKVATQLRKHFG-NK-TIIFAKSS-GGDLEITTHSFNCEGEFFY | |
| CNTSGLFNSSW---ENDTGS-T-QES-NRTKSNDT-------ITLPCRIKQIINMWQRAG | |
| QAIYAPPIPGVIQCQSNITGLLLTRDGG----NNNTTN-ETFRPGGGNMRDNWRSELYKY | |
| KVVKIEPLGVAPTTARRRVVEREKRAV--G-LGAL-FIGFLGAAGSTMGAASVTLTVQAR | |
| QLLSGIVQQQNNLLRAIEAQQHLLKLTVWGIKQLQARVLAVERYLHDQQLLGIWGCSGKL | |
| ICTTNVPWNDSRS-NKSLNDIWNNMTWMQWDEEISNYTQIIYNLLEKSQNQQEKNEQELL | |
| ALDKWASLWNWFNISNWLWYIRIFIIIVGGLIGLRIVFAVLSIINRVRQGYSPLSFQTHT | |
| PNPRDLDRPGRTEEEGGEQGRDRSIRLVNGFLALAWEDLRSLCLWSYHLLRDFILVAART | |
| VELLGRSSLKGLRLGWEGLKYLGNILLYWARELKISATSLLDTIAIVVAGWTDRAIEITQ | |
| NICRGILHIPRRIRQGFERALL- | |
| >A1.BE.97.PIC771_15.FM165628 | |
| MRVMGTQMNCQNL-WRWGT-MILGMIIICSA----TTNLWVTVYYGVPVWRDAETTLFCA | |
| SDAKAYDTEVHNIWATHACVPTDPDPQEIILKNVTEEFNMWKNNMVEQMHADIISLWDQS | |
| LKPCVQLTPPCVTLECND-----------YNSTKSNNTAPT---ETPEEVKNCTFNTTTE | |
| LRGKKKKEYSLFYRLDIVQINEDNSS------------DSRKYRLINCNTSAITQACPKV | |
| SFEPIPIHYCAPAGFAILKCNDIEFNGTGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEQ | |
| DIRIRSENISQNHKTIIVQFNQPVAINCTRLRNNTRRSIHI---GPGQAFYATGAIIGDI | |
| RSAHCNTSSKAWNKTLHRVATQLRKHF--NG-TIIFTNAS-GGDLEITTHSFNCGGEFFY | |
| CNTSRLFNSSW----EPLGQ-Y-----DDSQSNDT------NITLPCRIKQIIRMWQRTG | |
| QAIYAPPIQGEITCRSNITGLLLTRDGG---NKTNETS-ETFRPGGGDMRDNWRSELYKY | |
| KVVKIEPLGVAPTKAKRRVVEREKRAV--G-LGAV-LIGFLGTAGSTMGAASVTLTVQAR | |
| QLLSGIVQQQNNLLRAIEAQQHLLKLTVWGIKQLQARVLAMERYLHDQQLLGIWGCSGRL | |
| ICTTNVPWNASWS-NRSQNEIWNNMTWLQWDKEVGNYTDIIYDLLEKSQNQQEKNEQDLL | |
| ALDKWASLWNWFNISKWLWYIKIFIMIVGGLIGLRIVFAMLSIINRVRQGYSPLSFQIHT | |
| PNPRDLDRPGRIEEEGGEQGRDRSIRLVQGFLALAWDDLRNLCLFSYHRLRDFILIAART | |
| VELLGHSSLKGLRLGWEGLKYLGNVLLYWGRELKFSATSLLDTIAIVVAGRTDRVIEITQ | |
| SLCRAILNIPRRIRQGLERALL- | |
| >A1.BE.x.VI2809.EU191615 | |
| MRVMGTQMDCQNL-WRWGT-MILGMIIICSA----TTNLWVTVYYGVPVWRDAETTLFCA | |
| SDAKAYATEVHNVWATHACVPTDPDPQEVIMENVTEEFNMWKNNMVEQMHADIISLWDQS | |
| LKPCVQLTPLCVTLECAN---YTGTAYNCTACKNGTSTMVPPIVETPGEIQNCSFNITTE | |
| LRDKKKKVHSLFYRVDIVQIDNSSSN------SNT-----SKYRLINCNTSAITQACPKV | |
| SFEPIPIHYCAPAGFAILKCNDIEFNGTGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEK | |
| EIRIRFENITDNAKAIIVQFNQSVEINCTRPNNNTRTSVHI---GPGQAFYATGDIIGDI | |
| RNAHCNVSRKNWTEALYRVATQLRKHF--NR-TINFTSAS-GGDLELTTHTFNCGGEFFY | |
| CNTSTLFNSSWPLNQSNSWS--------NGGNDTN-------ITLPCRIKQIIRMWQRTG | |
| QAIYAPPIEGVIMCRSNITGLLLTRDGGNEANKTNETA-EIFRPGGGDMRDNWRSELYKY | |
| KVVKIEPLGVAPTRAKRRVVEREKRAV--G-LGAV-LIGFLGTAGSTMGAASVTLTVQAR | |
| QLLSGIVQQQNNLLRAIEAQQHLLKLTVWGIKQLQARVLAMERYLHDQQLLGIWGCSGRL | |
| ICTTNVPWNTSWS-NKSQDEIWNNMTWLQWDKEVGNYTDIIYDLLEKSQNQQEKNEQELL | |
| ALDKWASLWNWFNISNWLWYIKIFIMIVGGLIGLRIVFAVLAIINRVRQGYSPLSFQIHT | |
| PNPRDLDRPGRIEEEGGEQGRDRSIRLVQGFLALAWDDLRNLCLFSYHRLRDFILIAART | |
| VELLGHSSLKGLRLGWEGLKYLGNVLLYWGRELKISATSLLDTIAIAVAGWTDRVIEITQ | |
| NLCRAILNIPRRIRQGLERALL- | |
| >A1.CM.07.46_10.KP718918 | |
| MRVMGTQMNYQNW-WRWGT-IILGMIIICSV----AENLWVTVYYGVPVWRDAETTLFCA | |
| SDAKAYDTEVHNVWATHACVPTDPNPQELPLKNVTEDFNMWKNSMVEQMHTDIISLWDQS | |
| LKPCVKLTPLCVTLNCSN---------------INKNVTNG---TDIDMMKNCSFNMTTE | |
| IRDKKQKVYSLFYKLDIVPISEGNST------SNN-----SQYILINCNTSAITQACPKV | |
| SFEPIPIHYCAPAGFAILKCRDPKFNGKGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEQ | |
| EAMIRSENITDNTKTIIVQLNQSVIINCTRPNNNTRKSVRI---GPGQSFYATGDIIGDI | |
| RQAHCNVSKGDWNKALQEVVTQLGEHFG-NK-TIKFNSSA-GGDLEITTHSFNCGGEFFY | |
| CNTSGLFNSTW----FSNGS-RGNESMEDDTNITH-------ITLPCRIRQIVNMWQRAG | |
| QAMYAPPIQGVIKCTSNITGILLTRDGG---YNISNNDTEIFRPGGGNMKDNWRSELYKY | |
| KVVKVEPLGIAPTRAKRRVVEREKRAV--G-IGAV-FIGFLGAAGSTMGAASITLTAQAR | |
| QLLSGIVQQQSNLLRAIEAQQHLLKLTVWGIKQLQARVLAMEGYLRDQQLLGIWGCSGKL | |
| ICTTTVPWNSSWS-NKSYTEIWNNMTWLQWDKEVSNYTQEIYKLIEESQNQQEKNEQDLL | |
| ALDKWANLWNWFDISNWLWYIKIFIMIVGGLIGLRIVFAVLAIINRVRQGYSPLSLQTLY | |
| PNPRGRDRPGEIKEEGGEQDRDRSIRLVSGFLALAWDDLRSLCLFSYHQLRDFILI---- | |
| ---LGHSSLKGLRQGREGLKYLGNLLLYWGRELKISAVNLLDTIAIAVAGWTDRIIEVGQ | |
| RIGRAIIHIPVRIRQGLERALL- | |
| >A1.CM.03.CM54_7.KU168305 | |
| MRVMGTQTSYQNL-WRWGT-IILGMIIICSV----AEERWVTVYYGVPVWRDAETTLFCA | |
| SDAKAYDTEMHNVWATHACVPTDPNPQEILLGNVTEDFNMWKNNMVEQMHTDIISLWDQS | |
| LKPCVKLTPLCVTLHCRN---------------IPNVTS----------MTNCSYNTTTE | |
| LRDKRQKVYSLFYKLDXVPINENNSQ----------------YXLINCNTSAXTQACPKV | |
| TFEPIPIHYCAPAGFAILKCKDPEFNGTGPCKNVSSVQCTHGIKPVVSTQLLLNGSLAED | |
| KVMIRSENITDNAKTIIVQFNQSVEINCTRPNNNTRKSIRI---GPGQSFYAT-DIIGDI | |
| RQASCTVKRADWEKTLQEVVKQLGEHFK-NRTTIKFNSSS-GGDLEVTTHSFNCGGEFFY | |
| CNTSGLFNSTWKTNGTSTWK-ETNGTGSQENSNDN-------ITLPCRIKQIINMWQRAG | |
| QAMYAPPIAGVIKCNSNITGLLLTRDGG---SNNNSQE-ETFRPGGGNMKDNWRSELYRY | |
| KVVQIEPLGIAPTRARRRVVGREKRAV--G-LGAV-FIGFLGAAGSTMGAASITLTAQAR | |
| QLLSGIVQQQSNLLRAIEAQQHMLKLTVWGIKQLQARVLAVERYLKDQQLLGIWGCSGKL | |
| ICTTNVPWNSSWS-NKTQNEIWNNMTWLQWDKEINNYTQEIYRLIEESQNQQEKNEQDLL | |
| ALDKWSNLWNWFDISKWLWYIRIFIMIVGGLIGLRIVFAVLSIINRVRQGYSPLSFQTLT | |
| PNPRGLDRPGRIEEEGGEQDRDRSIRLVSGFLALAWDDLRSLCLFSYHRLRDFILIAART | |
| VELLGHSSLKGLRLGREGLKYLWNLLLYWGRELRTSAVNLLDTIAIAVAGWTDWVIEIGQ | |
| RICRAVINIPTRIRQGFERALL- | |
| >A1.CM.08.886_24.KP718928 | |
| MRVMGTQMNWQGL-WRWGT-IILGMIMICSV----AGNLWVTVYYGVPVWRDAETTLFCA | |
| SDAKAYDTEMHNVWATHACVPTDPDPQEINLENVTEDFNMWKNSMVEQMHTDIISLWDQS | |
| LKPCVKLTPLCVTLNCSS---------------IITNSTVN---ETRQGMRNCSFNTTTA | |
| LRDKRQRVYSLFYKLDIVPINGDNST--------------NTYMLINCNTSAITQACPKV | |
| TFEPIPIHYCTPAGFAILKCKDPTFNGTGPCRNVSSVQCTHGIKPVVSTQLLLNGSLAEQ | |
| KVMIRSENITDNTKTIIVQLNQSVVINCSRPNNNTRRSIRI---GPGQSFYATGEIIGDI | |
| REARCNVNGTEWNKALQKVVIQLREHFG-NK-TIKFNSSS-GGDLEITTHSFNCAGEFFY | |
| CNTSGLFNSTW----HSNGT-A------NGTENAT-------ITLPCRIKQIINLWQRVG | |
| QAMYAPPIPGIINCTSNITGLLLTRDGG----NASEET-ETFRPGGGNMKDNWRSELYKY | |
| KVVKIEPLGVAPTRAKRRVVEREKRAV--G-IGAV-FIGFLGAAGSTMGAASITLTAQAR | |
| QLLSGIVQQQSNLLRAIEAQQHMLKLTVWGIKQLQARVLAVERYLKDQQLLGIWGCSGKL | |
| ICTTNVPWNSSWS-NKSQDDIWKNMTWLQWDREISNYTQEIYKLIEESQNQQEKNEQDLL | |
| ALDKWATLWSWFDISNWLWYIRIFVIIVGGLIGLRIVFAVLSIIKRVRQGYSPLSFQILT | |
| PNPRGVDRPGGIEGEGGEPDRDRSIRLANGFLALAWDDLRSLCLFSYHRLRDFILIVART | |
| VELLGHSSLKGLRLGWEGLKHLWNLLLYWGRELKNSAVNLLDTIAIAVAGWTDWVIELGQ | |
| RICRAIRNIPRRIRQGLERALL- | |
| >A1.CM.97.97CM_MP582.AM279343 | |
| MXAMGIQMNYQNL-WKWGT-MILGMLIICST----AEKLWVTVYYGVPVWKDADTTLFCA | |
| SDAKAYDTEVHNVWATHACVPTDPDPREMPLKNVTEEFNMWKNNMVEQMHTDIISLWDQS | |
| LKPCVKLTPLCVTLDCHDSIFNTTSNSTTNSTNSPRNDTAERI-EMQREIQNCSYNMTTE | |
| LRDKKKKMYSLFYRLDLVQINDDSSN---NSTYSN-----STYRLINCNTSAITQACPKV | |
| SFEPIPIHYCAPAGFAILKCNNIEFNGTGPCTNVSTVQCTHGIRPVISTQLLLNGSLAEG | |
| EVRIRSENITNNAKTIIVQLDEGVHINCTRPNNNTRKSVHI---APGQAFYATGAIIGDI | |
| RRAYCQINGTRWNETLHKIVKQLRKHFN-NR-TIIFNSSS-GGDLEITTHSFNCGGEFFY | |
| CNTSGLFNSTW---FNSTWN-D-TISNNNTGSNDT-------IYLPCRIKQIINMWQRTG | |
| QAMYAPPIRGIIQCNSTITGLLLTRDGG---INNNSTN-ETFRPGGGNMRDNWRSELYKY | |
| KVVKIEPLGVAPTKARRRVVEREKRAV--G-LGAV-FIGFLGAAGSTMGAASITLTVQAR | |
| QLLSGIVQQQNNLLRAIEAQQHLLKLTVWGIKQLQARLLAVERYLKDQQLLGIWGCSGKL | |
| ICTTNVPWNSSWS-NKSQSEIWDNMTWLQWDKEISNYTDIIYNLIEESQIQQEKNEQDLL | |
| ALDKWANLWNWFDITNWLWYIKIFIMIVGGLIGLRIVFAVLAIINRVRQGYSPLSFQILN | |
| PNPGGLDRPGRIEEEGGEQGRGRSIRLVSGFLALAWDDLRSLCLFSYHRLRDFILIAART | |
| VELLGHSCLKGLRLGWESLKYLWNLLLYWGRELKISAINLLDTIAVAVAGWTDRVIEIGQ | |
| RICRAIRNIPRRIRQGAERALV- | |
| >A1.CY.09.CY243.JF683789 | |
| MKVKGIQMNLHCL-LTWG--MILGMITFCSA----ARKLWVTVYYGVPVWKDAKTTLFCA | |
| SDAKAYSTEKHNVWATHACVPTDPNPQEMHLENVTEEFNMWKNNMVEQMHTDIISLWDQS | |
| LKPCVKLTPLCVTLNCSY---NITSKVNKTFIDDINSTI-----DMKTEIKNCSFNTTTK | |
| IKNKVQKVHSLFYKLDIVPMGSDNSS----------------YRLINCNTSTITQACPKI | |
| TFEPIPIHYCAPAGFAILKCNDNNFNGTGPCTSVSAVQCPRGIKPVVSTQLLINGSLAEN | |
| ETMIRSENITNNAKNIIIQLKEPVRINCTRPNNNTRKSVRI---GPGQAFYATDEIIGDI | |
| RQARCEVNETEWNRTLHEVVKQLRTYFV-NK-TIAFNKSS-GGDLEITTHSFNCGGEFFY | |
| CNTSKLFNSIW----HPNDT-M-QEE-TNTNPNAN-------ITLPCRIKQIINLWQRVG | |
| KAIYAPPIRGRIECVSNITGLIITRDGG----NNTNNT-EIFRPAGGDMRDNWRSELYKY | |
| KVVQIEPLGIAPTEARRRVVQREKRAI--G-LGAM-FIGFLGAAGSTMGAASVTLTVQAR | |
| QLLSGIVQQQSNLLMAIEAQQHLLKLTVWGIKQLQARVLAVERYLKDQQLLGIWGCSGKL | |
| ICTTNVPWNKTWS-NRTKEEIWNNMTWMQWEKEIDNYTGLIYNLIEKSQNQQEINEKELL | |
| ELDKWDSLWSWFSITNWLWYIKIFIMIVGGLIGLRIVFAVLSIIRRVRQGYSPLPFQIHT | |
| PNPGGLDRPGRIEEEGGEQDRDRSIRLANRFLALAWDDLRNLCLVSYHRLRDFILIVART | |
| VELVGQSSLKGLRLGWEGLKYLGNLLVYWIRDLKISAINLLDTIAIAVAGWTDTVIEIGQ | |
| RIGRAILNIPRRIRQGLERALL- | |
| >A1.AU.04.PS1044_Day177.DQ676873 | |
| MRAKGIQMNLHCL-LKWGT-MILGMILICSA----AEQRWVTVYYGVPVWKDAETTLFCA | |
| SDAKAYDTEVHNVWATHACVPTDPNPQEINLKNVTEEFNMWKNNMVEQMQEDIISLWDQS | |
| LKPCVKLTPLCVTLNCSH---EVIFNSTLNNSTXSNXTLNNNTIEMKEEVRNCSYNVTTV | |
| LRDKKQKIYSLFYRLDVVPIGNNSDS---------------EYILINCNTSTITQACPKV | |
| SFEPIPIHYCTPAGYAILKCNDKDFNGTGPCKNVSTVQCTHGIKPVVTTQLLLNGSLAEN | |
| RTMIRSKNITDNKENIIVQLTEPVNITCIRPNNNTRKSVRI---GPGQTFYATGEIIGDI | |
| RKAHCVVNKTEWNKNLKKVVVQLRTYFK-NK-TISFTNHS-GGDPEVTTHSFNCGGEFFY | |
| CNTSELFNRTW----NATDQ-L-NSTEDSTALNET-------IILPCRIKQVINMWQTPG | |
| QAMYAPPIRGAIRCESNITGLILTRDGG---NDNTSTN-ETFRPGGGDMRDNWRSELYKY | |
| KVVRIEPLGIAPTTAKRRVVQREKRAV--G-IGAV-FIGFLGAAGSTMGAASITLTVQAR | |
| QLLSGIVQQQSNLLRAIEAQQHMLKLTVWGIKQLQARVLALERYLKDQQLLGIWGCSGKL | |
| ICTTNVPWNNTWS-NKNKSEIWDKMTWLQWDKEISNYTQIIYNLIEESQTQQEINEQELL | |
| ALDKWANLWNWFDISQWLWYIKIFIMIVGGLIGLRIVFAVLSIISRVRQGYSPLSFQTHT | |
| PNPEGLDRPGRTEEEGGEQGRDRSIRLVSGFLALXWDDLRSLCLFSYHRLRDLLSIVTRT | |
| VELLGHSSLKGLRLGWEGLKYLWNLLVYWSQELKISAVNLYDTIAIAVAGWTDRVIEIGQ | |
| GICRAILNIPRRIRQGLERALL- | |
| >A.CM.98.98CM_MP1014.AM279354 | |
| MRVRGIQRNYAPL-WRWGM-IFLGMIIICKA----TENLWVTVXYGVPVWRDAETTLFCA | |
| SDAKAYDXEVHNVWATHACVPTDPNPQEIELKNVTEKFNMWKNSMVEQMHADIISLWDQS | |
| LXPCVKLTPLCVTLRCHD-------FNSSNSNTSSASNISSGMQDMQGEIKNCSFNMTTE | |
| LRDKQQKVSALFYRLDVVEINNNKSE----------------YRLINCNTSAITQACPKV | |
| TFEPIPIHYCAPAGYAILKCNDXNFNGTGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEG | |
| NVXIRSENLTNNAKTIIVQLADPVNITCIRPNNNTRKSVHI---GPGQAFYATGDIIGDI | |
| RQAHCNVXRXXWNNTLHKVAEQLRQYFX-NK-TIAFNKSS-GGDLEITTHSFNCGGEFXY | |
| CNTSGLFNSTW----NGTGS-A-----NNTGLNGX-------ITLPCRIRQIVKMWQXVG | |
| QAMYAPPIQGIIRCESNITGLLLTRDGG----NNNNTV-ETFRPGGGDMRDNWRSELYKY | |
| KVVKIEPLGVAPTRAKRRVVEREKRAVV-G-LGAV-FLGFLGAAGSTMGAASITLTVQAR | |
| QLLSGIVQQQSNLLRAIEAQQQLLKLTVWGIKQLQARVLAVERYLKDQQLLGIWGCSGKL | |
| ICTTNVPWNSSWS-NKSQNEIWXNMTWLQWDKEIDNYTXIIYRLLEESQNQQEKNEQDLL | |
| ALDKWANLWTWFDISNWLWYIKIFIMVVGGLIGLRIVFAVLSIINRVRQGYSPLSFQTHT | |
| PNPEGPDRPERIEEEGGRQDRDRSIRLVSGFLALAWDDLRSLCLFSYHRLRDFILIVARI | |
| VELLGHNSLKGLRLGREGLKYLWNLLLYWGRELKSSAINLLNTIAIAVANWTDRVIEIGQ | |
| RAGRAILNIPRRIRQGLERALI- | |
| >A1.ES.06.X2110.FJ670523 | |
| MRAKGIQRNSQDL-LTWGT-MILGLIILCSA----ADNLWVTVYYGVPVWKDADTTLFCA | |
| SDAKAYDTEVHNVWATHACVPTDPNPQEIPLVNVTEEFNMWKNNMVEQMHTDIISLWDQS | |
| LKPCVKLTPLCVTLNCGH---NDT-------LTNXTAPVNN---TMREEVRNCSYNMTTE | |
| LRDKQKKVFSLFYKLDVVSINNSSSQ----------------YRLINCNTSAITQACPKV | |
| SFEPIPIHYCAPAGFAILKCRDNKFNGTGPCRNVSTVQCTHGIRPVASTQLLLNGSLAEE | |
| EVMIRSENISNNAKNIIVQLKEPVNITCARPGNNTRTSVRI---GPGQAFYATGDIIGDI | |
| RQAHCNVSRAAWNKTLQEVVKQLRKYFV-NE-TITFTNSS-GGDPEIVTHSFNCGGEFFY | |
| CNTSGLFNSTW---PNSTWN-A-NTSIQESNSTDN-------ITLQCRIKQIINLWQRAG | |
| KAIYAPPIQGAIQCISNITGLILTRDGG----NNGTNNTEIFRPGGGDMRDNWRSELYKY | |
| KVVKIEPLGVAPSRAKRRVVGREKRAV--T-IGAV-FLGFLGAAGSTMGAASLTLTVQAR | |
| QLLSGIVQQQSNLLQAIEAQQHLLKLTVWGIKQLQARVLALERYLKDQQLLGIWGCSGKI | |
| ICPTAVPWNYTWSNNKSYDEIWKNMTWLQWDKEVSSYTDQIYNLIEKSQNQQEINEQDLL | |
| ALDKWADLWNWFDISKWLWYIRIFIMIVGGLIGLRIVFAVLSIIKRVRQGYSPLSFQTLT | |
| PNPRELDRPRRIEEEGGEQGRGRSIRLVSGFLALAWDDLRSLCLFSYHQLRDFVLIVTRA | |
| VELLGHSSLKGLRLGWEGLKYLGNLLIYWIRELKISAISLLDTTAIVIAGWTDRIIEIGQ | |
| GIGRAILNVPRRIRQGLERSLL- | |
| >A1.CY.06.CY164.FJ388946 | |
| MKAKGIQRNSHGL-LRWGM-MILGMFMICSA----TENLWVTVYYGVPVWREADTTLFCA | |
| SDAKAYEPEVHNVWATHACVPTDPNPQEINMKNVTEEFNMWKNNMVEQMHTDIISLWDQS | |
| LKPCVKLTPLCVTLECRDV--NVNSTNTTTNATIERRGEIA---EEPGEIKNCSFNMTTE | |
| LRDKRQKVYSLFYRLDIVPINSNSIN---SSSSDS-----SEYRLINCNTSAITQACPKV | |
| SFEPIPIHYCAPAGFAILKCNDKEFNGTGLCRNVSTVQCTHGIRPVVSTQLLLNGSLAEN | |
| RTMIRSENISDNAKNIIVQFTEPVNITCIRPNNNTRKSVRI---GPGQAFYATGDIIGNI | |
| RQAYCEVNGSQWNKALQKVVNQLKTHFE-NATTITFNKSS-GGDLEITTHSFNCGGEFFY | |
| CNTSGLFNRTW----STNTS-M-QVS-NSTELNGP-------IILQCRIKQIINMWQRVG | |
| QAIYAPPIPGVIRCESNITGLILTRDGG----NNNTGN-QTFRPVGGDMKDNWRSELYKY | |
| KVVKIEPLGVAPSKAKRRVVEREKRAI--G-IGAV-FIGFLGAAGSTMGAASVTLTVQAR | |
| QLLSGIVQQQSNLLRAIEAQQHLLNLTVWGIKQLQARVLALERYLRDQQLLGIWGCSGKL | |
| ICTTNVPWNSTWS-NKSLDEIWKNMTWLQWDKEINNYTQLIYNLIEESQNQQAINEKELL | |
| ELDKWASLWSWFDITNWLWYIKIFIMIVGGLIGLRIVFAVLAVINRVRQGYSPLSFQIHT | |
| PTPRGLHRPRRLVEEGGEQGSGSSIRLVSGFLSLASYDLLSLCLFIYHRLINFILIAATT | |
| IELLVHSSLNKLRLVWEDLNYLGNLLAYWILELKISTINFLDTITIIVAAWTDKIIKIIQ | |
| NICR------------------- | |
| >A1.CY.05.CY023.FJ388894 | |
| MRAKGMQMNLHCL-LRWGT-MILGMIIICRA----VENTWVTVYYGVPVWRDAETTLFCA | |
| SDAKAYKSEVHNVWATHACVPTDPNPQEINLENVTEKFNMWKNNMVEQMHIDIISLWDES | |
| LKPCVKLTPLCVTLECSN------HVMSTNASTNATANINS---DMREEIKNCSHNITTE | |
| LRDKKQKVHSLFYRLDIVPINSNNDN-----NNTS-----KEYRLINCNTSAITQACPKV | |
| SFEPIPIHYCAPAGFAILKCNDKMFNGTGICRNVSTVQCTHGIRPVVSTQLLLNGSLAEK | |
| EIMIRSENITNNAKNIIVQLTKPVNITCIRPNNNTRKSIHI---GPGQAFYATGDIIGDI | |
| RQAHCNVSGTVWYETLQNVTEQLRKHFM-NK-TINFTKSS-GGDPEITTHSFNCGGEFFY | |
| CNTSSLFNSTW-NI-NTIWN-N-TMS-NSTESNGT-------IVLPCRIKQIVNVWQRAG | |
| QAIYAPPIQGIIQCVSNITGLILTRDGG---NNNNTNNTEIFRPGGGDMRDNWRSELYKY | |
| KVVKIEPLGVAPTKARRRVVGREKRAV--G-LGAV-FLGFLGTAGSTMGAASITLTVQAR | |
| QLLSGIVQQQSNLLRAIEAQQHLLKLTVWGIKQLQARVLAVERYLRDQQLLGIWGCSGKL | |
| ICTTNVPWNSTWS-NKSLDDIWNNMTWLQWDEEINNYTEQIYRLIEESQNQQEKNEKELL | |
| ELDKWASLWTWFDITKWLWYIKIFIMIVGGLIGLRIVFAVLSIINRVRQGYSPLSLQIPA | |
| PETAGLDRLRRIEEEGGEQDRGRSIRLVSGFLALAWDDLRSLCLFSYHRLRDFILIVTRT | |
| VEILGHNSLKGLRLGWEGLKYLWNLLVYWTRELKISAINLFNTIAITVAGWTDRVIEIGQ | |
| RLCRAIFNIPRRIRQGLERALL- | |
| >A1.CY.07.CY182.JF683737 | |
| MRAKGIQRNSHYL-LTWGT-MILGMIIICSA-----TNMWVTVYYGVPVWKDAETTLFCA | |
| SDAKAYKTEVHNVWATHACVPTDPNPQEINMENVTEEFNMWKNNMVEQMHTDIISLWDQS | |
| LKPCVKLTPLCVTLECSN----------------VTTNITG---EMKEEINSCSFDVTTV | |
| LRDKRKKSYSLFYILDIPPVNSNSNS----DNKNS-----MEYRLINCNTSVITQGCPKV | |
| SFDPIPIHYCAPAGFAILKCDDKEFNGTGPCNNVSTQQCTHGIRPVVSTQLLLNGSLAEN | |
| KTMIRSENITNNAKNIIVQLTKPVNITCIRPGNNTRQSIHI---GPGQAFYSRDDITGDI | |
| RKAHCEVNGTEWDKTLQEVAKQLRTYFE-NK-TIIFNGSS-GGDLEITTHSFNCRGEFFY | |
| CNTSGLFNSTW----NASDI--------TQGLNDT-------ITLQCRIKQIINMWQRVG | |
| QAMYAPPIQGEIRCESNITGLILTRDGG----NGNGTN-ETFRPGGGDMRDNWRSELYKY | |
| KVVKIEPLGVAPTRAKRRVVEREKRAV--G-LGAV-FIGFLGAAGSTMGAASVTLTVQAR | |
| QLLSGIVQQQSNLLRAIEAQQHLLKLTVWGIKQLQARVLAVERYLKDQQLLGIWGCSGKL | |
| ICTTNVPWNSTWS-NKSLDEIWDNMTWLQWDREISNYTQIIYNLIEESQTQQEMNEKDLL | |
| ALDKWANLWSWFDISNWLWYIKIFIMIVGGLIGLRIVFAVLSVIKKVRKGYSPLSFQTHT | |
| PNPRDLDRPGRIEEEDGEQDKGRSIRLVSGFLALVWDDLRSLCLFSYHHLRDFILIVART | |
| VELLGHR-------GWESLKYLGNLLAYWSRELKISAISLLNTTAIVIAGWTDRVIEIIQ | |
| RIYTAIFNIPRRIRQGLERALL- | |
| >A1.CY.08.CY235.JF683782 | |
| MRVRGIQMNSHCL-LRWGT-MILGLIIICSA----VEKTWVTVYYGVPVWKDAETTLFCA | |
| SDAKAYTTEMHNVWATHACVPTDPNPQEINLENVTEEFNMWKLNMVEQMHTDIISLWDQS | |
| LKPCVKLTPLCVTLDCGY-----------NVSINNTYSIND---TMETDLRNCSFDVTTK | |
| LRDKRQNVYSLFYRLDIVHIDSNSNN--------------SHYRLINCNTSAITQACPKV | |
| SFEPIPIHYCAPAGFAILKCNDKEFSGKGPCKNVSTVHCTHGIRPVVSTQLLLNGSLAEN | |
| RTMIRSENITNNAKNIIVQLTEPVNITCIRPSNNTRKSVHI---GPGQAFFATGDIIGDI | |
| RKAHCEVNETEWNKALTKVVEQLRTYFR-NK-TITFKGPS-GGDLEITTHSFNCGGEFFY | |
| CNTSKLFNTTW----NANGS-V-QES-VNTAGNTT-------IFLPCRIKQIIRMWQRAG | |
| QAIYAPPIQGRIRCESNITGLLLTRDGG----GNANNT-EIFRPGGGDMRDNWRSELYKY | |
| KVVKIEPLGVAPTKARRRVVQREKRAV--G-LGAV-FLGFLGAAGSTMGAASITLTVQAR | |
| QLLSGIVQQQSNLLRAIEAQQQMLRLTVWGIKQLQARVLAVERYLGDQQLLGIWGCSGKL | |
| ICTTNVPWNSTWS-NKSLDKIWNNMTWMQWDKEISNYTQLIYTLIEQSQNQQEINEQELL | |
| ELDKWANLWNWFDISHWLWYIKIFIMIVGGLIGLRIVFAVLSIIRRVRQGYSPLSFQTHF | |
| PNPGGLDRPGGIEGEGGEQDRGRSIRLVSGFLALAWEDLRNLCLFSYHRLRDFILIAART | |
| VELLGHSSLKGLRLGWEGLKYIGNILIYWSRELKISAISLLDTIAIAVANWTDRIIEIGQ | |
| GICRAIINIPRRIRQGLERALL- | |
| >A1.CY.08.CY236.JF683783 | |
| MRVRGIQMNSHCL-LRWGT-MILGMIIICSA----VEKTWVTVYYGVPVWKDAETTLFCA | |
| SDAKAYTTEAHNIWATHACVPTDPNPQEINLENVTEEFNMWKLNMVEQMHTDIISLWDQS | |
| LKPCVKLTPLCVTLDCRH---NVTIHNNVTNNNNITSGIND---TIATEVKNCSFNTTTE | |
| LKDKRQNVYSLFYRLDIVQIDSNSNN--------------SHYRLINCNTSTITQACPKV | |
| TFKPIPIHYCAPAGFAILKCNDKKFSGKRPCRNVSTVQWTHGIRPVVSTQLLLNGSLAEN | |
| RTMIRSENITNNAKNIIVQLTEPVNITCIRPSNNTRKSIRI---GPGQAFYATGDIIGNI | |
| RKAHCEVNGTEWNKALKGVVEQLRTYFS-NK-TIAFNDSS-GGDLEITTHSFNCGGEFFY | |
| CNTSKLFNTTW----NVTDS-------IEESGNTI-------IVLPCKIKQIINMWQRAG | |
| QAIYPPPIRGIIRCESNITGLLLTRDGG----DTENTT-EIFRPGGGDMRDNWRSELYKY | |
| KVVKIEPLGVAPTEARRRVVQREKRAV--G-IGAV-FLGFLGAAGSTMGAASITLTVQAR | |
| QLLSGIVQQQSNLLRAIEAQQQMLRLTVWGIKQLQARVLAVERYLGDQQLLGIWGCSGKL | |
| ICTTNVPWNSTWS-NKSLDKIWNNMTWMQWDKEISNYTQLIYTLIEESQNQQEINEQDLL | |
| ALDKWANLWNWFDISHWLWYIKIFIMIVGGLIGLRIVFAVLSIIRRVRQGYSPLSFQTHT | |
| PNPGGLDRPGRIEGEGGEQDRSRSIRLVSGFLALAWDDLRNLCLFSYHRLRDFILIAART | |
| VELLGHSSLKGLRLGWEGLKYLENLLVYWSRELKISAINLFDTIAIAVAGWTDRVIEIVQ | |
| GIGRAIINIPRRIRQGLERALL- | |
| >A1.CY.07.CY208.JF683760 | |
| MKVKGIQMNSHSL-LRWGT-MILGMIIICSA----AEKTWVTVYYGVPVWKDAETTLFCA | |
| SDAKAYKTEVHNVWATHACVPTDPNPQEMHLENVTEEFNMWKNNMVEQMHTDIIRLWDPS | |
| PQPCVKLTPLCVTLNCSY---------NITSNVTVDMNDTI---NMREEIKNCSFYTTTE | |
| IRDNRQKVYSLFYRLDIVPIGDRNNN--------------HSYRLINCNTSAITQACPKV | |
| TFEPIPIHYCAPAGFAILKCNDKNFNGAGSCKNVSTVQCTHGIKPVVSTQLLLNGSLAEN | |
| ETMIRSENITNNVKNIIVQFNESVKINCTRPNNNTRKSVHI---GPGQAFYATGEIVGDI | |
| RQARCEVNKTEWNKALKRVAHQLEKYFK-NK-TIAFNKSP-GGDLEITTHSFNCGGEFFY | |
| CNTSKLFNSTW----DPNNT-S---TQESNSTNDN-------IILPCRIRQIINMWQRAG | |
| QAIYAPPIQGIINCVSNITGLILTRDGG----VGNNAK-EVFRPGGGDMRDNWRSELYKY | |
| KVVKIEPLGVAPTGARRRVVQREKRAV--G-LGAV-FIGFLGAAGSTMGAASMTLTVQAR | |
| QLLSGIVQQQSNLLRAIEAQQHMLRLTVWGIKQLQARVLAVERYLGDQQLLGIWGCSGKL | |
| ICTTNVPWNSTWS-NKTRREIWDNMTWMQWDKEISNYTQVIYTLIEESQNQQEKNEQDLL | |
| ALGKWDSLWSWFSITNWLWYIKIFIMIVGGLIGLRIVFAVISIIHRVRQGYSPLSFQIHT | |
| PNPGGLDRPGRIEEVGGEQDRHNWIRLVSGLLALAWDDLRSLCLFSFLRLRDFIVIVART | |
| VELVGHSSLKGLRLGWEGLKYLGNLLVYWSRELKISDISLLDSIAIAVAAGTDRVIEIGQ | |
| RICRAIVIIHSRIRYGLERALL- | |
| >A1.CY.07.CY209.JF683761 | |
| MKVKGIQMNSHSL-LRWGT-MILGMIIICSA----ADKMWVTVYYGVPVWKDAETTLFCA | |
| SDAKAYKTEVHNVWATHACVPTDPNPQEMHLENVTEEFNMWKNNMVEQMHTDIISLWDQS | |
| LKPCVKLTPLCVTLNCSYITSNVTADITSNVTADMNDAI-----NMTAEIRNCSFNITTE | |
| IRDKIQKVYSLFYRLDIVPIDRNDSN--------------ASYRLINCNTSAITQACPKV | |
| TFEPIPIHYCAPAGFAILKCNDKDFNGTGPCRNVSTVQCTHGIKPVVSTQLLLNGSLAEN | |
| ETMIRSENITNNAKNIIVQLNEPVKINCTRPNNNTRKSIRI---GPGQAFYATGDIVGNI | |
| RQAHCEVNKTEWNKALKRVADQLRKYF--NK-TIAFNKSS-GGDLEITTHSFNCGGEFFY | |
| CNTSKLFNSTW----NNTST---QES-NSTNPNDN-------ITLPCRIKQIINMWQRAG | |
| QAIYAPPIQGKINCVSNITGLILTRDGG-----GNSTE-EVFRPGGGDMRDNWRSELYKY | |
| KVVKIEPIGVAPTEARRRVVQREKRAV--G-LGAV-FIGFLGAAGSTMGGASMTRTVQAR | |
| QLLSGIVQQQSNLLRAIEAQQHMLRLTVWGIKQLQARVLAVERYLGDQQLLGLWGCSGKL | |
| ICTTNVPWNSTWS-NKSHKAIWDNMTWMQWDKEISDYTQVIYTLIEESQNQQEKNEQDLL | |
| ALDKWDSLWSWFSITKWLWYIKIFIMIVGGLIGLRIVFAVISIIRRVRQGYSPLSFQIHT | |
| PNPGGLDRPGRIEEEGGEQDRGKSIRLVSGFLALAWDDLRSLCLFSYHRLRDFILIAART | |
| VELLGHSSLKGLRLGWEGLKYLGNLLAYWSRELKISAISLLDTTAIAVAGWTDRVIETGQ | |
| TICRAIVNIPRRIRQGLERALL- | |
| >A1.CY.05.CY121.FJ388932 | |
| MKAKGIQRNSHGL-LRWGI-MILGMIMICSATEKVAENLWVTVYYGVPVWKEANTTLFCA | |
| SDAKAYKTEVHNVWATHACVPTDPNPQEIDIKNVTEKFNMWKNNMVEQMNTDIISLWDQS | |
| LKPCVKLTPLCVTLECRD------------ASNTTNATFTE---GMDREIKNCSYNMTTE | |
| LRDKRQKVSSLFYRLDIVPIDSNSRN---SSSSNS-----SEYKLINCSTSSITQACPKV | |
| SFEPILIHYCAPAGVAILKSNDKEVNGAGPCRNVGTVQCRPGIRPVVSTQLLLNGSLAES | |
| KIMIRSENISNNAKNILVQFTEPVNITCIRPGNNTRRGVHI---GPGQAFYAVGDIIGNI | |
| RQAHCNVSRRKWEETLQKVASQLRTYFV-NK-TIIFTKSS-GGDLEITTHSFNCGGEFLY | |
| CNTSGLFNSTW----PANNS-T-QGS-NSTESNDT-------VILQCRIKQIINMWQRVG | |
| QAIYAPPIPGEIKCVSNITGLILTRDGG---SSNNTEN-ETFRPGGGDMRDNWRSELYKY | |
| KVVKIEPLGVAPTRAKRRVVQREKRAVLGG-LGAV-FVGFLGAAGSTMGAASVTLTVQAR | |
| KLLTGIVQQQSNLLRAIEAQQHLLKLTVWGIKQLQARVLALERYLRDQQLLGIWGCSGKL | |
| ICTTNVPWNSTWSKNKSHDEIWNNMTWLQWEKEIDIYTQDIYTLIEESQNQQEINEKELL | |
| ELDKWANLWNWFNITNWLWYIKIFIIIVGGLIGLRIVFAVLAVINRVRQGYSPLSFQIHT | |
| PNPGGLDRPGRIEEEGGEQGRDRSIRLVSGFLALAWDDLRSLCLFSYHRLRDFILIAART | |
| VELLGHSSLKGLRLGWEGLKYLGNLLAYWIRELKISAINLLDTIAIAVAGWTDRVIEVGQ | |
| SICRAIFNIPR------------ | |
| >A1.CY.07.CY207.JF683759 | |
| MKAKGIQMSSHGL-LRWGM-MILGMIIICSA----AGNLWVTVYYGVPVWKDADTTLFCA | |
| SDAKAIKTEVHNVWATHACVPTDPNPQEINLENVTEDFNMWKNNMVEQMQTDIISLWDQS | |
| LKPCVKLTPLCVTLDCSH---------NITSNNTDNNPNNT---KVEVEMRNCSFNTTTE | |
| IRDRTQKVYSLFYKVDVVEIDSNSNN------SNT-----NNYRLINCNTSVITQACPKV | |
| TFEPIPIHYCAPAGFAILKCNDKEFNGTGPCKNVSSVQCTHGIKPVVSTQLLLNGSLAEN | |
| KTMIRSENITNNAKNIIVQLTKPVQINCTRPNNNTRKSVRI---GPGQAFYATGEIIGDI | |
| RQAHCNVSKAEWHGALQEVGKQLGTYFK-NK-TIIFTNSS-GGDLEITTHSFNCGGEFFY | |
| CDTSGLFNSTW----NTTDT-M-HEE-TNTEANST-------ITLPCRIKQIINMWQRAG | |
| QAIYAPPIPGVIQCKSNITGLILTRDGG----SNSSTN-ETFRPGGGDMRDNWRSELYKY | |
| KVVKIEPLGVAPTKARRRVVQREKRAV--G-LGAV-FIGFLGAAGSTMGAASITLTVQAR | |
| QLLSGIVQQQSNLLRAIEAQQHLLKLTVWGIKQLQARVLAVERYLKDQQLLGIWGCSGKL | |
| ICTTNVPWNSTWS-NKSQDEIWDNMTWLQWDKEISNYTQAIYTLIEESQNQQEMNEKELL | |
| ELDKWASLWNWFDISNWLWYIKIFIMIVGGLIGLRIVFAVLSIVNRVRQGYSPLSFQIQT | |
| PNPGGPDRPGRIEGEGGEQDRDRSIRLVSGFLGLAWDDLRSLCLFSYHRLRDFILIVART | |
| VELLGHSSLKGLRLGWEALKYLGNLLAYWSRELKNSAINLVDTIAITVAGWTDRVIEVGQ | |
| RICRAIINIPRRIRQGLERALL- | |
| >A1.CY.05.CY051.FJ388903 | |
| MKAKGIQRNSHSL-LGWGM-VILGMIIICST----AENLWVTVYYGVPVWKEADTTLFCA | |
| SDAKAYKTEVHNVWATHACVPTDPNPQEINMENVTEEFNMWKNNMVEQMHTDIISLWDQS | |
| LKPCVELTPLCVTLECRN------------VYTTNITNITK---EMQGEIKNCSFNMTTE | |
| LRDKRQKVYSLFYKLDIVQINSNSSN----SSSDS-----SEYRLINCNTSAITQACPKV | |
| SFEPIPIHYCAPAGFAILKCNDKEFNGTGLCRNVSTVQCTHGIRPVVSTQLLLNGSLAEN | |
| KTMIRSENITNNAKNIIVQFTEPVNITCIRPNNNTRKSVRI---GPGQAFYAAGDIIGDI | |
| RQAHCNVSKEKWNRTLQEVAQQLGIHFE-NK-TIIFANSS-GGDLEITTHSFNCGGEFFY | |
| CNTSGLFNSQY-NTSGLVNN-T-QES-GSTESNDTESIVTDNITLQIRIKQIINQWQRVA | |
| QATYAPPIPGVIKCVSNITGLILTRDGG-----SSSGN-ETFRPGGGDMRDNWRSELYKY | |
| KVVKIEPLGVAPTRAKRRVVEREKRAV--G-IGAV-FIGFLGAAGSTMGAASMTLTVQAR | |
| QLLSGIVQQQSNLLRAIEAQQHLLKLTVWGIKQLQARVLALERYLRDQQLLGIWGCSGKL | |
| ICTTTVPWNSTWS-NKSLDEIWDNMTWLQWDKEINNYTQLIYTLIEESQNQQEINEKELL | |
| ELDKWANLWNWFDITSWLWYIRIFIMIVGGLIGLRIVFAVLAIINRVRQGYSPLSLQTHT | |
| PNPGGLDRPGRIEEEGGEQDRGRSIRLVSGFLALAWDDLRSLCLFSYHRLRDFILIAART | |
| VELLGHSSLKGLRLGWEGLKYLGNLLAYWSQELKISAINLLDTIAIAVAGWTDRVIERGQ | |
| SICRTI--------RGFERALL- | |
| >A1.CY.05.CY140.FJ388938 | |
| MRAKGIQRNSHCL-LKWGT-MILGLIIICSA----ADNLWVTVYYGVPVWKDAKTTLFCA | |
| SDAKAYKTEMHNVWATHACVPTDPNPQEINLENVTEEFNMWKNNMVEQMHTDIISLWDQS | |
| LKPCVKLTPLCVTLNCTN----------------IKNITDD---EMRREIKNCSFNMTTE | |
| LRDKQKKVYSLFYRLDVVPIRNNKNNSSETNSSEA-----GEYRLINCNTSAITQACPKV | |
| SFEPIPIHYCTPAGFAILKCNDKEFNGTGLCRNVSTVQCTHGIRPVVSTHLLLNGSLAEN | |
| RTMIRSENITNNAKNIIVQLTEPVNITCIRPNNNTRKSVHI---GPGQAFYATDDIIGDI | |
| RKAHCNVSRTKWNNTLKEVVNQLRKYFGNNK-TIIFNSSS-GGDLEITTHSFNCGGEFFY | |
| CNTSGLFNSTW----NGT-T-M-QES-NNTESNDTES--NDIITLRCRIRQIIRMWQRAG | |
| QAMYAPPIQGIIKCESNITGLILARDGG-----NRNET-ETFRPGGGDMRDNWRSELYKY | |
| KVVKIEPLGVAPTKARRRVVQREKRAV--G-IGAV-FIGFLGAAGSTMGAASITLTVQAR | |
| QLLSGIVQQQSNLLKAIEAQQHLLKLTVWGIKQLQARVLAVERYLKDQQLLGIWGCSGKL | |
| ICTTNVPWNSTWS-NKTQEEIWDNMTWLQWDKEISNYTKTIYELIEKSQNQQEINEQDLL | |
| ALDKWANLWTWFDISNWLWYIRIFVMIVGGLIGLRIVFAVLNIINRVRKGYSPLSFQTHT | |
| PSPGGLDRPGRIEEEGGEQDRSRSIRLVSGFLALAWDDLRSLCLFSYHRLRDFILIAART | |
| VELLGHSSLKGLRLGWEGLKYLGNLLIYWSRELKISAISLLDTIAIAVAGWTDRVIEIGQ | |
| RICRAICNIPRRIRQGLERALL- | |
| >A1.CY.05.CY106.FJ388925 | |
| MRAKGIRRNSHCL-LRWGT-MILGMIIICSA----AENLWVTVYYGVPVWKEAKTTLFCA | |
| SDAKAYKTEVHNVWATHACVPTDPNPQEINLENVTEEFNMWKNNMVEQMHTDIISLWDQS | |
| LKPCVKLTPLCVTLNCSH---NVT---KVTNNGTATANITG---EMKGEIKNCSFNITTE | |
| LRDKTQKIYSLFYRLDVVEIDKNSSN----------------YRLINCNTSAITQACPKV | |
| TFEPIPIHYCAPAGFAILKCNDKEFNGTGPCRDVSTVQCTHGIKPVVSTQLLLNGSLAEN | |
| KTMIRSENITNNAKNIIVQLTEPVNITCIRPNNNTRKSVHI---GPGQAFYATGEIIGDI | |
| RQAHCNVSETEWNNTLQKVTNQLRTYFG-NK-TIIFANSS-GGDPEIITHSFNCGGEFFY | |
| CNTSGLFNSTW----NATAS-M-QES-NSTESNDT------TITLPCRIKQIINMWQRAG | |
| QAIYAPPIRGVIRCESNITGLILTRDGG----NSNSTN-ETFRPGGGDMRDNWRSELYKY | |
| KVVKIEPLGVAPTRARRRVVEREKRAV--G-IGAV-FIGFLGAAGSTMGAASIALTVQAR | |
| QLLSGIVQQQSNLLRAIEAQQHMLKLTVWGIKQLQARVLAVERYLRDQQLLGIWGCSGEL | |
| ICTTNVPWNSTWS-NKSLNEIWDNMTWLQWDKEISNYTQLIYDLIEESQNQQEKNEQDLL | |
| ALDKWASLWSWFNISKWLWYIKIFIMIVGGLIGLRIVFAVLSIIRRVRQGYSPVSFQIHA | |
| PNPGGLDRPGRIEGEGGEQDRGRSIRLVSGFFALAWDDLRSLCLFSYHRLRDFILIVART | |
| VELLGHSSLKGLRLGWEGLKYLGNLLVYWSRELKISAINLLDTIAIAVAGWTDRVIEIGQ | |
| GIGRAIINIPRRIRQGLERALL- | |
| >A1.CY.05.CY153.FJ388942 | |
| MRAKGIQRSLRSL-LRWGT-MILGMIIICSA----AENLWVTVYYGVPVWKDAETTLFCA | |
| SDAKAYDTEVHNVWATHACVPTDPNPQEINLENVTEEFNMWKNNMVEQMHTDIVSLWDQS | |
| LKPCVELTPLCVTLNCSH-----------NVTANDTVSIKE---GMEGEIKNCSFNVTTE | |
| LRDKTQKVYSLFYRPDVEQIDNSSS-----------------YRLINCNTSAIAKACPKV | |
| TFEPIPIHYCAPAGFAILKCNDKEFNGTGPCRNVSTVQCTHGIRPVVSTQLLLNGSLAEN | |
| KTMIRSENITSNTKNIIVQLTEPVNITCIRPNNNTRKSIHM---GPGRAFYATGEIIGDI | |
| RQAHCNVSRAKWNNTLQKVVDQLRTYFG-NK-TITFTSNAPGGDLEITTHSFNCGGEFFY | |
| CNTSGLFNSSW-LKSNRTGP-S-TEP-NNTEPNNT------IITLPCKIKQIINMWQRTG | |
| QAMYAPPIPGVIRCESNITGLILTRDGG----NSSNSN-ETFRPGGGNMRDNWRSELYKY | |
| KVVKIEPLGVAPTRARRRVVEREKRAV--G-IGAV-FIGFLGAAGSTMGAASMTLTVQAR | |
| QLLSGIVQQQSNLLRAIEAQQHMLKLTVWGIKQLQARVLAVERYLRDQQLLGIWGCSGKL | |
| ICTTNVPWNSTWS-NKSLDDIWENMTWMQWDKEISNYTQLIYNLIEESQNQQEKNEKDLL | |
| ALDKWASLWNWFNISNWLWYIKIFIMIVGGLIGLRIVFAVLSIIRRVRQGYSPLSFQIHT | |
| PNPEGLDRPGRIEEEGGEQGRSRSIRLASGFLALAWDDLRSLCLFSYRRLRDFVLIAART | |
| VELLGHSSLKGLRLGWEGLKYLGNLLVYWSQELKISAINLFDTIAIAVAGWTDRVIEIGQ | |
| RICRAIINIPRRIRQGLERALLX |
Sign up for free
to join this conversation on GitHub.
Already have an account?
Sign in to comment