Skip to content

Commit

Permalink
Fix issue with numeric gene names and emapper2gbk genes (issue #10).
Browse files Browse the repository at this point in the history
But the issue is still present in emapper2gbk genomes.
  • Loading branch information
ArnaudBelcour committed Sep 20, 2022
1 parent 1aa3fd3 commit 9025e08
Show file tree
Hide file tree
Showing 6 changed files with 263 additions and 11 deletions.
5 changes: 4 additions & 1 deletion emapper2gbk/genes_to_gbk.py
Original file line number Diff line number Diff line change
Expand Up @@ -68,7 +68,10 @@ def faa_to_gbk(nucleic_fasta:str, protein_fasta:str, annot:Union[str, dict],
gene_protein_seqs = OrderedDict()

for record in SeqIO.parse(protein_fasta, "fasta"):
gene_protein_seqs[record.id] = record.seq
protein_id = record.id
if protein_id.isnumeric():
protein_id = f"gene_{protein_id}"
gene_protein_seqs[protein_id] = record.seq

# Create a taxonomy dictionary querying the EBI.
if ete_option:
Expand Down
7 changes: 7 additions & 0 deletions emapper2gbk/utils.py
Original file line number Diff line number Diff line change
Expand Up @@ -413,9 +413,16 @@ def read_annotation(eggnog_outfile:str):
# Assign the headers
annotation_data.columns = headers_row
if 'query_name' in annotation_data.columns:
# Check if the gene IDs are numeric, if yes add 'gene_' in front of them.
numeric_row_dataframe = pd.to_numeric(annotation_data['query_name'], errors='coerce').notnull()
if bool(numeric_row_dataframe.any()) is True:
annotation_data.loc[numeric_row_dataframe, 'query_name'] = 'gene_' + annotation_data.loc[numeric_row_dataframe, 'query_name']
annotation_dict = annotation_data.set_index('query_name')[to_extract_annotations].to_dict('index')
# 'query' added for compatibility with eggnog-mapper 2.1.2
elif 'query' in annotation_data.columns:
numeric_row_dataframe = pd.to_numeric(annotation_data['query'], errors='coerce').notnull()
if bool(numeric_row_dataframe.any()) is True:
annotation_data.loc[numeric_row_dataframe, 'query'] = 'gene_' + annotation_data.loc[numeric_row_dataframe, 'query']
annotation_dict = annotation_data.set_index('query')[to_extract_annotations].to_dict('index')
for key in annotation_dict:
yield key, annotation_dict[key]
Expand Down
14 changes: 14 additions & 0 deletions tests/numeric/betaox_annotation.tsv
Original file line number Diff line number Diff line change
@@ -0,0 +1,14 @@
# emapper version: emapper-1.0.3-35-g63c274b emapper DB: 2.0
# command: ./emapper.py --cpu 6 -i /data/shared/emapper_jobs/user_data/MM_hn50pfy_/query_seqs.fa --output query_seqs.fa --output_dir /data/shared/emapper_jobs/user_data/MM_hn50pfy_ -m diamond -d none --tax_scope auto --go_evidence non-electronic --target_orthologs all --seed_ortholog_evalue 0.001 --seed_ortholog_score 60 --query-cover 20 --subject-cover 0 --override --temp_dir /data/shared/emapper_jobs/user_data/MM_hn50pfy_
# time: Fri May 15 14:00:48 2020
#query_name seed_eggNOG_ortholog seed_ortholog_evalue seed_ortholog_score best_tax_level Preferred_name GOs EC KEGG_ko KEGG_Pathway KEGG_Module KEGG_Reaction KEGG_rclass BRITE KEGG_TC CAZy BiGG_Reaction
226 316407.85674387 0 1627.5 Escherichia fadE GO:0003674,GO:0003824,GO:0003995,GO:0005575,GO:0005623,GO:0005886,GO:0006082,GO:0006629,GO:0006631,GO:0006635,GO:0008150,GO:0008152,GO:0009056,GO:0009062,GO:0009987,GO:0016020,GO:0016042,GO:0016054,GO:0016491,GO:0016627,GO:0019395,GO:0019752,GO:0030258,GO:0032787,GO:0033539,GO:0034440,GO:0043436,GO:0044237,GO:0044238,GO:0044242,GO:0044248,GO:0044255,GO:0044281,GO:0044282,GO:0044464,GO:0046395,GO:0055114,GO:0071704,GO:0071944,GO:0072329,GO:1901575 ko:K06445 ko00071,ko01100,ko01212,map00071,map01100,map01212 M00087 R01175,R01279,R03777,R03857,R03990,R04751,R04754 RC00052,RC00076 ko00000,ko00001,ko00002,ko01000 iSbBS512_1146.SbBS512_E0217 Bacteria 1MUDR@1224,1RPM5@1236,3XNAM@561,COG1960@1,COG1960@2 NA|NA|NA I Catalyzes the dehydrogenation of acyl-coenzymes A (acyl- CoAs) to 2-enoyl-CoAs, the first step of the beta-oxidation cycle of fatty acid degradation. Is required for
1781 316407.85675083 0 1149.8 Escherichia fadK GO:0003674,GO:0003824,GO:0005575,GO:0005623,GO:0005886,GO:0015645,GO:0016020,GO:0016405,GO:0016874,GO:0016877,GO:0016878,GO:0031956,GO:0044464,GO:0071944 ko:K12507 ko00000,ko01000,ko01004 iECIAI1_1343.ECIAI1_1755 Bacteria 1MU6G@1224,1RMQ4@1236,3XMA2@561,COG0318@1,COG0318@2 NA|NA|NA IQ Catalyzes the esterification, concomitant with transport, of exogenous fatty acids into metabolically active CoA thioesters for subsequent degradation or incorporation into phospholipids. Is maximally active on C6 0, C8 0 and C12 0 fatty acids, while has a low activity on C14-C18 chain length fatty acids. Is involved in the anaerobic beta-oxidative degradation of fatty acids, which allows anaerobic growth of E.coli on fatty acids as a sole carbon and energy source in the presence of nitrate or fumarate as a terminal electron acceptor. Can functionally replace FadD under anaerobic conditions
1887 199310.c2209 0 1128.2 Escherichia fadD GO:0001676,GO:0003674,GO:0003824,GO:0004467,GO:0005488,GO:0005504,GO:0005575,GO:0005622,GO:0005623,GO:0005737,GO:0005829,GO:0005886,GO:0006082,GO:0006139,GO:0006163,GO:0006629,GO:0006631,GO:0006635,GO:0006637,GO:0006644,GO:0006725,GO:0006732,GO:0006753,GO:0006790,GO:0006793,GO:0006796,GO:0006807,GO:0008150,GO:0008152,GO:0008289,GO:0008610,GO:0008654,GO:0009056,GO:0009058,GO:0009062,GO:0009117,GO:0009150,GO:0009259,GO:0009314,GO:0009411,GO:0009416,GO:0009628,GO:0009898,GO:0009987,GO:0015645,GO:0016020,GO:0016042,GO:0016054,GO:0016405,GO:0016874,GO:0016877,GO:0016878,GO:0019395,GO:0019637,GO:0019693,GO:0019752,GO:0030258,GO:0031406,GO:0032787,GO:0033293,GO:0033865,GO:0033875,GO:0034032,GO:0034440,GO:0034641,GO:0035383,GO:0036041,GO:0036094,GO:0043167,GO:0043168,GO:0043177,GO:0043436,GO:0043603,GO:0044237,GO:0044238,GO:0044242,GO:0044248,GO:0044249,GO:0044255,GO:0044281,GO:0044282,GO:0044424,GO:0044425,GO:0044444,GO:0044459,GO:0044464,GO:0046395,GO:0046483,GO:0050896,GO:0051186,GO:0055086,GO:0055114,GO:0070538,GO:0071704,GO:0071944,GO:0072329,GO:0072521,GO:0090407,GO:0098552,GO:0098562,GO:1901135,GO:1901360,GO:1901564,GO:1901575,GO:1901576 6.2.1.3 ko:K01897 ko00061,ko00071,ko01100,ko01212,ko02024,ko03320,ko04146,ko04216,ko04714,ko04920,map00061,map00071,map01100,map01212,map02024,map03320,map04146,map04216,map04714,map04920 M00086 R01280 RC00004,RC00014 ko00000,ko00001,ko00002,ko01000,ko01004,ko04147 4.C.1.1 iSF_1195.SF1423,iSFxv_1172.SFxv_1611,iS_1188.S1538 Bacteria 1MU6G@1224,1RMQ4@1236,3XMU8@561,COG0318@1,COG0318@2 NA|NA|NA IQ Catalyzes the esterification, concomitant with transport, of exogenous long-chain fatty acids into metabolically active CoA thioesters for subsequent degradation or incorporation into phospholipids
2441 316407.1799732 0 1398.6 Escherichia fadJ GO:0003674,GO:0003824,GO:0003857,GO:0004165,GO:0004300,GO:0006082,GO:0006629,GO:0006631,GO:0006635,GO:0006725,GO:0006805,GO:0008150,GO:0008152,GO:0008691,GO:0008692,GO:0009056,GO:0009062,GO:0009404,GO:0009407,GO:0009410,GO:0009636,GO:0009850,GO:0009852,GO:0009987,GO:0010124,GO:0010817,GO:0016042,GO:0016054,GO:0016491,GO:0016614,GO:0016616,GO:0016829,GO:0016835,GO:0016836,GO:0016853,GO:0016854,GO:0016856,GO:0016860,GO:0016863,GO:0019395,GO:0019439,GO:0019748,GO:0019752,GO:0030258,GO:0032787,GO:0034440,GO:0042178,GO:0042221,GO:0042445,GO:0042447,GO:0042537,GO:0043436,GO:0044237,GO:0044238,GO:0044242,GO:0044248,GO:0044255,GO:0044281,GO:0044282,GO:0046395,GO:0050896,GO:0051716,GO:0055114,GO:0065007,GO:0065008,GO:0070887,GO:0071466,GO:0071704,GO:0072329,GO:0098754,GO:1901360,GO:1901361,GO:1901575 1.1.1.157,1.1.1.35,4.2.1.17,5.1.2.3,5.3.3.8 ko:K00074,ko:K01782,ko:K01825 ko00071,ko00280,ko00281,ko00310,ko00360,ko00362,ko00380,ko00410,ko00640,ko00650,ko00903,ko00930,ko01040,ko01100,ko01110,ko01120,ko01130,ko01200,ko01212,map00071,map00280,map00281,map00310,map00360,map00362,map00380,map00410,map00640,map00650,map00903,map00930,map01040,map01100,map01110,map01120,map01130,map01200,map01212 M00032,M00087 R01975,R01976,R03026,R03045,R03276,R04137,R04170,R04203,R04204,R04224,R04737,R04738,R04739,R04740,R04741,R04744,R04745,R04746,R04748,R04749,R04756,R05066,R05305,R05576,R06411,R06412,R06941,R06942,R07935,R07951,R08093,R08094 RC00029,RC00099,RC00117,RC00241,RC00525,RC00831,RC00834,RC00896,RC01078,RC01086,RC01095,RC01098,RC01103,RC01217,RC02115 ko00000,ko00001,ko00002,ko01000 iECABU_c1320.ECABU_c26730,iECO103_1326.ECO103_1532,iETEC_1333.ETEC_2476,iEcE24377_1341.EcE24377A_2637,iLF82_1304.LF82_0614,iNRG857_1313.NRG857_19200,ic_1306.c2886 Bacteria 1MU9P@1224,1RMZ8@1236,3XMJZ@561,COG1024@1,COG1024@2,COG1250@1,COG1250@2 NA|NA|NA I Catalyzes the formation of a hydroxyacyl-CoA by addition of water on enoyl-CoA. Also exhibits 3-hydroxyacyl-CoA epimerase and 3-hydroxyacyl-CoA dehydrogenase activities
2442 316407.85675365 5.1E-240 836.6 Escherichia fadI GO:0003674,GO:0003824,GO:0003857,GO:0003988,GO:0004300,GO:0005575,GO:0005622,GO:0005623,GO:0005737,GO:0005829,GO:0006082,GO:0006629,GO:0006631,GO:0006635,GO:0008150,GO:0008152,GO:0009056,GO:0009062,GO:0009987,GO:0016042,GO:0016054,GO:0016408,GO:0016491,GO:0016614,GO:0016616,GO:0016740,GO:0016746,GO:0016747,GO:0016829,GO:0016835,GO:0016836,GO:0019395,GO:0019752,GO:0030258,GO:0032787,GO:0033542,GO:0034440,GO:0043436,GO:0044237,GO:0044238,GO:0044242,GO:0044248,GO:0044255,GO:0044281,GO:0044282,GO:0044424,GO:0044444,GO:0044464,GO:0046395,GO:0055114,GO:0071704,GO:0072329,GO:1901575 2.3.1.16 ko:K00632 ko00071,ko00280,ko00281,ko00362,ko00592,ko00642,ko01100,ko01110,ko01120,ko01130,ko01212,map00071,map00280,map00281,map00362,map00592,map00642,map01100,map01110,map01120,map01130,map01212 M00087,M00113 R00829,R00927,R01177,R03778,R03858,R03991,R04546,R04742,R04747,R05506,R05586,R07891,R07895,R07899,R08091,R08095 RC00004,RC00326,RC00405,RC01702,RC02728,RC02898,RC02955 ko00000,ko00001,ko00002,ko01000 iECO103_1326.ECO103_2806,iEcHS_1320.EcHS_A2493 Bacteria 1MU5G@1224,1RNGU@1236,3XMTM@561,COG0183@1,COG0183@2 NA|NA|NA I Catalyzes the final step of fatty acid oxidation in which acetyl-CoA is released and the CoA ester of a fatty acid two carbons shorter is formed
3987 316407.85676208 7.1E-217 759.6 Escherichia fadA GO:0003674,GO:0003824,GO:0003988,GO:0005575,GO:0005622,GO:0005623,GO:0005737,GO:0006082,GO:0006629,GO:0006631,GO:0006635,GO:0008150,GO:0008152,GO:0009056,GO:0009062,GO:0009987,GO:0016042,GO:0016054,GO:0016408,GO:0016740,GO:0016746,GO:0016747,GO:0019395,GO:0019752,GO:0030258,GO:0032787,GO:0034440,GO:0043436,GO:0044237,GO:0044238,GO:0044242,GO:0044248,GO:0044255,GO:0044281,GO:0044282,GO:0044424,GO:0044464,GO:0046395,GO:0055114,GO:0071704,GO:0072329,GO:1901575 2.3.1.16 ko:K00632 ko00071,ko00280,ko00281,ko00362,ko00592,ko00642,ko01100,ko01110,ko01120,ko01130,ko01212,map00071,map00280,map00281,map00362,map00592,map00642,map01100,map01110,map01120,map01130,map01212 M00087,M00113 R00829,R00927,R01177,R03778,R03858,R03991,R04546,R04742,R04747,R05506,R05586,R07891,R07895,R07899,R08091,R08095 RC00004,RC00326,RC00405,RC01702,RC02728,RC02898,RC02955 ko00000,ko00001,ko00002,ko01000 iAPECO1_1312.APECO1_2612,iECNA114_1301.ECNA114_4154,iECOK1_1307.ECOK1_4314,iECP_1309.ECP_4058,iECS88_1305.ECS88_4293,iECSF_1327.ECSF_3702,iEcE24377_1341.EcE24377A_4364,iLF82_1304.LF82_0613,iNRG857_1313.NRG857_19195,iPC815.YPO3767 Bacteria 1MU5G@1224,1RM93@1236,3XM40@561,COG0183@1,COG0183@2 NA|NA|NA I Catalyzes the final step of fatty acid oxidation in which acetyl-CoA is released and the CoA ester of a fatty acid two carbons shorter is formed
398 316407.85676207 0 1449.1 Escherichia fadB GO:0003674,GO:0003824,GO:0003857,GO:0004165,GO:0004300,GO:0006082,GO:0006629,GO:0006631,GO:0006635,GO:0006725,GO:0006805,GO:0008150,GO:0008152,GO:0008691,GO:0008692,GO:0009056,GO:0009062,GO:0009404,GO:0009407,GO:0009410,GO:0009636,GO:0009850,GO:0009852,GO:0009987,GO:0010124,GO:0010817,GO:0016042,GO:0016054,GO:0016491,GO:0016614,GO:0016616,GO:0016829,GO:0016835,GO:0016836,GO:0016853,GO:0016854,GO:0016856,GO:0016860,GO:0016863,GO:0019395,GO:0019439,GO:0019748,GO:0019752,GO:0030258,GO:0032787,GO:0034440,GO:0042178,GO:0042221,GO:0042445,GO:0042447,GO:0042537,GO:0043436,GO:0044237,GO:0044238,GO:0044242,GO:0044248,GO:0044255,GO:0044281,GO:0044282,GO:0046395,GO:0050896,GO:0051716,GO:0055114,GO:0065007,GO:0065008,GO:0070887,GO:0071466,GO:0071704,GO:0072329,GO:0098754,GO:1901360,GO:1901361,GO:1901575 1.1.1.157,1.1.1.35,4.2.1.17,5.1.2.3,5.3.3.8 ko:K00074,ko:K01782,ko:K01825 ko00071,ko00280,ko00281,ko00310,ko00360,ko00362,ko00380,ko00410,ko00640,ko00650,ko00903,ko00930,ko01040,ko01100,ko01110,ko01120,ko01130,ko01200,ko01212,map00071,map00280,map00281,map00310,map00360,map00362,map00380,map00410,map00640,map00650,map00903,map00930,map01040,map01100,map01110,map01120,map01130,map01200,map01212 M00032,M00087 R01975,R01976,R03026,R03045,R03276,R04137,R04170,R04203,R04204,R04224,R04737,R04738,R04739,R04740,R04741,R04744,R04745,R04746,R04748,R04749,R04756,R05066,R05305,R05576,R06411,R06412,R06941,R06942,R07935,R07951,R08093,R08094 RC00029,RC00099,RC00117,RC00241,RC00525,RC00831,RC00834,RC00896,RC01078,RC01086,RC01095,RC01098,RC01103,RC01217,RC02115 ko00000,ko00001,ko00002,ko01000 iECO103_1326.ECO103_1532,iETEC_1333.ETEC_2476,iLF82_1304.LF82_0614,iNRG857_1313.NRG857_19200 Bacteria 1MU9P@1224,1RMZ8@1236,3XMBN@561,COG1024@1,COG1024@2,COG1250@1,COG1250@2 NA|NA|NA I Involved in the aerobic and anaerobic degradation of long-chain fatty acids via beta-oxidation cycle. Catalyzes the formation of 3-oxoacyl-CoA from enoyl-CoA via L-3-hydroxyacyl-CoA. It can also use D-3-hydroxyacyl-CoA and cis-3-enoyl-CoA as substrate
# 7 queries scanned
# Total time (seconds): 3.29501509666
# Rate: 2.12 q/s
14 changes: 14 additions & 0 deletions tests/numeric/betaox_genes.faa
Original file line number Diff line number Diff line change
@@ -0,0 +1,14 @@
>226
MMILSILATVVLLGALFYHRVSLFISSLILLAWTAALGVAGLWSAWVLVPLAIILVPFNFAPMRKSMISAPVFRGFRKVMPPMSRTEKEAIDAGTTWWEGDLFQGKPDWKKLHNYPQPRLTAEEQAFLDGPVEEACRMANDFQITHELADLPPELWAYLKEHRFFAMIIKKEYGGLEFSAYAQSRVLQKLSGVSGILAITVGVPNSLGPGELLQHYGTDEQKDHYLPRLARGQEIPCFALTSPEAGSDAGAIPDTGIVCMGEWQGQQVLGMRLTWNKRYITLAPIATVLGLAFKLSDPEKLLGGAEDLGITCALIPTTTPGVEIGRRHFPLNVPFQNGPTRGKDVFVPIDYIIGGPKMAGQGWRMLVECLSVGRGITLPSNSTGGVKSVALATGAYAHIRRQFKISIGKMEGIEEPLARIAGNAYVMDAAASLITYGIMLGEKPAVLSAIVKYHCTHRGQQSIIDAMDITGGKGIMLGQSNFLARAYQGAPIAITVEGANILTRSMMIFGQGAIRCHPYVLEEMEAAKNNDVNAFDKLLFKHIGHVGSNKVRSFWLGLTRGLTSSTPTGDATKRYYQHLNRLSANLALLSDVSMAVLGGSLKRRERISARLGDILSQLYLASAVLKRYDDEGRNEADLPLVHWGVQDALYQAEQAMDDLLQNFPNRVVAGLLNVVIFPTGRHYLAPSDKLDHKVAKILQVPNATRSRIGRGQYLTPSEHNPVGLLEEALVDVIAADPIHQRICKELGKNLPFTRLDELAHNALVKGLIDKDEAAILVKAEESRLRSINVDDFDPEELATKPVKLPEKVRKVEAA
>1781
MHPTGPHLGPDVLFRESNMKVTLTFNEQRRAAYRQQGLWGDASLADYWQQTARAMPDKIAVVDNHGASYTYSALDHAASCLANWMLAKGIESGDRIAFQLPGWCEFTVIYLACLKIGAVSVPLLPSWREAELVWVLNKCQAKMFFAPTLFKQTRPVDLILPLQNQLPQLQQIVGVDKLAPATSSLSLSQIIADNTSLTTAITTHGDELAAVLFTSGTEGLPKGVMLTHNNILASERAYCARLNLTWQDVFMMPAPLGHATGFLHGVTAPFLIGARSVLLDIFTPDACLALLEQQRCTCMLGATPFVYDLLNVLEKQPADLSALRFFLCGGTTIPKKVARECQQRGIKLLSVYGSTESSPHAVVNLDDPLSRFMHTDGYAAAGVEIKVVDDARKTLPPGCEGEEASRGPNVFMGYFDEPELTARALDEEGWYYSGDLCRMDEAGYIKITGRKKDIIVRGGENISSREVEDILLQHPKIHDACVVAMSDERLGERSCAYVVLKAPHHSLSLEEVVAFFSRKRVAKYKYPEHIVVIEKLPRTTSGKIQKFLLRKDIMRRLTQDVCEEIE
>1887
LKKVWLNRYPADVPTEINPDRYQSLVDMFEQSVARYADQPAFVNMGEVMTFRKLEERSRAFAAYLQQGLGLKKGDRVALMMPNLLQYPVALFGILRAGMIVVNVNPLYTPRELEHQLNDSGASAIVIVSNFAHTLEKVVDKTAVQHVILTRMGDQLSTAKGTVVNFVVKYIKRLVPKYHLPDAISFRSALHNGYRMQYVKPELVPEDLAFLQYTGGTTGVAKGAMLTHRNMLANLEQVNATYGPLLHPGKELVVTALPLYHIFALTINCLLFIELGGQNLLITNPRDIPGLVKELAKYPFTAITGVNTLFNALLNNKEFQQLDFSSLHLSAGGGMPVQQVVAERWVKLTGQYLLEGYGLTECAPLVSVNPYDIDYHSGSIGLPVPSTEAKLVDDDDNEVPPGQPGELCVKGPQVMLGYWQRPDATDEIIKNGWLHTGDIAVMDEEGFLRIVDRKKDMILVSGFNVYPNEIEDVVMQHPGVQEVAAVGVPSGSSGEAVKIFVVKKDPSLTEESLVTFCRRQLTGYKVPKLVEFRDELPKSNVGKILRRELRDEARGKVDNKA
>2441
MEMTSAFTLNVRLDNIAVITIDVPGEKMNTLKAEFASQVRAIIKQLRENKELRGVVFVSAKPDNFIAGADINMIGNCKTAQEAEALARQGQQLMAEIHALPIQVIAAIHGACLGGGLELALACHGRVCTDDPKTVLGLPEVQLGLLPGSGGTQRLPRLIGVSTALEMILTGKQLRAKQALKLGLVDDVVPHSILLEAAVELAKKERPSSRPLPVRERILAGPLGRALLFKMVGKKTEHKTQGNYPATERILEVVETGLAQGTSSGYDAEARAFGELAMTPQSQALRSIFFASTDVKKDPGSDAPPAPLNSVGILGGGLMGGGIAYVTACKAGIPVRIKDINPQGINHALKYSWDQLEGKVRRRHLKASERDKQLALISGTTDYRGFAHRDLIIEAVFENLELKQQMVAEVEQNCAAHTIFASNTSSLPIGDIAAHATRPEQVIGLHFFSPVEKMPLVEIIPHAGTSAQTIATTVKLAKKQGKTPIVVRDKAGFYVNRILAPYINEAIRMLTQGERVEHIDAALVKFGFPVGPIQLLDEVGIDTGTKIIPVLEAAYGERFSAPANVVSSILNDDRKGRKNGRGFYLYGQKGRKSKKQVDPAIYPLIGTQGQGRISAPQVAERCVMLMLNEAVRCVDEQVIRSVRDGDIGAVFGIGFPPFLGGPFRYIDSLGAGEVVAIMQRLATQYGSRFTPCERLVEMGARGESFWKTTATDLQ
>2442
MGQVLPLVTRQGDRIAIVSGLRTPFARQATAFHGIPAVDLGKMVVGELLARSEIPAEVIEQLVFGQVVQMPEAPNIAREIVLGTGMNVHTDAYSVSRACATSFQAVANVAESLMAGTIRAGIAGGADSSSVLPIGVSKKLARVLVDVNKARTMSQRLKLFSRLRLRDLMPVPPAVAEYSTGLRMGDTAEQMAKTYGITREQQDALAHRSHQRAAQAWSDGKLKEEVMTAFIPPYKQPLVEDNNIRGNSSLADYAKLRPAFDRKHGTVTAANSTPLTDGAAAVILMTESRAKELGLVPLGYLRSYAFTAIDVWQDMLLGPAWSTPLALERAGLTMSDLTLIDMHEAFAAQTLANIQLLGSERFAREALGRAHATGEVDDSKFNVLGGSIAYGHPFAATGARMITQTLHELRRRGGGFGLVTACAAGGLGAAMVLEAE
>3987
MEQVVIVDAIRTPMGRSKGGAFRNVRAEDLSAHLMRSLLARNPALEAAALDDIYWGCVQQTLEQGFNIARNAALLAEVPHSVPAVTVNRLCGSSMQALHDAARMIMTGDAQACLVGGVEHMGHVPMSHGVDFHPGLSRNVAKAAGMMGLTAEMLARMHGISREMQDAFAARSHARAWAATQSAAFKNEIIPTGGHDADGVLKQFNYDEVIRPETTVEALATLRPAFDPVNGMVTAGTSSALSDGAAAMLVMSESRAHELGLKPRARVRSMAVVGCDPSIMGYGPVPASKLALKKAGLSASDIGVFEMNEAFAAQILPCIKDLGLIEQIDEKINLNGGAIALGHPLGCSGARISTTLLNLMERKDVQFGLATMCIGLGQGIATVFERV
>3988
MLYKGDTLYLDWLEDGIAELVFDAPGSVNKLDTATVASLGEAIGVLEQQSDLKGLLLRSNKAAFIVGADITEFLSLFLVPEEQLSQWLHFANSVFNRLEDLPVPTIAAVNGYALGGGCECVLATDYRLATPDLRIGLPETKLGIMPGFGGSVRMPRMLGADSALEIIAAGKDVGADQALKIGLVDGVVKAEKLVEGAKAVLRQAINGDLDWKAKRQPKLEPLKLSKIEATMSFTIAKGMVAQTAGKHYPAPITAVKTIEAAARFGREEALNLENKSFVPLAHTNEARALVGIFLNDQYVKGKAKKLTKDVETPKQAAVLGAGIMGGGIAYQSAWKGVPVVMKDINDKSLTLGMTEAAKLLNKQLERGKIDGLKLAGVISTIHPTLDYAGFDRVDIVVEAVVENPKVKKAVLAETEQKVRQDTVLASNTSTIPISELANALERPENFCGMHFFNPVHRMPLVEIIRGEKSSDETIAKVVAWASKMGKTPIVVNDCPGFFVNRVLFPYFAGFSQLLRDGADFRKIDKVMEKQFGWPMGPAYLLDVVGIDTAHHAQAVMAAGFPQRMQKDYRDAIDALFDANRFGQKNGLGFWRYKEDSKGKPKKEEDAAVEDLLAEVSQPKRDFSEEEIIARMMIPMVNEVVRCLEEGIIATPAEADMALVYGLGFPPFHGGAFRWLDTLGSAKYLDMAQQYQHLGPLYEVPEGLRNKARHNEPYYPPVEPARPVGDLKTA
Loading

0 comments on commit 9025e08

Please sign in to comment.