cds/tools/chlorodb added
Former-commit-id: 0579e878a69b7c285ca71870e9ca5730649a2fda Former-commit-id: 7cced5b488441d87bf070a9a444317db0e048880
This commit is contained in:
@ -1,5 +1,7 @@
|
||||
#!/bin/csh -f
|
||||
|
||||
setenv Verbose 1
|
||||
|
||||
setenv ORG_HOME `dirname $0`/../../..
|
||||
source $ORG_HOME/scripts/csh_init.sh
|
||||
|
||||
@ -8,9 +10,9 @@ echo "+ testing CDS"
|
||||
setenv TMP_CLEANUP 0
|
||||
setenv PASS1_SPEEDUP 1
|
||||
setenv PASS1_SLOWDOWN 0
|
||||
setenv PASS1_BLASTX_FILTER_NBMAX 10
|
||||
setenv PASS1_BLASTX_FILTER_NBMAX 5
|
||||
|
||||
`dirname $0`/../bin/go_cds.sh test.fst > test.bak
|
||||
`dirname $0`/../bin/go_cds.sh test.fst test.db > test.bak
|
||||
|
||||
diff -q test.bak test.ref >& /dev/null
|
||||
|
||||
@ -18,7 +20,7 @@ set stat = $status
|
||||
|
||||
if ($stat == 0) then
|
||||
echo "+ $VTC[3]CDS test Ok$VTC[1]"
|
||||
\rm -r test.bak test.tmp
|
||||
\rm -r test.bak test.tmp test.db/*.fst.p??
|
||||
else
|
||||
echo "* $VTC[2]CDS test Failure$VTC[1]"
|
||||
endif
|
||||
|
18
detectors/cds/test/test.db/Annot.lst
Normal file
18
detectors/cds/test/test.db/Annot.lst
Normal file
@ -0,0 +1,18 @@
|
||||
atpf atpF 483 1:80_2:401_3:1_4:1 POLYEX ATP_synthase_CF0_B_subunit
|
||||
ccsa ccsA 477 1:476_2:1 POLYEX cytochrome_c_biogenesis_protein
|
||||
ndha ndhA 384 1:9_2:375 POLYEX NADH_dehydrogenase_subunit_1
|
||||
ndhb ndhB 699 1:5_2:693_3:1 POLYEX NADH_dehydrogenase_subunit_2
|
||||
ndhd ndhD 383 1:383 MONEX NADH_dehydrogenase_subunit_4
|
||||
ndhe ndhE 395 1:395 MONEX NADH_dehydrogenase_subunit_4L
|
||||
ndhf ndhF 384 1:384 MONEX NADH_dehydrogenase_subunit_5
|
||||
ndhg ndhG 386 1:386 MONEX NADH_dehydrogenase_subunit_6
|
||||
ndhh ndhH 406 1:400_2:6 POLYEX NADH_dehydrogenase_subunit_7
|
||||
ndhi ndhI 386 1:386 MONEX NADH_dehydrogenase_subunit_I
|
||||
psac psaC 498 1:491_2:4_3:3 POLYEX photosystem_I_subunit_VII
|
||||
rpl2 rpl2 800 1:101_2:698_5:1 POLYEX ribosomal_protein_L2
|
||||
rpl23 rpl23 787 1:782_2:2_3:1_4:2 POLYEX ribosomal_protein_L23
|
||||
rpl32 rpl32 474 1:474 MONEX ribosomal_protein_L32
|
||||
rps15 rps15 480 1:479_2:1 POLYEX ribosomal_protein_S15
|
||||
rps7 rps7 853 1:853 MONEX ribosomal_protein_S7
|
||||
ycf1 ycf1 408 1:406_2:2 POLYEX hypothetical_chloroplast_RF1
|
||||
ycf2 ycf2 654 1:649_2:5 POLYEX Ycf2
|
50
detectors/cds/test/test.db/atpf.fst
Normal file
50
detectors/cds/test/test.db/atpf.fst
Normal file
@ -0,0 +1,50 @@
|
||||
>AC_000188@LyesCp071@atpf@11803@13043@R@2@185 ATP_synthase_CF0_B_chain
|
||||
MKNVTDSFVSLGHWPSAGSFGFNTDILATNPINLSVVLGVLIFFGKGVLS
|
||||
DLLDNRKQRILNTIRNSEELRGGAIEQLEKARSRLRKVETEAEQFRVNGY
|
||||
SEIEREKLNLINSTYKTLEQLENYKNETIQFEQQRAINQVRQRVFQQALR
|
||||
GALGTLNSCLNNELHLRTISANIGMLGTMKEITD
|
||||
>NC_000925@PopuCp059@atpf@45392@45943@R@1@184 ATP_synthase_CF0_B_subunit
|
||||
MNSIVNITPIIIILSEHSSEHTFGFNSDIFEANVINILLLLFGLIYVLKQ
|
||||
SLGSTLNERQLKVLAAIQESEERLEQASSRLSESEKQLAQTQIIINQIKK
|
||||
EAQLTAEKVRSSILAQGQIDIERLAITGKSNIETAEKQIRRQIQQQIAFL
|
||||
ALKKVTLQLENQMSSDIQLRIIDNNIAKLGDQL
|
||||
>NC_000926@GuthCp075@atpf@65505@66053@R@1@183 ATP_synthase_CF0_B_subunit
|
||||
MDIISGFYNTINLAELSNAKTFGFNPNILEANVLNIAILLSGVIYLGRNF
|
||||
LTSALESRQQKVTEAIQEAEERLQQANVKLLDAEKQLTQAQTVIEQIKKE
|
||||
AEKTARTVKETILAQGKLDIERLTNNGKSSIEKAELQIKKQIQQHITDLA
|
||||
IKKVSAQMETFMTDNLQVKVIDTNIASLGGKI
|
||||
>NC_000927@NeolCp025@atpf@19121@19651@R@1@177 ATP_synthase_CF0_B_chain
|
||||
MFHFLALTPLAHSEGFGLNTNILETNILNLAAVFALLAYVGTDFVSSLLK
|
||||
TRKESILKSLRDADERYQDAVNQLKQALQELETARTNAAEIRRQSEINAE
|
||||
AIRQRLELLTQEEMARLEEAKETIIKLEEEKAVAEVCTKVISMALVRAEK
|
||||
KIISSMDEAMHRRVMDMYLNLLREVY
|
||||
>NC_000932@ArthCp008@atpf@11529@12798@R@2@185 ATP_synthase_CF0_B_subunit
|
||||
MKNLTDSFVYLGHWPSAGSFGFNTDILATNPINLSVVFGVLIFFGKGVLN
|
||||
DLLDNRKQRILNTIRNSEELREGAIQQLENARARLRNVETEADKFRVNGY
|
||||
SEIEREKLNLINSTYKTLKQLENYKNETILFEQQRTINQVRERVFQQALQ
|
||||
GAIGTLNSCLSNELHLRTINANIGMFGTMKEITD
|
||||
>NC_001319@MapoCp012@atpf@18468@19609@D@2@185 ATP_synthase_CF0_B_subunit
|
||||
MENGTYFIISSNFWTIAGSFGLNTNLLETNLINLGVVLGLLVYFGKGVLS
|
||||
NLLNNRKLTILNTIQDAEERYKEATDKLNQARTRLQQAKQKADDIRINGL
|
||||
SQMEKEKQDLINAADEDSKRLEDSKNATIRFEKQRAIEQVRQQVSRLALE
|
||||
RALETLKSRLNSELHLRMIDYHIGLLRAMESTIE
|
||||
>NC_001320@OrsajCp021@atpf@32741@34111@D@2@181 ATP_synthase_CF0_B_subunit
|
||||
MKNVTHSFVFLAHWPSAGSFGLNTDILATNLINLTVVVGVLIYFGKGVLK
|
||||
DLLDNRKQRILSTIRNSEELRRGTIEQLEKARIRLQKVELEADEYRMNGY
|
||||
SEIEREKANLINATSISLEQLEKSKNETLYFEKQRAMNQVRQRVFQQAVQ
|
||||
GALGTLNSCLNTELHFRTIRANISILGAME
|
||||
>NC_001603@EugrCp038@atpf@64813@66970@D@4@184 ATP_synthase_CF0_B_chain
|
||||
MVIDNFNIFTIISNAKTFGINTNVFETNIINLAIVVGTLFYYGKLTLSDL
|
||||
LKTRKKTIIKNILDIDEKIRSSQSSLYLAELEFENAAKKASLIRSNGTTF
|
||||
CLKSFDIIRSSVNEDIKRLKQSKRLILRTEDKKSVREIFKNLYSQACQKA
|
||||
KATIIKRLNSKIHKKIILKKMEKMSLKKLKPKY
|
||||
>NC_001631@PithCp015@atpf@11663@12972@R@2@185 ATP_synthase_CF0_B_subunit
|
||||
MKNVIDPFISLSYWPSAGGFGSNTNILETNIINSSVVLSVLIYFGKGVLS
|
||||
NLLDNRKQKILETIRNSEELCKGAIDQLEKARACLRNVEMIADEIQVNGN
|
||||
SQIEREKEDLLNTASDNLEQLEDPKNETIYSEQQRAFDQIRQQVSRQALR
|
||||
RAIGTLNSRLNTELHLRTIDHNIGLLRTMMNTND
|
||||
>NC_001666@ZemaCp019@atpf@35097@36479@D@2@184 ATP_synthase_CF0_B_subunit
|
||||
MKNVTHSFVFLAHWPFAGSFGLNTDILATNLINLTVVVGVLIFFGKGVLK
|
||||
DLLDNRKQRILSTIRNSEELRKGTLEQLEKARIRLQKVELEADEYRMNGY
|
||||
SEIEREKENLINATSISLEQLEKSKNETLYFEKQRAMNQVRQQGFQQAVQ
|
||||
GALGTLNSCLNTELHFRTIRANIGILGAIEWKR
|
78
detectors/cds/test/test.db/ccsa.fst
Normal file
78
detectors/cds/test/test.db/ccsa.fst
Normal file
@ -0,0 +1,78 @@
|
||||
>AC_000188@LyesCp084@ccsa@115765@116706@D@1@314 cytochrome_c_biogenesis_protein
|
||||
MIFSTLEHILTHISFSIVSIVITIHLITFLVDEIVKLYDSSEKGIIVTFF
|
||||
CITGLLVTRWVSSGHFPLSDLYESLIFLSWSFSLIHIIPYFKKNVLILSK
|
||||
ITGPSAILTQGFATSGILTEIHQSGILVPALQSEWLIMHVSMMILGYAAL
|
||||
LCGSLLSVALLVITFRKNRKLFSKSNVFLNESFFLGENVVENTSFFCTKN
|
||||
YYRSQLIQQLDYWSYRVISLGFTFLTIGILSGAVWANEAWGSYWNWDPKE
|
||||
TWAFITWIVFAIYLHTRTNRNLRGPNSAIVASIGFLIIWICYFGVNLLGI
|
||||
GLHSYGSFPSTFN
|
||||
>NC_000925@PopuCp184@ccsa@160407@161366@D@1@320 cytochrome_c_biogenesis_protein
|
||||
MNLEMMQNSCVNFAFGGLLTAMLVYWSSLAFPRISGLNKLAALITLLVNI
|
||||
ALALTLSSRWFANGYFPLSNLYESLLFLAWGLTFVHLFIESKTKSRLIGA
|
||||
VSIPVAMFVTAFASLALPIEMQKASPLVPALKSNWLMMHVSIMMISYSIL
|
||||
ILGSLLSILFLIITRGQDINLKGSSVGTGSYTVKSLDSNPSFAFSNPSGI
|
||||
VQEQSNMLINSTRMNLLESIDNLSYRIIGLGFPLLTIGIVAGAVWANEAW
|
||||
GSYWSWDPKETWALITWLIFAAYLHCRITKSWQGKRPAILASVGFLVVWI
|
||||
CYLGVNFLGKGLHSYGWLA
|
||||
>NC_000926@GuthCp037@ccsa@33657@34562@R@1@302 cytochrome_c_biogenesis_protein
|
||||
MFNVQFDIFNFSNNITFLTLLISLISYWLGLIFKKIKNVFYIGYGSTILA
|
||||
CITITIILGTRWIESGYFPLSNLYESLMFLTWGLLFSAIYLEYKTNLYLI
|
||||
GAIVSPISLFIVSFSTLSLPQDMQKAAPLVPALKSNWLMMHVSVMMLSYS
|
||||
TLIIGSLLAILYLVLIKAQQKKHSLKDFAFANLEFTFPKSTNSTNFNLLE
|
||||
TLDNLSYRTIGFGFPLLTIGIIAGAVWANEAWGTYWSWDPKETWALITWL
|
||||
VFAAYLHARITKSWTGERPAYLAALGFVVVWICYLGVNFLGKGLHSYGWL
|
||||
N
|
||||
>NC_000927@NeolCp108@ccsa@128438@129259@D@1@274 cytochrome_c_biogenesis_protein
|
||||
MSTFSILSLVAFATLFVTMLLYFFQRQPLARQSMWIAHTSLAGLLLLRWV
|
||||
QSGHFPLSNLYESCLFLSWAVTLGHFVVEKDASRAGFLDLGIFTAPMAFF
|
||||
VYAFATFSLPPTMQEAGPLVPALRSHWLMMHVTLMILSYAALLFGSVLSL
|
||||
AFLVITTGPRKNSEKLQSLASTFDTLSYRTLGIGFPLLTVGILSGAVWAN
|
||||
EAWGSYWSWDPKETWALITWLIFAIYLHSRLTYGWNGQKAALIASVGFFL
|
||||
IWICYLGVNLLGKGLHSYGWLTS
|
||||
>NC_000927@NeolCp129@ccsa@163667@164488@R@1@274 cytochrome_c_biogenesis_protein
|
||||
MSTFSILSLVAFATLFVTMLLYFFQRQPLARQSMWIAHTSLAGLLLLRWV
|
||||
QSGHFPLSNLYESCLFLSWAVTLGHFVVEKDASRAGFLDLGIFTAPMAFF
|
||||
VYAFATFSLPPTMQEAGPLVPALRSHWLMMHVTLMILSYAALLFGSVLSL
|
||||
AFLVITTGPRKNSEKLQSLASTFDTLSYRTLGIGFPLLTVGILSGAVWAN
|
||||
EAWGSYWSWDPKETWALITWLIFAIYLHSRLTYGWNGQKAALIASVGFFL
|
||||
IWICYLGVNLLGKGLHSYGWLTS
|
||||
>NC_000932@ArthCp073@ccsa@114461@115447@D@1@329 cytochrome_c_biogenesis_protein
|
||||
MIFSILEHILTHISFSVVSIVLTIYFLTLLVNLDEIIGFFDSSDKGIIIT
|
||||
FFGITGLLLTRWIYSGHFPLSNLYESLIFLSWAFSIIHMVSYFNKKQQNK
|
||||
LNTITAPSVIFIQGFATSGLLNKMPQSAILVPALQSQWLMMHVSMMILGY
|
||||
GALLCGSLLSIALLVITFRKVGPTFWKKNIKKNFLLNELFSFDVLYYINE
|
||||
RNSILLQQNINFSFSRNYYRYQLIQQLDFWSFRIISLGFIFLTVGILSGA
|
||||
VWANETWGSYWNWDPKETWAFITWTIFAIYLHIKTNRNVRGINSAIVALI
|
||||
GFILIWICYFGVNLLGIGLHSYGSFTSN
|
||||
>NC_001319@MapoCp078@ccsa@95482@96444@D@1@321 cytochrome_c_biogenesis_protein
|
||||
MPFITLERILAHTSFFLLFFVTFIYWGKFLYINIKPITILGEISMKIACF
|
||||
FITTFLLIRWSSSGHFPLSNLYESSMFLSWSFTLIHLILENKSKNTWLGI
|
||||
ITAPSAMLTHGFATLSLPKEMQESVFLVPALQSHWLMMHVTMMMLSYSTL
|
||||
LCGSLLAITILIITLTKQKNLPILTSYFNFPFNSFIFKNLLQPMENEILS
|
||||
YKTQKVFSFINFRKWQLIKELDNWSYRVISLGFPLLTIGILSGAVWANEA
|
||||
WGSYWNWDPKETWALITWLIFAIYLHTRMIKGWQGKKPAIIASLGFFIVW
|
||||
ICYLGVNLLGKGLHSYGWLI
|
||||
>NC_001320@OrsajCp087@ccsa@105236@106201@D@1@322 cytochrome_c_biogenesis_protein
|
||||
MLFATLEHILTHISFSTISIVITIHLITLLVRELGGLRDSSEKGMIATFF
|
||||
CITGFLVSRWASSGHFPLSNLYESLIFLSWALYILHMIPKIQNSKNDLST
|
||||
ITTPSTILTQGFATSGLLTEMHQSTILVPALQSQWLMMHVSMMLLSYATL
|
||||
LCGSLLSAALLMIRFRKNLDFFSKKKKNVLSKTFFFNEIEYFYAKRSALK
|
||||
STFFPLFPNYYKYQLIERLDSWSYRVISLGFTLLTIGILCGAVWANEAWG
|
||||
SYWNWDPKETWAFITWTIFAIYLHSRTNPNWKGTKSAFVASIGFLIIWIC
|
||||
YFGINLLGIGLHSYGSFTLPI
|
||||
>NC_001631@PithCp147@ccsa@104925@105887@R@1@321 cytochrome_c_biogenesis_protein
|
||||
MIFITLEHILAHISFSLILVVTLIYWGTLVYRIEGLSSSGGKGMIVTFLC
|
||||
TTGLLINRWLYSGHLPLSNLYESFMFLSWSSSVFHILLEVRSRDDRWLGA
|
||||
ITAPSAMLTHGFATLGLPEEMQRSGMLVPALQSHWSMMHVSMILFSYATL
|
||||
LCGSLASIALLVIMSGVNRQVIFGAMDNLFSRAILPNENFYSHEKQKSDL
|
||||
QYTVYFSSTNYRKCQLIKQLDHWSYRAIGLGFSLSTIGTLSGAIWANEAW
|
||||
GSYWSWDPKETWALITWTIFAIYLHTRMNKGWQGEEPAIVASLGFFIVWI
|
||||
RYLGVNLLGIGLHSYGWLEP
|
||||
>NC_001666@ZemaCp085@ccsa@108995@109960@D@1@322 cytochrome_c_biogenesis_protein
|
||||
MLFATLEHILTHISFSTISIVITIHLITLLVRELRGLRDSSEKGMIATFF
|
||||
SITGFLVSRWVSSGHFPLSNLYESLIFLSWTLYILHTIPKIQNSKNDLST
|
||||
ITTPSTILTQGFATSGLLTEMHQSTILVPALQSQWLMMHVSMMLLSYATL
|
||||
LCGSLLSAALLIIRFRKNFDFFSLKKNVFLKTFFFSEIEYLYAKRSALKN
|
||||
TSFPVFPNYYKYQLTERLDSWSYRVISLGFTLLTVGILCGAVWANEAWGS
|
||||
YWNWDPKETWAFITWTIFAIYLHSRKNPNWKGTNSALVASIGFLIIWICY
|
||||
FGINLLGIGLHSYGSFTLPSK
|
90
detectors/cds/test/test.db/ndha.fst
Normal file
90
detectors/cds/test/test.db/ndha.fst
Normal file
@ -0,0 +1,90 @@
|
||||
>AC_000188@LyesCp085@ndha@121113@123337@R@2@364 NADH_dehydrogenase_subunit_1
|
||||
MIIDTTEIETINSFSKLESLKEVYGIIWMLVPIVTLVLGITIGVLVIVWL
|
||||
EREISAGIQQRIGPEYAGPLGILQALADGTKLLLKENLIPSTGDTRLFSI
|
||||
GPSIAVISIFLSYSVIPFGDHLVLADLSIGVFFWIAISSIAPVGLLMSGY
|
||||
GSNNKYSFLGGLRAAAQSISYEIPLALCVLSISLLSNSLSTVDIVEAQSK
|
||||
YGFWGWNLWRQPIGFIVFLISSLAECERLPFDLPEAEEELVAGYQTEYSG
|
||||
IKFGLFYIASYLNLLVSSLFVTVLYLGGWNLSIPYIFVPDIFGINKGGKV
|
||||
FGTLIGIFITLAKTYLFLFIPIATRWTLPRLRMDQLLNLGWKFLLPISLG
|
||||
NLLLTTSSQLLSL
|
||||
>NC_000927@NeolCp116@ndha@144380@145468@D@1@363 NADH_dehydrogenase_subunit_1
|
||||
MTYVLDLKRSFLDACTWLIGDNFRDLGSVLWVPLPILSLVIVATLGVLVI
|
||||
VWLERKISAGVQQRVGPEYGGALGLLQPLADGLKLVFKEDVVPAKSDTWL
|
||||
FTLGPAVVVIPIFLAYLVVPFGQQLIIADLRIGIFFWIAISSIAPIGLLM
|
||||
SGYGSNNKYSFLGGLRAAAQSISYELPLAICVLSVCLLADSLSTVDIVES
|
||||
QSSWGILTWNIWRQPIGFVAFLIAALAECERLPFDLPEAEEELVAGYQTE
|
||||
YTGMKFGLFYVGSYVNLLVSGCFVTVLYLGGWHGPFAIDGILPDSPPFQV
|
||||
LDAFLGITWTLLKTFLFLFAAILTRWTLPRVRIDQLLDLGWKFLLPVSLG
|
||||
NLLLTASLKLLF
|
||||
>NC_000932@ArthCp079@ndha@119847@122009@R@2@361 NADH_dehydrogenase_subunit_1
|
||||
MIIYATAVQTINSFVKLESLKEVYGLIWIFVPIFSLVLGIITGVLVIVWL
|
||||
EREISAGIQQRIGPEYAGPLGILQALADGTKLLFKENLRPSRGNTPLFSI
|
||||
GPSIAVISILLSYSVIPFSNHLVLADLNIGIFLWIAISSIAPIGLLMSGY
|
||||
GSNNKYSFLGGLRAAAQSISYEIPLTLCVLSISLLSNSLSTVDIVEAQSK
|
||||
YGFWGWNLWRQPIGFIIFLISSLAECERLPFDLPEAEEELIAGYQTEYSG
|
||||
IKFGLFYVASYLNLLISSLFVTVLYLGGWNISIPYISILELFQRDQIFGT
|
||||
TIGIFITLAKTYLFLFVSIATRWTLPRLRMDQLLNLGWKFLLPISLGNLL
|
||||
LTTSFQLFSL
|
||||
>NC_001319@MapoCp084@ndha@100382@102200@R@2@369 NADH_dehydrogenase_subunit_1
|
||||
MISNINLEDKFFSFFFTLGFSKEFFNFLWIIFSILILMLGVTIGVLVLVW
|
||||
LERKISAAIQQRIGPEYAGPLGIIQALADGIKLFLKEDIVPAQGDVWLFN
|
||||
IGPILVLIPVFLSYLVIPFEYNVILANFSIGVFFWIAVSSVVPLGLLMAG
|
||||
YGSNNKYSFLGGLRAAAQSISYEIPLALSVLSIALLSNSLSTVDIVEAQS
|
||||
KYGFLSWNLWRQPIGFIVFFIASLAECERLPFDLPEAEEELVAGYQTEYS
|
||||
GMKFAFFYLASYLNLLVSSLFVTILYLGGWHFSIPFFSLFKNFEWNLMSN
|
||||
GISEVISIIIGIVITLVKSYLFLFISIMTRWTLPRIRIDQLLNLGWKFLL
|
||||
PIALGNLLLTTSFQLFLL
|
||||
>NC_001320@OrsajCp093@ndha@110631@112706@R@2@363 NADH_dehydrogenase_subunit_1
|
||||
MIIDRVQVEAINSFSNLELLKEVYGLIWILPILTLLLGITIEVLVIVWLE
|
||||
REISASIQQRIGPEYAGPLGLLQAIADGTKLLFKEDILPSRGDIPLFSIG
|
||||
PSIAVISILLSFLVIPLGYRFVLADLSIGVFLWIAISSIAPIGLLMAGYS
|
||||
SNNKYSFSGGLRAAAQSISYEIPLTFCVLAISLLSNSSSTVDIVEAQSKY
|
||||
GFFGWNLWRQPIGFLVFLISSLAECERLPFDLPEAEEELVAGYQTEYSGI
|
||||
KYGLFYLVSYLNLLVSSLFVTVLYLGGWNLSIPYISFFGFFQMNKMVGIL
|
||||
EMTMSIFITLTKAYLFLFISITIRWTLPRMRMDQLLNLGWKFLLPISLGN
|
||||
LLLTTSSQLVSL
|
||||
>NC_001666@ZemaCp091@ndha@114343@116454@R@2@363 NADH_dehydrogenase_subunit_1
|
||||
MIIDRVEVETINSFSKSELFKEIYGLIWILPIFALLLGITIEVLVIVWLE
|
||||
REISASIQQRIGPEYAGPLGLLQAIADGTKLLLKEDILPSRGDIPLFSIG
|
||||
PSIAVISILLSFLVIPLGYRFVLADLSIGVFLWIAISSIAPIGLLMAGYS
|
||||
SNNKYSFSGGLRAAAQSISYEIPLTFCVLAISLLSNSSSTVDIVEAQSKY
|
||||
GFFGWNLWRQPIGFLVFLISSLAECERLPFDLPEAEEELVAGYQTEYSGI
|
||||
KYGLFYLVSYLNLLVSSLFVTVLYLGGWNFSIPYISFFGFFQMNKIIGIL
|
||||
EMVIGIFITLTKAYLFLFISITIRWTLPRMRMDQLLNLGWKFLLPISLGN
|
||||
LLLTTSSQLVSL
|
||||
>NC_001879@NitaCp088@ndha@121696@123935@R@2@364 NADH_dehydrogenase_subunit_1
|
||||
MIIDTTEIETINSFSKLESLKEVYGIIWMLFPILTLVLGITIGVLVIVWL
|
||||
EREISAGIQQRIGPEYAGPLGILQALADGTKLLLKENLIPSTGDTRLFSI
|
||||
GPSIAVISIFLSYSVIPFGDHLVLADLSIGVFFWIAISSIAPVGLLMSGY
|
||||
GSNNKYSFLGGLRAAAQSISYEIPLALCVLSISLLSNSLSTVDIVEAQSK
|
||||
YGFWGWNLWRQPIGFIVFLISSLAECERLPFDLPEAEEELVAGYQTEYSG
|
||||
IKFGLFYIASYLNLLVSSLFVTVLYLGGWNLSIPYIFVPELFGINKRGKV
|
||||
FGTLIGIFITLAKTYLFLFIPIATRWTLPRLRMDQLLNLGWKFLLPISLG
|
||||
NLLLTTSSQLLSL
|
||||
>NC_002186@MeviCp102@ndha@106489@107592@R@1@368 NADH_dehydrogenase_subunit_1
|
||||
MLLTINLKDSFLTFFSNLGFSNEFSKALWIPLPILLLIILAVVGVLVVVW
|
||||
LERKISAAVQQRIGPEYAGPLGVLQPLADGLKLAFKEDIIPSKGDVLLFT
|
||||
LGPAIVVIPIFLSYLIVPFGENLIVSNINLGIFFWITVSSVAPLGLLMSG
|
||||
YGSNNKYSFLGGLRATAQSLSYEIPLALCVLSICLLSDSLSTIDIVQKQS
|
||||
TYGILGWNIWRQPIGFIAFIIAALAECERLPFDLPEAEEELVAGYQTEYT
|
||||
GMKFGLFYIGSYVNLLVSALFASVLYLGGWSLPIPIEFLLNKMSLNASDS
|
||||
EVQVISAFLGIGMTLLKTYLFLFLSILTRWTMPRVRIDQLLDLGWKFLLP
|
||||
ISLGNLLLTASLKIALL
|
||||
>NC_002202@SpolCp090@ndha@117598@119774@R@2@366 NADH_dehydrogenase_subunit_1
|
||||
MIIDTTTTKVQAINSFSRLEFLKEVYETIWMLFPILILVLGITIGVLVIV
|
||||
WLEREISASIQQRIGPEYAGPLGILQALADGTKLLFKENLLPSRGDTYLF
|
||||
SIGPSIAVISILLGYLIIPFGSRLVLADLSIGVFLWIAVSSIAPIGLLMS
|
||||
GYGSNNKYSFLGGLRAAAQSISYEIPLTLCVLSISLLSNSSSTVDIVEAQ
|
||||
SKYGFWGWNLWRQPIGFIVFIISSLAECERLPFDLPEAEEELVAGYQTEY
|
||||
SGIKFGLFYVASYLNLLISSLFVTVLYLGGWNLSIPYIFISEFFEINKID
|
||||
GVFGTTIGIFITLAKTFLFLFIPITTRWTLPRLRMDQLLNLGWKFLLPIS
|
||||
LGNLLLTTSSQLFSL
|
||||
>NC_002693@OeelhCp102@ndha@125123@127258@R@2@364 NADH_dehydrogenase_subunit_1
|
||||
MIIDTTAVQDMNSFSRLQSLKEVSGIIWMLVPILSLVLGITLGVLVIVWL
|
||||
EREISAGIQQRIGPEYAGPMGILQALADGIKLIFKENLLPSRGDTRLFSI
|
||||
GPSIAVISILLSYSVIPFSSHLVLSDLNIGVFLWIAVSSIAPIGLLMSGY
|
||||
GSNNKYSFLGGLRAAAQSISYEIPLTLCLLSISLLSNSSSTVDIVEAQSK
|
||||
YGLWGWNLWRQPIGFLVFLISSLAECERLPFDLPEAEEELVAGYQTEYSG
|
||||
IKFGLFYVASYLNLLVSSLFVTVLYLGGWNISISYIFVPGLFEITKVGRV
|
||||
FGTTIGIFTTLAKTYLFLFISITTRWTLPRLRMDQLLNLGWKFLLPISLG
|
||||
NLLLTTSSQLLSL
|
120
detectors/cds/test/test.db/ndhb.fst
Normal file
120
detectors/cds/test/test.db/ndhb.fst
Normal file
@ -0,0 +1,120 @@
|
||||
>AC_000188@LyesCp066@ndhb@96224@98435@R@2@511 NADH_dehydrogenase_subunit_2
|
||||
MIWHVQNENFILDSTRIFMKAFHLLLFDGSLIFPECILIFGLILLLMIDS
|
||||
TSDQKDIPWLYFISSTSLVMSITALLFRWREEPMISFSGNFQTNNFNEIF
|
||||
QFLILLCSTLCIPLSVEYIECTEMAITEFLLFVLTATLGGMFLCGANDLI
|
||||
TIFVAPECFSLCSYLLSGYTKKDVRSNEATMKYLLMGGASSSILVHGFSW
|
||||
LYGSSGGEIELQEIVNGLINTQMYNSPGISIALIFITVGIGFKLSPAPSH
|
||||
QWTPDVYEGSPTPVVAFLSVTSKVAASASATRIFNIPFYFSSNEWHLLLE
|
||||
ILAILSMILGNLIAITQTSMKRMLAYSSIGQIGYVIIGIIVGDSNDGYAS
|
||||
MITYMLFYISMNLGTFACIVLFGLRTGTDNIRDYAGLYTKDPFLALSLAL
|
||||
CLLSLGGLPPLAGFFGKLYLFWCGWQAGLYFLVLIGLLTSVVSIYYYLKI
|
||||
IKLLMTGRNQEITPHVRNYRRSPLRSNNSIELSMIVCVIASTIPGISMNP
|
||||
IIAIAQDSLF
|
||||
>AC_000188@LyesCp086@ndhb@142909@145120@D@2@511 NADH_dehydrogenase_subunit_2
|
||||
MIWHVQNENFILDSTRIFMKAFHLLLFDGSLIFPECILIFGLILLLMIDS
|
||||
TSDQKDIPWLYFISSTSLVMSITALLFRWREEPMISFSGNFQTNNFNEIF
|
||||
QFLILLCSTLCIPLSVEYIECTEMAITEFLLFVLTATLGGMFLCGANDLI
|
||||
TIFVAPECFSLCSYLLSGYTKKDVRSNEATMKYLLMGGASSSILVHGFSW
|
||||
LYGSSGGEIELQEIVNGLINTQMYNSPGISIALIFITVGIGFKLSPAPSH
|
||||
QWTPDVYEGSPTPVVAFLSVTSKVAASASATRIFNIPFYFSSNEWHLLLE
|
||||
ILAILSMILGNLIAITQTSMKRMLAYSSIGQIGYVIIGIIVGDSNDGYAS
|
||||
MITYMLFYISMNLGTFACIVLFGLRTGTDNIRDYAGLYTKDPFLALSLAL
|
||||
CLLSLGGLPPLAGFFGKLYLFWCGWQAGLYFLVLIGLLTSVVSIYYYLKI
|
||||
IKLLMTGRNQEITPHVRNYRRSPLRSNNSIELSMIVCVIASTIPGISMNP
|
||||
IIAIAQDSLF
|
||||
>NC_000927@NeolCp033@ndhb@28430@29950@D@1@507 NADH_dehydrogenase_subunit_2
|
||||
MELSDILASFHASNLIPEGIVACTILLVLLLDLVYSRTCHAWLAWVAMAG
|
||||
LSLASVLLGQQWYQLMNLPTATMTFGGSFQADSLSLVFRAIIAMSCVLCI
|
||||
LLSIDYVESTGTAPSEFLVLIATASLGGMLVAGSNDLLMMFVSLETLGLA
|
||||
SYLLTGYMKRDVRSNEASLKYLLVGAASSGLFLYGISWMYGISGGHMELN
|
||||
SIAHAIVSLDETKTTTCALALVLMTVGVGFKVAAAPFHQWTPDVYQGSPT
|
||||
PVVAFLSVGSKAAGFILAVRMCTTLFPSFNTEWHLIFTILSILSMIVGNF
|
||||
IAVTQTSLKRMLGYSSVGQAGVMMIGMLTDSPDGYASLIVYLLIYLFMNL
|
||||
GAFACVILFGLRTGTDQIQDYSGLLARDPFLALCLSLCLLSLGGIPPLAG
|
||||
FFGKMYLFLAAWDAGQYSLVWVGLITSVVSIYYYLSVVKIMLVPATQEMS
|
||||
LAVREYPRRAWSLEPIQPLEVGIFVCVLGSILVGVAGNSMVNLMTITMSQ
|
||||
APSLGV
|
||||
>NC_000932@ArthCp068@ndhb@94941@97164@R@2@513 NADH_dehydrogenase_subunit_2
|
||||
MIWHVQNENFILDSTRIFMKAFHLLLFDGSFIFPECILIFGLILLLMIDS
|
||||
TSDQKDIPWLYFISSTSFVMSITALLFRWREEPMISFSGNFQTNNFNEIF
|
||||
QFLILLCSTLCIPLSVEYIECTEMAITEFLLFILTATLGGMFLCGANDLI
|
||||
TIFVAPECFSLCSYLLSGYTKKDIRSNEATMKYLLMGGASSSILVHGFSW
|
||||
LYGSSGGEIELQEIVNGLINTQMYNSPGISIALIFITVGIGFKLSLAPSH
|
||||
QWTPDVYEGSPTPVVAFLSVTSKVAASASATRIFDIPFYFSSNEWHLLLE
|
||||
ILAILSMIFGNLIAITQTSMKRMLAYSSIGQIGYVIIGIIVGDSNGGYAS
|
||||
MITYMLFYIAMNLGTFACIILFGLRTGTDNIRDYAGLYTKDPFLALSLAL
|
||||
CLLSLGGLPPLAGFFGKLHLFWCGWQAGLYFLVSIGLLTSVLSIYYYLKI
|
||||
IKLLMTGRNQEITPHMRNYRISPLRSNNSIELSMIVCVIASTIPGISMNP
|
||||
IIAIAQDTLFSF
|
||||
>NC_000932@ArthCp086@ndhb@141485@143708@D@2@513 NADH_dehydrogenase_subunit_2
|
||||
MIWHVQNENFILDSTRIFMKAFHLLLFDGSFIFPECILIFGLILLLMIDS
|
||||
TSDQKDIPWLYFISSTSFVMSITALLFRWREEPMISFSGNFQTNNFNEIF
|
||||
QFLILLCSTLCIPLSVEYIECTEMAITEFLLFILTATLGGMFLCGANDLI
|
||||
TIFVAPECFSLCSYLLSGYTKKDIRSNEATMKYLLMGGASSSILVHGFSW
|
||||
LYGSSGGEIELQEIVNGLINTQMYNSPGISIALIFITVGIGFKLSLAPSH
|
||||
QWTPDVYEGSPTPVVAFLSVTSKVAASASATRIFDIPFYFSSNEWHLLLE
|
||||
ILAILSMIFGNLIAITQTSMKRMLAYSSIGQIGYVIIGIIVGDSNGGYAS
|
||||
MITYMLFYIAMNLGTFACIILFGLRTGTDNIRDYAGLYTKDPFLALSLAL
|
||||
CLLSLGGLPPLAGFFGKLHLFWCGWQAGLYFLVSIGLLTSVLSIYYYLKI
|
||||
IKLLMTGRNQEITPHMRNYRISPLRSNNSIELSMIVCVIASTIPGISMNP
|
||||
IIAIAQDTLFSF
|
||||
>NC_001319@MapoCp003@ndhb@1514@3555@D@2@502 NADH_dehydrogenase_subunit_2
|
||||
MKLELDMFFLYGSTILPECILIFSLLIILIIDLTFPKKDTIWLYFISLTS
|
||||
LLISIIILLFQYKTDPIISFLGSFQTDSFNRIFQSFIVFCSILCIPLSIE
|
||||
YIKCAKMAIPEFLIFILTATVGGMFLCGANDLVTIFVSLECLSLCSYLLC
|
||||
GYTKRDIRSNEAAIKYLLIGGTSSSILAYGFSWLYGLSGGETNIQKITNG
|
||||
LLNAETYNSSGTFIAFICILVGLAFKLSLVPFHQWTPDIYEGSPTPVVAF
|
||||
LSVTSKIAGLALATRILNILFSFSPNEWKIFLEILAILSMILGNLVAITQ
|
||||
TSMKRMLAYSSISQIGYILIGLITGDLKGYTSMTIYVFFYIFMNLGTFAC
|
||||
IILYSLRTGTDNIRDYAGLYIKDPLLSFSLTLCLLSLGGLPPLTGFFGKL
|
||||
YLFWCGWQSGFYLLVFIALITSVISLYYYLKIIKLILTKKNNEINPYIQA
|
||||
YIITSPTFFSKNPIEFVMIFCVLGSTFLGIIINPIFSFFQDSLSLSVFFI
|
||||
K
|
||||
>NC_001320@OrsajCp075@ndhb@85395@87639@R@2@511 NADH_dehydrogenase_subunit_2
|
||||
MIWHVQNENFILDSTRIFMKAFHLLLFQGSFIFPECILIFGLILLLMIDL
|
||||
TSDQKDRPWFYFISSTSLVISITALLFRWREEPIISFSGNFQTNNFNEIF
|
||||
QFLILLCSTLCIPLSVEYIECTEMAITEFLLFVLTATLGGMFLCGANDLI
|
||||
TIFVAPECFSLCSYLLSGYTKRDLRSNEATMKYLLMGGASSSILVHGFSW
|
||||
LYGSSGGEIELQEIVNGLINTQMYNSPGISIALISITVGLGFKLSPAPFH
|
||||
QWTPDVYEGSPTPVVAFLSVTSKVAASASATRILDIPFYFSSNEWHLLLE
|
||||
ILAILSMILGNLLAITQTSMKRMLAYSSIGQIGYVIIGIIVGDSNDGYAS
|
||||
MITYMLFYISMNLGTFACIVLFGLRTGTDNIRDYAGLYTKDPFLALSLAL
|
||||
CLLSLGGLPPLAGFFGKLYLFWCGWQAGLYFLVSIGLLTSVLSIYYYLKI
|
||||
VKLLMTGRNQEITPYVRNYRRSPLRSNNSIELSMTVCVIASTIPGISMNP
|
||||
ILAIAQDTLF
|
||||
>NC_001320@OrsajCp104@ndhb@127479@129723@D@2@511 NADH_dehydrogenase_subunit_2
|
||||
MIWHVQNENFILDSTRIFMKAFHLLLFQGSFIFPECILIFGLILLLMIDL
|
||||
TSDQKDRPWFYFISSTSLVISITALLFRWREEPIISFSGNFQTNNFNEIF
|
||||
QFLILLCSTLCIPLSVEYIECTEMAITEFLLFVLTATLGGMFLCGANDLI
|
||||
TIFVAPECFSLCSYLLSGYTKRDLRSNEATMKYLLMGGASSSILVHGFSW
|
||||
LYGSSGGEIELQEIVNGLINTQMYNSPGISIALISITVGLGFKLSPAPFH
|
||||
QWTPDVYEGSPTPVVAFLSVTSKVAASASATRILDIPFYFSSNEWHLLLE
|
||||
ILAILSMILGNLLAITQTSMKRMLAYSSIGQIGYVIIGIIVGDSNDGYAS
|
||||
MITYMLFYISMNLGTFACIVLFGLRTGTDNIRDYAGLYTKDPFLALSLAL
|
||||
CLLSLGGLPPLAGFFGKLYLFWCGWQAGLYFLVSIGLLTSVLSIYYYLKI
|
||||
VKLLMTGRNQEITPYVRNYRRSPLRSNNSIELSMTVCVIASTIPGISMNP
|
||||
ILAIAQDTLF
|
||||
>NC_001666@ZemaCp075@ndhb@89236@91472@R@2@511 NADH_dehydrogenase_subunit_2
|
||||
MIWHVQNENFILDSTRIFMKAFHLLLFHGSFIFPECILIFGLILLLMIDL
|
||||
TSDQKDRPWFYFISSTSLVISITALLFRWREEPIISFSGNFQTNNFNEIF
|
||||
QFLILLCSTLCIPLSVEYIECTEMAITEFLLFVLTATLGGMFLCGANDLI
|
||||
TIFVAPECFSLCSYLLSGYTKRDLRSNEATMKYLLMGGASSSILVHGFSW
|
||||
LYGSSGGEIELQEIVNGLINTQMYNSPGISIALIFITVGLGFKLSPAPFH
|
||||
QWTPDVYEGSPTPVVAFLSVTSKVAASALATRILDIPFYFSSNEWHLLLE
|
||||
ILAILSMILGNLLAITQTSMKRMLAYSSIGQIGYVIIGIIVGDSNDGYAS
|
||||
MITYMLFYISMNLGTFACIVLFGLRTGTDNIRDYAGLYTKDPFLALSLAL
|
||||
CLLSLGGLPPLAGFFGKLYLFWCGWQAGLYFLVSIGLLTSVLSIYYYLKI
|
||||
IKLLMTGRNQEITPYVRNYRRSPLRSNNSIELSMTVCVIASTIPGISMNP
|
||||
ILAIAQDTLF
|
||||
>NC_001666@ZemaCp101@ndhb@131265@133501@D@2@511 NADH_dehydrogenase_subunit_2
|
||||
MIWHVQNENFILDSTRIFMKAFHLLLFHGSFIFPECILIFGLILLLMIDL
|
||||
TSDQKDRPWFYFISSTSLVISITALLFRWREEPIISFSGNFQTNNFNEIF
|
||||
QFLILLCSTLCIPLSVEYIECTEMAITEFLLFVLTATLGGMFLCGANDLI
|
||||
TIFVAPECFSLCSYLLSGYTKRDLRSNEATMKYLLMGGASSSILVHGFSW
|
||||
LYGSSGGEIELQEIVNGLINTQMYNSPGISIALIFITVGLGFKLSPAPFH
|
||||
QWTPDVYEGSPTPVVAFLSVTSKVAASALATRILDIPFYFSSNEWHLLLE
|
||||
ILAILSMILGNLLAITQTSMKRMLAYSSIGQIGYVIIGIIVGDSNDGYAS
|
||||
MITYMLFYISMNLGTFACIVLFGLRTGTDNIRDYAGLYTKDPFLALSLAL
|
||||
CLLSLGGLPPLAGFFGKLYLFWCGWQAGLYFLVSIGLLTSVLSIYYYLKI
|
||||
IKLLMTGRNQEITPYVRNYRRSPLRSNNSIELSMTVCVIASTIPGISMNP
|
||||
ILAIAQDTLF
|
113
detectors/cds/test/test.db/ndhd.fst
Normal file
113
detectors/cds/test/test.db/ndhd.fst
Normal file
@ -0,0 +1,113 @@
|
||||
>AC_000188@LyesCp081@ndhd@116944@118446@R@1@501 NADH_dehydrogenase_subunit_4
|
||||
MNYFPWLTIIVVFPIFAGSLIFFLPHKGNRVIRWYTICICILELLLTTYA
|
||||
FCYHFQSDDPLIQLVEDYKWIDFFDFHWRLGIDGLSIGPILLTGFITTLA
|
||||
TLAAWPVTRDSRLFHFLMLAMYSGQIGLFSSRDLLLFFIMWELELIPVYL
|
||||
LLAMWGGKKRLYSATKFILYTAGGSVFLLMGVLGVALYGSNEPTLNFETS
|
||||
VNQSYPVVLEIIFYIGFFIAFAVKSPIIPLHTWLPDTHGEAHYSTCMLLA
|
||||
GILLKMGAYGLIRINMELLPHAHSIFSPWLMIIGTIQIIYAASTSLGQRN
|
||||
LKKRIAYSSVSHMGFIIIGISSLTDTGLNGALLQIISHGFIGAALFFLAG
|
||||
TTYDRIRLVYLDEMGGIAIPMPKMFTMFSSFSMASLALPGMSGFVAELIV
|
||||
FFGIITGQKYLLMPKLLITFVMAIGIILTPIYSLSMPRQMFYGYKLFNAP
|
||||
KDSFFDSGPRELFLSISIFLPVIGIGIYPDFVLSLAVDKVEVILSNFFYR
|
||||
>NC_000927@NeolCp113@ndhd@139299@140801@D@1@501 NADH_dehydrogenase_subunit_4
|
||||
MTHFPWLSTIVLFPLLASLAIPWLPDRKGTTVRWYALGVGLIDFSLIAYM
|
||||
FGRYYDFEQTSLQFVEDITWIDRLHLHWSLGVDGLSMPLVLLTGFITTLA
|
||||
TLAAWPVTKNPRLFYFLMLAMYTGQLGVFVVQDLLLFFLMWELELIPVYL
|
||||
LVSCWGGKKRLYAATKFILYTALGSIFILLGALTMPFMGIQGVTFDMSTL
|
||||
AYREYSLPVEILLYTGFLIAYGVKLPAIPVHTWLPDTHGEAHYSTCMLLA
|
||||
GILLKMGGYALIRINMNMLPHAHALFSPWLIGVGVVNIIYAALTSFAQRN
|
||||
LKRKIAYSSVSHMGFVLIGIGSLSEAGLNGAMLQMISHGLIGASLFFLAG
|
||||
TTYDRTRTLVLEEMGGLATFMPKTFALFTACSLASLALPGMSGFFAELLV
|
||||
FLGLVTSEAYSPTFRAIMTVFEAIGILLTPIYLLSMLRQLFYGRSIGRPK
|
||||
ALIDAGPREVFVVSCLLVPILGIGIYPKLATAIYVNTTDHVVQHVLSALR
|
||||
>NC_000932@ArthCp074@ndhd@115665@117167@R@1@501 NADH_dehydrogenase_subunit_4
|
||||
MNDFPWLTIIVVFPISAGSLMLFLPHRGNKVNKWYTICICILELLLTTYA
|
||||
FCYNFKMDDPLIQLSEDYKWIDFFDFYWRMGIDGLSIGTILLTGFITTLA
|
||||
TLAAFPVTRDSRFFHFLMLAMYSGQIGSFSSRDLLLFFIMWELELIPVYL
|
||||
LLSMWGGKKRLYSATKFILYTAGSSIFLLIGVLGISLYGSNEPTLNLELL
|
||||
ANKSYPVTLEILFYIGFLIAFAVKSPIIPLHTWLPDTHGEAHYSTCMLLA
|
||||
GILLKMGAYGLVRINMELLPHAHSMFSPWLLVVGTIQIIYAASTSPGQRN
|
||||
LKKRIAYSSVSHMGFIIIGISSITDPGLNGAILQIISHGFIGAALFFLAG
|
||||
TSYDRIRLVYLDEMGGMAISIPKIFTMFTILSMASLALPGMSGFIAEFIV
|
||||
FFGIITSQKYFLISKIFIIFVMAIGMILTPIYLLSMLRQMFYGYKLINIK
|
||||
NFSFFDSGPRELFLSISILLPIIGIGIYPDFVLSLASDKVESILSNYFYG
|
||||
>NC_001319@MapoCp079@ndhd@96665@98164@R@1@500 NADH_dehydrogenase_subunit_4
|
||||
MNHFPWLTIIVLFPISAGLVIPFLPSTGNKIIRWYTLGVCLLEFLLITYI
|
||||
FCYHYQFNDHLIQLKEDYNWISFINFHWRLGIDGFSIGLILLTGFITTLA
|
||||
TLAAWPVTRNPRLFYFLMLAMYSGQIGLFASQDILLFFFMWELELLPVYL
|
||||
LLAMWGGKRRLYAATKFILYTAAGSLFILIGGLIMAFYNSNEFTFDFQFL
|
||||
INKKYPLELEIIIYLSFLIAYAVKLPIIPFHTWLPDTHGEAHYSTCMLLA
|
||||
GILLKMGAYGLIRINMELLPHAHSFFAPWLVIVGAIQIVYAALTSLSQRN
|
||||
LKRRIAYSSVSHMGFVLIGIGSITNLGLNGAILQMISHGLIGASLFFLAG
|
||||
ISYDRTRTLVLDQMGGIGNSMPKIFTLFTSCSMASLALPGMSGFIAELMI
|
||||
FLGVIDNPNYSSLFKIIIIIIQGIGIILTPIYLLSMLRQMFYGYKFSNTL
|
||||
EPYFMDAGPREIFILICLFFPIISIGIYPNFVLSIWNSKVNFLLSNNFF
|
||||
>NC_001320@OrsajCp088@ndhd@106398@107900@R@1@501 NADH_dehydrogenase_subunit_4
|
||||
MSSFPWLTILVVLPIFAGSLIFFLPHRGNKIVRWYTMSICLLEFLLMTYA
|
||||
FCYHFQLEDPLIQLKEDSKWIDVFNFHWRLGIDGLSLGSILLTGFMTTLA
|
||||
TLAAWPVTRNSRLFYFLMLAMYSGQIGLFSSRDLLLFFIMWELELIPVYL
|
||||
LLSMWGGKRRLYSATKFILYTAGGSIFFLIGVLGMGLYGSNEPRLDLERL
|
||||
INQSYPATLEILFYFGFLIAYAVKLPIIPLHTWLPDTHGEAHYSTCMLLA
|
||||
GILLKMGAYGLIRINMELLPHAHYLFSPWLVIIGAMQIIYAASTSLGQRN
|
||||
FKKRIAYSSVSHMGFIIIGIGSITNIGLNGAILQILSHGFIGATLFFLAG
|
||||
TACDRMRLVYLEELGGASIPMPKIFTMFSSFSMASLALPGMSGFVAELVV
|
||||
FFGLITSPKFLLMPKMLITFVMAIGMILTPIYLLSMLRQMFYGYKLFHVP
|
||||
NENFEDSGPRELFLLICIFLPVIGIGIYPDFVLSLSVDRVEALLSNYYPK
|
||||
>NC_001666@ZemaCp086@ndhd@110138@111640@R@1@501 NADH_dehydrogenase_subunit_4
|
||||
MSYFPWLTILVVLPIFAGSLIFFLPHKGNKIVRWYTIAICLLEFLLMTYA
|
||||
FCYHFQLEDPLIQLKEDSKWIDVFDFHWRLGIDPLSLGSILLTGFITTLA
|
||||
TLAAWPVTRNSQLFYFLMLAMYSGQIGLFSSRDLLLFFIMWELELIPVYL
|
||||
LLSMWGGKRRLYSATKFILYTAGGSIFFLIGVLGMGLYGSNEPGLDLERL
|
||||
INQSYPTTWEILLYFGFLIAYAVKLPIIPLHTWLPYTHGEAHYSTCMLLA
|
||||
GILLKMGAYGLIRVNMELLPHAHYLFSPWLVIIGAVQIIYAASTSLGQRN
|
||||
FKKRIAYSSVSHMGFIIIGIGSITNIGLNGAILQILSHGFIGATLFFLAG
|
||||
TACDRMRLVYLEELGGISIPMPKIFTMFSSFSMASLALPGMSGFVAELVV
|
||||
FFGLITSPKFMLMPKMLITFVMAIGMILTPIYLLSMLRQMFYGYKLFHVP
|
||||
NKNFVDSGPRELFLLICIFLPVIGIGIYPDLVLSLSVDRVEVLLSNYYTK
|
||||
>NC_001879@NitaCp083@ndhd@117525@119027@R@1@501 NADH_dehydrogenase_subunit_4
|
||||
MNYFPWLTIIVVFPIFAGSLIFFLPHKGNRVIRWYTICICILELLLTTYA
|
||||
FCYHFQSDDPLIQLVEDYKWINFFDFHWRLGIDGLSIGPILLTGFITTLA
|
||||
TLAAWPVTRDSRLFHFLMLAMYSGQIGSFSSRDLLLFFIMWELELIPVYL
|
||||
LLCMWGGKKRLYSATKFILYTAGGSVFLLMGVLGLALYGSNEPTLNFETS
|
||||
VNQSYPVVLEIIFYIGFFIAFAVKSPIIPLHTWLPDTHGEAHYSTCMLLA
|
||||
GILLKMGAYGLIRINMELLPHAHSIFSPWLMIIGTIQIIYAALTSLGQRN
|
||||
LKKRIAYSSVSHMGFIIIGISSLTDTGLNGALLQIISHGFIGAALFFLAG
|
||||
TTYDRIRLVYLDEMGGIAIPMPKMFTMFSSFSMASLALPGMSGFVAELIV
|
||||
FFGIITGQKYLLIPKILITFVMAIGMILTPIYSLSMSRQMFYGYKLFNAP
|
||||
KDSFFDSGPRELFLSISIFLPVIGIGIYPDFVLSLAVDKVEVILSNFFYR
|
||||
>NC_002186@MeviCp085@ndhd@90277@91800@D@1@508 NADH_dehydrogenase_subunit_4
|
||||
MNNFPWITSIVMLPILAGLLIPFIPDENGKNVRWYALGIGLLDFLLISYI
|
||||
FGYKYNIQDTSLQLIDDYEWISSINFHWRLGIDGLSIPLILLTGFITTLA
|
||||
MLGAWPIQKNAKLFYFLMLAMYSGQLGVFASQDLLLFFLMWELELIPIYI
|
||||
LLIIWGGKKRLYAATKFILYTALGSIFILIAAFGMAFYGENMSFDMQILG
|
||||
EKEYPINLEILFYICFLIAYAVKLPAFPVHTWLPDTHGEAHYSTCMLLAG
|
||||
ILLKMGGYALIRINMNMLPNAHIYFAPYLAIIGVINIIYAALTSFAQRNI
|
||||
KRKIAYSSISHMGFVLIGISSFTDIGLSGAMLQMVSHGLIGASLFFLAGT
|
||||
TYDRTRTLILEDMGGIAKYMPKIFAMFTTCSLASLALPGMSGFVAELMVF
|
||||
LGFANSNAYSIEFRGIITFLEAIGIIVTPIYLLSMLRQVFYGSENLKLLK
|
||||
VNNLIDASAREIFIISCLLVPVIGIGIYPRILTQIYDLKTNAIIEHLEII
|
||||
RSNSQIM
|
||||
>NC_002202@SpolCp085@ndhd@113491@114996@R@1@502 NADH_dehydrogenase_subunit_4
|
||||
MTNSFPWLTTIVVLPIFAGSLIFLFPHRGNKVIRWYTICISMIELLLMTY
|
||||
VFFYHFQPDDPLIQLVEDYKWINFFDFHWRLGIDGLSIGPILLTGFITTL
|
||||
ATLAAWPVTRNSQLFHFLMLAMYSAQIGLFSSRDLLLFFIMWELELIPVY
|
||||
LLLSMWGGKKRLYSATKFILYTAGGSIFLLMGVLGVGLYGSNEPTLNLET
|
||||
LVNQSYPVALEIIFYIGFFIAFAVKLPIIPLHTWLPDTHGEAHYSTCMLL
|
||||
AGILLKMGAYGLVRINMELLPHAHSIFSPWLMIIGTMQIIYAASTSPGQR
|
||||
NLKKRIAYSSVSHMGFIIIGISSITDTGLNGAILQIISHGFIGAALFFLA
|
||||
GTSYDRIRLVYLDEMGGIAIPMPKIFTLFSSFSMASLALPGMSGFIAELI
|
||||
VFFGLITSQKYLLIPKLLITFGMAIGMILTPIYLLSMSRQMFYGYKLFNI
|
||||
SNSSFFDSGPRELFVSTSIFLPVIGIGVYPDLVLSLSVEKVEAILSNYFY
|
||||
R
|
||||
>NC_002693@OeelhCp097@ndhd@121124@122647@R@1@508 NADH_dehydrogenase_subunit_4
|
||||
MNSFPWLTIIVVFPILTGSLIFLLPHRGNKVMKWYTLCICILELLLTTYT
|
||||
FCYHFQLDDPLTQLTENYKWIHFFDFYWRLGIDGLSIGPILLTGFITTLA
|
||||
TLAAWPVTRDAQLFHFLMLAMYSGQIGSFSSRDLLLFFLMWEFELIPVYL
|
||||
LLSMWGGKKRLYSATKFILYTAGGSIFLLIGVLGIGLYGSNEPTLNFETL
|
||||
ANQSYPVALEVIFYVGFLIAFAVKLPIIPFHTWLPDTHGEAHYSTCMLLA
|
||||
GILLKMGAYGLVRINMELLPHAHCLFSPGLIIVGAIQIIYAASTSPGQLN
|
||||
LKKRIAYSSISHMGFIIIGIGSLSDTGLNGAILQIISHGFIGAALFFLAG
|
||||
TSYDRIRLLYLDEMGGMAIPLPKLFTMLSILSMASLALPGLSGFVAELLV
|
||||
FFGIITSQKYLLMPKILIAFLMAIGMILTPIYSLSMLRQMFYGYKLFNVP
|
||||
NYYFFDSGPRELFVSISLLLPIIGIGIYPDFVLSLSVEKVEAIISHFFFS
|
||||
IVFKKKE
|
39
detectors/cds/test/test.db/ndhe.fst
Normal file
39
detectors/cds/test/test.db/ndhe.fst
Normal file
@ -0,0 +1,39 @@
|
||||
>AC_000188@LyesCp080@ndhe@119061@119366@R@1@102 NADH_dehydrogenase_subunit_4
|
||||
MILEHVLVLSAYLFSIGIYGLITSRNMVRALMCLELILNAVNINFVTFSD
|
||||
FFDNRQLKGDIFSIFVIAIAAAEAAIGLAIVSSIYRNRKSTRINQSNLLN
|
||||
N
|
||||
>NC_000927@NeolCp119@ndhe@147326@147631@D@1@102 NADH_dehydrogenase_subunit_4L
|
||||
MIFQSYLLIAASMFCIGLYGLLTSRNVVRVLMSLELLLNAVNLNLLTFSN
|
||||
FVDSHEMKGQVLALFVIALAAAEAAIGLAIILSIYRNQRTVDPEQFNLLK
|
||||
W
|
||||
>NC_000932@ArthCp076@ndhe@117804@118109@R@1@102 NADH_dehydrogenase_subunit_4L
|
||||
MILEHVLVLSAYLFLIGLYGLITSRNMVRALMCLELILNAVNMNFVTFSD
|
||||
FFDNSQLKGEIFCIFVIAIAAAEAAIGLAIVSSIYRNRKSIRINQSTLLN
|
||||
K
|
||||
>NC_001319@MapoCp081@ndhe@98757@99059@R@1@101 NADH_dehydrogenase_subunit_4L
|
||||
MLEHILTLSAFLFCIGVFGLITSRNMVRALMCLELIFNAVNINLVAFSNF
|
||||
LDSSQIKGEIFSIFIIAIAAAEATIGLAIVLAIYRNRKSTRIDQFNLLKW
|
||||
>NC_001320@OrsajCp090@ndhe@108712@109017@R@1@102 NADH_dehydrogenase_subunit_4L
|
||||
MMFEHVLFLSVYLFSIGIYGLITSRNMVRALICLELILNSINLNLVTFSD
|
||||
LFDSRQLKGDIFAIFVIALAAAEAAIGLSILSSIHRNRKSTRINQSNFLN
|
||||
N
|
||||
>NC_001666@ZemaCp088@ndhe@112473@112778@R@1@102 NADH_dehydrogenase_subunit_4L
|
||||
MMFERVLFLSVYLFSIGIYGLITSRNMVRALICLELILNSINLNLVTFSD
|
||||
LFDSRQLKGDIFAIFVIALAAAEAAIGLSILSSIHRNRKSTRINQSNFLN
|
||||
N
|
||||
>NC_001879@NitaCp085@ndhe@119652@119957@R@1@102 NADH_dehydrogenase_subunit_4L
|
||||
MILEHVLVLSAYLFSIGIYGLITSRNMVRALMCLELILNAVNINFVTFSD
|
||||
FFDNRQLKGDIFSIFVIAIAAAEAAIGLAIVSSIYRNRKSTRINQSNLLN
|
||||
N
|
||||
>NC_002186@MeviCp099@ndhe@104916@105221@R@1@102 NADH_dehydrogenase_subunit_4L
|
||||
MYIENFLLLASALFCIGIYGLLTSRNIVRVLMCLELCLNAININFIAFSN
|
||||
FIDYEKINGQVIAIFIMTIAAAEAAIGLALVLTIYRNRETVDIENFDLLK
|
||||
G
|
||||
>NC_002202@SpolCp087@ndhe@115663@115968@R@1@102 NADH_dehydrogenase_subunit_4L
|
||||
MILEHVLVLSAFLFSIGIYGLVTSRNLVRALMCLELILNAVNLNFVTFSD
|
||||
FFDSRQLKGNIFSIFVIAIAAAEAAIGPAIVSSIYRNRKSIRINQSNLLN
|
||||
K
|
||||
>NC_002693@OeelhCp099@ndhe@123298@123603@R@1@102 NADH_dehydrogenase_subunit_4L
|
||||
MILEHVLVLSAYLFSIGIYGLITSRNMVRALMCLELILNSVNLNFVTFSD
|
||||
FFDSRQLKGDIFSIFIIAIAAAEAAIGLAIVSSIYRNRKSIRINQSNLLN
|
||||
K
|
157
detectors/cds/test/test.db/ndhf.fst
Normal file
157
detectors/cds/test/test.db/ndhf.fst
Normal file
@ -0,0 +1,157 @@
|
||||
>AC_000188@LyesCp073@ndhf@111508@113721@R@1@738 NADH_dehydrogenase_subunit_5
|
||||
MEQTYEYAWIIPFIPLPVPMLIGAGLILFPTATKRFRRMWAFQSVLLLSI
|
||||
VMIFSIYLSIQQINSSSVYQYVWSWIINNDFSLDFGYLIDPLTSIMSILI
|
||||
TTVGIMVLIYSDNYMAHDQGYLRFFAYMSFFSTSMLGLVTSSNLIQIYIF
|
||||
WELVGLCSYLLIGFWFTRPVAANACQKAFVTNRVGDFGLLLGILGFYWIT
|
||||
GSFEFRDLFEIFNNLIYNNELNFLFVTLCAVLLFAGAVAKSAQFPLHVWL
|
||||
PDAMEGPTPISALIHAATMVAAGIFLVARLLPLFRVIPYIMYLISVIGII
|
||||
TVLLGATLALAQKDIKRGLAYSTMSQLGYMMLALGMGSYRSALFHLITHA
|
||||
YSKALLFLGSGSIIHSMETIVGYSPAKSQNMGLMGGLRKHVPITKITFLL
|
||||
GTLSLCGIPPLACFWSKDEILNDSWLYSPIFAIIAWATAGLTAFYMFRIY
|
||||
LLTFEGHLNAHFQNYGGKQKIPFYSISLWGKNGVKKNSCLLTMNNNESTY
|
||||
FLSKTKYPIAKNGRKMTRPFMTIAHFKHKAVSSYPYESDNTMLFPIFVLG
|
||||
LFTLFVGAIGIPFNQEGVNLDILSKWLAPSINLLHPKSNNSLDWNEFLKD
|
||||
AVVSVSIAYFGIFIASFLYKPIYSSLKNLEFINSFVKKGPKRILWDKILN
|
||||
GIYDWSYNRAYIDAFYTRFFVGGIRGLAEFTHFVDRRVIDGMTNGVGVIS
|
||||
FIVGEGIKYIGGGRISSYLFLYLAYVSVFLLVYYLLF
|
||||
>NC_000927@NeolCp114@ndhf@140837@142783@R@1@649 NADH_dehydrogenase_subunit_5
|
||||
MEIFHQAIWLIPVLPLSASMLSGIGLLTFRETTSDLRRLHGALAIGAMAL
|
||||
SFVVSLGVLWNQLHGIAPVRWIIEWMLTDTFRLEIGYWVDPLTSTMLVVV
|
||||
TSVALLVMIYSDEYMHVDEGYVRFFVYLSIFTTSMLGLVLSPNLVQVYGF
|
||||
WELVGMCSYLLVGFWFTRPTAAEASQKAFITNRVGDFGLLLGILALYWMT
|
||||
GSFEFASIADRLGDLLIAIPSLRTIACIACILVFMGPIAKSAQFPLHVWL
|
||||
PDAMEGPTPISALIHAATMVAAGVFLVARMFPVFDQLPLVMELIAWTGTL
|
||||
TAFLGATMALTQSDIKKGLAYSTMSQLGYMIMALGTGAYSEALFHLTTHA
|
||||
YSKALLFLAAGSVIHGMEPVVGFSPMQNQNMHRMGGLRKYMPLTAMTFLL
|
||||
GTCSICGIPPLACFWSKDAILAEVFATHPTCWLIAWLTAGMTGFYMFRIY
|
||||
FLTFEGSFRSDLGRAKPKESHLGMVAPLIILAIPTVAIGSLGTPFAPVWE
|
||||
TFVHAPGQLSSLDEEFDLAEFLEMAGSSVGIGLLGISLSSLMYRNYAIDA
|
||||
TRISEYFSPLNRLFASKWYIDDLYAQVIVQGTRTIAQTLLIFDQRIIDGA
|
||||
VNLTAFGTLSAADTLKYWENGRVQFYILSIIFGVLFGSWLLTTHLSSL
|
||||
>NC_000932@ArthCp071@ndhf@110398@112638@R@1@747 NADH_dehydrogenase_subunit_5
|
||||
MEHTYQYSWIIPFIPLPVPILLGVGLLLFPTATKNLRRMWTFLSIFLLSI
|
||||
VMIFSIYLSIQQIFLSCIHQNVWSWTINNEFSFEFGYFIDPLTSIMSILI
|
||||
TTVGILVLIYSDNYMSHDQGYLRFFAYMGFFNTSMLGLVTSSNLIQVYFF
|
||||
WELVGMCSYLLIGFWFTRPIAANACQKAFVTNRVGDFGLLLGILGLYWIT
|
||||
GSFEFQDLFEIFNNLILNNRVNLLFLTLCAFLLFVGPIAKSAQFPLHVWL
|
||||
PDAMEGPTPISALIHAATMVAAGIFLVARLLPLFIVIPSIMYIISLIGII
|
||||
TVLLGATLALAQKDIKRGLAYSTMSQLGYMMLALGMGSYRSALFHLITHA
|
||||
YSKALLFLGSGSIIHSMEAIVGYSPDKSQNMILMGGLTKHVPITKTAFLI
|
||||
GTLSLCGIPPLACFWSKDEILNDSLLFSPIFAIIACSTAGLTAFYMFRIY
|
||||
LLTFEGHLNTYFLNYSGKKSGSFYSLSLWGKEEEKKLNKNFGLVPLLTMN
|
||||
NTKRASFFCNKTYKISNNVRNQIFITVENFGLNTRTFYYPHESDNTILFP
|
||||
MLILVLFTLFIGAIGIPFNQEGIDFDILSKFFTPSINLLHKNSQNFVDWY
|
||||
EFLRNATFSVSIAFFGIFIAYCLYKPFYSSLLNLTLLNSFQKWNSKRIHW
|
||||
EKLINFVYNWSYNRGYIDSFFKTSLIESIRRLAKQTTFFDKRIIDGITNG
|
||||
VGITSFFVGEVTKYIGGSRISSYLFLYLSYVLIFLMILFFFYFEKF
|
||||
>NC_001319@MapoCp074@ndhf@91101@93179@R@1@693 NADH_dehydrogenase_subunit_5
|
||||
MELIFQNVWFVPLFPFLASILLGIGLFFFPNSIKKFRRLSSFISIMFLNI
|
||||
AMLLSFHFFWQQITGSPIHRYLWSWVLYKNFVLEIGYLLDPLTSIMLVLV
|
||||
TTVAVMVMIYSDSYMFYDEGYIKFFCYLSLFTASMLGLVLSPNLIQVYIF
|
||||
WELVGMCSYLLIGFWFTRPSAANACQKAFVTNRIGDFGLLLGILGFYWIT
|
||||
GSFDFQQLSKRFFELLSYNQINLVFATLCALFLFLGPVAKSAQFPLHIWL
|
||||
PDAMEGPTPISALIHAATMVAAGIFLVARMFPLFQMLPFVMSIISWTGAI
|
||||
TALLGATIALAQKDLKKGLAYSTMSQLGYMMLALGIGSYKAGLFHLITHA
|
||||
YSKALLFLGSGSVIHSMEPIVGYHPNKSQNMIFMGGLRQYMPITAITFLF
|
||||
GTLSLCGIPPFACFWSKDEILVNSWLHFPILGSIAFFTAGLTAFYMFRIY
|
||||
FLTFEGDFRGHFFDDVKKLSSISIWGSLEFNKEQFKLDKKSTLYPKEANN
|
||||
IMLFPLIILTIPTVFIGFIGILFDENKMNVDSLSYWLTLSINSFNYSNSE
|
||||
KFLEFLFNAIPSVSIAFFGILIAFYLYGPNFSFLKKEKKKLQLKSEIDIV
|
||||
LKSFSNFIYNWSYYRAYIDGFYSSFFIKGLRFLIKIVSFIDRWIIDGIIN
|
||||
GIGIFSFFGGESLKYIEGGRISSYLFFIIFCMFLFFLYSYII
|
||||
>NC_001320@OrsajCp085@ndhf@101433@103637@R@1@735 NADH_dehydrogenase_subunit_5
|
||||
MEHTYQYAWVIPLLPLPVIMSMGFGLFLVPTATKNLRRIWAFPSVLLLSI
|
||||
AMVFSVHLSIQQINGSSIYQYLWSWTVNNDFSLEFGYLIDPLTSIMLILI
|
||||
TTVGILVLIYSDDYMSHDEGYLRFFVYISFFNTSMLGLVTSSNLIQIYFF
|
||||
WELVGMCSYLLIGFWFTRPIAASACQKAFVTNRVGDFGLLLGILGFFWIT
|
||||
GSLEFRDLFKIANNWIPNNEINSLLTILCAFLLFLGAVAKSAQFPLHVWL
|
||||
PDAMEGPTPISALIHATTMVAAGIFLIARLLPLFISLPLIMSFISLIGTL
|
||||
TLFLGATLALAQRDIKRSLAYSTMSQLGYMMLALGIGSYQAALFHLITHA
|
||||
YSKALLFLGSGSVIHSMEPLVGYSPDKSQNMVLMGGLRKYIPITRTCFLW
|
||||
GTLSLCGIPPLACFWSKDEILSNSWLYSPFFGIIASFTAGLTAFYMFRIY
|
||||
LLTFDGYLRVHFQNYSSTKEDSLYSISLWGKRISKGVNRDFVLSTAKSGV
|
||||
SFFSQNLSKIHVNTGNRIGSFSTSLGTKNTFVYPHEPGNTMLFPLLILLL
|
||||
CTLFIGSIGIHFDNEIGELTILSKWLTPSINFFQESSNSSINSYEFITNA
|
||||
ISSVSLAIFGLFIGIYVLWICLLFFSEFDLINSFVKGGPKKYFFHQLKKK
|
||||
IYSWSYNRGYIDIFYTRTFTLGIRGLTELTQFFDKGVIDGITNGVGLASF
|
||||
CIGEEIKYVGGGRISSYLFFFLCYVSVFLFFFLS
|
||||
>NC_001666@ZemaCp083@ndhf@105072@107288@R@1@739 NADH_dehydrogenase_subunit_5
|
||||
MEHTYQYAWVIPLLPLPVIMSMGFGLFLIPTATKNLRRIWAFPSILLLSI
|
||||
AMVFSLHLSIQQINGSSIYQYLWSWTINNDFSLEFGYLVDPLTSIMLILI
|
||||
TTVGILVLIYSDDYMSHDEGYLRFFVYISFFNTSMLGLVTSSNLIQIYFF
|
||||
WELVGMCSYLLIGFWFTRPIAASACQKAFVTNRVGDFGLLLGILGFFWIT
|
||||
GSLEFRDLFKIANNWIPNNGINSLLTTLCAFLLFLGAVAKSAQFPLHVWL
|
||||
PDAMEGPTPISALIHAATMVAAGIFLLARLLPLFISLPWIMSFISLIGTI
|
||||
TLFLGATLALAQRDIKRSLAYSTMSQLGYMMLALGIGSYQAALFHLITHA
|
||||
YSKALLFLGSGSVIHSMEPLVGYSPDKSQNMVLMGGLRKYVPITRTTFLC
|
||||
GTLSLCGIPPLACFWSKDEILSNSWLYSPFFGIIASFTAGLTAFYMFRIY
|
||||
LLTFDGYLRVHFQNYSSTKEGSLYSISLWGKSISKGVNRDFVLSTMKSGV
|
||||
SFFSQNIPKIPANTRNKIGSFSTPFGAKNTFVYPHETGNTMLFPLLILLL
|
||||
FTLFIGSIGIHFDNGVKDNRILELTILSKWLTPSINLFQENSNSSINSYE
|
||||
FLTNAISSVSLAIFGLFIAYIFYGSAYSFFQNLNFQNSLVKKNPKKSFLD
|
||||
EVKKKIYSWSYNRGYIDFFYTRVFILGIRKLAELTHFFDKGVIDGITNGV
|
||||
GLAGFCIGEEIKYVGGGRISSYLFFFLCYVSLFLFFIP
|
||||
>NC_001879@NitaCp080@ndhf@112072@114294@R@1@741 NADH_dehydrogenase_subunit_5
|
||||
MEQTYEYAWIIPFIPLPVPMLIGAGLFLFPTATKSFRRMWAFQSVLLLSI
|
||||
VMVFSIYLSIQQINSSSFYQYVWSWIINNDFSLDFGYLIDPLTSIMSILI
|
||||
TTVGIMVLIYSDNYMAHDQGYLRFFAYMSFFSTSMLGLVTSSNLIQIYIF
|
||||
WELVGLCSYLLIGFWFTRPVAANACQKAFVTNRVGDFGLLLGILGFYWIT
|
||||
GSFEFRDLFEIFNNLIYNNEVDFLFVTLCAVLLFAGAVAKSAQFPLHVWL
|
||||
PDAMEGPTPISALIHAATMVAAGIFLVARLLPLFRVIPYIMYLISVIGII
|
||||
TVLLGATLALAQKDIKRGLAYSTMSQLGYMMLALGMGSYRSALFHLITHA
|
||||
YSKALLFLGSGSIIHSMETIVGYSPAKSQNMGLMGGLRKHVPISKITFLL
|
||||
GTLSLCGIPPLACFWSKDEILNDSWLYSPIFAIIAWATAGLTAFYMFRIY
|
||||
LLTFEGHLNAHFPNYGGKQKTPFYSISLWGKNGVKKNSCLLTMNNNESTY
|
||||
FFAKTKYPIDKNGRKMTRPFMTIAHFEHKAVYSYPYESDNTMLFPIFVLG
|
||||
LFTLFVGSIGIPFNQEGGNLDILSKWLAPSINLLHQKSNNSMDWNEFLKD
|
||||
AVLSVSIAYFGIFIASFLYKPIYSSLKNFELINSFVKKGPKRILWDKIIN
|
||||
GIYDWSYNRAYIDAFYTRFLVGGIRGLAEFTHFFDRRVIDGMTNGVGVIS
|
||||
FIVGEGIKYIGGGRISSYLFLYLAYVSIFLLVYYLLFSTL
|
||||
>NC_002186@MeviCp105@ndhf@109803@111761@D@1@653 NADH_dehydrogenase_subunit_5
|
||||
MESISQYAWLIPIFPLAGSLLIGIGLISFRRATNILRWRYSFLIIALLGI
|
||||
SLILSCLILFSQINATPSYQWIFQWIVTNNFLLEIGYFVDPLTAVMLVIV
|
||||
TTVAILVLIYTDGYMSYDEGYVRFFAYLSLFTTSMLGLVLSPNLLQIYVF
|
||||
WELVGMCSYLLIGFWFTRPAAADACQKAFVTNRVGDFGLLLGILGFYWMT
|
||||
GSFEFDVISMKLLQLAEYDNFNTQLAIFFGFLIFLGPVAKSAQFPLHVWL
|
||||
PDAMEGPTPISALIHAATMVAAGVFLVARMFPIFSQFPFLMDLIAWTGAI
|
||||
TAIIGATIAVTQVDLKKGLAYSTMSQLGYMIMAMGMGSYTASLFHLMTHA
|
||||
YSKALLFLSAGSTIHGMEPIVGFNPAKNQNMSLMGGIRKYMPITGNAFLI
|
||||
GTLSLCGIPPLACFWSKDAILSNAFVHSPLLWFIGWSTAGLTSFYMFRMY
|
||||
FLVFEGEFRGNSVNQEKIRSNKLPKESNTKMTLPLIILTLFSITIGWIGT
|
||||
PFNNQFMFLIHTINQEIEPFDINEFLFIAGSSVGIALLGCYTAYLIYIKD
|
||||
KNTDKFANLLQPFYQLSFNKWYIDDIYEYIFVKGNRQLAQQTLLFDKKII
|
||||
DGFVNLTGLITLVSSESLRSIENGKIQSYILMIIFTLLTILGISQTYYSL
|
||||
IL
|
||||
>NC_002202@SpolCp080@ndhf@107770@109998@R@1@743 NADH_dehydrogenase_subunit_5
|
||||
MEHIYQYAWIIPFLPLPVPLLIGAGLLFFPTATKNLRRIWAFSSISLLSI
|
||||
VMIFSMKLAIQQINSNSIYQYLWSWTINNDFSLEFGYLMDPLTSIMSMLI
|
||||
TTVAILVLIYSDNYMSHDQGYLRFFAYMSFFNTSMLGLVTSSNLIQIYIF
|
||||
WELVGMCSYLLIGFWFTRPIAANACQKAFVTNRVGDFGLLLGILGLYWIT
|
||||
GSFEFRDLFEIFNNLIKNNEVNSLFCILCAFLLFAGAVAKSAQFPLHVWL
|
||||
PDAMEGPTPISALIHAATMVAAGIFLVARLLPLFVVIPYIMYVISFIGII
|
||||
TVLLGATLALAQKDIKRSLAYYTMSQLGYMMLALGMGSYRTALFHLITHA
|
||||
YSKALLFLASGSLIHSMGTIVGYSPDKSQNMVLMGGLTKHVPITKTSFLI
|
||||
GTLSLCGIPPLACFWSKDEILNDSWVYSPIFAIIAYFTAGLTAFYMFRIY
|
||||
LLTFEGHLNFFCKNYSGKKSSSFYSISLWGKKELKTINQKISLLNLLTMN
|
||||
NKERASFFSKKPYEINVKLTKLLRSFITITYFENKNISLYPYESDNTMLF
|
||||
PLIILIMFTLFVGFIGIPFNQEGMDLDILTKWLTPSINLLHSNSENFVDW
|
||||
YEFVINAIFSISIAFFGIFIAFFFYKPIYSSLKNFDLINSFDKRGQKRIL
|
||||
GDNIITIIYNWSANRGYIDAFYSTFLIKGIRSLSELVSFFDRRIIDGIPN
|
||||
GFGVTSFFVGEGIKYVGGGRISSYLFWYLLYVSIFLFIFTFT
|
||||
>NC_002693@OeelhCp094@ndhf@115809@118142@R@1@778 NADH_dehydrogenase_subunit_5
|
||||
MEYTYQYSWIIPFIPLPVPILIGMGLLLFPTATKNHRRVWSFPSILLLSM
|
||||
VMLLSVYLSIQQINRSFIYQYVWSWTINNDFSLEFGHLIDPLASIMLILI
|
||||
TTVGILVLFYSDNYMSHDQGYLRFFAYLSFFNTSMLGLVTSSNLIQIYIF
|
||||
WELVGMCSYLLIGFWFTRPIAATACQKAFVTNRVGDFGLLLGILGLYWIT
|
||||
GSFEFRDLFEIVNNLIDNNNQVHFLFVTLCSFLLFAGAVAKSAQFPLHVW
|
||||
LPDAMEGPTPISALIHAATMVAAGIFLVARLLPLFVITPYIMNLISLIGI
|
||||
ITVLLGATLALAQKDIKRSLAYSTMSQLGYMMLALGMGSYRAALFHLITH
|
||||
AYSKALLFLGSGSIIHSMESIVGYSPDKSQNMVLMGGLKKHVPITKTAFL
|
||||
VGTLSLCGIPPLACFWSKDEILNDSWLYSPIFAIIACSTAGFTAFYMFRV
|
||||
YLLTFDGHLNVHFQNYSGQKSSSVYSISLWGKQVPKRIQNPFCLLNLLTM
|
||||
NNNESTSFFWNNKCKLDGNVKKRIRPFITVTHFPNRKTFSYPHESDNTML
|
||||
FSLFVLVLFTLFVAAIGIPFNQEGSDCDILSKLLNPSINLLHQNSNNFTD
|
||||
WYEFVTNASFSVSIALLGIFIATFLYKPIYSSLQNFNLLNSFYKRSANRV
|
||||
MWDKIQNWIYDWSYNRGYIDSFYTISLTGGIRGLAELSHFFDRRVIDGIL
|
||||
NGFGLTSFFLGESLKYFGGGRISSYLLLYSIFIFIFLLMDSFFTNLPFFV
|
||||
LCQFLDSSFSMSISGFLLYENFLYENF
|
50
detectors/cds/test/test.db/ndhg.fst
Normal file
50
detectors/cds/test/test.db/ndhg.fst
Normal file
@ -0,0 +1,50 @@
|
||||
>AC_000188@LyesCp077@ndhg@119590@120120@R@1@177 NADH_degydrogenase_subunit_6
|
||||
MDLSEPIHDFLLVFLGSGLILGGLGVVLLPNPIYSAFSLGLVLVCTSLFY
|
||||
ILSNAYFVAAAQLLIYVGAINVLIIFAVMFMNGSEYYKDFHLWTVGDGIT
|
||||
SMVCISLFISLITTISDTSWYGIIWTTRSNQIIEQDFLSNSQQIGIHLST
|
||||
DFFLPFELISIILLVALIGAIAVARQ
|
||||
>NC_000927@NeolCp118@ndhg@146302@146811@D@1@170 NADH_dehydrogenase_subunit_6
|
||||
MEIVQNFSSAALTTGILLGCLGVIFLPSIVYAAFLLGAVFFCLAGIYVLL
|
||||
HADFVAAAQVLVYVGAINVLILFAIMLVNPQDAPPRALDSPPLIPGIACI
|
||||
GLLGVLVQMISTTSWLTPPWTPEPNSLPVLGGHLFSDCLLAFEVMSLVLL
|
||||
VALVGAIVLARREPVERSS
|
||||
>NC_000932@ArthCp077@ndhg@118377@118907@R@1@177 NADH_dehydrogenase_subunit_6
|
||||
MDLPGPIHDFLLVFLGSGLLVGGLGVVLLPNPIFSAFSLGFVLVCISLLY
|
||||
ILSNSHFVAAAQLLIYVGAINVLIIFAVMFMNDSEYSTDFNLWTIGNGIT
|
||||
SLVCTTILFLLMSTILDTSWYGVIWTTKLNQILEQDLISNSQQIGIHLST
|
||||
DFFLPFELISIILLVALIGAISVARQ
|
||||
>NC_001319@MapoCp082@ndhg@99113@99688@R@1@192 NADH_dehydrogenase_subunit_6
|
||||
MKLPESFYETIFLFLESGLILGSLGVILLTNIVYSALFLGFVFVCISLLY
|
||||
LLLNADFVAAAQILIYVGAVNVLIIFAVMLINKKQYSNFFVYWTIGDGIT
|
||||
LTLCTSIFLLLNNFISNTSWSKIFLMTKPNLVVKDIILINTVRHIGSELL
|
||||
TEFLLPFELMSIILLVALIGAITLARREKKIELEKNDFFNF
|
||||
>NC_001320@OrsajCp091@ndhg@109227@109757@R@1@177 NADH_dehydrogenase_subunit_6
|
||||
MDLPGPIHEILVLFGGFVLLLGGLGVVLLTNPTFSAFSLGLVLVCISLFY
|
||||
ILLNSYFVAVAQLLIYVGAINVLIIFAVMFVNGSEWSKDKNFWTIGDGFT
|
||||
SLVCITIPFSLMTTIPDTSWYGILWTTRSNQIVEQGLINNVQQIGIHLAT
|
||||
DFYLPFELISIILLVSLIGAITMARQ
|
||||
>NC_001666@ZemaCp089@ndhg@112993@113523@R@1@177 NADH_dehydrogenase_subunit_6
|
||||
MDLPGPIHEILVLFGGFGLLLGGLGVVLLTNPIYSAFSLGLVLVCISLFY
|
||||
FLLNSYFVAVAQLLIYVGAINVLIIFAVMFVNGSEWSKDKNYWTIGDGFT
|
||||
LLLCITIPFSLMTTIPDTSWYGILWTTRSNQIVEQGLINNVQQIGIHLAT
|
||||
DFYLPFELISLILLVSLIGAITMARQ
|
||||
>NC_001879@NitaCp086@ndhg@120181@120711@R@1@177 NADH_dehydrogenase_subunit_6
|
||||
MDLSEPIHDFLLVFLGSGLILGGLGVVLLPNPIYSAFSLGLVLVCTSLFY
|
||||
ILSNSYFVAAAQLLIYVGAINVLIIFAVMFMNGSEYYKDFHLWTVGDGIT
|
||||
SMVCISLFISLITTISDTSWYGIIWTTRSNQIIEQDFISNSQQIGIHLST
|
||||
DFFLPFELISIILLVALIGAIAVARQ
|
||||
>NC_002186@MeviCp100@ndhg@105252@105821@R@1@190 NADH_dehydrogenase_subunit_6
|
||||
MSFSEQIQNLSLLLLEIGTIIGALGVVLLPNILYSGFLLGGVLICIAGIY
|
||||
LLLNAEFIAAAQVLIYVGAINVIILFAIMLVNKIENLNPSNNQMMRNGLS
|
||||
SFICFSFFILLSNMIFDTQWIDTVGVSTKYSISIIGNHIFSDFLLPFEIV
|
||||
SVLLLVTLVGAVFIARKEDASEIEISKISFLNLPDPSKK
|
||||
>NC_002202@SpolCp088@ndhg@116164@116694@R@1@177 NADH_dehydrogenase_subunit_6
|
||||
MDLPGPIHDFLLVFLGSGLILGALGVVLFTNPIFSAFSLGLVLVCISLFY
|
||||
ILANSHFVASAQLLIYVGAINVLIIFSVMFMSGPEYDKKFQLWTVGDGVT
|
||||
SLVCISLFVSLISTILNTSWYGIIWTTKSNQILEQDLINASQQIGIHLST
|
||||
DFFLPFELISIILLVSLIGAIAVARQ
|
||||
>NC_002693@OeelhCp100@ndhg@123796@124326@R@1@177 NADH_dehydrogenase_subunit_6
|
||||
MDLPGPIHDFLLVFLGSGLIVGGLGVVLLTNPIFSAFSLGLVLVCISLFF
|
||||
SLSNSYFVAAAQLLIYVGAINVLILFAVMFMNGSEYSKDLTLWTVGDGIT
|
||||
SLVCTSIFISLITTILDTSWYGIIWTTKSNQIIEQDLIGNSQQIGIHLST
|
||||
DFFLPFELISIILLVSLIGAIAVARQ
|
90
detectors/cds/test/test.db/ndhh.fst
Normal file
90
detectors/cds/test/test.db/ndhh.fst
Normal file
@ -0,0 +1,90 @@
|
||||
>AC_000188@LyesCp078@ndhh@123339@124520@R@1@394 NADH_dehydrogenase_subunit_7
|
||||
MTAPTTRKDLMIVNMGPQHPSMHGVLRLIVTLDGEDVVDCEPILGYLHRG
|
||||
MEKIAENRTIIQYLPYVTRWDYLATMFTEAITINGPEQLGNIQVPKRASY
|
||||
IRVIMLELSRIASHLLWLGPFMADIGAQTPFFYIFRERELIYDLFEAATG
|
||||
MRMMHNYFRIGGVAADLPYGWIDKCLDFCDYFLTGVAEYQKLITRNPIFL
|
||||
ERVEGVGIIGRDEALNWGLSGPMLRASGIEWDLRKVDHYESYDEFDWQVQ
|
||||
WQREGDSLARYLVRIGEMTESIKIIQQALEGIPGGPYENLEMRRFDRLKD
|
||||
PEWNDFEYRFISKKPSPTFELSKQELYVRVEAPKGELGIFLIGDQSVFPW
|
||||
RWKIRPPGFINLQILPQLVKRMKLADIMTILGSIDIIMGEVDR
|
||||
>NC_000927@NeolCp115@ndhh@143205@144380@D@1@392 NADH_dehydrogenase_subunit_7
|
||||
MIEAKTDPMIVSMGPHHPSMHGVLRLIVTLDGENVLDCEPVVGYLHRGME
|
||||
KIAENRTIVQYLPYVTRWDYLATMFTEAITVNAPERLANIEVPRRASYLR
|
||||
VIMLELSRIASHLLWLGPFMADLGAQTPFFYILREREMIYDLFEAATGMR
|
||||
MMHNYFRVGGVAADVPYGWIDKCLDFCEYFLPKVDEYEALITRNPIFLKR
|
||||
VKGVGTISPQQAINWGLSGPMLRASGVSWDLRKVDRYECYEDFHWSVESE
|
||||
ETGDCLARYLVRIREMRTSTKIVQQALKSIPGGPTENLEARQLSQGRTSP
|
||||
WNEFDYQFLGKKASPTFKMPRQEHYVRVEAPKGELGVFLIGDDHVFPWRW
|
||||
KIRPPGFINVQILPNLVQGMKLADIMTILGSIDIIMGEVDR
|
||||
>NC_000932@ArthCp080@ndhh@122011@123192@R@1@394 NADH_dehydrogenase_subunit_7
|
||||
MKRPVTGKDLMIVNMGPHHPSMHGVLRLIVTLDGEDVVDCEPILGYLHRG
|
||||
MEKIAENRAIIQYLPYVTRWDYLATMFTEAITVNGPEQLGNIQVPKRASY
|
||||
IRVIMLELSRIASHLLWLGPFMADIGAQTPFFYIFREREFVYDLFEAATG
|
||||
MRMMHNFFRIGGIAADLPYGWIDKCLDFCDYFLTEVVEYQKLITRNPIFL
|
||||
ERVEGVGIIGGEEAINWGLSGPMLRASGIPWDLRKIDRYESYDEFEWEIQ
|
||||
WQKQGDSLARYLVRLSEMTESIKIIQQALEGLPGGPYENLESRGFDRKRN
|
||||
PEWNDFEYRFISKKPSPTFELSKQELYVRVEAPKGELGIFLIGDQSGFPW
|
||||
RWKIRPPGFINLQILPELVKRMKLADIMTILGSIDIIMGEVDR
|
||||
>NC_001319@MapoCp085@ndhh@102202@103380@R@1@393 NADH_dehydrogenase_subunit_7
|
||||
MMILTKNKPMIVSMGPHHPSMHGVLRLIVTLDGEDVLDCEPVLGYLHRGM
|
||||
EKIAENRTIVQYLPYVTRWDYLATMFTEAITVNAPEKLTNIQVPKRASYI
|
||||
RIIMLELSRIASHLLWLGPFMADIGAQTPFFYIFREREMIYDLFESATGM
|
||||
RMMHNYFRIGGVAVDLPYGWIDKCLDFCDYFLPKINEYERLITNNPIFLK
|
||||
RVEGIGTVTREEAINWGLSGPMLRASGVQWDLRKVDHYECYDELDWKIQW
|
||||
QKEGDSLARYLVRIGEMKESVKIIQQALKAIPGGPFENLEARRLNQGKNS
|
||||
EWNLFEYQFISKKPSPTFKLPKQEHYVRVEAPKGELGIFLIGDDSVFPWR
|
||||
LKIRSPGFINLQILPQLVKGMKLADIMTILGSIDIIMGEVDR
|
||||
>NC_001320@OrsajCp094@ndhh@112708@113889@R@1@394 NADH_dehydrogenase_subunit_7
|
||||
MSLPLTRKDLMIVNMGPQHPSMHGVLRLIVTLDGEDVIDCEPILGYLHRG
|
||||
MEKIAENRTIIQYLPYVTRWDYLATMFTEAITVNAPEFLENIQIPQRASY
|
||||
IRVIMLELSRIASHLLWLGPFMADLGAQTPFFYIFRERELIYDLFEAATG
|
||||
MRMMHNYFRIGGVAADLPYGWIDKCLDFCDYFLRGVIEYQQLITQNPIFL
|
||||
ERVEGVGFISGEEAVNWGLSGPMLRASGIQWDLRKVDLYESYNQFDWKVQ
|
||||
WQKEGDSLARYLVRIGEMRESIKIIQQAVEKIPGGPYENLEVRRFKKAKN
|
||||
SEWNDFEYRFLGKKPSPNFELSKQELYARVEAPKGELGIYLVGDDSLFPW
|
||||
RWKIRPPGFINLQILPQLVKKMKLADIMTILGSIDIIMGEVDR
|
||||
>NC_001666@ZemaCp092@ndhh@116456@117637@R@1@394 NADH_dehydrogenase_subunit_7
|
||||
MSLSLKRKDLMIVNMGPQHPSMHGVLRLIVTLDGEDVIDCEPILGYLHRG
|
||||
MEKIAENRSIIQYLPYVTRWDYLATMFTEAITVNAPEFLENIQIPKRASY
|
||||
IRVIMLELSRIASHLLWLGPFMADLGAQTPFFYIFRERELIYDLFEAVTG
|
||||
MRMMHNYFRIGGVAADLPYGWMDKCLDFCDYFLQGVVEYQELITQNPIFL
|
||||
ERVEGVGFISGEEAVNWGLSGPMLRASGIQWDLRKIDPYESYNQFDWKVQ
|
||||
WQKEGDSLARYLVRVGEMRESIKIIQQAVEKIPGGPYENLEARRFKKAKN
|
||||
PEWNDFEYRFLGKKPSPNFELSKQELYVRVEAPKGELGIYLVGDDSLFPW
|
||||
RWKIRPPGFINLQILPQLVKKMKLADIMTILGSIDIIMGEVDR
|
||||
>NC_001879@NitaCp089@ndhh@123937@125118@R@1@394 NADH_dehydrogenase_subunit_7
|
||||
MTAPTTRKDLMIVNMGPQHPSMHGVLRLIVTLDGEDVVDCEPILGYLHRG
|
||||
MEKIAENRTIIQYLPYVTRWDYLATMFTEAITINGPEQLGNIQVPKRASY
|
||||
IRVIMLELSRIASHLLWLGPFMADIGAQTPFFYIFRERELIYDLFEAATG
|
||||
MRMMHNYFRIGGVAADLPYGWIDKCLDFCDYFLTGVAEYQKLITRNPIFL
|
||||
ERVEGVGIIGGDEALNWGLSGPMLRASGIEWDLRKVDHYESYDEFDWQVQ
|
||||
WQREGDSLARYLVRIGEMTESIKIIQQALEGIPGGPYENLEIRRFDRLKD
|
||||
PEWNDFEYRFISKKPSPTFELSKQELYVRVEAPKGELGIFLIGDQSVFPW
|
||||
RWKIRPPGFINLQILPQLVKRMKLADIMTILGSIDIIMGEVDR
|
||||
>NC_002186@MeviCp103@ndhh@107611@108792@R@1@394 NADH_dehydrogenase_subunit_7
|
||||
MTMLQTKTDPMVISMGPHHPSMHGVLRLIVTLDGENVIDCEPVLGYLHRA
|
||||
MEKIAENRTIVQYLPYVTRWDYLATMFTEAITVNAPEKLANIEVPKRASY
|
||||
IRVIMLELSRIASHLLWLGPFMADIGAQTPFFYILREREMIYDLFEAATG
|
||||
MRMMHNYFRIGGVASDLPYGWVDKCLDFSDYFLPKVDEYERLITNNPIFL
|
||||
KRVRDVGFISREEAINWGLSGPMLRASGVQWDLRKVDNYECYGELDWNVQ
|
||||
WQSDGDCLARYLVRLGEMRESTKIIQQALKAIPGGPYENLEARRLSKGRK
|
||||
SEWNNFEYQFVGKKPSPTFKIPKQEHYVRVEAPKGELGVFLMGDDNVFPW
|
||||
RWKIRSPGFINVQILPELVRGMKLADIMTILGSIDIIMGEVDR
|
||||
>NC_002202@SpolCp091@ndhh@119776@120957@R@1@394 NADH_dehydrogenase_subunit_7
|
||||
MAVPTTRKDLMIVNMGPHHPSMHGVLRLIVTLDGEDVIDCEPIVGYLHRG
|
||||
MEKIAENRTIIQYLPYVTRWDYLATMFTEAITVNGPEQLGNIQVPKRASY
|
||||
IRVIMLELSRIASHLLWLGPFMADIGAQTPFFYILRERELIYDLFEAATG
|
||||
MRMMHNYFRIGGVAADLPYGWIDKCLDFCDYFLIGLTEYQKLITRNPIFL
|
||||
ERVENVGIIGGEEAINWGLSGPMLRASGIQWDLRKVDHYECYDEFDWEVQ
|
||||
WQKEGDSLARYLIRIGEMAESVKIIQQALEGIPGGPYENLEIRRFNRIKY
|
||||
PEWNDFEYRFISKKPSPAFELSKQELYVRVEAPKGELGIFLIGDQSVFPW
|
||||
RWKIRPPGFINLQILPQLVKKMKLADIMTILGSIDIIMGEVDR
|
||||
>NC_002693@OeelhCp103@ndhh@127260@128441@R@1@394 NADH_dehydrogenase_subunit_7
|
||||
MNVTTTRKDLMIVNMGPHHPSMHGVLRLILTLDGEDVIDCEPILGYLHRG
|
||||
MEKIAENRTVIQYLPYVTRWDYLATMFTEAITINGPEQLGNIQVPKRASY
|
||||
IRIIMLELSRIASHLLWLGPFMADIGAQTPFFYIFRERELVYDLFEAATG
|
||||
MRMMHNYFRIGGVAADLPYGWIDKCLDFCDYFLTAVSEYQKLITRNPIFL
|
||||
ERVEGVGIIGGEEAINWGLSGPMLRASGIEWDLRKVDRYECYGELDWEIR
|
||||
WQKEGDSLARYLVRMSEMTESIKIIQQALEGIPGGPYENLEIRCFDREKD
|
||||
PEWDGFEYRFISKKPSPTFELPKQELYVRVEAPKGELGIFLIGDQSGFPW
|
||||
RWKIRPPGFINLQILPQLVKRMKLADIMTILGSIDIIMGEVDR
|
50
detectors/cds/test/test.db/ndhi.fst
Normal file
50
detectors/cds/test/test.db/ndhi.fst
Normal file
@ -0,0 +1,50 @@
|
||||
>AC_000188@LyesCp076@ndhi@120525@121028@R@1@168 NADH_dehydrogenase_subunit_I
|
||||
MLPMITEFINYGQQTIRAARYIGQGFMITLSHANRLPVTIQYPYEKLITS
|
||||
ERFRGRIHFEFDKCIACEVCVRVCPIDLPVVDWKLETDIRKKRLLNYSID
|
||||
FGICIFCGNCVEYCPTNCLSMTEEYELSTYDRHELNYNQIALGRLPMSVI
|
||||
DDYTIRTISNLPQINNE
|
||||
>NC_000927@NeolCp117@ndhi@145747@146268@D@1@174 NADH_dehydrogenase_subunit_I
|
||||
MFDFLTSLQTYRQEAAQAAQYIGQGFGVTFDHMSRRPITIHYPYEKLIPS
|
||||
ERFRGRIHFEFDKCIACEVCVRVCPINLPVVDWDYQKSVKKKQLRSYSID
|
||||
FGVCIFCGNCVEYCPTNCLSMTEEYELSVYDRHELNFDHVALGRVPTSVV
|
||||
QDTLVTPVLGLGYLPKGELSSLP
|
||||
>NC_000932@ArthCp078@ndhi@119244@119762@R@1@173 NADH_dehydrogenase_subunit_I
|
||||
MLPMITGFMNYGQQTLRAARYIGQGFMITLSHTNRLPVTIQYPYEKLITS
|
||||
ERFRGRIHFEFDKCIACEVCVRVCPIDLPVVDWKLETNIRKKRLLNYSID
|
||||
FGICIFCGNCVEYCPTNCLSMTEEYEFSTYDRHELNYNQIALGRLPMSVI
|
||||
DDYTIRTIWNSPQTKNGVNPLI
|
||||
>NC_001319@MapoCp083@ndhi@99779@100330@R@1@184 NADH_dehydrogenase_subunit_I
|
||||
MFSIINGLKNYNQQAIQAARYIGQGFLVTLDHMNRLPTTIQYPYEKLIPS
|
||||
ERFRGRIHFEFDKCIACEVCVRVCPINLPVVDWELKKTIKKKQLKNYSID
|
||||
FGVCIFCGNCVEYCPTNCLSMTEEYELSTYNRHELNYDQIALGRLPISII
|
||||
EDSTIENIFNLTSLPKGKIEGHIYSRNITNIVN
|
||||
>NC_001320@OrsajCp092@ndhi@110000@110536@R@1@179 NADH_dehydrogenase_subunit_I
|
||||
MFPMVTGFMGQQTIRAARYIGQSFIITLSHTNRLPITIHYPYEKSITSER
|
||||
FRGRIHFEFDKCIACEVCVRVCPIDLPLVDWRFEKDIKRKQLLNYSIDFG
|
||||
VCIFCGNCVEYCPTNCLSMTEEYELSTYDRHELNYNQIALSRLPISIMGD
|
||||
YTIQTIRNSTQSKIDEEKSWNSRTITDY
|
||||
>NC_001666@ZemaCp090@ndhi@113707@114249@R@1@181 NADH_dehydrogenase_subunit_I
|
||||
MFPMLTGFISYGQQTIRAARYIGQSFIITLSHTNRLPITIHYPYEKSITS
|
||||
ERFRGRIHFEFDKCIACEVCVRVCPIDLPLVDWRFEKDIKRKQLLNYSID
|
||||
FGVCIFCGNCVEYCPTNCLSMTEEYELSTYDRHELNYNQIALSRLPISIM
|
||||
GDYTIQTIRNSPQSKIDEEKSWNSRTITDY
|
||||
>NC_001879@NitaCp087@ndhi@121108@121611@R@1@168 NADH_dehydrogenase_subunit_I
|
||||
MLPMITEFINYGQQTIRAARYIGQGFMITLSHANRLPVTIQYPYEKLITS
|
||||
ERFRGRIHFEFDKCIACEVCVRVCPIDLPVVDWKLETDIRKKRLLNYSID
|
||||
FGICIFCGNCVEYCPTNCLSMTEEYELSTYDRHELNYNQIALGRLPMSVI
|
||||
DDYTIRTISNLPQIKNE
|
||||
>NC_002186@MeviCp101@ndhi@105946@106476@R@1@177 NADH_dehydrogenase_subunit_I
|
||||
MFNFIDNVQTYSKEALQAAKYIGQGFMVTFDHMNRRAITIQYPYEKLIPS
|
||||
ERFRGRIHFEFDKCIACEVCVRVCPINLPVVNWEFQKEKKKKQLQTYSID
|
||||
FGVCIFCGNCVEYCPTNCLSMTEEYELSVYDRHELNYDNFALGRLPTMVN
|
||||
NDSMVKGIKGLGYLPKGIIEGHIDNQ
|
||||
>NC_002202@SpolCp089@ndhi@116981@117493@R@1@171 NADH_dehydrogenase_subunit_I
|
||||
MFPMVTGFINYGQQTIRAARYIGQSFMITLSHANRLPVTIQYPYEKLITS
|
||||
ERFRGRIHFEFDKCIACEVCVRACPIDLPVVDWKLETDIRKKRLLNYSID
|
||||
FGICIFCGNCVEYCPTNCLSMTEEYELSTYDRHELNYNQIALGRLPISIT
|
||||
DDYTIRTILNSPQTKEKACD
|
||||
>NC_002693@OeelhCp101@ndhi@124541@125038@R@1@166 NADH_dehydrogenase_subunit_I
|
||||
MFPMVTGFMNYGQQTVRAARYIGQGFMITLSHANRLPVTIQYPYEKLITS
|
||||
ERFRGRIHFEFDKCIACEVCVRVCPIDLPVVDWKLETGVRKKRLLNYSID
|
||||
FGVCIFCGNCVEYCPTNCLSMTEEYELSTYDRHELNYNQIALGRLPMSVI
|
||||
DDYTIRTILNSAQIK
|
30
detectors/cds/test/test.db/psac.fst
Normal file
30
detectors/cds/test/test.db/psac.fst
Normal file
@ -0,0 +1,30 @@
|
||||
>AC_000188@LyesCp065@psac@118564@118809@R@1@82 photosystem_I_subunit_VII
|
||||
MSHSVKIYDTCIGCTQCVRACPTDVLEMIPWDGCKAKQIASAPRTEDCVG
|
||||
CKRCESACPTDFLSVRVYLWHETTRSMGLAY
|
||||
>NC_000925@PopuCp189@psac@164452@164697@R@1@82 photosystem_I_subunit_VII
|
||||
MAHSVKVYDTCIGCTQCVRACPCDVLEMVPWDGCKAKQIASAPRTEDCIG
|
||||
CKRCETACPTDFLSVRVYLGAETTRSMGLAY
|
||||
>NC_000926@GuthCp035@psac@33008@33253@D@1@82 photosystem_I_subunit_VII
|
||||
MSHSVKVYDTCIGCTQCVRACPCDVLEMVAWDGCKAGQIASAPRTEDCIG
|
||||
CKRCETACPTDFLSVRVYLGGETTRSMGLAY
|
||||
>NC_000927@NeolCp112@psac@138977@139222@D@1@82 photosystem_I_subunit_VII
|
||||
MSHSVKIYDTCIGCTQCVRACPTDVLEMVPWGGCKAAQIASAPRTEDCVG
|
||||
CKRCESACPTDFLSVRVYLGAETTRSMGLAY
|
||||
>NC_000932@ArthCp075@psac@117318@117563@R@1@82 photosystem_I_subunit_VII
|
||||
MSHSVKIYDTCIGCTQCVRACPTDVLEMIPWDGCKAKQIASAPRTEDCVG
|
||||
CKRCESACPTDFLSVRVYLWHETTRSMGLAY
|
||||
>NC_001319@MapoCp080@psac@98289@98534@R@1@82 photosystem_I_subunit_VII
|
||||
MAHAVKIYDTCIGCTQCVRACPTDVLEMIPWDGCKANQIASAPRTEDCVG
|
||||
CKRCESRCPTDFLSVRVYLGNETTRSMGLSY
|
||||
>NC_001320@OrsajCp089@psac@108020@108265@R@1@82 photosystem_I_subunit_VII
|
||||
MSHSVKIYDTCIGCTQCVRACPTDVLEMIPWDGCKAKQIASAPRTEDCVG
|
||||
CKRCESACPTDFLSVRVYLGPETTRSMALSY
|
||||
>NC_001603@EugrCp046@psac@74937@75893@R@3@82 photosystem_I_subunit_VII
|
||||
MSHSVKIYNTCIGCTQCVRACPTDVLEMVPWDGCKAGQIASSPRTEDCVG
|
||||
CKRCESACPTDFLSVRVYLGSETSRSMGLAY
|
||||
>NC_001631@PithCp145@psac@103521@103766@D@1@82 photosystem_I_subunit_VII
|
||||
MAHSVKIYDTCIGCTQCVRACPTDVLEMIPWEGCKAKQIASAPRTEDCAG
|
||||
CKRCESACPTDFLSVRVYLWHETTRSMGLAY
|
||||
>NC_001666@ZemaCp087@psac@111760@112005@R@1@82 photosystem_I_subunit_VII
|
||||
MSHSVKIYDTCIGCTHCVRACPTDVLEMIPWDGCKAKQIASAPRTEDCVG
|
||||
CKRCESACPTDFLSVRVYLGPETTRSMALSY
|
70
detectors/cds/test/test.db/rpl2.fst
Normal file
70
detectors/cds/test/test.db/rpl2.fst
Normal file
@ -0,0 +1,70 @@
|
||||
>AC_000188@LyesCp030@rpl2@86038@87528@R@2@275 ribosomal_protein_L2
|
||||
MAIHLYKTSTPSTRNGTVDSQVKSNPRNNLIYGQRRCGKGRNARGIITAR
|
||||
HRGGGHKRLYRKIDFRRNEKDIYGRIVTIEYDPNRNAYICLIHYGDGEKR
|
||||
YILHPRGAIIGDTIVSGTEVPIKMGNALPLTDMPLGTAIHNIEITLGKGG
|
||||
QLARAAGAVAKLIAKEGKSATLKLPSGEVRLISKNCSATVGQVGNVGVNQ
|
||||
KSLGRAGSKRWLGKRPVVRGVVMNPVDHPHGGGEGRAPIGRKKPTTPWGY
|
||||
PALGRRSRKRNKYSDNLILRRRSK
|
||||
>AC_000188@LyesCp087@rpl2@153816@155306@D@2@275 ribosomal_protein_L2
|
||||
MAIHLYKTSTPSTRNGTVDSQVKSNPRNNLIYGQRRCGKGRNARGIITAR
|
||||
HRGGGHKRLYRKIDFRRNEKDIYGRIVTIEYDPNRNAYICLIHYGDGEKR
|
||||
YILHPRGAIIGDTIVSGTEVPIKMGNALPLTDMPLGTAIHNIEITLGKGG
|
||||
QLARAAGAVAKLIAKEGKSATLKLPSGEVRLISKNCSATVGQVGNVGVNQ
|
||||
KSLGRAGSKRWLGKRPVVRGVVMNPVDHPHGGGEGRAPIGRKKPTTPWGY
|
||||
PALGRRSRKRNKYSDNLILRRRSK
|
||||
>NC_000925@PopuCp126@rpl2@103379@104263@R@1@295 ribosomal_protein_L2
|
||||
MAIRLYRAYTPGTRNRTVSTFSEITTDKPEKSLINKHHFCKGRNNRGVIT
|
||||
CRHKGGGHKQRYRLIDFKRNRHNIIAKVASIEYDPNRNARIALLHYLDGE
|
||||
KRYILHPRSLSVGAIVVSGPMAPIEVGNALPLSTIPLGTAVHNIELRPYC
|
||||
GGQIVRSAGTYAQIVAKEGNFVTVKLPSSEVRMIRKECYATIGQVGNIDA
|
||||
SNITLGKAGRSRWLGKRPTVRGVVMNPVDHPHGGGGEGKSPIGRSRPVTP
|
||||
WGKPALGVKTRNPNKYSNPYVLLVVNKVYLTYNLILKYNVEINT
|
||||
>NC_000926@GuthCp113@rpl2@100540@101367@D@1@276 ribosomal_protein_L2
|
||||
MGIRIYKSYTPGTRNRSSSDFVEITKSKPEKSLLRKKLSCAGRNNRGLIT
|
||||
VRHKGGGHKQRYRLVDFKRNKLDIPAIVASVEYDPNRNARIALLHYQDGE
|
||||
KRYILHPKKLAVGDKIYSGINVPIEIGNAMPLYNVPLGTAVHNVELIPGR
|
||||
GGQIVRSAGTSAQVVAKDGQVVTIKMPSNEVRMIYKNCYATIGEVGNADI
|
||||
KNIRLGKAGRKRWLGIRPSVRGVVMNPCDHPHGGGEGRSPIGRAKPVTPW
|
||||
GKPALGVKTRRQNKYSDFCIIRSRN
|
||||
>NC_000927@NeolCp022@rpl2@15904@16731@R@1@276 ribosomal_protein_L2
|
||||
MGIRFYRAHTPGTRNRSVSDFHEITTSTPTKSLTHANHRARGRNHSGSIT
|
||||
TRWRGGGHKRLYRQIDFRRDKVGVLARVATVEYDPNRSARIALLHYQDGS
|
||||
KRYILHPQGLAIGAEVMSSPEAPISIGNALPLVNMPLGTEVHNIELRPYN
|
||||
GGQLVRAAGAVAQLVAKEGGFGTLRMPSGEVRLVAKDCWATVGQVGHVES
|
||||
INLTLGKAGRSRWLDRRPRVRGSVMNACDHPHGGGEGRCPIGHPGPLTPW
|
||||
GKPALGQRTRARKKYSDALLVRRRK
|
||||
>NC_000932@ArthCp064@rpl2@84337@85843@R@2@275 ribosomal_protein_L2
|
||||
MAIHLYKTSTPSTRNGAVDSQVKSNPRNNLICGQHHCGKGRNARGIITAR
|
||||
HRGGGHKRLYRKIDFRRNAKDIYGRIVTIEYDPNRNAYICLIHYGDGEKR
|
||||
YILHPRGAIIGDTIVSGTEVPIKMGNALPLTDMPLGTAIHNIEITLGRGG
|
||||
QLARAAGAVAKLIAKEGKSATLKLPSGEVRLISKNCSATVGQVGNVGVNQ
|
||||
KSLGRAGSKCWLGKRPVVRGVVMNPVDHPHGGGEGRAPIGRKKPVTPWGY
|
||||
PALGRRTRKRKKYSETLILRRRSK
|
||||
>NC_000932@ArthCp085@rpl2@152806@154312@D@2@275 ribosomal_protein_L2
|
||||
MAIHLYKTSTPSTRNGAVDSQVKSNPRNNLICGQHHCGKGRNARGIITAR
|
||||
HRGGGHKRLYRKIDFRRNAKDIYGRIVTIEYDPNRNAYICLIHYGDGEKR
|
||||
YILHPRGAIIGDTIVSGTEVPIKMGNALPLTDMPLGTAIHNIEITLGRGG
|
||||
QLARAAGAVAKLIAKEGKSATLKLPSGEVRLISKNCSATVGQVGNVGVNQ
|
||||
KSLGRAGSKCWLGKRPVVRGVVMNPVDHPHGGGEGRAPIGRKKPVTPWGY
|
||||
PALGRRTRKRKKYSETLILRRRSK
|
||||
>NC_001319@MapoCp072@rpl2@79137@80514@R@2@278 ribosomal_protein_L2
|
||||
MAIRLYRAYTPGTRNRSVPKFDEIVKCQPQKKLTYNKHIKKGRNNRGIIT
|
||||
SQHRGGGHKRLYRKIDFQRNKKYITGKIKTIEYDPNRNTYICLINYEDGE
|
||||
KRYILYPRGIKLDDTIISSEEAPILIGNTLPLTNMPLGTAIHNIEITPGK
|
||||
GGQLVRAAGTVAKIIAKEGQLVTLRLPSGEIRLISQKCLATIGQIGNVDV
|
||||
NNLRIGKAGSKRWLGKRPKVRGVVMNPIDHPHGGGEGRAPIGRKKPLTPW
|
||||
GHPALGKRSRKNNKYSDTLILRRRKNS
|
||||
>NC_001320@OrsajCp069@rpl2@81180@82664@R@2@274 ribosomal_protein_L2
|
||||
MAKHLYKTPIPSTRKGTIDRQVKSNPRNNLIHGRHRCGKGRNSRGIITAR
|
||||
HRGGGHKRLYRKIDFRRNQKDISGRIVTIEYDPNRNAYICLIHYGDGEKG
|
||||
YILHPRGAIIGDTIVSGTKVPISMGNALPLTDMPLGTAIHNIEITRGRGG
|
||||
QLARAAGAVAKLIAKEGKSATLRLPSGEVRLVSQNCLATVGQVGNVGVNQ
|
||||
KSLGRAGSKCWLGKRPVVRGVVMNPVDHPHGGGEGKAPIGRKKPTTPWGY
|
||||
PALGRRTRKRKKYSDSFILRRRK
|
||||
>NC_001320@OrsajCp109@rpl2@132454@133938@D@2@274 ribosomal_protein_L2
|
||||
MAKHLYKTPIPSTRKGTIDRQVKSNPRNNLIHGRHRCGKGRNSRGIITAR
|
||||
HRGGGHKRLYRKIDFRRNQKDISGRIVTIEYDPNRNAYICLIHYGDGEKG
|
||||
YILHPRGAIIGDTIVSGTKVPISMGNALPLTDMPLGTAIHNIEITRGRGG
|
||||
QLARAAGAVAKLIAKEGKSATLRLPSGEVRLVSQNCLATVGQVGNVGVNQ
|
||||
KSLGRAGSKCWLGKRPVVRGVVMNPVDHPHGGGEGKAPIGRKKPTTPWGY
|
||||
PALGRRTRKRKKYSDSFILRRRK
|
30
detectors/cds/test/test.db/rpl23.fst
Normal file
30
detectors/cds/test/test.db/rpl23.fst
Normal file
@ -0,0 +1,30 @@
|
||||
>AC_000188@LyesCp026@rpl23@87547@87828@R@1@94 ribosomal_protein_L23
|
||||
MDGIKYAVFTDKSIRLLGKNQYTSNVESGSTRTEIKHWVELFFGVKVIAM
|
||||
NSHRLPGKSRRMGPIMGHTMHYRRMIITLQPGYSIPPLRKKRT
|
||||
>AC_000188@LyesCp083@rpl23@153516@153797@D@1@94 ribosomal_protein_L23
|
||||
MDGIKYAVFTDKSIRLLGKNQYTSNVESGSTRTEIKHWVELFFGVKVIAM
|
||||
NSHRLPGKSRRMGPIMGHTMHYRRMIITLQPGYSIPPLRKKRT
|
||||
>NC_000925@PopuCp127@rpl23@104311@104613@R@1@101 ribosomal_protein_L23
|
||||
MDSIDSRDLLDLVKYPIITDKTTKLLEENQYCFAVDPNATKINIKAAIQY
|
||||
IFNVQVTGVNTCHPPKKKRSIGRFIGKRPHYKKAIITLASKDSINLFPET
|
||||
>NC_000926@GuthCp112@rpl23@100237@100524@D@1@96 ribosomal_protein_L23
|
||||
MHALIDLVKYPLITDKATRLLELNQYTFLTSRVATKTDIKNAIEFLFNVK
|
||||
VISINTCLLPLKRKRLGKFVGSKPRYKKAVVTLEKNNTINLFSEN
|
||||
>NC_000927@NeolCp023@rpl23@16871@17149@R@1@93 ribosomal_protein_L23
|
||||
MIIDLVKRPVITEKATRILEKNQYTFDVELSLTKPKIKALIEKAFKVEVV
|
||||
SVNTHRPPRRKRRLGTTQGYLPRYKRAIITLKRGFMIPLTPF
|
||||
>NC_000932@ArthCp065@rpl23@85862@86143@R@1@94 ribosomal_protein_L23
|
||||
MDGIKYAVFTDKSIRLLGKNQYTFNVESGSTRTEIKHWVELFFGVKVIAM
|
||||
NSHRLPGKVKRMGPILGHTMHYRRMIITLQPGYSIPPLRKKRT
|
||||
>NC_000932@ArthCp084@rpl23@152506@152787@D@1@94 ribosomal_protein_L23
|
||||
MDGIKYAVFTDKSIRLLGKNQYTFNVESGSTRTEIKHWVELFFGVKVIAM
|
||||
NSHRLPGKVKRMGPILGHTMHYRRMIITLQPGYSIPPLRKKRT
|
||||
>NC_001319@MapoCp073@rpl23@80550@80825@R@1@92 ribosomal_protein_L23
|
||||
MNQVKYPVLTEKTIRLLEKNQYSFDVNIDSNKTQIKKWIELFFNVKVISV
|
||||
NSHRLPKKKKKIGTTTGYTVRYKRMIIKLQSGYSIPLFSNK
|
||||
>NC_001320@OrsajCp071@rpl23@82683@82964@R@1@94 ribosomal_protein_L23
|
||||
MDGIKYAVFTEKSLRLLGKNQYTFNVESGFTKTEIKHWVELFFGVKVVAV
|
||||
NSHRLPGKGRRMGPILGHTMHYRRMIITLQPGYSIPLLDREKN
|
||||
>NC_001320@OrsajCp108@rpl23@132154@132435@D@1@94 ribosomal_protein_L23
|
||||
MDGIKYAVFTEKSLRLLGKNQYTFNVESGFTKTEIKHWVELFFGVKVVAV
|
||||
NSHRLPGKGRRMGPILGHTMHYRRMIITLQPGYSIPLLDREKN
|
30
detectors/cds/test/test.db/rpl32.fst
Normal file
30
detectors/cds/test/test.db/rpl32.fst
Normal file
@ -0,0 +1,30 @@
|
||||
>AC_000188@LyesCp036@rpl32@114504@114671@D@1@56 ribosomal_protein_L32
|
||||
MAVPKKRTSTSKKRIRKNIWKRKGYWVALKAFSLAKSLSTGNSKSFFVRQ
|
||||
TKINK
|
||||
>NC_000925@PopuCp022@rpl32@16239@16418@D@1@60 ribosomal_protein_L32
|
||||
MAVPKKRTSKAKKNARKANWKNQAKTEAQKALSLAKSVLTGKSNGFVYNT
|
||||
LEVADAIVE
|
||||
>NC_000926@GuthCp026@rpl32@24770@24931@D@1@54 ribosomal_protein_L32
|
||||
MAVPKKRTSRSKTNSRFANWLNKSNLQAQRAISKAKSITNKKNTVNDETI
|
||||
ETE
|
||||
>NC_000927@NeolCp122@rpl32@149220@149447@D@1@76 ribosomal_protein_L32
|
||||
MAVPKKRKSKSRANSQNHVWKREIVKQARRAVSLAKALLGGNTNFLLVSP
|
||||
GPTTPIKPNPKKQTGRRPRSQRRRT
|
||||
>NC_000932@ArthCp072@rpl32@113449@113607@D@1@53 ribosomal_protein_L32
|
||||
MAVPKKRTSISKKRIRKKIWKRKGYWTSLKAFSLGKSLSTGNSKSFFVQQ
|
||||
NK
|
||||
>NC_001319@MapoCp076@rpl32@93886@94095@D@1@70 ribosomal_protein_L32
|
||||
MAVPKKRTSKSKTRIRKAIWKNKANKSALRAFSLAKSILTNRSKSFYYTI
|
||||
NDKLLNSSKSISTSKLDES
|
||||
>NC_001320@OrsajCp086@rpl32@104352@104543@D@1@64 ribosomal_protein_L32
|
||||
MAVPKKRTSMSKKRIRKNLWKKKTYFSIVQSYSLAKSRSFSGVSEHPKPK
|
||||
GFSRQQTNNRVLG
|
||||
>NC_001603@EugrCp047@rpl32@75928@76092@R@1@55 ribosomal_protein_L32
|
||||
MAVPKKKMSKSRRNSRKSNWKKKVLKKVLFALSLGKSFEANTNVNFSFGD
|
||||
KLPQ
|
||||
>NC_001631@PithCp150@rpl32@107399@107611@R@1@71 ribosomal_protein_L32
|
||||
MAVPKKRTSRSKKKIRKNVRKGKAYRAAIKAFSLAKSISTGHSKSFYCIV
|
||||
NDDSSGSSESKLTAIDLDDP
|
||||
>NC_001666@ZemaCp084@rpl32@108127@108306@D@1@60 ribosomal_protein_L32
|
||||
MAVPKKRTSMSKKRIRKNLWKKKTYFSIVQSYSLAKSRSFSRGNEHPKPK
|
||||
GFSGQQANK
|
30
detectors/cds/test/test.db/rps15.fst
Normal file
30
detectors/cds/test/test.db/rps15.fst
Normal file
@ -0,0 +1,30 @@
|
||||
>AC_000188@LyesCp029@rps15@124632@124895@R@1@88 ribosomal_protein_S15
|
||||
MVKNSVISVISQEEKKGSVEFQVFNFTNKIRRLTSHLELHKKDYLSQRGL
|
||||
KKILGKRQRLLAYLAKKNRVRYKELINRLDIRETKTR
|
||||
>NC_000932@ArthCp081@rps15@123296@123562@R@1@89 ribosomal_protein_S15
|
||||
MIKNIVISFEEQKEESRGSVEFQVFSFTNKIRRLTSHLELHRKDYLSQRG
|
||||
LRKILGKRQRLLAYLSKKNRVRYKELINQLNIRELKTR
|
||||
>NC_001319@MapoCp086@rps15@103433@103699@R@1@89 ribosomal_protein_S15
|
||||
MSKNLFMDLSSISEKEKGSVEFQIFRLTNRVVKLTYHFKKHGKDYSSQRG
|
||||
LWKILGKRKRLLAYLFKTNFVSYENLIIQLGIRGLKKN
|
||||
>NC_001320@OrsajCp083@rps15@100818@101090@D@1@91 ribosomal_protein_S15
|
||||
MKKKGGRKIFGFMVKEEKEENWGSVEFQVFSFTNKIRRLASHLELHKKDF
|
||||
SSERGLRRLLGKRQRLLAYLAKKNRVRYKKLISQLDIRER
|
||||
>NC_001320@OrsajCp095@rps15@114028@114300@R@1@91 ribosomal_protein_S15
|
||||
MKKKGGRKIFGFMVKEEKEENWGSVEFQVFSFTNKIRRLASHLELHKKDF
|
||||
SSERGLRRLLGKRQRLLAYLAKKNRVRYKKLISQLDIRER
|
||||
>NC_001631@PithCp139@rps15@101136@101402@D@1@89 ribosomal_protein_S15
|
||||
MINNLSISSSLIPDKQRGSVESQVFYLTNRVLRLTQHLQLHGRDYSSQRG
|
||||
LWKILSKRKQLLVYLSKRDKLRYDDLIGQLGIRGLKTR
|
||||
>NC_001666@ZemaCp082@rps15@104729@104965@D@1@79 ribosomal_protein_S15
|
||||
MVKEEKQENRGSVEFQVFSFTNKIRRLASHLELHKKDFSSERGLRRLLGK
|
||||
RQRLLAYLAKKNRVRYKKLISQLDIREK
|
||||
>NC_001666@ZemaCp093@rps15@117772@118008@R@1@79 ribosomal_protein_S15
|
||||
MVKEEKQENRGSVEFQVFSFTNKIRRLASHLELHKKDFSSERGLRRLLGK
|
||||
RQRLLAYLAKKNRVRYKKLISQLDIREK
|
||||
>NC_001879@NitaCp090@rps15@125230@125493@R@1@88 ribosomal_protein_S15
|
||||
MVKNSVISVISQEEKRGSVEFQVFNFTNKIRRLTSHLELHKKDYLSQRGL
|
||||
KKILGKRQRLLAYLSKKNRVRYKELINQLDIRETKTR
|
||||
>NC_002186@MeviCp104@rps15@109145@109417@R@1@91 ribosomal_protein_S15
|
||||
MLKKKIIKTHANHTNDTGSTQVQVSLLSSRVAQLTKHLNNHKNDYSSQRG
|
||||
LKKLLGQRKRLLKYLFVKDPLGYNNLIIQLGIRPGKSLVN
|
50
detectors/cds/test/test.db/rps7.fst
Normal file
50
detectors/cds/test/test.db/rps7.fst
Normal file
@ -0,0 +1,50 @@
|
||||
>AC_000188@LyesCp008@rps7@98721@99188@R@1@156 ribosomal_protein_S7
|
||||
MSRRGTAEKKTAKSDPIYRNRLVNMLVNRILKHGKKSLAYQIIYRAVKKI
|
||||
QQKTETNPLSVLRQAIRGVTPDITVKARRVGGSTHQVPIEIGSTQGKALA
|
||||
IRWLLAASRKRPGRNMAFKLSSELVDAAKGSGDAIRKKEETHRMAEANRA
|
||||
FAHFR
|
||||
>AC_000188@LyesCp022@rps7@142156@142623@D@1@156 ribosomal_protein_S7
|
||||
MSRRGTAEKKTAKSDPIYRNRLVNMLVNRILKHGKKSLAYQIIYRAVKKI
|
||||
QQKTETNPLSVLRQAIRGVTPDITVKARRVGGSTHQVPIEIGSTQGKALA
|
||||
IRWLLAASRKRPGRNMAFKLSSELVDAAKGSGDAIRKKEETHRMAEANRA
|
||||
FAHFR
|
||||
>NC_000925@PopuCp103@rps7@92209@92679@R@1@157 ribosomal_protein_S7
|
||||
MSRRNTAKKRFASPDPLYKSRLVSMLTVRILKSGKKTLAQRIIYQALDIV
|
||||
KERTETDPLNVLEKAIRNITPLVEVKARRVGGSTYQVPIEVRAYRGTNLA
|
||||
LRWITRFSRERSGKSMSMKLANEIMDAANETGNSIRKREETHRMAEANKA
|
||||
FAHYRY
|
||||
>NC_000926@GuthCp136@rps7@111745@112215@D@1@157 ribosomal_protein_S7
|
||||
MSRRSTTKKKLALPDPIYNSRLVNMLTVRILKEGKKHLAQRIIYNAFDII
|
||||
KQRTGEDAILVFESAIKKVTPLVEVKARRIGGSTYQVPMEVRAFRGTNLA
|
||||
LRWITKYARERAGKSMSMKLANEIMDAANETGSSIRKREEIHRMAEANKA
|
||||
FAHYRF
|
||||
>NC_000927@NeolCp044@rps7@48318@48788@D@1@157 ribosomal_protein_S7
|
||||
MSRRNTAVKRSISSDPVYNSQLIHMMISHILKEGKKALAYRLMYDAMKRI
|
||||
EKTTQQDPILVVERAVRNATPTIEVKARRMGGSIYQVPLEVKPERGTALA
|
||||
LRWILLAARNRTGRDMVAKLSNELMDASNRIGNAVRKRDEMHRMAEANKA
|
||||
FAHIRV
|
||||
>NC_000932@ArthCp069@rps7@97478@97945@R@1@156 ribosomal_protein_S7
|
||||
MSRRGTAEEKTAKSDPIYRNRLVNMLVNRILKHGKKSLAYQIIYRALKKI
|
||||
QQKTETNPLSVLRQAIRGVTPDIAVKARRVGGSTHQVPIEIGSTQGKALA
|
||||
IRWLLGASRKRPGRNMAFKLSSELVDAAKGSGDAIRKKEETHRMAEANRA
|
||||
FAHFR
|
||||
>NC_000932@ArthCp088@rps7@140704@141171@D@1@156 ribosomal_protein_S7
|
||||
MSRRGTAEEKTAKSDPIYRNRLVNMLVNRILKHGKKSLAYQIIYRALKKI
|
||||
QQKTETNPLSVLRQAIRGVTPDIAVKARRVGGSTHQVPIEIGSTQGKALA
|
||||
IRWLLGASRKRPGRNMAFKLSSELVDAAKGSGDAIRKKEETHRMAEANRA
|
||||
FAHFR
|
||||
>NC_001319@MapoCp002@rps7@892@1359@D@1@156 ribosomal_protein_S7
|
||||
MSRKSIAEKQVAKPDPIYRNRLVNMLVNRILKNGKKSLAYRILYKAMKNI
|
||||
KQKTKKNPLFVLRQAVRKVTPNVTVKARRIDGSTYQVPLEIKSTQGKALA
|
||||
IRWLLGASRKRSGQNMAFKLSYELIDAARDNGIAIRKKEETHKMAEANRA
|
||||
FAHFR
|
||||
>NC_001320@OrsajCp076@rps7@87944@88414@R@1@157 ribosomal_protein_S7
|
||||
MSRRGTAEKRTAKSDPIFRNRLVNMVVNRIMKDGKKSLAYQILYRAVKKI
|
||||
QQKTETNPLLVLRQAIRRVTPNIGVKTRRNKKGSTRKVPIEIGSKQGRAL
|
||||
AIRWLLEASQKRPGRNMAFKLSSELVDAAKGGGGAIRKKEATHRMAEANR
|
||||
ALAHFR
|
||||
>NC_001320@OrsajCp103@rps7@126704@127174@D@1@157 ribosomal_protein_S7
|
||||
MSRRGTAEKRTAKSDPIFRNRLVNMVVNRIMKDGKKSLAYQILYRAVKKI
|
||||
QQKTETNPLLVLRQAIRRVTPNIGVKTRRNKKGSTRKVPIEIGSKQGRAL
|
||||
AIRWLLEASQKRPGRNMAFKLSSELVDAAKGGGGAIRKKEATHRMAEANR
|
||||
ALAHFR
|
353
detectors/cds/test/test.db/ycf1.fst
Normal file
353
detectors/cds/test/test.db/ycf1.fst
Normal file
@ -0,0 +1,353 @@
|
||||
>AC_000188@LyesCp019@ycf1@125297@130972@R@1@1892 ycf1_protein
|
||||
MIFQSFLLGNLVSLCMKIINSVVVVGLYYGFLTTFSIGPSYLFLLRALVM
|
||||
EEGTEKKVSATTGFITGQLMMFISIYYAPLHLALGRPHTITVLALPYLLF
|
||||
HFFWNNHKHFFDYGSTTRNSMRNLSIQCVFLNNLIFQLFNHFILPSSMLA
|
||||
RLVNIYLFRCNNKILFVTSGFVGWLIGHILFMKWLGLVLVWIRQNHSIRS
|
||||
NKYIRSNKYLVLELRNSMARIFSILLFITCVYYLGRIPSPILTKKLKEAS
|
||||
KTEERVESEEERDVEIETASEMKGTKQEQEGSTEEDPYPSPSLFSEEGWD
|
||||
PDKIDETEEIRVNGKDKIKDKFHSHLTETGYNNINTSNSPIYDYQDSYLN
|
||||
NNNTGNLENCKLQLLDKKNENQEQDLFWFQKPLVSLLFDYNRWNRPFRYI
|
||||
KNNRFEQAVRTEMSQYFFDTCKSDGKQKISFTYPPSLSTFWKMIKRKIPL
|
||||
LSLQKTLPNELDTQWVSTNKEKSNNLNKEFLNRLEILDKESLSLDILETR
|
||||
TRFCNDDTKKEYVPKMYDPLLNGLYRGTIKKGVSSSIINNTLLENWEKRV
|
||||
RLNRIHTIFLPNIDYQEFEQKAYTIDKKPLSTEIDEFLTLINELGNEAKS
|
||||
SLNLKGLSLFSDQEQRRANSEKRTKFVKFVFNALDPNETKSGKKSIGIKE
|
||||
ISKKVPRWSHKLITELDQQMGEFKDRASMDHQLRSRKAKRVVIFTDNKAT
|
||||
KDAEEEVALISYSQQSDFRRGIITGSMRAQRRKTFISKLFQANVHSPLFV
|
||||
DRITPLRLFSFDISELIKPILKNWTDKEGEFKILESREEQTKREEKKEKD
|
||||
KKEDNKRKEQARIAIEEAWDTIPLAQIIRGYMLITQSILRKYILLPALII
|
||||
AKNIGRMLFLQLPEWSEDLQEWNREMQIKCTYNGVQLSETEFPKNWLRDG
|
||||
IQIKILFPFCLKPWHISKLYPSRRELMKKQKQKDDFCFLTVWGMEAELPF
|
||||
GSPRKRPSFFEPIFKELEKKIGKFKKKYFLTLKILKGKTKLFRKVSKETT
|
||||
KLFIKSIGFLKKIKKELSKVNLIVLFRFKEISESNETKKEKDYLISNQII
|
||||
NESFRQIESGNWPNSSLIETKMKDLTNRTSTIKNKIERITKEKKKVTPEI
|
||||
DINPNKTNNIKKFESPKKIFQILKSRNTRVIWKFHYFLKLFIQRLYINLF
|
||||
LSIINIPRITTQLFLKSTNKLIEKFISNNEINQEKINNKKKIHFMFISTI
|
||||
KKSLYNISKKNSHILCDLSYLSQAYVFYKLSQTQVINFSKFRSVLQYNTT
|
||||
SCFLKTKIKDYFKTLGIFHSELKHKKLQSYRINQWKNWLRWHYQYDLSQI
|
||||
RWSRLMPKKWRTRVNQSCMAQNKNRNLNKWNSYEKDQLLHYKKENDSELY
|
||||
SLSNEKDNFKKCYGYGLLAYKSINYENKSDSFFSRLPFEVQVKKNLEISY
|
||||
NSNTSKHNFVDMPGNLHINNYLRKGNILDRERNLDRKYFDWKIIHFSLRQ
|
||||
KGDIEAWVKIDTNSNPNTKIGINNYQIIDKIEKKGVFYLTTHQNPEKTQK
|
||||
NSKKFFFDWMGMNEKIFNRPILNLEFWFFPEFVLLYNVYKIKPWIIPSKF
|
||||
LLFNLNTNKNVSQNKNQNFFLPSNKKIKIKNRSQEAKEPPSQRERGSDIE
|
||||
NKGNLSPVFSKHQTDLEKDYVESDTKKGKNKKQYKSNTEAELDLFLKRYL
|
||||
LFQLRWNGALNQRMFENIKVYCLLLRLINPTKITISSIQRREMSLDIMLI
|
||||
QANLPLTDLMKKGVLIIEPIRLSVKDNGQFIMYQTIGISLIHKSKHQTNQ
|
||||
RYREQRYVDKKNFDEFILQPQTQRINTEKTHFGLLVPENILWSRRRRELR
|
||||
IRSFFNSWNWNVVDRNSVFCNETNVKNWSQFLGERKPLYKDKNELIKFKF
|
||||
FFWPNYRLEDLACMNRYWFDTNNGSRFSILRIHMYPRLKIN
|
||||
>NC_000932@ArthCp070@ycf1@109405@110436@D@1@344 hypothetical_protein
|
||||
MMVFQSFILGNLVSLCMKIINSVVVVGLYYGFLTTFSIGPSYLFLLRARV
|
||||
MDEGEEGTEKKVSATTGFIAGQLMMFISIYYAPLHLALGRPHTITVLALP
|
||||
YLLFHFFWNNHKHFFDYGSTTRNEMRNLRIQCVFLNNLIFQLFNHFILPS
|
||||
SMLARLVNIYMFRCNNKMLFVTSSFVGWLIGHILFMKWVGLVLVWIQQNN
|
||||
SIRSNVVIRSNKYKFLVSELRNSMARIFSILLFITCVYYLGRIPSPIFTK
|
||||
KLKGTSETGGTKQDQEVSTEEAPFPSLFSEEGEDLDKIDEMEEIRVNGKD
|
||||
KINKDDEFHVRTYYNYKTVSENLYGNKENSNLEFFKIKKKEDH
|
||||
>NC_000932@Arthcp087@ycf1@123884@129244@R@1@1787 Ycf1
|
||||
MMVFQSFILGNLVSLCMKIINSVVVVGLYYGFLTTFSIGPSYLFLLRARV
|
||||
MDEGEEGTEKKVSATTGFIAGQLMMFISIYYAPLHLALGRPHTITVLALP
|
||||
YLLFHFFWNNHKHFFDYGSTTRNEMRNLRIQCVFLNNLIFQLFNHFILPS
|
||||
SMLARLVNIYMFRCNNKMLFVTSSFVGWLIGHILFMKWVGLVLVWIQQNN
|
||||
SIRSNVVIRSNKYKFLVSELRNSMARIFSILLFITCVYYLGRIPSPIFTK
|
||||
KLKGTSETGGTKQDQEVSTEEAPFPSLFSEEGEDLDKIDEMEEIRVNGKD
|
||||
KINKDDEFHVRTYYNYKTVSENLYGNKENSNLEFFKIKKKEDHFLWFEKP
|
||||
FVTLVFDYKRWNRPNRYIKNDKIENIVRNEMSQYFFYTCQSDGKERISFT
|
||||
YPPNLSTFFEMIQKRIPSFTKEKKTFDQVSTYWSLIHEEKRENLKKEFLN
|
||||
RIEALDKEWSVENILEKTTRFCYNEAKKEYLPKIYDPFLHGISRGRIKKL
|
||||
PPFQIITETYRKNNLGGSWINKIHGLLLKINYKKFEQTIEKFNRKSLSIE
|
||||
KKLSFFSEPQQEEKINSEEEIKTFKFLFDIVRTDSNDQTLIKNFMDFPEI
|
||||
NKKVPRWSYKLISELEELEGENEENVPMEPGIRSRKAKRVVVFTDKEPHG
|
||||
EIYTNLKDNQNSDQNDEMALIRYSQQSDFRREIIKGSMRSQRRKTVIWEF
|
||||
FQAKVHSPLFFDRIDKLFFFSFDIWGLKKKIIKNFIWKKKIDKKEEEQSK
|
||||
REETRRIEIAETWDSFLFAQIIRGSLLVTQSILRKYIILPLLIIIKNSVR
|
||||
MLLFQFPEWSQDLKDWKREMHVKCTYNGVQLSETEFPRNWLTDGIQIKIL
|
||||
FPFYLKPWHKSKFQASQKARLKKTKDKGEKNDFCFLTVWGMETELPFGSA
|
||||
QRKPSFFEPISKELKKRIKKLKKKSFVVLKIFKERAPIFLKVAKETKNWI
|
||||
LKNFIFIKGISKRNLIPLFGPREIYELNEPKKDSIISNQMIHELSVQNKS
|
||||
LEWTNSSLSEKKIKNLIDRKKTIRNQIEEISKEKQNLTNSCTKLRYDSKI
|
||||
IESSKKIWQTFKRKNTRLIRKSIFFFKFCIEQMSIAIFLGIINIPRITTQ
|
||||
LFFESTKKILDKYIYKNEENGEKKKNTLYFISTIKNLISNKKKMSYDLCS
|
||||
LSQAYVFYKLSQIKVSNFCKLKAVLEYNICITSFFVKNKIKVFFQEHGIF
|
||||
HYELKNKTFLNSEVNQWKNWLRSQYQYNLPQISWARLVTQNWKNKINKDS
|
||||
LVLNPSLTKEDSYEKKKFDNYKKQKFFEADSLLNPKHNVKKDSIYNLFCY
|
||||
KSIHSTEKNFDMSIGIALDNCLVSSFLEKYNIRGMGEIRHRKYLDWRILN
|
||||
FWFTKKVTIEPWVDTKSKKKYINTKVQNYQKIDKITQTDLANKKRNFFDW
|
||||
MGMNEEILNQRITNFEFFFFPEFFLFSSTYKMKPWVIPIKLLLLNFNENI
|
||||
NVNKKIIRKKKGFIPSNEKESLRFYNLNKEEKESAGQVELESDKETKRNP
|
||||
EAARLNQEKNIEENFAESTIKKRKNKKQYKSNTEAELDLFLTRYSRFQLR
|
||||
WNCFFNQKILNNVKVYCLLVRLNNPNEIAVSSIERGEMSLDILMIEKNFT
|
||||
FAKLMKKGILIIEPVRLSVQNDGQLIIYRTIGISLVHKNKHKISKRYKKK
|
||||
SYINKKFFEKSITKYQNKTVNKKKNNYDFFVPEKILSPKRRREFRILICF
|
||||
NLKKKNARDTNSRFDKNIQNLTTVLHKKKDLDLDKDKNNLINLKSFLWPN
|
||||
FKLEDLACMNRYWFNTTNGNHFSMIRIRMYTRFPIP
|
||||
>NC_001879@NitaCp151@ycf1@125891@131599@R@1@1903 Ycf1
|
||||
MMIFQSFLLGNLVSLCMKIINSVVVVGLYYGFLTTFSIGPSYLFLLRALV
|
||||
MEEGTEKKVSATTGFITGQLMMFISIYYAPLHLALGRPHTITVLALPYLL
|
||||
FHFFWNNHKHFFDYGSTTRNSMRNLSIQCVFLNNLIFQLFNHFILPSSML
|
||||
ARLVNIYLFRCNSKILFVTSGFVGWLIGHILFMKWLGLVLVWIRQNHSIR
|
||||
SNKYIRSNKYLVLELRNSMARIFSILLFITCVYYLGRIPSPILTKKLKEA
|
||||
SKTEERVESEEERDVEIETASEMKGTKQEQEGSTEEDPYPSPSLFSEERW
|
||||
DPDKIDETEEIRVNGKDKIKDKFHSHLTETGYNNINTSNSPIYDYEDSYL
|
||||
NNNNTGNTEIFKLQLLDKKNENKDLFWFQQPLVSLLFDYNRWNRPFRYIK
|
||||
NNRFEQAIRTEMSQYFFNTCKSDGKQRISFTYPPSLSTFWKMIKRRIPLL
|
||||
SLQKTLPNELDNQWISTNKEKSNNLNKEFLNRLEVLDKESFSLDILETRT
|
||||
RLCNDDTKKEYVPKMYDPLLNGPYRGTIKKKFSPSIINNTSLENLKERVR
|
||||
INRIHTIFLPNTDYQELEQKVDTVAKKPLSTEIDEFLTLINEFGNEPKSS
|
||||
LNLKDLSLFSDQEQGRVNSEKRTKFVKFVFNAIAPNGTTSEKKSIGIKEI
|
||||
SKKIPRWSHKLITELEQQSGDYQEGVPLDHQIRSRKAKRVVIFTANNQNN
|
||||
DPDTKDTDTADQDQTKEVALIRYSQQPDFRRGIIKGSMRAQRRKTVIWKL
|
||||
FQANVHSPLFLDRITPPFLFSFDISGLIKPIFRNWSGKEGEFKILESREE
|
||||
QTKREEKKEKDKKGENKRKEKARIEIAEAWDTIPFAQIIRGYMLITQSIL
|
||||
RKYIVLPSLIIAKNLGRMLVLQLPEWSEDLQEWNREMHIKCTYNGVQLSE
|
||||
TEFPKNWLKDGIQIKILFPFCLKPWHISKLYSSRGELMKKKKQKDDFCFL
|
||||
TVWGMEAELPFGSPRKRPSFFEPIFKELEKKIGKFKKKYFITLKVFKGKI
|
||||
KLFRRISKETKKWLIKSSLFIKKMKKELSKVNPIVLFRLKEIDESNETKK
|
||||
EKDSLMSNQIINESFSQIESGNWPNSSLIESKMKDLTDRTSTIKNQIERI
|
||||
TKEKKKVTPEIDISPNKTNNIKKFESPKKIFQILKRRNTRLIWKFHYFLK
|
||||
LFIQRLYIDLFLSIINIPRINTQLFLESTNKLIDKYISNNEINQEKINNQ
|
||||
KKIHFISTIKKSLYNISKKNSHIFFDLSYLSQAYVFYKLSQPQVINLSKL
|
||||
RSVLQYNRTSFFLKTKIKDYFRTLGIFHSELKHKKLQSYRINQWKNWLRR
|
||||
HYQYDLSQIRWSRLMPQKWRNRVNQGCMAQNRNLNKWNSYEKDQLIHYKK
|
||||
ENDSELYSLANQKDNFQKCYRYDLLAYKSINYEKKNDSFISRLPFQVNKN
|
||||
LEISSNSNTSKHNLFDMLGNLHINNYLRKGNILYIERNLDRKYFDWKIIH
|
||||
FSLRQKEDIEAWVKIDTNSNPNTKIGINNYQIIDKIDKKGFFYLTIHQNP
|
||||
ENNQKNSKKAFFDWMGMNEKILNRPILNLEFWFFPEFVPLYNVYKIKPWI
|
||||
IPSKLLLLNLNTNENVSQNKNINKNQKQNFFLRSNKKIKNRIQEAKEPAS
|
||||
QGEKERGSDIENKGNLGPVLSKHQNALKKDYAESDTKKGKKKKQYKSNTE
|
||||
AELDLFLKRYLLFQLRWNDALNQRMIENIKVYCLLLRLINPSKIAISSIQ
|
||||
RREMSLDIMLIQKNLTLTELMKKGILIIEPIRLSVKNNGQFIMYQTIGIS
|
||||
LVHKSKHQTNQRYPEQRYVDKKNFDEFILQPQTQRINTDKNHFDLLVPEN
|
||||
ILWSRRRRELRIRSLFNSLNWNGIDRNSVFCNENNVKNWSQFLDERKPLY
|
||||
KEKNELIKLKFFLWPNYRLEDLACMNRYWFDTNNGSRFSILRIHMYPQLK
|
||||
IN
|
||||
>NC_002202@SpolCp093@ycf1@121596@127097@R@1@1834 ycf1_protein
|
||||
MIFQSFLLGNLVSLCMKIINSVVVVGLYYGFLTTFSIGPSYLFLLRAQVM
|
||||
EEGEEGTEKKVSGTTGFIMGQLMMFISIYYTPLHLALGRPHTITVLALPY
|
||||
LLFHFFWNNHKHFFDYGSTSRNSMRNLSIQCVFLNNLIFQLFNYFILPSS
|
||||
MLARLVNIYMFRCNNKMLFVTSSFVGWLIGHILFMKWVGLVLVWIQQNNS
|
||||
IRSNKYLVSELRNSMARIFSILFFITCVYYLGRMPSPIFTNKLKQMLETN
|
||||
EIEEETNLEIEKTSETKETKQEEEGFTEEDPSPSLFSEEKEDPDKIDETE
|
||||
KIRVNGKDKTKDEFHLKEACYKNSPTSYSGNQDISKLEILKKEKKILFWF
|
||||
QKPLIFLLFDYKRWNRPMRYIKNNRFENAVRNEMSQYFFYTCQNDGKQRI
|
||||
SFTYPPSLSIFWEMIQRKISLATTEKFLYDDELYNYWIYTNEQKKNSLSN
|
||||
EFANRITVLDKGLFYIDVLDKKTRLCKSKNEYLQKDHDPLLNGSYRGIIK
|
||||
KTLLPFINNDETTVKKLIDEIFINKIHSVLGNCNNYQEFEYKKDPFKKNP
|
||||
ISSKIRHFVTLMSQFDGESTFNQKGISLLSEHKQICSEDPEIFFKFLVDT
|
||||
IIADSFTQTIPKESIGIKEISKKVPHWSYQLIDESEQEEMENEKQVSWPH
|
||||
QIRSRSGKEVVFFTDKQENTDNPTPNTADISEQADEVVLTRYPQESDFRR
|
||||
DIIKGSMRSQRRKIVIWELFQANIHSPLFLDRTNKSSFFSITFSRLIKRI
|
||||
FKNYMGKNPELDISNYKEEELKKKEKAKEHKKDKEKKQEQIRLDIAETWD
|
||||
TIPGAQIIRSLILLTQSILRKYILLPLLITGKNIGRILLFQLPEWSDDFK
|
||||
EWTSEMHIKCTYNGVQLSEKEFPKNWLTDGMQIKILSPFCLKPWHKSMIR
|
||||
PYHQDKKKKEQNQIDAFCFLTVVGLETDIPFGPPRKRPSFFQPIFKQLDK
|
||||
KIEKLIKGNFQVRKRLKEKILFFLKLQNETNNWIIEIFPFFKKIIRKMST
|
||||
VNTIGVFGLKEASSEIKSEKDSRIKNHMIHESSVQIRFLNQTNSSVTEKK
|
||||
MKDLANRTRIIKNKIEKISNDKLKMSPKKTRYGTKNLGQILKRRNARLIR
|
||||
NSNYILKFFRERIYGDIFLYIINIPKINTQLFLESTKNGIDKSIYNNESI
|
||||
TKTNKNRIQFISTINKKFLPFLSTSKNNSKIISDFSFLSQAYVFYKLSQA
|
||||
KILNLYKLRLVLQYRGISLFLKNEIKDFFGTQGITNSELKTKKLPNSGMN
|
||||
QWKNWLKLKNNYQYNLSQLKWSRLVPQKWRNRVTEHCEVENTNLYQNEEL
|
||||
INSKKHLLLLPDQKYNFQKNYRYDVLSYKFFNYKNKNDSYRYSYGLPFQV
|
||||
NKNQEFSYTYNYNINNNKFIDMWWNIPISNFSYLEKTKIMDIDKNIDRKY
|
||||
LDFKILDFSLRNKIDIEDWIDISTSINENTKTEPRNYQIVEKINKKSLVY
|
||||
STIYQEIKQSDQKNKLFDWMGMNEKILSRPISNLEFWFFSEFFSFYNAYK
|
||||
MKPWVIPINLLFSNSNVSEKFSKNKSINRKKKTNPFIPSNEKKSFELENR
|
||||
NQDEKELVSKEDLGSYVQENYEKDIEEDYISFIDIKKPIKQKQPKSVIEA
|
||||
EFDLFLKRYLLFQLKWADSLNEKLMDNIQVYCLVLRLINPIEILISSIER
|
||||
KELSMDIMLDRKDFNCPNWKQKRVLIIEPIRLSIRGDGQFLLYQTIGISL
|
||||
VHKSKHQNNQKRYSENVDKKFLGERNKNNFDLLAPENLLSPRRRRELRIL
|
||||
LCLNSRNNNGVNTNPMENRVKNCNQFFDEKKDLDRDKNTLRNLKFFLWPN
|
||||
YRLEDLACMNRFWFDTNNGSRFSILRIHMYPQF
|
||||
>NC_002693@OeelhCp105@ycf1@129224@136615@R@1@2464 Ycf1
|
||||
MVNLVYVCMKINNSVVMVGLYYGFISAFSIGSSYLFLLRPRFLNDDPDAI
|
||||
EKKASETAGFFTGQLLIFISILYGPLHLALGRPHTILLLLAPYFFFHYLF
|
||||
SNSGQWPSQRFAFPLLTKSMRNRRFQLVFLNNLLFQLFSLSLLGRPMLTR
|
||||
LSYIYIFRCNNKMLFVLSSFVGWLIGHILVLKWAGLVFVWLLQVIRSKTM
|
||||
KYITCNVLIPATKYIIEKWRNSFVAGLIREILAMKQVESALVRIKNSKLL
|
||||
DDARWWIRGSSLISGLKINIRFYARLILRGFENVYVGAKFRQDMEHLFSI
|
||||
ILFAIFLLYLDQTPLLYADPADKKLQLQRKLSNETQAARAEKKLEERLTK
|
||||
KFEAQRRAQRAAQRQALQEFKQGVVESYLAKQVAKDANQIQAQKDEKQIQ
|
||||
AEQKARRIRAEQVVQYTFWLIEAQRREMEIEAARAMQEAYKGMLAAQEGY
|
||||
VEEGVQEKQEGFPEELISPSPIFHSEEREENPKLLILKEKISILKKKISI
|
||||
LKKKISILKEKNDLFSFEIPIITSLFDPQKPLRPLRYIKTCAGVEKAVKN
|
||||
EMSQYFFYACRSDGKQRICFTYPPSLATFWEMIQRKMASRFPRIYAKAKW
|
||||
RALRWSAPGSYRQWISRNKKKKNSLSTEFQNRIKTLDKKKSLLNVLARRK
|
||||
RSSLLNVLARRKRSSLQNVLETRKRLCNYKTNKTKKEYLPEKEYLPEIAD
|
||||
PFLTGALRGKSDPEVDDGGRKTSDLIKVVFLKNNITMATLRNKNDDDLRE
|
||||
QKNAIALLSRMKNPVNKLHLLFVNERDYPFVKTLVNRINGPAVPKKKKKI
|
||||
SKSKQKNVKSKQKNVKSKQKNVKSKQKNVKSKQNEIKRKVNEIKRKVNEI
|
||||
KRKQNESYPRGVKFGATPKTEINPHGIRFDAATIEKYSFATGYSYSPPSF
|
||||
DDILFHAFVTEPQRNKKAVIELEEEINKKVPRWSYQLIDELEQLEGAEGE
|
||||
TQFSDHEIRILPFKRVAVFTEKDSKKRKPLIDEQGNFVRHRKTYAIRFLG
|
||||
HMSDFRRGLIKGSARQDRRKAYVCRTTQVNARSPLFALGPRTFLDGLVNL
|
||||
AVQVKFFYETRIKGEKIVDDDDDNEKDEFKVMIPDTKSIVAETREMLKQA
|
||||
GAEDGQSYEDVEDDIRIENVTEMWENIDYGQVIRTFILLLHIFLRKKVVF
|
||||
PAFIIGKNIARMLLLQATEWKIDFARLKRERYAICTYNGMKVSEKIAFDQ
|
||||
FPPDWADDGIQILVTNPFYLKPWYRSKTRSIQKDPKKEKDPKKEKGPKKE
|
||||
PWYRFKTRFIQKDPKKEKGPKKEKGPKKEPWYRRFFFQKDPKKEKGPKKG
|
||||
KAQFEGDRGVRFLTSFGILTDRPFGDLITPDWGVFFNPIRNELKKKIRQF
|
||||
EKKHSIILSKRFRNVLKKTKKWFIKSFLFLKRARLKRHPIELSGGRETPE
|
||||
FTRSQKDIDNLKNEQDFRMSRNPRISESLLQGPVRALKDDSLPEEKVADP
|
||||
EKEPSDLDNELRAVWDEIDKVTKERKKIVFTPKPDSPDKLVQAKKNILKK
|
||||
LERIKSRRHKFYFLRIRKSYYVLLFFIKRISRNIKRIYLNPLERAISIRK
|
||||
IHPQRFFEFSKKMIEKSIGIGKTETNKETVYKTKKKKKKKNPFISIFKES
|
||||
LYDKDIRISENDIKLGDTWNGYKYKRKKATDTSDLASMSQAYVFYKLYQT
|
||||
QQTQLIHLDKLRYVLQYDGTSRFLKKELKDYFEAQELFHSKLKHKNSLNS
|
||||
GKNQWKNWLKAQHQYSVSPIIWNSLSPQKWRTKVNQERMDENTDLNKRYS
|
||||
NEKRKQFFEANSLDDEENVVETYLGQRAGDIKNSIKSYSYDLFSYQSINS
|
||||
EDKYVCINNKQKNSYNYNRRKVNLVDSPEGIALSNQFLVQNDLLDLYTFP
|
||||
DRKYVPWRLFPGSLIGGNDKDKDRFVKMWTATNSGNAVKYWTAANGNTSI
|
||||
KPGVFWTFQNSQRTKKQNPLFDWRGMNTELPNRCISDLKGWFFFSELLKL
|
||||
DLRYQVKPWILSKNLLFENLIFENQEENPNLIQNPIEDGRKNVIQNENEN
|
||||
DPIEDGRQNVIQNENENAIQNLIDFFLEKKNSPKDTNQELHAQAKARIWD
|
||||
ALVASLKQKREQKERKNKRIAQLIEKKKQKEIEKQKRKIEKQKRKKEKIE
|
||||
NAKKKIENEKKKIETEEEKIEKEKRKKERKKEKLKKKVAKNIEKLKNKVA
|
||||
KNVAKNIEKLKKQRAKNIARMEEEDKKARKKRKRKVQVQENKIPYTAFGS
|
||||
DKWQRPIAEYPKSGDIRNFQVILPEDDDEDDEEDRLDELKLNAYELSRIQ
|
||||
KITDEKRMKRNLLSSIKRERLKMEFSTRNNSLATIMLTHGIFSIEPLRIS
|
||||
RQNQDASFLIYQLIKISLVEQLDPYDHNDSFELTEKYRARRNFFMPKTNA
|
||||
ETMHKSDSDLFVPETILSTKRRRELRILISFYSRRGKRKNRIYKNPVFWK
|
||||
YVKNCGEVVDNSEKKKKKLIKSFLWPNYRLEDLACMNRYWFNAQNGSRFS
|
||||
MLRIRMYPRLKIR
|
||||
>NC_002694@LocoCp080@ycf1@120497@125878@R@1@1794 hypothetical_protein
|
||||
MIFQSFILDNLVSLCLKIINSVIVVGLYYGFMTTFSTGPSYLFLLRAHVM
|
||||
EEGTEKKISATTGFITGQLVMFISIYYAPLHIALDRPHTITVITLPYLLL
|
||||
YFLGNNQKNFLNYVYKNQNSIRHFSIQRIFFQNLFFQLLNPFFLPSSILM
|
||||
RLANIYIFQSNNKVLFLTSSFVGWLIGHVFFMKWIGLMLVWIQEKNNSIK
|
||||
STVAIRSNKGVLAKFRKSMFQIFLIFFFITCLYYLGRIPPIYFFTPKMSE
|
||||
IKERGEIEKREGEIDIEINSQRAGSKQEQKITAEEKLSPYLFSKKNNNLD
|
||||
KIKEENDIFGFQKPLVTILFDYNRWNRPLRYIKNDRFENVVRNEISQFFF
|
||||
FTCQSDGKERISFTYPPNLSTFQKMMEMKISLFTRDIISYEELSNSWRST
|
||||
NEEKKKKLTNEFLNRVEVLDKESLPVDIFENRIRLCNDEKKQKYLTKEYD
|
||||
PFLNGPCRGQIQKWFSPPIQKETYKKNSLFINKIHGILFSNTNNYPKFEQ
|
||||
KKNIFDRKSLLTDINFFFNLITKFSRKSVSSLNFEGLYLFPKDNKGKMSS
|
||||
KKKKFLFDTIRPDLNDNKIVNLQKCIGINEIVKKLPRWSYNLIDELEQLE
|
||||
GKKKVEYHQIRSRKAKRVVLLTKNSQNDDNYDETTDTDNTEKKKELALIR
|
||||
YSQQPDFRRDIIKGSIRAQRRKTVTCKLFQRSVDSPLFLEKMEKTSFFCF
|
||||
DILDSSKIFFMFKNWIRKKKELKNSDYTDEKAKESQKKEEEKIKKNEKEE
|
||||
KRRIEIGEAWDSIIFAQVIRGCLLITQSILRKYILLPSLIITKNIVRILL
|
||||
FQFPEWSEDFRDWQREMYIKCTYNGVQLSETEFPKKWLTDGIQIKILFPF
|
||||
RLKPWHRSKLRFTEKKKDPLKNKKVKKKNFCFLTIFGMEVELPFSGYPRN
|
||||
RFSFFDPILKELKKKMKKLKNNFFLILKIVNERTKNFITTLKETSKRIIQ
|
||||
SILKKVLFLNKKIKKLYNYLFLFRFKKIDELNQNKKNFPITKNNPIIYES
|
||||
TILIQAINKTNCSLTEKKIKAINAKTKKIIKKIERMTKENKGGFLISEIN
|
||||
SNSKKTSSNTKGLELEKKILQILQRRNVQLTHKLYSFFKFLLNFMKKVYT
|
||||
DIFLCIVSVPRINVQFFLESTKKIINQSIYNKKTNEEIIDKTNQSIIHFI
|
||||
SIINKSSNTKNTNSAANSYEVSALSQAYVFFKISQIQVLNVYKYKFKYVF
|
||||
DYDGRSFFIKDEIKDYFFGIQGIIHSKLRHKNSPVSLKNQWTNWLKVHYQ
|
||||
YDLSQNRWSRLVQKNLKNRINKHRLDQNKDLTKCDSYKKTQLIVSKNKKQ
|
||||
QVDFLVNLLIQKKIKKQSRYDLLLYKFINYAEKKELSIYGYRSPFQANKK
|
||||
RAISYDYNTQKKEFFDRMDDISIKNYIAEDAIRYIEQNRDRKYFDWVVMD
|
||||
VKIQNNSISNLQFSFFFKFLRFYDAYRNKPWIIPIKFLFLHFSVNQNFNK
|
||||
IKNIIEKKRRIDIFKPWKKKKILEVELETPNRAKKEYTSRVDLNKPSLSN
|
||||
QEKDIEEDYGESDSKKGGKDKNKKKYKNKIEAEVNLLLRKYLNFHLNWKG
|
||||
SLNKRVINNVKVYCLLIRLKNIKQIAISSIQRGELSLDIMMIQNEKDSTL
|
||||
TGFRKKKEFIEKGIFIIEPVRLSRKNNEQFFMYETARLLLIHKSKRQINQ
|
||||
RNPEKSDLDKQIFYKNIPPKRDQRITQNKEKKHYALVVIENILSARRRRE
|
||||
LRILICFNPRSINSMPRKTIFDNENKINNCCQVFAKNKDLDKEKKILMNL
|
||||
KLILWPNYRLEDLACINRYWFDTYNGSRFSIVRIHMYPRLKMR
|
||||
>NC_003119@MetrCp012@ycf1@13390@18672@R@1@1761 hypothetical_chloroplast_RF1
|
||||
MIYQLFILDRLVGLWLKILNSAIVMGLYYGFLTTFSIGPSYLFLIRARVM
|
||||
DKGTETEIAATTGFITGQLMMFISIYYAPLHLALIRPHTITVLTLPYLFF
|
||||
NFVYKNNKHYYSADSHFYLDLDYGYKNPNSIRKFRIYKVFFNNLFFQLSN
|
||||
PLLFPSSILLRLMNIYLFRSNNKLLFLTSSFLGWLIGHIFLMKCIGLILL
|
||||
VWSKQKNSIKSKLTMRFDKYILLQLRNYVGQIFVVFSFVIVVHYLGRTPV
|
||||
PYLYTYTDEILEYDEKQKDEINGETEIDVEIDSEQEQNGSIEDEEDILSY
|
||||
LFPKKDKTLENIEQDNNLLALEKPLVTTLFDYRKWNRPLRYIKNDHFERV
|
||||
VRDENSQFFFHICQSDGKERISFTYPPDLSSFLKIMEKKMDLFTKDKISY
|
||||
NDNELSNYWSSNNKEKRKKLSNEFFKRAKVLDKKYKKYKKFIPVDVFENR
|
||||
IRLSNDKRKIKYLTKIYDPFLNGPFRGQSFSPSIQNETYTTNSILINKIH
|
||||
GLLLINSNYPEFDNSNYPEFDNSNYPEFEQKIDQFDRKFLLTEIGFFFNL
|
||||
ISQFSEKSVSSFNFDGLYLFPEHEQVKIYSEEKKRKKKFLFEAIRTDQNN
|
||||
QTIFNRKKCTGINEISKQVPRWSYELIDELEQMTERLTKEFQIRSAKAER
|
||||
MVIFNGNTDSLTLNIGPRNDNDAIPEVDLNHEFFLVNFLREPDFDRDIIK
|
||||
GSMRPLRRKIATTKLSQGNAQPHSPIFLEMIDPLYFIFGDLFDDLSQIFK
|
||||
EMFRKPGTDNSEFVEFQERLEHKYEEDAKDDAEIRRLKIEEDWESILYGL
|
||||
IIRSFVLLIQSFFRKYILLPSLIITKNIIRILLFQNPEWSEDFRDWSREV
|
||||
HIKCTYQGIPVSDKELPKNWFDEGIQIRILNPFVLKAWHKSKVQSTEKKK
|
||||
KKRSTEKKYTENKNFWFLTGYGTLVESYLDEGFPRDPLSIFGPVLKTIRK
|
||||
QLKKDLKKHFFLVLKFLNERKKWFPTMLKKIENWNIKRILKSILFRFKII
|
||||
DELSESKKTSTISKNNSKIEVIEVIEESPVKMESINWTNSSFTEKRIKDL
|
||||
NVKTKTIIKQIETMTEEKKEGILTSEINLNSNKTTYDAKRLELQKNNLQI
|
||||
LQRRFVRLIRKSYSFFKIFIEGVYIDILLCISSIARIHRQRFLDFLESTD
|
||||
KILNVKKPIYDKKKKMEEMEERFENLSVSRLISILEKSENITNMNSQNSW
|
||||
DVSSLSSLSQEYVFYKLSQIQFSNGSKFKIRSILESPGRSFFLKNEIKDY
|
||||
FFRMQGTYNSKLRHKKRSDSLMNPWTNWFKVLYQYDLPEKRWSRLVSQNW
|
||||
RNRINEHRVAQNKDLVEYDSYEKNQLIWKELILSKKQEQEGDLLKIEIKN
|
||||
KIKKQYRYDLFSYQYLNFANKKKSSIYGYRSPNKNQAISYNYNISIQNYL
|
||||
EEYDILDMEKNLEKNLDRKYFNWMGMNVKRKKTSRPKDKFLIPGFWFFSK
|
||||
LSKLYCAYKMNPWILPIKFFVLQLDNLELTTEEYVNTVDEDLKSVSYYYK
|
||||
GSDSKYRTDLKGERDFLLSKYLGFYLHCDSSDEEIGMDNTNLFCLLLRMK
|
||||
KFNKIVIMSIKKLELDIEMLVDSRTKDFCYTECRDTEDLKERLIFFIEPI
|
||||
RLPRKKHEQSLLYQTIRLPLIHKSKTRKSWSWKKKKSRVDQKITENKDKN
|
||||
LYDLFVPENLLSTRRRRELRILTCFNPRNRNTVHRKTINDNENQIKNVSQ
|
||||
VLTKNKDLDSETKKLMNFKLFLWPNYRLEDLACINRYWFNTHNGSHFSIL
|
||||
RIHMYPRLKD
|
||||
>NC_003386@PsnuCp088@ycf1@112439@117550@R@1@1704 hypothetical_protein
|
||||
MIGRLYMKKLKNLFLFLSSLCPVFPWISQISLVMPFGLYYGFLTALPIGP
|
||||
SQILSIRTFFLEGNRSGIICILGSMMGQFVILLSIYCSPLYVMLVKPHLM
|
||||
TLLVIPYMFYYWYRTKNPSRYYILHPIKSLTHAHTRNLLLDSFIFQLLNP
|
||||
ILLPNPVLTRLLNLFLFRYSSNVFFLTSSLLGWLCGHILFINSIKLLLFR
|
||||
IEHDSPIIYILMKRSISRTFSILISITFFLYLGRSPVPLITKKFADEITL
|
||||
SDQKIKENLWEESLWLYRPWPTSFFDQYRWNRPIRYIPNSKSSHNGFVKK
|
||||
QVSKFFYDECITDGKNAISFASQPSLSIFKKQLMNYLHNSDISISTKDSY
|
||||
KGWIETKREKRDALNNEFKDRIQFVYNSSTIEEAMENKTGFSHDRNHFLV
|
||||
KVNDPFLSGSSRIRIPNKKYSSSLLKLHDSKDQTMKISKKTKRKHTRNKM
|
||||
RNWIFNKHKKWQHNKFPLPWEPIPTKAEKVFWRILNESENPIILEMLTTL
|
||||
NSIKEKNYQFRITWEHIFQLPRIEKAIFLFRSKQEIEDSIFRYPSHLSLK
|
||||
NLTLFNIFTRSKNIFYSAKIAVSPILQIEEMQKELPRYNSRLRSDRIDAV
|
||||
NVDVDIRQRKIKNLGPRKGKLEDKEKEKEKAAQTQTEVKKEREKEKEERV
|
||||
IKRFQNQSDFRRKLVKGSIRARRRKTGIWRLYQSGTHSPFFLRMKEIPIS
|
||||
FQSSINALRLNKMKDERAILGIGKELRPFNLYKKRSKADRLTIAARFDFP
|
||||
IAHAGRGVLLIIQSNIRKYVILPILIICKNIGRIMLFQSPEWKEDWAEWN
|
||||
QEIHIKCTYDGIEVSHRHLPAHWFKEGLQIKILYPFHLKPWHIHRTNNIN
|
||||
DLRNEAQIQKEISDFGKQRKLSFSYLTIWGYQTSSVFGSMKKRPSFWRPI
|
||||
ANALKKKLQRNLFSKLTWISHFFYEIILLSRTFIISKKPNNIPEMSIQSN
|
||||
ELRYDVSDYELIQKYPNSNEKNDYVVMNEISIESNNRNGKEISHESQDQY
|
||||
KDNFNNIRSFNDIETLLTDISGTSVEESYRDRIETYLRLNKKNHRYAINI
|
||||
RLIWNKQLVQTQQEFSRFRRIIMQFMHKGYRLAKRFLTKFYREIFRRFTF
|
||||
SIQLSIQLVLRLTKNITKLSEKNKVYQNLNLLKKNEQNLKIDSSRNKPVL
|
||||
SQAYVFQKLWHARTRTKIDVHYLVQSLEREIVNSIENNELKASKLKDLKW
|
||||
NEHNYLNDHIKDLLEIQGLLKETQTFTEKNWKEWLHCFTRYQISSKIEYG
|
||||
IVPQKWKNEVKKRWKSNTNKLDKNKEYKTLEKENKYSLYETNNMLKQRIN
|
||||
NRNNYCEFYNLLYSFIDSTKASNIIKLPIQQKGKEDPIQYINDINKIHEN
|
||||
IHLNSKKKYKRPQFQSISTEKGDIDSNLMLWLLPNLLDTKPESVTNSLDS
|
||||
YSFEMYLSQNEDKDSLKKEIRFNAKKLNLDTKEPTSDAMKPTSDTKELIS
|
||||
DTNEPTSDIKSDDQSENQNKPLKEKSIRERKHHRPIPQVKWKSKSVEKKM
|
||||
QRINNLTSFLSVIEDRKNMENYIISFCMKMGIDIDLLNSFFTNTEDELSI
|
||||
QLLDDSAHRLPRLLNDQTLVRKMVSILLNFEKQFEEGITSKISSQSISSI
|
||||
YRTEKKYSVNSYNLEDIMLSRRYRELRILNSLILEKQYVNFDHWIDKSEK
|
||||
YPFLNLPSQVQIIKRFLWPTYRLEDLACMNRFWFNTNNGSRFAMLKLRMY
|
||||
CPD
|
||||
>NC_004115@ChglCp095@ycf1@114383@118735@R@1@1451 hypothetical_chloroplast_RF1
|
||||
MITTYSTFLFNFLSQFQYLVNIPEPLILFGLYYGFLTTLPISFSHIVVIR
|
||||
NRLIEGKTSSVMAFCGLITGQLCMIGTIYYTPLYKLFIKPHLILLLSIIY
|
||||
SFFYWQRLRNNQNYDDLREAQSLINVRNFFSFFDSFVFQILNPILLPTPI
|
||||
FFRLNNVFLFRYSNNLNFFLSFFIGSLIGNFLFFNALNWIRYRFEQDSNV
|
||||
IYPVLKLLINKSIIPIVFCICLIPIAKYSHIPFCTMKQKEGQSSYSFDKN
|
||||
WPNIIFDSNQPHRPIRIFSETKTDDNLNINDNLSKKQTSQFFFKECISDG
|
||||
NVRISYTYPSTLANFQTDLSSSFQDFSLSEQSFDNLYSNWKLEKLSRKDN
|
||||
LNNLLLTKIKLLNNKKEWFYKHFQNKFGTFIKDDNNYNKFVKKSNDVRLK
|
||||
QSSKIQIKKSKLLTSDIRDISTTQSGFYDLKKNKLKSFISQKFKMNSNNS
|
||||
TLPVWNHLNKQLLQNELKRIKKQLQDKTKNIKENDFNNLKLLKSNIETID
|
||||
NTINDIHHNKIKQITSVDLIKIFATNNKTLLLETLAFNKKITQKDNFNFN
|
||||
KLFQHKNKKFTTNSGNENTYLNLNDIFKNIKRLPKWRTFSKHVVYDEVSD
|
||||
IRRRAIKSNSKLKIANKDSDIIIFEYKKSLNFRARLPKGSLRARRKNKFT
|
||||
WKLFHNNLNSPFFIRSKQLLNKTDIPFLKYNENYLNFFKNFISPDKNINY
|
||||
LNNDISEMRRQELLFKWDKTNVHILRSMVLVGQAFFRKYIKLPIFIFFKN
|
||||
LSRQLLYQPSEWTKDWSNWMNEWYIFCYYDGTELAKDQWPEMWLQRGIQI
|
||||
KLINPFYIKPWYIQKSFIKNKQNKKTRTSYLTVFGSQQELPFGKKIRMPS
|
||||
FWKPVRREVSKSIKLKLYFPFLTLQKNTIILFEKVFNKKRINEDNKTIEK
|
||||
SILNKKNEQLILKKDEVIPNNKSIAGKLSKLDFHNQNITKTSIKNATKQI
|
||||
LIKNEYNSLLKENKNLFTKNKIVFLKIKNILNKLNLKLIKVKINFTYKIK
|
||||
TVLKIISRNLLKFYSIIQFQLENLGRNNSNDLSYKNQLSYQKDFPNFNNF
|
||||
CLNQANIIQNLCKNNILKHKKLNQNFQINSKNLNQTNIIDVNPENIKAQD
|
||||
FKNLLENIYTFTPTINLWDKLSTNNWKISVQNNWKQKSYNNYDLTKKALV
|
||||
SKNLNFISYFYQNNLINNLNKKIKHTKIFNLSKNYLSLNNLNQNQIKNFD
|
||||
FQNSLNNNITYKKNIKNFTIRQNVPSQLRRWDWKNNKIKKFVNRLLQKNT
|
||||
ILLKEEVFNLIPFFDRFTIQNPMIRNWSHPISSILDDEIFTYELLDTFLQ
|
||||
INKNIDFLHTKQIEDNLSSNSNQAIASLPLSSTTAENFLYYLTTVEDLIS
|
||||
IEDKKELKILNSLNFNKSTPNYIKTNVVEKSLNENLSKNLQSILSKETLD
|
||||
SINNTQILKKFLWASYRCEDLACMNRFWFSTNNGSRFGTLRLRLYPNLKN
|
466
detectors/cds/test/test.db/ycf2.fst
Normal file
466
detectors/cds/test/test.db/ycf2.fst
Normal file
@ -0,0 +1,466 @@
|
||||
>AC_000188@LyesCp004@ycf2@88196@95032@D@1@2279 Ycf2_protein
|
||||
MRGHQFKSWIFELREILREIKNSHHFLDSWTQFNSVGSFIHIFFHQERFL
|
||||
KLFDPRIWSILLSRNSQGSPSNRYFTIKGVILFVVAVLIYRINNRNMVER
|
||||
KNLYLIGLLPIPMNSIGPRNDTLEESVGSSNINRLIVSLLYLPKGKKISE
|
||||
SCFLNPKESTWVLPITKKCSMPESNWGSRWWRNWIGKKRDSSCKISNETV
|
||||
AGIEILFKEKDLKYLEFLFVYYMDDPIRKDHDWELFDRLSLRKSRNRINL
|
||||
NSGPLFEILVKHWISYLMSAFREKIPIEVEGFFKQQGAGSTIQSNDIEHV
|
||||
SHLFSRNKWAISLQNCAQFHMWQFRQDLFVSWGKNPPESDFLRNVSRENW
|
||||
IWLDNVWLVNKDRFFSKVQNVSSNIQYDSTRSSFVQVTDSSQLKGSSDQS
|
||||
RDHLDSISNEDSEYHTLINQREIQQRKERSILWDPSFLQTERKEIESGRF
|
||||
PKCLSGYSSMSRLFTEREKQMINHLFPEEIEEFLGNPTRSVRSFFSDRWS
|
||||
ELHLGSNPTERSTRDQKLLKKQQDLSFVPSRRSEKKEMVNIFKIITYLQN
|
||||
TVSIHPISSDPGCDMVPKDEPDMDSSNKISFLNKNPFFDLFHLFHDRNRG
|
||||
GYTLHYDFASEERFQEMADLFTLSITEPDLVYHKGFAFSIDSCGLDQKQF
|
||||
LNEARDESKKKSLLVLPPIFYEENESFSRRIRKKWVRISCGNDLEDPKPK
|
||||
IVVFASNNIMEAVTQYRLIRNLIQIQYSTYGYIRNVLNRFFLMNRSDRNF
|
||||
EYGIQRDQIGKDTLNHRTIMKYTINQYLSNLKKSQKKWFEPLILISRTER
|
||||
SMNRDPDAYRYKWSNGSKSFQEHLEQSVSKQKSRFQVVFDRLRINQYSID
|
||||
WSEVIDKKDLSKSLRFFLSKSLLFLSKLLLFLSNSLPFFCVSFGNIPIHR
|
||||
SEIYIYEELKGPNDQLCNQLLESIGLQIVHLKKLKPFLLDDHDTSQKSKF
|
||||
LINGGTISPFLFNKIPKWMIDSFHTRNNRRKSFDNPDSYFSMIFHDQDNW
|
||||
LNPVKPFHRSSLISSFYKANRLRFLNNPHHFCFYWNTRFPFSVEKARINN
|
||||
SDFTYGQFLNILFIRNKIFSLCVGKKKHAFWGRDTISPIESQVSNIFIPN
|
||||
DFPQSGDETYNLYKSFHFPSRSDPFVRRAIYSIADISGTPLTEGQIVNFE
|
||||
RTYCQPLSDMNLSDSEGKNLHQYLNFNSNMGLIHTPCSEKDLSSEKRKKW
|
||||
SLCLKKCVEKGQTYRTFQRDSAFSTLSKWNLFQTYMPWFLTSTGYKYLNL
|
||||
IFLDTFSDLLPILSSSQKFVSIFPDIMHGSGISWRILQKKLCLPQWNLIS
|
||||
EISSKCLHNLLLSEEMIHRNNESPLISTHLRSPNAREFLYSILFLLLVAG
|
||||
YLVRTHLLFVSRASSELQTEFERVKSLMTPSSMIELRKLLDRYPTSEPNS
|
||||
FWLKNLFLVALEQLGDSLEEIRGSASGGNMLGPAYGVKSIRSKKKDWNIN
|
||||
LIEIIDLIPNPINRITFSRNTRHLSHTSKEIYSLIRKRKNVNGDWIDEKI
|
||||
ESWVANSDSIDDEEREFLVQFSTLTTENRIDQILLSLTHSDHLSKNDSGY
|
||||
QMIEQPGAIYLRYLVDIHKKHLMNYEFNPSCLAERRIFLAHYQTITYSQT
|
||||
SCGENSFHFPSHGKPFSLRLALSPSRGILVIGSIGTGRSYLVKYLATNSY
|
||||
VPFITVFLNKFLDNKSKGFLLDEIDIDDSDDIDDSDNLDASDDIDRDLDT
|
||||
ELELLTRMNGLTVDMMPEIDRFYITLQFELAKAMSPCIIWIPNIHDLDVN
|
||||
ESNDLSLGLLVNHLSRDCERCSTRNILVIASTHIPQKVDPALIAPNKLNT
|
||||
CIKIRRLLIPQQRKHFFTLSYTRGFHLEKKMFHTNGFGSITMGSNARDLV
|
||||
ALTNEVLSISITQKKSIIDTNTIRSALHRQTWDLRSQVRSVQDHGILFYQ
|
||||
IGRAVAQNVLLSNCPIDPISIYMKKKSCNEGDSYLYKWYFELGTSMKRLT
|
||||
ILLYLLSCSAGSVAQDLWSLSVPDEKNGITSYGLVENDSDLVHGLLEVEG
|
||||
ALVGSSRTEKDCSQFDNDRVTLLLRPEPRNPLDMMQKGSWSILDQRFLYE
|
||||
KYESEFEEGEGEGALDPQEDLFNHIVWAPRIWRPWGFLFDCIERPNELGF
|
||||
PYWSRSFRGKRIIYDEEDELQENDSGFLQSGTMQYQTRDRSQGLFRISQF
|
||||
IWDPADPLFFLFKDQPPGSVFSHRELFADEEMSKGLLTSQTDPPTSLYKR
|
||||
WFIKNTQEKHFELLINRQRWLRTNSSLSNGSFRSNTLSESYQYLSNLFLS
|
||||
NGTLLDQMPKTLLRKRWLFPDEMKIGFM
|
||||
>AC_000188@LyesCp055@ycf2@146312@153148@R@1@2279 Ycf2_protein
|
||||
MRGHQFKSWIFELREILREIKNSHHFLDSWTQFNSVGSFIHIFFHQERFL
|
||||
KLFDPRIWSILLSRNSQGSPSNRYFTIKGVILFVVAVLIYRINNRNMVER
|
||||
KNLYLIGLLPIPMNSIGPRNDTLEESVGSSNINRLIVSLLYLPKGKKISE
|
||||
SCFLNPKESTWVLPITKKCSMPESNWGSRWWRNWIGKKRDSSCKISNETV
|
||||
AGIEILFKEKDLKYLEFLFVYYMDDPIRKDHDWELFDRLSLRKSRNRINL
|
||||
NSGPLFEILVKHWISYLMSAFREKIPIEVEGFFKQQGAGSTIQSNDIEHV
|
||||
SHLFSRNKWAISLQNCAQFHMWQFRQDLFVSWGKNPPESDFLRNVSRENW
|
||||
IWLDNVWLVNKDRFFSKVQNVSSNIQYDSTRSSFVQVTDSSQLKGSSDQS
|
||||
RDHLDSISNEDSEYHTLINQREIQQRKERSILWDPSFLQTERKEIESGRF
|
||||
PKCLSGYSSMSRLFTEREKQMINHLFPEEIEEFLGNPTRSVRSFFSDRWS
|
||||
ELHLGSNPTERSTRDQKLLKKQQDLSFVPSRRSEKKEMVNIFKIITYLQN
|
||||
TVSIHPISSDPGCDMVPKDEPDMDSSNKISFLNKNPFFDLFHLFHDRNRG
|
||||
GYTLHYDFASEERFQEMADLFTLSITEPDLVYHKGFAFSIDSCGLDQKQF
|
||||
LNEARDESKKKSLLVLPPIFYEENESFSRRIRKKWVRISCGNDLEDPKPK
|
||||
IVVFASNNIMEAVTQYRLIRNLIQIQYSTYGYIRNVLNRFFLMNRSDRNF
|
||||
EYGIQRDQIGKDTLNHRTIMKYTINQYLSNLKKSQKKWFEPLILISRTER
|
||||
SMNRDPDAYRYKWSNGSKSFQEHLEQSVSKQKSRFQVVFDRLRINQYSID
|
||||
WSEVIDKKDLSKSLRFFLSKSLLFLSKLLLFLSNSLPFFCVSFGNIPIHR
|
||||
SEIYIYEELKGPNDQLCNQLLESIGLQIVHLKKLKPFLLDDHDTSQKSKF
|
||||
LINGGTISPFLFNKIPKWMIDSFHTRNNRRKSFDNPDSYFSMIFHDQDNW
|
||||
LNPVKPFHRSSLISSFYKANRLRFLNNPHHFCFYWNTRFPFSVEKARINN
|
||||
SDFTYGQFLNILFIRNKIFSLCVGKKKHAFWGRDTISPIESQVSNIFIPN
|
||||
DFPQSGDETYNLYKSFHFPSRSDPFVRRAIYSIADISGTPLTEGQIVNFE
|
||||
RTYCQPLSDMNLSDSEGKNLHQYLNFNSNMGLIHTPCSEKDLSSEKRKKW
|
||||
SLCLKKCVEKGQTYRTFQRDSAFSTLSKWNLFQTYMPWFLTSTGYKYLNL
|
||||
IFLDTFSDLLPILSSSQKFVSIFPDIMHGSGISWRILQKKLCLPQWNLIS
|
||||
EISSKCLHNLLLSEEMIHRNNESPLISTHLRSPNAREFLYSILFLLLVAG
|
||||
YLVRTHLLFVSRASSELQTEFERVKSLMTPSSMIELRKLLDRYPTSEPNS
|
||||
FWLKNLFLVALEQLGDSLEEIRGSASGGNMLGPAYGVKSIRSKKKDWNIN
|
||||
LIEIIDLIPNPINRITFSRNTRHLSHTSKEIYSLIRKRKNVNGDWIDEKI
|
||||
ESWVANSDSIDDEEREFLVQFSTLTTENRIDQILLSLTHSDHLSKNDSGY
|
||||
QMIEQPGAIYLRYLVDIHKKHLMNYEFNPSCLAERRIFLAHYQTITYSQT
|
||||
SCGENSFHFPSHGKPFSLRLALSPSRGILVIGSIGTGRSYLVKYLATNSY
|
||||
VPFITVFLNKFLDNKSKGFLLDEIDIDDSDDIDDSDNLDASDDIDRDLDT
|
||||
ELELLTRMNGLTVDMMPEIDRFYITLQFELAKAMSPCIIWIPNIHDLDVN
|
||||
ESNDLSLGLLVNHLSRDCERCSTRNILVIASTHIPQKVDPALIAPNKLNT
|
||||
CIKIRRLLIPQQRKHFFTLSYTRGFHLEKKMFHTNGFGSITMGSNARDLV
|
||||
ALTNEVLSISITQKKSIIDTNTIRSALHRQTWDLRSQVRSVQDHGILFYQ
|
||||
IGRAVAQNVLLSNCPIDPISIYMKKKSCNEGDSYLYKWYFELGTSMKRLT
|
||||
ILLYLLSCSAGSVAQDLWSLSVPDEKNGITSYGLVENDSDLVHGLLEVEG
|
||||
ALVGSSRTEKDCSQFDNDRVTLLLRPEPRNPLDMMQKGSWSILDQRFLYE
|
||||
KYESEFEEGEGEGALDPQEDLFNHIVWAPRIWRPWGFLFDCIERPNELGF
|
||||
PYWSRSFRGKRIIYDEEDELQENDSGFLQSGTMQYQTRDRSQGLFRISQF
|
||||
IWDPADPLFFLFKDQPPGSVFSHRELFADEEMSKGLLTSQTDPPTSLYKR
|
||||
WFIKNTQEKHFELLINRQRWLRTNSSLSNGSFRSNTLSESYQYLSNLFLS
|
||||
NGTLLDQMPKTLLRKRWLFPDEMKIGFM
|
||||
>NC_000932@ArthCp066@ycf2@86474@93358@D@1@2295 Ycf2
|
||||
MKGHQFKSWIFELREIVREIKNAHYFLDSWTQFNSVGSFIHIFFHQERFR
|
||||
KLLDPRIFSILLLRNSQGSTSNRYFTIKGVVLFVVAALLYRINNRNMVES
|
||||
KNLYLKGLLPIPMNSIGPRNDTSEESFGSCNINRLIVSLLYLTKGKKISE
|
||||
SCFRDPKESTWVLPITQKCIMPESNWSSRWWRNWIGKKRGFCCKISNETV
|
||||
AGIDISFKEKDIKYLEFLFVYYMDDPIRKGHDWELFDRLSPSKRRNIINL
|
||||
NSGQLFEILVKDWICYLMFAFREKIPIEVEGFCKQQGAGSTIQSNDIEHV
|
||||
SHLFSRNKWAISLQNCAQFHMWQFHQDLFVSWGKNPHESDFFRKISRENW
|
||||
IWLDNVWLVNKDRFFSKVRNVSSNIQYDSTRSSFVQVTDSSQLNGSSDQF
|
||||
IDPFDSISNEDSEYHYHTLINQREIQQLKERSILLDPSFIQTEGREIESD
|
||||
RFPKYLSGYSSMPRLFTEREKRMNNHLLPEESEEFLGNPTRAIRSFFSDR
|
||||
WSELHLGSNPTERSTRDQKLLKKEQDVSFVPSRRSENKEIVNIFKIITYL
|
||||
QNTVSIHPISSDLGCDMVPKDELDMDSSNKISFLNKNPFFDLFHLFHERK
|
||||
RGGYTLRHESEERFQEMADLFTLSITEPDLVYHKGFAFSIDSYGLDQRQF
|
||||
LKEVFNFRDESKKKSLLVLPPIFYEENESFYRRLRKIWVRISCGNYLEDQ
|
||||
KRVVFASNNIMEAVNQYRLIRNMIQIQFQYSPYGYIRNVLNRFFLMKRPD
|
||||
RNFEYGIQRDLIGNDTLNHRTIMKDTINQHLSNLKKSQKKWFDPLIFLSQ
|
||||
TERSINRDPNAYRYKWSNGSKNFQEHLEHFVSERKSRFQVVFDQLCINQY
|
||||
SIDWSEVIDKKDLSKSLRFFLSKLLRFFLSKLLLFLSKLLLFLSNSLPFF
|
||||
FVSFENIPIHRSEIHIYELKGPNDQLCNQLLESIGLQIVHLKKLKPFLLD
|
||||
DHNTSQKSKFLINGGTISPFLFNKIPKWMIDSFHTRKNRRKSFDNTDSAY
|
||||
FSIVSHDQDNWLNPVKPFQRSSLISSFSKANRLRFLNNPHHFCFYCNKRF
|
||||
PFYVEKARLNNSDFTFTYGQFLTILFIHNKTFSSCGGKKKHAFLERDTIS
|
||||
PSSIESQVSNIFISNDFPQSGDERYNLYKSFHFPIRSDPLVRRAIYSIAD
|
||||
ISGTPLIEGQRVNFERTYCQTLSDMNLSDSEEKSLHQYLNFNSNMGLIHT
|
||||
PCSEKYLQRKKRSLCLKKCVDKGQMDRTFQRDSAFSTLSKWNLFQTYMPW
|
||||
FFTSTGYKYLNLIFLDTFSDLLRILSSSQKFVSIFHDIMHGLDISWRILQ
|
||||
KKLCLPQRNLISEISSKSLHNLLLSEEMIHRNNESSLISTHLRSPNVREV
|
||||
LYSILFLLLVAGYIVRTHLLFVSRAYSELQTEFEKIKSLMIPSYMIELRK
|
||||
LLDRYPTSELNSFWLKNLFLVALEQLGDCLEEIRGSGGNMLWGGDPAYGV
|
||||
KSIRSKKKDLKINFIDIIDLISIIPNPINRITFSRNTRHLSHTSKEIYSL
|
||||
IRKRKNVSGDWIDDKIESWVANSDSIDDKEREFLVQFSTLRAEKRIDQIL
|
||||
LSLTHSDHLSKNDSGYQMIEQPGTIYLRYLVDIHKKYLMNYEFNTSCLAE
|
||||
RRIFLAHYQTITYSQTSCGANSFHFPSHGKPFSLRLALSPSRSILVIGSI
|
||||
GTGRSYLVKYLATNSYVPFITVFLNKFLDNKPKGFFIDDIDIDDSDDIDA
|
||||
SNDIDRELDTELELLTMMNALTMDMMLEIDRFYITLQFELAKAMSPCIIW
|
||||
IPNIHDLDVNESSYLALGLLVNSLSRDCERCSTRNILVIASTHIPQKVDP
|
||||
ALIAPNKLNTCIKIRRLLIPQQRKHFFTLSYTRGFHLEKKMFHTNGFESI
|
||||
TMGSSARDLVALTNEALSISITQKKSIIDTNTIRSALHRQTWDLRSQVRS
|
||||
VQDHGILFYQIGRAVAQNVLISNCPIDPISIYMKKKSCNEGDSYLYKWYF
|
||||
ELGTSMKKFTILLYLLSCSAGSVAQDLWSLPVPDEKNRITSYGFVENDSD
|
||||
LVHGLLEVQGALVGSSRTEKDCSQFDNDRVTLLFRSEPRDPLYMMQDGSC
|
||||
SIVDQRFLYEKYESEFEEGEGEGVLDPQQIEEDLFNHIVWAPRIWRPRGF
|
||||
LFDCIERPNELGFPYSAGSFRGKRIIYDEKYELQENDSEFLQSGTMQYQR
|
||||
RDRSSKEQGFFRISQFIWDPADPLFFLFKDQPFVSVFSHREFFADEEMSK
|
||||
GLLTSQTDPPTSIYKRWFIKNTQEKHFELLIQRQRWLRTNSSLSNGFFRS
|
||||
NTRSESYQYLSNLFISNGTLLDRMTKTLLKKRWLFSDEMKIGFM
|
||||
>NC_000932@ArthCp083@ycf2@145291@152175@R@1@2295 Ycf2
|
||||
MKGHQFKSWIFELREIVREIKNAHYFLDSWTQFNSVGSFIHIFFHQERFR
|
||||
KLLDPRIFSILLLRNSQGSTSNRYFTIKGVVLFVVAALLYRINNRNMVES
|
||||
KNLYLKGLLPIPMNSIGPRNDTSEESFGSCNINRLIVSLLYLTKGKKISE
|
||||
SCFRDPKESTWVLPITQKCIMPESNWSSRWWRNWIGKKRGFCCKISNETV
|
||||
AGIDISFKEKDIKYLEFLFVYYMDDPIRKGHDWELFDRLSPSKRRNIINL
|
||||
NSGQLFEILVKDWICYLMFAFREKIPIEVEGFCKQQGAGSTIQSNDIEHV
|
||||
SHLFSRNKWAISLQNCAQFHMWQFHQDLFVSWGKNPHESDFFRKISRENW
|
||||
IWLDNVWLVNKDRFFSKVRNVSSNIQYDSTRSSFVQVTDSSQLNGSSDQF
|
||||
IDPFDSISNEDSEYHYHTLINQREIQQLKERSILLDPSFIQTEGREIESD
|
||||
RFPKYLSGYSSMPRLFTEREKRMNNHLLPEESEEFLGNPTRAIRSFFSDR
|
||||
WSELHLGSNPTERSTRDQKLLKKEQDVSFVPSRRSENKEIVNIFKIITYL
|
||||
QNTVSIHPISSDLGCDMVPKDELDMDSSNKISFLNKNPFFDLFHLFHERK
|
||||
RGGYTLRHESEERFQEMADLFTLSITEPDLVYHKGFAFSIDSYGLDQRQF
|
||||
LKEVFNFRDESKKKSLLVLPPIFYEENESFYRRLRKIWVRISCGNYLEDQ
|
||||
KRVVFASNNIMEAVNQYRLIRNMIQIQFQYSPYGYIRNVLNRFFLMKRPD
|
||||
RNFEYGIQRDLIGNDTLNHRTIMKDTINQHLSNLKKSQKKWFDPLIFLSQ
|
||||
TERSINRDPNAYRYKWSNGSKNFQEHLEHFVSERKSRFQVVFDQLCINQY
|
||||
SIDWSEVIDKKDLSKSLRFFLSKLLRFFLSKLLLFLSKLLLFLSNSLPFF
|
||||
FVSFENIPIHRSEIHIYELKGPNDQLCNQLLESIGLQIVHLKKLKPFLLD
|
||||
DHNTSQKSKFLINGGTISPFLFNKIPKWMIDSFHTRKNRRKSFDNTDSAY
|
||||
FSIVSHDQDNWLNPVKPFQRSSLISSFSKANRLRFLNNPHHFCFYCNKRF
|
||||
PFYVEKARLNNSDFTFTYGQFLTILFIHNKTFSSCGGKKKHAFLERDTIS
|
||||
PSSIESQVSNIFISNDFPQSGDERYNLYKSFHFPIRSDPLVRRAIYSIAD
|
||||
ISGTPLIEGQRVNFERTYCQTLSDMNLSDSEEKSLHQYLNFNSNMGLIHT
|
||||
PCSEKYLQRKKRSLCLKKCVDKGQMDRTFQRDSAFSTLSKWNLFQTYMPW
|
||||
FFTSTGYKYLNLIFLDTFSDLLRILSSSQKFVSIFHDIMHGLDISWRILQ
|
||||
KKLCLPQRNLISEISSKSLHNLLLSEEMIHRNNESSLISTHLRSPNVREV
|
||||
LYSILFLLLVAGYIVRTHLLFVSRAYSELQTEFEKIKSLMIPSYMIELRK
|
||||
LLDRYPTSELNSFWLKNLFLVALEQLGDCLEEIRGSGGNMLWGGDPAYGV
|
||||
KSIRSKKKDLKINFIDIIDLISIIPNPINRITFSRNTRHLSHTSKEIYSL
|
||||
IRKRKNVSGDWIDDKIESWVANSDSIDDKEREFLVQFSTLRAEKRIDQIL
|
||||
LSLTHSDHLSKNDSGYQMIEQPGTIYLRYLVDIHKKYLMNYEFNTSCLAE
|
||||
RRIFLAHYQTITYSQTSCGANSFHFPSHGKPFSLRLALSPSRSILVIGSI
|
||||
GTGRSYLVKYLATNSYVPFITVFLNKFLDNKPKGFFIDDIDIDDSDDIDA
|
||||
SNDIDRELDTELELLTMMNALTMDMMLEIDRFYITLQFELAKAMSPCIIW
|
||||
IPNIHDLDVNESSYLALGLLVNSLSRDCERCSTRNILVIASTHIPQKVDP
|
||||
ALIAPNKLNTCIKIRRLLIPQQRKHFFTLSYTRGFHLEKKMFHTNGFESI
|
||||
TMGSSARDLVALTNEALSISITQKKSIIDTNTIRSALHRQTWDLRSQVRS
|
||||
VQDHGILFYQIGRAVAQNVLISNCPIDPISIYMKKKSCNEGDSYLYKWYF
|
||||
ELGTSMKKFTILLYLLSCSAGSVAQDLWSLPVPDEKNRITSYGFVENDSD
|
||||
LVHGLLEVQGALVGSSRTEKDCSQFDNDRVTLLFRSEPRDPLYMMQDGSC
|
||||
SIVDQRFLYEKYESEFEEGEGEGVLDPQQIEEDLFNHIVWAPRIWRPRGF
|
||||
LFDCIERPNELGFPYSAGSFRGKRIIYDEKYELQENDSEFLQSGTMQYQR
|
||||
RDRSSKEQGFFRISQFIWDPADPLFFLFKDQPFVSVFSHREFFADEEMSK
|
||||
GLLTSQTDPPTSIYKRWFIKNTQEKHFELLIQRQRWLRTNSSLSNGFFRS
|
||||
NTRSESYQYLSNLFISNGTLLDRMTKTLLKKRWLFSDEMKIGFM
|
||||
>NC_001568@EpviCp27@ycf2@22045@28695@D@1@2217 Ycf2
|
||||
MKEHPFPYKSWILELREIKNSHYFLDSWTKFNSVGSYINIFSHQERFIKL
|
||||
FDPRILSILLSRNSQGSTSNRYFTIKGVILFVVAVLIYRINNRNMVEIKN
|
||||
IYWRGLLPIPMNSIGPRNDTLEELVGSYNINRFIVSLLYLTKGKNISESF
|
||||
FLNLKESTLVLPITKKCSMPESNWGSRWWRNWTGKNRDYSCKISNETVAG
|
||||
IEILFKEKDKKYLEFIFFYYMDDPIRKDRDWELFDRLSPSKRLNKINFYS
|
||||
GPLFEILVKRRIYYLMSAFREKIPIEVVKGFFKQQKVGSTIQSNDIEHVS
|
||||
HFFSRNKRAISLKNSAQFNMWQFRQDLLVSWGENPHESDFLRNVSRANWI
|
||||
WLNNVWLVNKYRFCRKVRNVSSNIKYKYDSTRSRSSFVQVTDSSQLKGSY
|
||||
YKSSGHFYSVISNEDSEYHTLINQREIKPLKSIFFDPSFLQTEATEIESD
|
||||
QLQKRPSGYSSTLFTEHEKQMINHMLPEEIEEFIGNPTRLVHSFLSDRWS
|
||||
ELHLGSNPTERSTRDHKLLKKQQDLSFVPSRRSENKELVNILKIITYLKN
|
||||
TVSIHPISSDPGCDGVLKDEPDMDSSNKISVFNKNTFIYLFHLFHDWNRV
|
||||
GYTLNLHHDFELEERFQEKADLFTLSITEPDLVYHKGFSFSIYMDQKQKM
|
||||
VVFASNNIMEAVNQSRFIRNMIKIQYSTYGYIRNVLHRFFLMNRSDHNLE
|
||||
YEIKRDQIGKDTLNHRTIIKYMINQHLSNFKKSQNKWFNPILFFSRTERS
|
||||
VNRNPDAYRYKRSNGSNNFLEHLEHFVSEQKSHFKFKIVFDLIRFNQYSI
|
||||
DWSAFIDTKDLSKPLRFFLSKLLFFLSNSLPFFCVSFGNIPIHRSEIYIY
|
||||
ELKDPNDQLCNQFLEPIDLKIVHLKKRKPFLLGYHGTSRKLKLLITGGRP
|
||||
FLFNKIPRCMIDSFHTINNRSKSFDNTDSYLSMIFHNKDNWLNLVKPFHR
|
||||
SSLISYFYKANRLQFLNNPHNFCFYCNTRLPFYVEKAHIHNYYFTYGQFL
|
||||
NILFIRNKIFSLCVDKKKHAFWGGRDTISPIESQVSKIFIPKNFPQSGDE
|
||||
TYNLSQPFHFPSRYDPFVRLIANIYGTPLTEGQIVNLGRTYCQPLSDMNL
|
||||
SDSEGKNFHQYLNFNSNMGLIHTPCSDKYLPSEKRKKRSLCINKYKCVEK
|
||||
GQMYRTFQRKVAFSTLSKWNLFQTYMPWFLTSAGYKYINLIFLDTFSELL
|
||||
SILSSSKKFVSIFNNIMHGSGISWRIINKKRCLPQWNLISEISSKCLHNL
|
||||
LLSEETIRQNNESPLISTHLRSPNVREFLYSILFLLLVVGYLVRTHLLFV
|
||||
SRASSELQTEFKRVKSLMIPSSMIELRKLLNRYPTPASNSFWLKNLFIVA
|
||||
MEQLVYSLEEIRASGGNLLGPAYGVKSICSKNKYFNINLIDLIPNPINRI
|
||||
IFSRNMRHLSHTSKEIYSLIRKRKNVNGDWIDDIIESWVANSDSIDDEER
|
||||
EFLVQFSALTTEKRIYQILLSLTHSDHLSKNDSGYKMIEQPGAIYLRYLV
|
||||
DIHKKYLLNYECNTSCLVERRVFLAHSQTITYSQTSRGTNTLHFPSQGKP
|
||||
FSISLALSPSKGILVIGSIGTGRSFLVKYLATNSYVPFITVFLNKFLDNK
|
||||
PKGFLVDDNDDNDSSDDIYASDDINSDLDTELELITMMNALTMDMMLELD
|
||||
RFFTTLQLELAKAMSPWIIWIPNIHDLDVNESNYLSFGLLVNHLSERCST
|
||||
NNIIVIASTHIPKKVDPALLAPNKLNTCIKIRRLLIPQQRKHFCTLSYTR
|
||||
GFHLENKIFHTNGFGSITMGSSARDLVALTNEALSISITQNKSILDTNTI
|
||||
RSALHRQTWDLRSGVRSFQDNGILSYQIGRAITQNVLLSNCPIDPISIYM
|
||||
KKKSCTCNGGDYYFYKWYFGLGTSMKKLTILLYLLSCSAGSVAQDLWSLP
|
||||
GPAEKNGITSYGLVENDSDLVRGLLEVEGALVGSSRTEKDCSPFDNDRVI
|
||||
FTLILRPEPGNPLDIIKKGSCSIFDHRFIYEKYESEFEEGYGEGALDPQQ
|
||||
IEEDLFNHIVWAPRIWRPWGFIFYCIERPNELGFPYWSRSFRGKRIVYDK
|
||||
DEEGELQENDSELLKSGTVQYQTRDRSSKEQGLLKINQFIWDPADPLFFL
|
||||
LKDQPPGSVFSHRRFFADEEMSKGLLTSQKDPPTSIYKRWFIKNTQEQHF
|
||||
ELLINRQRWLRTKSSLSKSNGSFRSNTLFESYQYLSTLFLSNGTLFDKMT
|
||||
KTLLIKRWLFPDEMQM
|
||||
>NC_001568@EpviCp32@ycf2@61133@67783@R@1@2217 Ycf2
|
||||
MKEHPFPYKSWILELREIKNSHYFLDSWTKFNSVGSYINIFSHQERFIKL
|
||||
FDPRILSILLSRNSQGSTSNRYFTIKGVILFVVAVLIYRINNRNMVEIKN
|
||||
IYWRGLLPIPMNSIGPRNDTLEELVGSYNINRFIVSLLYLTKGKNISESF
|
||||
FLNLKESTLVLPITKKCSMPESNWGSRWWRNWTGKNRDYSCKISNETVAG
|
||||
IEILFKEKDKKYLEFIFFYYMDDPIRKDRDWELFDRLSPSKRLNKINFYS
|
||||
GPLFEILVKRRIYYLMSAFREKIPIEVVKGFFKQQKVGSTIQSNDIEHVS
|
||||
HFFSRNKRAISLKNSAQFNMWQFRQDLLVSWGENPHESDFLRNVSRANWI
|
||||
WLNNVWLVNKYRFCRKVRNVSSNIKYKYDSTRSRSSFVQVTDSSQLKGSY
|
||||
YKSSGHFYSVISNEDSEYHTLINQREIKPLKSIFFDPSFLQTEATEIESD
|
||||
QLQKRPSGYSSTLFTEHEKQMINHMLPEEIEEFIGNPTRLVHSFLSDRWS
|
||||
ELHLGSNPTERSTRDHKLLKKQQDLSFVPSRRSENKELVNILKIITYLKN
|
||||
TVSIHPISSDPGCDGVLKDEPDMDSSNKISVFNKNTFIYLFHLFHDWNRV
|
||||
GYTLNLHHDFELEERFQEKADLFTLSITEPDLVYHKGFSFSIYMDQKQKM
|
||||
VVFASNNIMEAVNQSRFIRNMIKIQYSTYGYIRNVLHRFFLMNRSDHNLE
|
||||
YEIKRDQIGKDTLNHRTIIKYMINQHLSNFKKSQNKWFNPILFFSRTERS
|
||||
VNRNPDAYRYKRSNGSNNFLEHLEHFVSEQKSHFKFKIVFDLIRFNQYSI
|
||||
DWSAFIDTKDLSKPLRFFLSKLLFFLSNSLPFFCVSFGNIPIHRSEIYIY
|
||||
ELKDPNDQLCNQFLEPIDLKIVHLKKRKPFLLGYHGTSRKLKLLITGGRP
|
||||
FLFNKIPRCMIDSFHTINNRSKSFDNTDSYLSMIFHNKDNWLNLVKPFHR
|
||||
SSLISYFYKANRLQFLNNPHNFCFYCNTRLPFYVEKAHIHNYYFTYGQFL
|
||||
NILFIRNKIFSLCVDKKKHAFWGGRDTISPIESQVSKIFIPKNFPQSGDE
|
||||
TYNLSQPFHFPSRYDPFVRLIANIYGTPLTEGQIVNLGRTYCQPLSDMNL
|
||||
SDSEGKNFHQYLNFNSNMGLIHTPCSDKYLPSEKRKKRSLCINKYKCVEK
|
||||
GQMYRTFQRKVAFSTLSKWNLFQTYMPWFLTSAGYKYINLIFLDTFSELL
|
||||
SILSSSKKFVSIFNNIMHGSGISWRIINKKRCLPQWNLISEISSKCLHNL
|
||||
LLSEETIRQNNESPLISTHLRSPNVREFLYSILFLLLVVGYLVRTHLLFV
|
||||
SRASSELQTEFKRVKSLMIPSSMIELRKLLNRYPTPASNSFWLKNLFIVA
|
||||
MEQLVYSLEEIRASGGNLLGPAYGVKSICSKNKYFNINLIDLIPNPINRI
|
||||
IFSRNMRHLSHTSKEIYSLIRKRKNVNGDWIDDIIESWVANSDSIDDEER
|
||||
EFLVQFSALTTEKRIYQILLSLTHSDHLSKNDSGYKMIEQPGAIYLRYLV
|
||||
DIHKKYLLNYECNTSCLVERRVFLAHSQTITYSQTSRGTNTLHFPSQGKP
|
||||
FSISLALSPSKGILVIGSIGTGRSFLVKYLATNSYVPFITVFLNKFLDNK
|
||||
PKGFLVDDNDDNDSSDDIYASDDINSDLDTELELITMMNALTMDMMLELD
|
||||
RFFTTLQLELAKAMSPWIIWIPNIHDLDVNESNYLSFGLLVNHLSERCST
|
||||
NNIIVIASTHIPKKVDPALLAPNKLNTCIKIRRLLIPQQRKHFCTLSYTR
|
||||
GFHLENKIFHTNGFGSITMGSSARDLVALTNEALSISITQNKSILDTNTI
|
||||
RSALHRQTWDLRSGVRSFQDNGILSYQIGRAITQNVLLSNCPIDPISIYM
|
||||
KKKSCTCNGGDYYFYKWYFGLGTSMKKLTILLYLLSCSAGSVAQDLWSLP
|
||||
GPAEKNGITSYGLVENDSDLVRGLLEVEGALVGSSRTEKDCSPFDNDRVI
|
||||
FTLILRPEPGNPLDIIKKGSCSIFDHRFIYEKYESEFEEGYGEGALDPQQ
|
||||
IEEDLFNHIVWAPRIWRPWGFIFYCIERPNELGFPYWSRSFRGKRIVYDK
|
||||
DEEGELQENDSELLKSGTVQYQTRDRSSKEQGLLKINQFIWDPADPLFFL
|
||||
LKDQPPGSVFSHRRFFADEEMSKGLLTSQKDPPTSIYKRWFIKNTQEQHF
|
||||
ELLINRQRWLRTKSSLSKSNGSFRSNTLFESYQYLSTLFLSNGTLFDKMT
|
||||
KTLLIKRWLFPDEMQM
|
||||
>NC_001879@NitaCp068@ycf2@88885@95727@D@1@2281 Ycf2
|
||||
MRGHQFKSWIFELREILREIKNSHHFLDSWTQFNSAGSFIHIFFHQERFL
|
||||
KLFDPRIWSILLSRNSQGSTSNRYFTIKGVILFVVAVLIYRINNRNMVER
|
||||
KNLYLIGLLPIPMNSIGPRNDTLEESVGSSNINRLIVSLLYLPKGKKISE
|
||||
SCFLNPKESTWVLPITKKCSMPESNWGSRWWRNWIGKKRDSSCKISNETV
|
||||
AGIEILFKEKDLKYLEFLFVYYMDDPIRKDHDWELFDRLSLRKSRNRINL
|
||||
NSGPLFEILVKHWISYLMSAFREKIPIEVEGFFKQQGAGSTIQSNDIEHV
|
||||
SHLFSRNKWAISLQNCAQFHMWQFRQDLFVSWGKNPPESDFLRNVSRENW
|
||||
IWLDNVWLVNKDRFFSKVQNVSSNIQYDSTRSSFVQVTDSSQLKGSSDQS
|
||||
RDHLDSISNEDSEYHTLINQREIQQRKERSILWDPSFLQTERKEIESGRF
|
||||
PKCLSGYSSMSRLFTEREKQMINHLFPEEIEEFLGNPTRSVRSFFSDRWS
|
||||
ELHLGSNPTERSTRDQKLLKKQQDLSFVPSKRSENKEMVNIFKIITYLQN
|
||||
TVSIHPISSDPGCDMVPKDEPDMDSSNKISFLNKNPFFDLFHLFHDRNRG
|
||||
GYTLHYDFESEERFQEMADLFTLSITEPDLVYHKGFAFSIDSCGLDQKQF
|
||||
LNEARDESKKKSLLVLPPIFYEENESFSRRIRKKWVRISCGNDLEDPKPK
|
||||
IVVFASNNIMEAVTQYRLIRNLIQIQYSTYGYIRNVLNRFFLMNRSDRNF
|
||||
EYGIQRDQIGKDTLNHRTIMKYTINQYLSNLKKSQKKWFEPLILISRTER
|
||||
SMNRDPDAYRYKWSNGSKNFQEHLEQSVSEQKSRFQVVFDRLRINQYSID
|
||||
WSEVIDKKDLSKPLRFFLSKSLLFLSKLLFFLSNSLPFFCVSFGNIPIHR
|
||||
SEIYIYELKGPNDQLCNQLLESIGLQIVHLKKWKPFLLDDHDTSQKSKFL
|
||||
INGGTISPFLFNKIPKWMIDSFHTRNNRRKSFDNPDSYFSMIFHDQDNWL
|
||||
NPVKPFHRSSLISSFYKANRLRFLNNPHHFCFYWNTRFPFSVEKARINNS
|
||||
DFTYGQFLNILFIRNKIFSLCVGKKKHAFWGRDTISPIESQVSNIFIPND
|
||||
FPQSGDETYNLYKSFHFPSRSDPFVRRAIYSIADISGTPLTEGQIVNFER
|
||||
TYCQPLSDMNLSDSEGKNLHQYLNFNSNMGLIHTPCSEKDLSSEKRKKRS
|
||||
LCLKKCVEKGQMYRTFQRDSAFSTLSKWNLFQTYMPWFLTSTGYKYLNLI
|
||||
FLDTFSDLLPILSSSQKFVPIFHDIMHGSGISWRILQKKLCLPQWNLISE
|
||||
ISSKCLHNLLLSEEMIHRNNESPLISTHLRSPNAREFLYSILFLLLVAGY
|
||||
LVRTHLLFVSRASSELQTEFEKVKSLMIPSSMIELRKLLDRYPTSEPNSF
|
||||
WLKNLFLVALEQLGDSLEEIRGSASGGNMLGPAYGVKSIRSKKKDWNINL
|
||||
IEIIDLIPNPINRITFSRNTRHLSHTSKEIYSLIRKRKNVNGDWIDDKIE
|
||||
SWVANSDSIDDEEREFLVQFSTLTTENRIDQILLSLTHSDRLSKNDSGYQ
|
||||
MIEQPGAIYLRYLVDIHKKHLMNYEFNPSCLAERRIFLAHYQTITYSQTS
|
||||
CGENSFHFPSHGKPFSLRLALSPSRGILVIGSIGTGRSYLVKYLATNSYV
|
||||
PFITVFLNKFLDNKPKGFLLDEIDIDDSDDIDDSDNLDASDDIDRDLDTE
|
||||
LKLLTRMNGLTMDMMPEIDRFYITLQFELAKAMSPCIIWIPNIHDLDVNE
|
||||
SNDLALGLLVNHLSRDCERCSTRNILVIASTHIPQKVDPALIAPNKLNTC
|
||||
IKIRRLLLPQQRKHFFTLSYTRGFHLEKKMFHTNGFGSITMGSNARDLVA
|
||||
LTNEVLSISITQKKSIIDTNTIRSALHRQTWDLRSQVRSVQDHGILFYQI
|
||||
GRAVAQNVLLSNCPIDPISIYMKKKSCNEGDSYLYKWYFELGTSMKRLTI
|
||||
LLYLLSCSAGSVAQDLWSLSGPDEKNGITSYGLVENDSDLVHGLLEVEGA
|
||||
LVGSSRTEKDCSQFDNDRVTLLLRPEPRNPLDMMQNGSCSILDQRFLYEK
|
||||
YESEFEEGEGEGALDPQEDLFNHIVWAPRIWRPWGFLFDCIERPNELGFP
|
||||
YWSRSFRGKRIIYDEEDELQENDSEFLQSGTMQYQTRDRSSKEQGLFRIS
|
||||
QFIWDPADPLFFLFKDQPPGSVFSHRELFADEEMSKGLLTSQTDPPTSIY
|
||||
KRWFIKNTQEKHFELLINRQRWLRTNSSLSNGSFRSNTLSESYQYLSNLF
|
||||
LSNGTLLDQMTKTLLRKRWLFPDEMKIGFM
|
||||
>NC_001879@NitaCp102@ycf2@146903@153745@R@1@2281 Ycf2
|
||||
MRGHQFKSWIFELREILREIKNSHHFLDSWTQFNSAGSFIHIFFHQERFL
|
||||
KLFDPRIWSILLSRNSQGSTSNRYFTIKGVILFVVAVLIYRINNRNMVER
|
||||
KNLYLIGLLPIPMNSIGPRNDTLEESVGSSNINRLIVSLLYLPKGKKISE
|
||||
SCFLNPKESTWVLPITKKCSMPESNWGSRWWRNWIGKKRDSSCKISNETV
|
||||
AGIEILFKEKDLKYLEFLFVYYMDDPIRKDHDWELFDRLSLRKSRNRINL
|
||||
NSGPLFEILVKHWISYLMSAFREKIPIEVEGFFKQQGAGSTIQSNDIEHV
|
||||
SHLFSRNKWAISLQNCAQFHMWQFRQDLFVSWGKNPPESDFLRNVSRENW
|
||||
IWLDNVWLVNKDRFFSKVQNVSSNIQYDSTRSSFVQVTDSSQLKGSSDQS
|
||||
RDHLDSISNEDSEYHTLINQREIQQRKERSILWDPSFLQTERKEIESGRF
|
||||
PKCLSGYSSMSRLFTEREKQMINHLFPEEIEEFLGNPTRSVRSFFSDRWS
|
||||
ELHLGSNPTERSTRDQKLLKKQQDLSFVPSKRSENKEMVNIFKIITYLQN
|
||||
TVSIHPISSDPGCDMVPKDEPDMDSSNKISFLNKNPFFDLFHLFHDRNRG
|
||||
GYTLHYDFESEERFQEMADLFTLSITEPDLVYHKGFAFSIDSCGLDQKQF
|
||||
LNEARDESKKKSLLVLPPIFYEENESFSRRIRKKWVRISCGNDLEDPKPK
|
||||
IVVFASNNIMEAVTQYRLIRNLIQIQYSTYGYIRNVLNRFFLMNRSDRNF
|
||||
EYGIQRDQIGKDTLNHRTIMKYTINQYLSNLKKSQKKWFEPLILISRTER
|
||||
SMNRDPDAYRYKWSNGSKNFQEHLEQSVSEQKSRFQVVFDRLRINQYSID
|
||||
WSEVIDKKDLSKPLRFFLSKSLLFLSKLLFFLSNSLPFFCVSFGNIPIHR
|
||||
SEIYIYELKGPNDQLCNQLLESIGLQIVHLKKWKPFLLDDHDTSQKSKFL
|
||||
INGGTISPFLFNKIPKWMIDSFHTRNNRRKSFDNPDSYFSMIFHDQDNWL
|
||||
NPVKPFHRSSLISSFYKANRLRFLNNPHHFCFYWNTRFPFSVEKARINNS
|
||||
DFTYGQFLNILFIRNKIFSLCVGKKKHAFWGRDTISPIESQVSNIFIPND
|
||||
FPQSGDETYNLYKSFHFPSRSDPFVRRAIYSIADISGTPLTEGQIVNFER
|
||||
TYCQPLSDMNLSDSEGKNLHQYLNFNSNMGLIHTPCSEKDLSSEKRKKRS
|
||||
LCLKKCVEKGQMYRTFQRDSAFSTLSKWNLFQTYMPWFLTSTGYKYLNLI
|
||||
FLDTFSDLLPILSSSQKFVPIFHDIMHGSGISWRILQKKLCLPQWNLISE
|
||||
ISSKCLHNLLLSEEMIHRNNESPLISTHLRSPNAREFLYSILFLLLVAGY
|
||||
LVRTHLLFVSRASSELQTEFEKVKSLMIPSSMIELRKLLDRYPTSEPNSF
|
||||
WLKNLFLVALEQLGDSLEEIRGSASGGNMLGPAYGVKSIRSKKKDWNINL
|
||||
IEIIDLIPNPINRITFSRNTRHLSHTSKEIYSLIRKRKNVNGDWIDDKIE
|
||||
SWVANSDSIDDEEREFLVQFSTLTTENRIDQILLSLTHSDRLSKNDSGYQ
|
||||
MIEQPGAIYLRYLVDIHKKHLMNYEFNPSCLAERRIFLAHYQTITYSQTS
|
||||
CGENSFHFPSHGKPFSLRLALSPSRGILVIGSIGTGRSYLVKYLATNSYV
|
||||
PFITVFLNKFLDNKPKGFLLDEIDIDDSDDIDDSDNLDASDDIDRDLDTE
|
||||
LKLLTRMNGLTMDMMPEIDRFYITLQFELAKAMSPCIIWIPNIHDLDVNE
|
||||
SNDLALGLLVNHLSRDCERCSTRNILVIASTHIPQKVDPALIAPNKLNTC
|
||||
IKIRRLLLPQQRKHFFTLSYTRGFHLEKKMFHTNGFGSITMGSNARDLVA
|
||||
LTNEVLSISITQKKSIIDTNTIRSALHRQTWDLRSQVRSVQDHGILFYQI
|
||||
GRAVAQNVLLSNCPIDPISIYMKKKSCNEGDSYLYKWYFELGTSMKRLTI
|
||||
LLYLLSCSAGSVAQDLWSLSGPDEKNGITSYGLVENDSDLVHGLLEVEGA
|
||||
LVGSSRTEKDCSQFDNDRVTLLLRPEPRNPLDMMQNGSCSILDQRFLYEK
|
||||
YESEFEEGEGEGALDPQEDLFNHIVWAPRIWRPWGFLFDCIERPNELGFP
|
||||
YWSRSFRGKRIIYDEEDELQENDSEFLQSGTMQYQTRDRSSKEQGLFRIS
|
||||
QFIWDPADPLFFLFKDQPPGSVFSHRELFADEEMSKGLLTSQTDPPTSIY
|
||||
KRWFIKNTQEKHFELLINRQRWLRTNSSLSNGSFRSNTLSESYQYLSNLF
|
||||
LSNGTLLDQMTKTLLRKRWLFPDEMKIGFM
|
||||
>NC_002202@SpolCp103@ycf2@142690@149085@R@1@2132 Ycf2
|
||||
MKGHQFKSWIFELREILREIKNSHYFLDSWTQFNSVGSFIHIFFYQERFL
|
||||
KLFDPRIWSILLSPNSQGSTSNRYFTIKGVVLFVVVVLIYRITNRNMVER
|
||||
KNLYLIGLFPIPMNSIGPRNDTLEKSFGSSNINRLIVSLLYLPKGKKISE
|
||||
SYFLDPKESTWFLPITKKCIMPESNRGSRWWRNWIGKRRDSSCKISNETV
|
||||
AGIEISFKEKDIQYLEFPFVYYMDDPIRKDHDWELFDCLSLFLRNVSREN
|
||||
WIWLDNVRLVNKDRFFSKVRNVSSNIQYDFTRSSFVQVTDSSQLKESSDQ
|
||||
SRDRSNSISNADSEYHTLINKREIQQLKERSILRDPSFLQTEGTEIESDR
|
||||
FPKCLSGYSSMPRLFTAREKQMIIHLLPEEIEQLLENPTRSIRSFFSGRW
|
||||
SELHLGSNPTERSTRDPQLLKKQQDVSFAPSRQSENKEMVNIFKIIKYLQ
|
||||
NTVSIHPISSDPGCDMVPKDELDMDSSDKISFLNKNSFFDLFHLFHDRNR
|
||||
GGYALHHDFESEEKFQEMADLFTLSITDPDLVYHRGFSFSIDSCGLDQKQ
|
||||
FLNEVFNSRDESKKKSLLVLSPIFYEENESFYRRIRKKGVRISRNVLNRF
|
||||
FLINRSDRSFEYGIQRDQIGNDTLNHRTIRKYMINQDFSNLKKSQKKWFD
|
||||
PLIFLSRTERFMNRDPDAYRYKWFNGSKNFQEHLEHFVSEQKSRFQVVFD
|
||||
QLRINQYSIDWSEVIDKKDLSKSLRFFLSKSLRFFLSKLLLFLSNSLPFF
|
||||
FVSFGNIPINRSEIRIYELKGPNDQLYNPLVESIGLQIVHLKKWKAFLLD
|
||||
DHDTFQKSKFLINGGTISPFLFNKIPKWMIDSFHTRNNSGKSFDNTDSYF
|
||||
SMISHDQNNWLNPVKPFHRSSLISSFYKANQLRFLNNPHHFCFYCNKRFP
|
||||
FYMEKARINNSDFTYRQFLNILFIHNKLFSLCVGKKKHAFLERDTISPIE
|
||||
SQVSNIFLPNDFPIRSDLLVRRTIYSIADISGTPLTEGQLVHFERTYCQP
|
||||
LSDMNLSDSEKKNLHQYLNFNSNMGFIYTPCSEKYLLSEKRKKRSLCLKK
|
||||
CVEKGQMYRTFQRDSAFSTLSKWNLFQTYMPWFLTSTGYKYLNFLFLDTF
|
||||
SDLLPILSSSQKFLSILHDIMHGSGISWRILQKKLCLPPWNLISEISSKC
|
||||
LHNLLLPEEMIHRNNESPLIWTHLASPNVREFFYSILFLLFVAGYLVRTH
|
||||
LLFVFRASSELQTEFERVKSLMIPSYMIELRKLLDRYPTSEPNSFWLKNL
|
||||
FLVALEQLGDSLEEIRGSASGDNMLLGGGPGPAYGFKSIRSKKKYLNINL
|
||||
IDILDLISIIPNPINRITFSRNTRHLSHTSKEIYSLIRKRKRVNGDWIDD
|
||||
KIESWVASSDSIDDEEREFLVQFSTLTTEKRIDQILLSLTHSDHLSKNDS
|
||||
GYQLIEQPGAIYLRYLVDIHKKYLMNYEFNTSCLAERRVFLAHYQTITYS
|
||||
QTSCGANSFHFPSHGKPFSLRLALSPSRGILVIGSIGTGRSYLVKYLATN
|
||||
SYVPFITVFLNKFLDNKPKGSLIDASDDIDRDLDTELELLTMMNALTMDM
|
||||
MPEIDQFSITLQFELAKAMSPCIIWIPNIHDLDVNESNYLSLGLFVNYLS
|
||||
RDCERGSTRNILVIASTHIPQKVDPALIAPNQLNTCIKIRRLRIPQQRKH
|
||||
FFTLSYTRGFHLEKKMFHTNGFGSITMGSNVRDLVAFINEALSISITQKK
|
||||
SIIDTNTIRSALHRQTWDLRSQVRSVQDHGILFYQIGRAVAQNVLLSNCP
|
||||
IDPISTYMKKKSCNEGDSYLYKWYFELGTSMKKLTILLYLLSCSAGSVAQ
|
||||
DLWSLPGPDEKNGITSYGLVENDSYLVHGLLEVEGALVGSSRIEKACSQN
|
||||
DRVTLFLRPELRNPLDMMQNGSCSILDHRFLYEKYESELEEGEGALDPQQ
|
||||
IEEDLFNHIVWAPRIWNPWGFLFDCIERPNELGFPYWARSFRGKRSIYDK
|
||||
EDELQENDSEFLQSGTMQYQTRDRSSKEQGFFRISQFIWDPADPLFFLFK
|
||||
DQPFVSVFSHREFFADEEISKGLLTSQMNPPISIFQRWFIKNTQEKHFEL
|
||||
LINRQRWLRTNSSLSNGSFRSNTLSESYQYLSNLFLSNGTLLDQMTKTLL
|
||||
RKRWLFPDEMKIGFMQEEKDFPFLSRKDMWP
|
||||
>NC_002693@OeelhCp081@ycf2@92143@99165@D@1@2341 Ycf2
|
||||
MGNQRNRVNLNPFRFWVFELREILREIKNSRYPFNSVGSFIHIFVHQERF
|
||||
LKLLDPRIWSVLRSQGSTGVVLFLVAVLIYRINNRNMIERKNIYLTGLLP
|
||||
IPTNFAGPRNETLEESFLSSNINRLIVSLLHLPKGKRLSESCFLDPKEST
|
||||
RVLPITKWRNWIGKRRDSSQLKGSSDQSRDHFDSIGTEDSEYHTLINQRE
|
||||
IQQRKERSSLLDPSFLQTERTEIESDRFSKGLSGSSSKSRLFTEGEKEMN
|
||||
NHLPPEEIEEFLGNPTRSILSFFSDEWSELHLGSNPTERSTVDQKLLKKE
|
||||
QEVSFAPFRRSETKEIVNLFKTMAYLQKTVSIHPISSDPGCDMVPKDELD
|
||||
SEERFQEMADLFTLSITEPDLVYHKGFAFSIDSSVLDQKQFLAEARDESK
|
||||
KKSLLVLPPVFYQENESFYRRIRKRGVQISCGNDLEDPKPKIVVFASNNI
|
||||
VEAVNQYRWIRNLIQIQYSTHGYIRNVLNRFFLMNRSDRNFEYGIQRDQI
|
||||
GNDTLNHRTFMKYTINQHLSNLKKSQKKGSDPLILISRTERSVNRDPNAY
|
||||
RYKWSKGSKNFQEHLEHFVSEQKSRFQVVFDRYRSIRNRYRSIRNRYRSR
|
||||
INQYSSDRSEVSDKKDNRYRSRINQYSSDRSEVSDQKNLAKFRSFVFSKL
|
||||
LLFLSNSLPFFFVSFGNTPPIQRSEIRVSELKGPNDRLCNQFLESIGLQL
|
||||
VYLKKLKPFLLDDHETSQKSKLLFNKKPEGMIDSFHTRNNRGKSLDSYFS
|
||||
MISHDQDNWLNPVKPFHRSSLISSFYKANRLRFLNNPHDFGFFCNKRFPF
|
||||
YVDIKNLDFTYGQFLNILFIRNTKFSLCGDKKKHAFLERDTISSIESQVS
|
||||
NLFKDFPQSGDERYNFYKYFHLAMRSDPLVRRAIYSIADISGTPLTEGQR
|
||||
VNFERTYCQPLSDMNLSDSEGKNLYQYLNFNSNMGLIYSEKCFSSEKRKK
|
||||
KKPEKRKEKKPEKRKEKKPEKRKEKKPEKRKEKKPEKRKEKKPEKRKEKK
|
||||
PEKRKEKKQSLYLKQWVEKVQMDRALQGERVSLILSNWNLFKTYVMPFSL
|
||||
TSTGYNLLKLMFLDTLGSYVMPLLRSSPKFVSICYAISDPCGISWRILQK
|
||||
KLCLLQWNWISAISNKCFHKLLLSEESIHRNNESPSMTDLRWPNLGAFLY
|
||||
SILFLLFVAGHLVFSHLLFLSQDFSELQRDFARAQSLMIPSYIVELRELL
|
||||
DMYPAPRSFKKLFLAAREKLVNYLRWGGGRKSFLIHLFELLNITPNPIDR
|
||||
IAFLKNTRHLSHTSKELYSLITELGDFSSLCSGQRYRYDQIIENVNGPCC
|
||||
LIDDKIESWISNCDAIEDKEREFLVPFCNFTRETRIDQILLSLTHSDHLS
|
||||
NNDSASQMSEEPGAFYLRHLVDIHKKGLMNYECNTSCLAERRIFLAHYQT
|
||||
ITYSPCGDNRSHFPSHGKTFSLRLPLHPSRATLVIGSIGSGRSYLVKSLA
|
||||
TNSYVPLITVVLNKFLKNWTPQGFDIHESGVYDEYGDDAEEANDYGASFF
|
||||
DFLDNDSDDYEDRDSDDYDEPGASDDYEDRDMEDFVDSEMTEWLTKTNVP
|
||||
LVYQLLDDEIDEFYITLQFELAKAMSPCILWIPNIHDLDAKESDYLSLGL
|
||||
LVNHLSRDCGRRSTKNEILVIASTHIPQKVDPSLIGPDGLSTCIKTRRLL
|
||||
VPQQQQCLFTLSYTRGFHLENKMFHTHTNEFESTILGPSVPDLVALTNEA
|
||||
LSISITQKKSIIDTTTIRYALHRKTWDLEADRNLSPAKEHGTLFYQVGRA
|
||||
FAHTVLLRNCPIDPISIYIKKNLCEAGDSSLYKWYFELGTSMKKLTILLY
|
||||
LLTCSAGSIAQDLLSPPGPDEQNLITSYGLVENDSDLVHGLSDIVHGLLE
|
||||
LEGALVGSSPTEEEVEGTEEEVEGTEEEVEGTEEEVEGTEEEVEGTEEEV
|
||||
EGTEEEVEGTEDEEGEGTEEEVEGTEDEEGEGTEEEVEGTEDEEGEGTEE
|
||||
EVEGTEDEEGEGTEDEEGEGTEEEVEGTEEEVEGTEDEEGEGTEKDSSQF
|
||||
DNDRVTLLLRPKPRNPLDIQRLIYQHQKYESELEEDDDDDEDVFAPQKML
|
||||
EDLFSELVWSPRIWHPWDFILDCEAEIPAEEIPEEEDPLPEEALETEVAV
|
||||
WGEEEEGEADDEEDERLEAQQEDELLEEEDEELKEEEDELHEEEEEEEEE
|
||||
EEEEEEDELHEEEEEEEEEDELQENDSEFFRSETQQPQARDGFSEEEGCF
|
||||
RISQFMWVPGDPLSFLYKDTPFVEVLSYPEEATEISKELLRLLNPKTKRD
|
||||
APKRARQRWWTKKKQDKHYELVLDRQRWLITKSSLSKSNGFFRSNTPSES
|
||||
YQYLSNLFLSNRRLLDQITKTFFRKKWLFPDEMKIGFMEQ
|
@ -45,28 +45,27 @@ FT AAAQSISYEIPLALCVLSISLRVIR"
|
||||
FT gene 42910..45121
|
||||
FT /gene="ndhB"
|
||||
FT /locus_tag=""
|
||||
FT CDS join(42910..43780,44367..45121)
|
||||
FT CDS join(42910..43685,44365..45121)
|
||||
FT /codon_start=1
|
||||
FT /transl_table=11
|
||||
FT /gene="ndhB"
|
||||
FT /locus_tag=""
|
||||
FT /product="NADH dehydrogenase subunit 2"
|
||||
FT /inference="similar to DNA sequence:NC_008535:CoarCp067"
|
||||
FT /inference="similar to DNA sequence:AC_000188:LyesCp066"
|
||||
FT /translation="MIWHVQNENFILDSTRIFMKAFHLLLFDGSLIFPECILIFGLILL
|
||||
FT LMIDSTSDQKDIPWLYFISSTSLVMSITALLFRWREEPMISFSGNFQTNNFNEIFQFLI
|
||||
FT LLCSTLCIPLSVEYIECTEMAITEFLLFVLTATLGGMFLCGANDLITIFVAPECFSLCS
|
||||
FT YLLSGYTKKDVRSNEATMKYLLMGGASSSILVHGFSWLYGSSGGEIELQEIVNGLINTQ
|
||||
FT MYNSPGISIALIFITVGIGFKLSPAPSHQWTPDVYEGVRFVREIPTSLSISEMFGFFKT
|
||||
FT PWTCRREMLSPTPVVAFLSVTSKVAASASATRIFNIPFYFSSNEWHLLLEILAILSMIL
|
||||
FT GNLIAITQTSMKRMLAYSSIGQIGYVIIGIIVGDSNDGYASMITYMLFYISMNLGTFAC
|
||||
FT IVLFGLRTGTDNIRDYAGLYTKDPFLALSLALCLLSLGGLPPLAGFFGKLYLFWCGWQA
|
||||
FT GLYFLVLIGLLTSVVSIYYYLKIIKLLMTGRNQEITPHVRNYRRSPLRSNNSIELSMIV
|
||||
FT CVIASTIPGISMNPIIAIAQDSLF"
|
||||
FT exon 42910..43780
|
||||
FT MYNSPGISIALIFITVGIGFKLSPAPSHQWTPDVYEGSPTPVVAFLSVTSKVAASASAT
|
||||
FT RIFNIPFYFSSNEWHLLLEILAILSMILGNLIAITQTSMKRMLAYSSIGQIGYVIIGII
|
||||
FT VGDSNDGYASMITYMLFYISMNLGTFACIVLFGLRTGTDNIRDYAGLYTKDPFLALSLA
|
||||
FT LCLLSLGGLPPLAGFFGKLYLFWCGWQAGLYFLVLIGLLTSVVSIYYYLKIIKLLMTGR
|
||||
FT NQEITPHVRNYRRSPLRSNNSIELSMIVCVIASTIPGISMNPIIAIAQDSLF"
|
||||
FT exon 42910..43685
|
||||
FT /gene="ndhB"
|
||||
FT /locus_tag=""
|
||||
FT /number=1
|
||||
FT exon 44367..45121
|
||||
FT exon 44365..45121
|
||||
FT /gene="ndhB"
|
||||
FT /locus_tag=""
|
||||
FT /number=2
|
||||
@ -79,7 +78,7 @@ FT /transl_table=11
|
||||
FT /gene="ndhD"
|
||||
FT /locus_tag=""
|
||||
FT /product="NADH dehydrogenase subunit 4"
|
||||
FT /inference="similar to DNA sequence:NC_007898:LyesC2p017"
|
||||
FT /inference="similar to DNA sequence:AC_000188:LyesCp081"
|
||||
FT /translation="MNYFPWLTIIVVFPIFAGSLIFFLPHKGNRVIRWYTICICILELL
|
||||
FT LTTYAFCYHFQSDDPLIQLVEDYKWIDFFDFHWRLGIDGLSIGPILLTGFITTLATLAA
|
||||
FT WPVTRDSRLFHFLMLAMYSGQIGLFSSRDLLLFFIMWELELIPVYLLLAMWGGKKRLYS
|
||||
@ -98,7 +97,7 @@ FT /transl_table=11
|
||||
FT /gene="ndhE"
|
||||
FT /locus_tag=""
|
||||
FT /product="NADH dehydrogenase subunit 4L"
|
||||
FT /inference="similar to DNA sequence:NC_001879:NitaCp085"
|
||||
FT /inference="similar to DNA sequence:AC_000188:LyesCp080"
|
||||
FT /translation="MILEHVLVLSAYLFSIGIYGLITSRNMVRALMCLELILNAVNINF
|
||||
FT VTFSDFFDNRQLKGDIFSIFVIAIAAAEAAIGLAIVSSIYRNRKSTRINQSNLLNN"
|
||||
FT gene complement(11509..13722)
|
||||
@ -178,7 +177,7 @@ FT /transl_table=11
|
||||
FT /gene="psaC"
|
||||
FT /locus_tag=""
|
||||
FT /product="photosystem I subunit VII"
|
||||
FT /inference="similar to DNA sequence:NC_023792:CP89_p014"
|
||||
FT /inference="similar to DNA sequence:AC_000188:LyesCp065"
|
||||
FT /translation="MSHSVKIYDTCIGCTQCVRACPTDVLEMIPWDGCKAKQIASAPRT
|
||||
FT EDCVGCKRCESACPTDFLSVRVYLWHETTRSMGLAY"
|
||||
FT gene 53817..55307
|
||||
@ -190,7 +189,7 @@ FT /transl_table=11
|
||||
FT /gene="rpl2"
|
||||
FT /locus_tag=""
|
||||
FT /product="ribosomal protein L2"
|
||||
FT /inference="similar to DNA sequence:NC_007898:LyesC2p002"
|
||||
FT /inference="similar to DNA sequence:AC_000188:LyesCp030"
|
||||
FT /translation="MAIHLYKTSTPSTRNGTVDSQVKSNPRNNLIYGQRRCGKGRNARG
|
||||
FT IITARHRGGGHKRLYRKIDFRRNEKDIYGRIVTIEYDPNRNAYICLIHYGDGEKRYILH
|
||||
FT PRGAIIGDTIVSGTEVPIKMGNALPSTDMPLGTAIHNIEITLGKGGQLARAAGAVAKLI
|
||||
@ -213,7 +212,7 @@ FT /transl_table=11
|
||||
FT /gene="rpl23"
|
||||
FT /locus_tag=""
|
||||
FT /product="ribosomal protein L23"
|
||||
FT /inference="similar to DNA sequence:NC_007898:LyesC2p003"
|
||||
FT /inference="similar to DNA sequence:AC_000188:LyesCp026"
|
||||
FT /translation="MDGIKYAVFTDKSIRLLGKNQYTSNVESGSTRTEIKHWVELFFGV
|
||||
FT KVIAMNSHRLPGKSRRMGPIMGHTMHYRRMIITLQPGYSIPPLRKKRT"
|
||||
FT gene 14505..14672
|
||||
@ -249,7 +248,7 @@ FT /transl_table=11
|
||||
FT /gene="rps7"
|
||||
FT /locus_tag=""
|
||||
FT /product="ribosomal protein S7"
|
||||
FT /inference="similar to DNA sequence:NC_007898:LyesC2p007"
|
||||
FT /inference="similar to DNA sequence:AC_000188:LyesCp008"
|
||||
FT /translation="MSRRGTAEKKTAKSDPIYRNRLVNMLVNRILKHGKKSLAYQIIYR
|
||||
FT AVKKIQQKTETNPLSVLRQAIRGVTPDITVKARRVGGSTHQVPIEIGSTQGKALAIRWL
|
||||
FT LAASRKRPGRNMAFKLSSELVDAAKGSGDAIRKKEETHRMAEANRAFAHFR"
|
||||
|
Reference in New Issue
Block a user