Files
annotate/data/cds/chlorodb/core/psbb.fst
alain viari 8dab2d56b2 CDS detector added
Former-commit-id: 93fac7a70052d06c2a12bf8af59820c653edd31b
Former-commit-id: 0869fdad0f550941a0f78f1e4c57f4fcdb3f6076
2015-11-08 14:28:05 +01:00

5829 lines
284 KiB
Plaintext

>AC_000188@LyesCp048@psbb@74341@75867@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTVTNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSAGLAENQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTKRQAA
>NC_000925@PopuCp137@psbb@111415@112944@D@1@510 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLIAVHLMHTALVAGWAGSMALYELAVFDPSDP
VLNPMWRQGMFVMPFMARLGVTDSWGGWSITGESVSNPGLWSLEGVALTH
IVLSGMLFLAAIWHWVYWDLELFRDPRTGEPALDLPKIFGIHLLLSSLLC
FGFGAFHVTGLFGPGMWVSDGYGVTGKVLPVAPAWGPEGFNPFNPGGVAS
HHIAAGTVGILAGVFHLTVRPPQRLYRALRMGNIETVLSSSISAVFFSAF
ITCGTMWYGSATTPIELFGPTRYQWDSGYFQQEIEKRVENAIADGAAPSE
AWSRIPDKLAFYDYIGNNPAKGGLFRAGPMNKGDGVAEAWLGHPVFQDKE
GRELSVRRMPAFFETFPVILVDKDGIIRADIPFRRAESKYSIEQVGVTAS
FYGGKLNGQVFNDAPSVKKYARKAQLGEVFEFDRTTLESDGVFRSSPRGW
FTFGHANFALIFFFGHLWHGSRTIFRDVFAGIGAEVTEQVEFGAFQKLGD
RSSKKQGAV
>NC_000926@GuthCp140@psbb@114454@115983@D@1@510 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLIAVHLMHTALVAGWAGSMALYELAVFDPSDP
VLNPMWRQGMYVMPFMARIGVTDSWGGWSITGESVSNPGFWSFEGVALAH
IGLSGLLFLAAVWHWVYWDLELFRDPRTGNPALDLPKIFGIHLVLAGLLC
FGFGAFHVTGAWGPGIWVSDAYGITGKVQPVAPTWGPEGFNPFNPSGVAS
HHIAAGILGFIAGIFHIAVRPPQRLYRALRMGNIETVLSSSIAAVFFAAF
ITTGTMWYGSATTPIELFGPTRYQWDSGYFQQEIERRVENSLNEGLSLSE
AWSRIPDKLAFYDYVGNNPAKGGLFRAGPMNKGDGIAEAWLGHPVFQDKE
GRELTVRRMPAFFETFPVILVDKDGIIRADIPFRRAESKYSVEQVGVTVS
FYGGKLNGQTYTDAPTVKKYARKAQLGEVLEFDRTTLESDGVFRSSPRGW
YTFGHANFALLFFLGHLWHGSRTLFRDVFSGIGAEVTEQVEFGAFQKLGD
RSTKKQGAV
>NC_000927@NeolCp076@psbb@82794@84320@R@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLIAVHLMHTALVSGWAGSMALYEISVFDPSDP
VLNPMWRQGMFVIPFMTRLGVTKSWGGWSITGESVSNPGIWSYEGVATAH
ILLSGALFMAAIWHWVFWDLELFRDPRTGEPALDLPKIFGIHLFLSGLLC
FGFGAFHVTGLYGPGIWVSDPYGITGSVQPVEPAWGPEGFDPFNPGGIAS
HHIAAGILGILAGLFHLSVRPPQRLYKALRMGNVETVLSSSIAAVFWAAF
VVSGTMWYGSAATPIELFGPTRYQWDQGFFQQEIEKRVQGSLASGASLSD
AWAKIPEKLSFYDYIGNNPAKGGLFRAGAMNSGDGIAAGWLGHPVFTDKA
GNELFVRRMPTFFETFPVLLVDKDGVVRADVPFRRAESKYSIEQVGVSVT
FYGGELDGVTFNDPSTVKKYARRAQLGSVFEFDRATLQSDGVFRSSPRGW
FTFGHLWFALLFFFGHIWHGARTIFRDVFGGIDPDLDDQVEFGAFQKLGD
VTTRRQAV
>NC_000932@ArthCp049@psbb@72371@73897@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLAVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWNITGGTITNPGLWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSAGLAENQSLSE
AWAKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPVFRNKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTKRQAV
>NC_001319@MapoCp055@psbb@69026@70552@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLIAVHLMHTALVSGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITKSWGGWSITGETVTNAGIWSYEGVAAVH
IVLSGLLFLAAIWHWVYWDLELFRDERTGKPSLDLPKIFGIHLFLSGVLC
FAFGAFHVTGLFGPGIWISDPYGLTGKVQPVAPAWGAEGFDPFVPGGIAS
HHIAAGILGILAGLFHLSVRPPQRLYKGLRMGNVETVLSSSIAAVFFAAF
VVAGTMWYGSAATPIELFGPTRYQWDQGFFQQEIDRRIRSSKAENLSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGAMDNGDGIAVGWLGHAVFKDKE
GNELFVRRMPTFFETFPVVLVDEQGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELDGVSFSDPATVKKYARRAQLGEIFEFDRATLKSDGVFRSSPRGW
FTFGHATFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTKRQVI
>NC_001320@OrsajCp053@psbb@68799@70325@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVSGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSISGGTVTNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLAGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQAVNPAWGAEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSDGLAENLSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDEEGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRSQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHATFALLFFFGHIWHGARTLFADVFAGIDPDLDAQVEFGAIQKRGD
PTTGRQPV
>NC_001603@EugrCp058@psbb@97098@100368@R@5@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRFISVHLMHTALVSGWAGSMALYELAIFDPSDV
ALNPMWPQGMFVLPFMTRLGVTKSWGAWSVTGESFSDPGIWSYEGVAVAH
IILSGLLFLAAIWHWVYWDLDLFRDPASGELKLDLPRVFGVHLFLSGALC
LAFGVFHVTGVFGPGIWVSDPYGLSGKIEPVIPSWGAEGFDPYNVGAIAS
HHIAAGLLGLIAGGFHVLVRPSQRLFVLLRMGNIETVLSSSIAAVFWSAF
VVSGTMWYGSASTPIELFGPTRYQWDKGYFQEEIERRVQASLSDGCSLSE
AWGAISPKLAFYDYIGNNPAKGGLFRSGPMNNGDGIATAWLGHAVFIDKE
GNSLFVRRMPTFFETFPVILLDQNGVVRADIPFRRAESKYSIEQVGVTVR
FFGGSFDTLSFNDPATVKRYARHAQLGEIFDFNRSILQSDGVFRSSPRGW
FTFGHLSFALIFFFGHIWHGARTLFKYLLAGIDPHLEEEIEFGTFEKLGD
DTTKKELV
>NC_001631@PithCp083@psbb@52424@53950@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLISVHIMHTALVAGWAGSMTLYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGIKDSWSGWNITGETVINPGIWSYEGVAVAH
IVFSGLCFLAAIWHWVYWDLDIFCDERTGKRCLDLPKVFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKIQPVDPAWGAEGFDPFVPGGIAS
HHIAAGILGILAGLFHLSVRPPQRLYVGLRMGNIETVLSSSIAAVFFAAF
IVAGTMWYGSATTPVELFGPTRYQWDQGYFQQEIDRRVRAGLAENLSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGAMDNGDGIAVGWLGHPIFKDKE
GNELFVRRMPTFFETFPVVLVDKEGIVKADVPFRRAESKYSVEQVGVTVE
FYGGGLDRVSFGDPAIVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHATFALLFFSGHIWHGARTLFRDVFAGIDSDLDDRIEFGAFQKLGD
PTTKRQVV
>NC_001666@ZemaCp048@psbb@70706@72232@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVSGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSISGGTVTNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLAGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQAVNPAWGAEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSDGLAENLSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPVFRDKE
GRELFVRRMPTFFETFPVVLVDEEGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHATFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGTFQKVGD
PTTRRQAA
>NC_001675@CypaCp030@psbb@33290@34819@R@1@510 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLIAVHLMHTALVAGWAGSMALYEIAVFDPSDP
VLNPMWRQGMFVLPFMVRLGITNSWGGWTINGENVTDPGFWSFEGVAAAH
IGLSGLLFLAAIWHWVYWDLELFRDPRTGEPALDLPKMFGIHLFLSGLLC
FGFGAFHLTGLFGPGMWVSDAYSITGRVQPVAPAWGPEGFNPFNPGGVVS
HHIAAGIVGILAGLFHLSVRPPQRLYKALRMGNIETVLSSSISAVFFAAF
IVAGTMWYGSAATPVELFGPTRYQWDQEYFHQEMERRVQKDVAAGASLSE
AWNRIPAKLAFYDYIGNNPAKGGLFRAGPMNKGDGIAESWLGHATFKDKE
GRELTVRRMPTFFETFPVVLIDKDGVLRADIPFRRAESKYSIEQMGVTVS
FYGGKLDGQTFTDAPTVKKYARKAQLGEAFEFDRETLKSDGVFRSSARGW
FTFGHASFALIFFFGHLWHGGRTLFRDVFAGIGEEVTEQVEFGAFQKVGD
KTTRKQEAG
>NC_001713@OdsiCp084@psbb@76048@77577@D@1@510 photosystem_II_47_kDa_protein
MALPWYRVHTVVLNDPGRLIAVHLMHTALVAGWAGSMALYELAVFDPSDP
VLNPMWRQGMFVMPFMTRLGITDSWGGWSITGESVSNPGIWSFEGVALSH
IILSGMCFLAAIWHWVYWDLELFRDPRTGEPALDLPKIFGIHLFLSGLLC
FGFGAFHVTGLFGPGIWVSDAYGVTGKVQPVAPAWGADGFNPFNPGGIAA
HHIAAGIFGIFAGIFHLTVRPPQRLYRALRMGNIETVLSSSIAAVFFAAF
VTSGTMWYGAAATPIELFGPTRYQWDSGYFQQEIERQVETSVSEGLSESQ
AWSRIPDKLAFYDYIGNNPAKGGLFRAGPMNKGDGIAEAWLGHPIFRDKD
GRELTVRRMPAFFETFPVILVDKDGIIRADIPFRRAESKYSIEQVGVTVD
FYGGKLNGQTFKDAPTVKKFARKAQLGEVFEFDRTSLESDGVFRSSPRGW
YTFGHANFALLFFFGHLWHGGRTIFRDVFTGIGAEVTEQVEFGAFQKLGD
KSTKKQGAV
>NC_001840@CycaCp083@psbb@72055@73584@R@1@510 photosystem_II_47_kDa_protein
MALPWYRVHTVVLNDPGRLISVHLMHTALVSGWAGSMALYELAVFDPSDP
VLNPMWRQGMFVMPFMARLGVTDSWGGWSITGESVSNPGLWSFEGVALTH
IVLSGLLFLASIWHWVYWDLDLFRDPRTLEPALDLPKVFGIHLVLSSLLC
FGFGAFHVTGLFGPGIWISDAYGLTGRIQSVAPAWGPEGFNPFNPGGIAS
HHIAAGTVGILAGVFHLNVRPPQRLYRALRMGNIETVLSSSIAAVFFASF
VVSGTMWYGAASTPIELFGPTRYQWDSGYFQQEIEKRVEESLSNGLSLPE
AWSNIPDKLAFYDYIGNNPAKGGLFRAGPMNKGDGIAEAWLGHPVFQDKE
GHELIVRRMPAFFENFPIILVDKDGIIRADIPFRRAESKYSIEQVGVTCS
FYGGKLNNQSFKDASTVKKYARKAQFGEVFEFDRTILDSDGVFRSSPRGW
FTFGHANFALLFFFGHLWHGSRTLFRDVFAGIGAEVTEQVEFGVFQKVGD
KTTKKQGYV
>NC_001865@ChvulCp090@psbb@75950@77476@R@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLIAVHLMHTSLVSGWAGSMAFYELAVFDPSDP
VLNPMWRQGMFVLPFMTRLGITQSWGGWTISGETAANPGVWSYEGVAAAH
IVLSGLLFAASIWHWVYWDLELFRDPRTSNPALDLPKIFGIHLFLSGVLC
FGFGAFHVTGIFGPGIWVSDPYGITGTVQAVAPSWDATGFDPYNPGGISA
HHIAAGILGVLAGLFHLCVRPPQRLYNGLRMGNIETVLSSSIAAVFWAAF
VVSGTMWYGSAATPIELFGPTRYQWDLGFFQQEIERRVQTNLSEGKSASQ
AWAEIPEKLAFYDYIGNNPAKGGLFRAGAMNSGDGIAVGWLGHAVFKEKQ
GNELFVRRMPTFFETFPVVLVDKDGVVRADVPFRRSESKYSIEQVGVSVT
FYGGELDGVTFNDPATVKKYARRAQLGEIFEFDRATLQSDGVFRASPRGW
FTFAHLCFALLFFFGHIWHGARTIFRDVFAGIDADLDEQVEFGAFLKLGD
TSTRRQSV
>NC_001879@NitaCp052@psbb@74956@76482@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTVTNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSAGLAENQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTKRQAA
>NC_002186@MeviCp006@psbb@7825@9351@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLISVHIMHTGLVSGWAGSMAFYELAVFDPSDP
VLNPMWRQGMFVLPFMTRLGISKSWGGWDINGDSITDPGLWSYEGVAATH
IILAGLMFLASMWHWVYWDLELFRDPRTGKPALDLPKIFGIHLFLSGLLC
FGFGAFHVTGLFGPGIWVSDPYGITGRVQPIEPSWGADGFDPFNPGGIAS
HHIAAGILGILAGLFHLSVRPSFRLYKALRMGNVETVLSSSIAAVFWAAF
VVSGTMWYGSAATPIELFGPTRYQWDLGYFNKEINKRVQASIASGSTASE
AWSRIPEKLAFYDYIGNNPAKGGLFRAGAMNNGDGIAAGWLGHAVFKDKE
GRELFVRRMPTFFETFPVVLLDKDGIVRADIPFRRAESKYSIEQVGVSVA
FYGGELDGVTFKDPTTVKKYARRAQLGEIFEFDRARLKSDGVFRSSPRGW
FTFGHLCFALLFFFGHIWHGARTIFRDVFAGIDPDLDEQVEFGAFQKLGD
ASTRKQAV
>NC_002202@SpolCp052@psbb@71047@72573@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLISVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTITDPGIWSYEGVAGAH
IMFSGLCFLAAIWHWVYWDLEIFSDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPVSPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSAGLAENQSFSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLIDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGSRTLFRDVFAGIDPDLDVQVEFGAFQKIGD
PTTRRQGV
>NC_002693@OeelhCp063@psbb@77298@78824@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLAVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTVTNPGIWSYEGVAGSH
ILFSGLCFLAAIWHWVYWDLAIFSDERTGKPSLDLPKIFGIHLFLSGLAC
FGFGAFHVTGLYGPGIWVSDPYGLTGEVQPVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVGAGLAKNQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDSGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTIE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDTQVEFGAFQKLGD
PTTRRQAV
>NC_002694@LocoCp049@psbb@70038@71564@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLAVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWNITGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFSDERTGKPSLDLPKIFGIHLFLAGLAC
FGFGAFHVTGLYGPGIWVSDPYGLTGRVQPVNPAWGVEGFDPFVPGGVAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVGAGLAENQSFSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGSRTLFRDVFAGIDPDLDSQVEFGAFQKLGD
PTTRRQVV
>NC_002762@TraeCp048@psbb@68672@70198@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLAVHIMHTALVSGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITDSWGGWSISGGTVTNPGIWSYEGVAGTH
IVFSGLCFLAAIWHWVYWDLEIFSDERTGKPSLDLPKIFGIHLFLAGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQAVNPAWGAEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSNGLAENLSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPVFRDKE
GRELFVRRMPTFFETFPVVLVDEEGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRSQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHATFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGTFQKVGD
PTTRKQAA
>NC_003119@MetrCp033@psbb@52372@53898@R@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWNITGGTITNPGIWSYEGVAAAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLAGVAC
FGFGAFHVTGLFGPGIWVSDPYGLTGRVQSVNPAWGVDGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVGAGLAENQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FFGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTKKQAV
>NC_003386@PsnuCp051@psbb@71406@72932@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLIAVHLMHTALVSGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRIGITKSWGGWSITGDTVSDAGIWSFEGVAAAH
ITLSGLLFLSAIWHWVYWDLDLFRDERTGKPSLDLPKIFGIHLFLSGVLC
FGFGAFHITGLFGPGIWISDPYGLTGKVQPVDPAWGAEGFDPFIPGGIAS
HHIAAGILGILAGLFHLSVRPPQRLYKALRMGNVETVLSSSIAAVFFAAF
VVSGTMWYGSATTPIELFGPTRYQWDQGYFQQEIDRRIRASRAEGLSLSE
AWSRIPEKLAFYDYIGNNPAKGGLFRAGAMDNGDGIAIGWLGHAAFKDKE
GHELFVRRMPTFFETFPVVLVDEEGIVRADAPFRRAESKYSVEQVGVTVE
FYGGELNGVGFNDPSTVKKYARRAQLGEIFEFDRATLKSDGVFRSSPRGW
FTFGHATFALIFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTERQGI
>NC_004115@ChglCp030@psbb@34370@35896@R@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLIAVHIMHTALVSGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFITRLGVTKSWGGWSITGETVTNAGLWSYEGVAAVH
IILSGLLFLAAIWHWVFWDLELFRDERTGKPSLDLPKIFGIHLFLSGLLC
FGFGAFHVTGLFGPGIWVSDPYGLTGSVQPVSPAWGAEGFDPFNAGGIAS
HHIAAGILGILAGLFHLSVRPPQRLYKGLRMGNVETVLSSSIAAVFWAAF
VVAGTMWYGSAATPIELFGPTRYQWDQGYFEQEIDKRVGTSLSEGLTLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGAMDNGDGIAVGWLGHASFKDKE
GRELFVRRMPSFFETFPVVLLDSEGIVRADVPFRRAESKYSIEQVGVTVQ
FYGGELDGVSFSDPATVKKYARRAQLGEIFEFDRATLKSDGVFRSSPRGW
FTFGHANFALLFFFGHIWHGGRTLFRDVFAGIDPDLDAQVEFGLFQKLGD
PSTRREAV
>NC_004543@AnfoCp054@psbb@91107@92633@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLIAVHLMHTALVSGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITKSWGGWSITGETVTNAGIWSYEGVAAVH
IVLSGLLFLAAIWHWVYWDLELFRDERTGKPSLDLPKIFGIHLFLSGVLC
FGFGAFHVTGLFGPGIWVSDPYGLTGKVEPVAPAWGAEGFDPFVPGGIAS
HHIAAGILGILAGLFHLSVRPPQRLYKGLRMGNVETVLSSSIAAVFFAAF
VVAGTMWYGSAATPIELFGPTRYQWDQGFFQQEIDRRIRSSKAENLSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGAMDNGDGIAVGWLGHAVFKDKE
GHELFVRRMPTFFETFPVVLVDEEGIVRADIPFRRAESKYSVEQVGVIVE
FYGGELDGVSFSDPVTVKKYARRAQLGEIFEFDRATLKSDGVFRSSPRGW
FTFGHATFALLFFFGHIWHGARTLFRDVFAGIDSDLDAQVEFGAFEKLGD
PTTKRQVV
>NC_004561@AtbeCp048@psbb@75183@76709@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTVTNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSAGLAENQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTKRQAA
>NC_004677@PikoCp063@psbb@51198@52724@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLISVHIMHTALVAGWAGSMTLYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGIKDSWSGWNITGETVINPGIWSYEGVAGAH
IMFSGLMFLAAIWHWVYWDLEIFYDERTGKLCLDLPKVFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKIQPVDPAWGAEGFDPFVPGGIAS
HHIAAGILGILAGLFHLSVRPPQRLYVGLRMGNIETVLSSSIAAVFFAAF
IVAGTMWYGSATTPVELFGPTRYQWDQGYFQQEIDRRVRAGLAENLSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGAMDNGDGIAVGWLGHPIFKDKE
GNELFVRRMPTFFETFPVVLVDKEGIVKADVPFRRAESKYSVEQVGVTVE
FYGGGLDRVSFGDPAIVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHATFALLFFSGHIWHGARTLFRDVFAGIDPDLDSRIEFGAFQKLGD
PTTKRQVV
>NC_004766@AdcaCp050@psbb@67792@69318@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLISVHLMHTALVSGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRIGVSKSWGGWIITGDTSTDAGIWSYEGVAAAH
IILSGLLFLAAIWHWVYWDLDLFRDDRTGKPSLDLPKIFGIHLFLSGVLC
FSFGAFHVTGLFGPGIWISDPYGLTGKVEPVDPAWGAEGFDPFIPGGIAS
HHIAAGVLGILAGLFHLSVRPPQRLYKALRMGNVETVLSSSIAAVFFAAF
VVSGTMWYGSAATPIELFGPTRYQWDQGYFQQEIERRIRLGEAENLSLSQ
VWSKIPEKLAFYDYIGNNPAKGGLFRAGAMDNGDGIAVGWLGHALFKDRE
GRELFVRRMPTFFETFPVVLVDGEGVVRADVPFRRAESKYSVEQVGVTVD
FFGGELDGASFSDPATVKKYARRAQLGEIFEFDRATLKSDGVFRSSPRGW
FTFGHTTFALIFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PSTKKQAV
>NC_004799@CymeCp103@psbb@80909@82438@D@1@510 photosystem_II_47_kDa_protein
MALPWYRVHIVVLNDPGRLISVHLMHTALVAGWAGSMALYELAVFDPSDP
VLNPMWRQGMFVMPFMARLGVTDSWGGWSVTGENVVNPGLWSFEGVALTH
IVLSGLLFLASIWHWVYWDLELFRDARTGEPALDLPKIFGIHLLLASLLC
FGFGAFHVTGVFGPGIWVSDAYGLTGKVQPVAPAWGPEGFNPYNPGGVAS
HHIAAGTVGILAGVFHLNVRPPQRLYRALRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDSGYFQQEMERRVQANVSQGASLAE
AWSKIPDKLAFYDYIGNNPAKGGLFRAGPMNKGDGIAQAWLGHAVFQDKQ
GRELTVRRMPAFFETFPVILVDKDGIVRADIPFRRAESKYSIEQVGVTCQ
FYGGKFNGQKFTDAASVKRYARKAQLGEVFEFDRSSLDSDGVFRTSPRGW
FTFAHANFALLFFFGHLWHGARTIFRDVFAGIGAEVTEQVEFGVFQKVGD
RSTKKQASV
>NC_004993@CafeCp049@psbb@73734@75260@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVSGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPVNPAWGAEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVGAGLAENLSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPVFRDKE
GHELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHATFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQVV
>NC_005086@AmtrCp049@psbb@79044@80570@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVSGWAGSMALYELAVFDPSDP
ILDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTVTNPGIWSYEGVAGAH
IVFSGLCFLASIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQSVNPAWGAEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
IVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVGTGLAENLSLSE
AWSKIPDKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GHELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNRVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKIGD
PTTRRQIV
>NC_005087@PhpapaCp012@psbb@9785@11323@R@1@513 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLIAVHLMHTALVSGWAGSMALYELAVFDPSDP
ILDPMWRQGMFVIPFMTRLGITKSWGGWSITGETVNNAGIWSYEGVAAVH
IVLSGLLFLAAIWHWVYWDLELFRDERTGKPSLDLPKIFGIHLFLSGVLC
FAFGAFHVTGLFGPGIWVSDPYGLTGKVQPVVPAWGAEGFDPFVPGGIAS
HHIAAGILGILAGLFHLSVRPPQRLYKGLRMGNVETVLSSSIAAVFFAAF
VVAGTMWYGSAATPVELFGPTRYQWDQGFFQQEIDRRIRASKSENLSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGAMDNGDGIAVGWLGHAVFKDRE
GHELFVRRMPTFFETFPVVLVDEEGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSFSDPATVKKYARRAQLGEIFEFDRATLKSDGVFRSSPRGW
FTFGHATFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTKRQIITRLI
>NC_005353@ChreCp032@psbb@80277@81803@R@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVINDPGRLISVHLMHTALVSGWAGSMALFEISVFDPSDP
VLNPMWRQGMFVLPFMTRLGITQSWGGWTISGETATNPGIWSYEGVAAAH
IILSGALFLASVWHWTYWDLELFRDPRTGKTALDLPKIFGIHLFLSGLLC
FGFGAFHVTGVFGPGIWVSDPYGLTGRVQPVAPSWGADGFDPYNPGGIAS
HHIAAGILGVLAGLFHLCVRPSIRLYFGLSMGSIETVLSSSIAAVFWAAF
VVAGTMWYGSAATPIELFGPTRYQWDQGFFQQEIQKRVQASLAEGASLSD
AWSRIPEKLAFYDYIGNNPAKGGLFRTGAMNSGDGIAVGWLGHASFKDQE
GRELFVRRMPTFFETFPVLLLDKDGIVRADVPFRKAESKYSIEQVGVSVT
FYGGELDGLTFTDPATVKKYARKAQLGEIFEFDRSTLQSDGVFRSSPRGW
FTFGHVCFALLFFFGHIWHGARTIFRDVFAGIDDDINDQVEFGKYKKLGD
TSSLREAF
>NC_005878@PS151@psbb@132967@134493@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVSGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSISGGTVTNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLAGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQAVNPAWGAEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSDGLAENLSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPVFRDKE
GRELFVRRMPTFFETFPVVLVDEEGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHATFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGTFQKVGD
PTTRRQAA
>NC_005973@OrniCp051@psbb@68730@70256@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVSGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSISGGTVTNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLAGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQAVNPAWGAEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSDGLAENLSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDEEGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRSQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHATFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGTFQKVGD
PTTRRQPV
>NC_006050@NyalCp050@psbb@78188@79714@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVSGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTVTNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPVNPSWGAEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKALRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVNAGLAENLSLSE
SWSKIPDKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPVFRDKE
GHELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELDGVSYNDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQVV
>NC_006084@SaofCp049@psbb@71341@72867@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVSGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSISGGTVTNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLAGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQAVNPAWGAEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSDGLAENLSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPVFRDKE
GRELFVRRMPTFFETFPVVLVDEEGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHATFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGTFQKVGD
PTTRRQAA
>NC_006137@Grc000070@psbb@67611@69140@R@1@510 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLISVHLMHTALVAGWAGSMALYELAVFDPSDP
VLNPMWRQGMFVMPFMSRLGVTDSWGGWSITGESVSNPGLWSFEGVAITH
IVLSGMLFLASIWHWVYWDLELFRDPRTGEPALDLPKIFGIHLLLSSLLC
FGFGAFHATGLFGPGIWISDGYGITGKVQPIAPAWGPDGFNPFNPGGVAS
HHIAAGTVGILAGLFHLTVRPPQRLYRALRMGNIETVLSSSISAVFFSAF
VTCGTMWYGSATTPIELFGPTRYQWDSGYFQQEIERRVENSLNEGATPEE
AWSKIPDKLAFYDYIGNNPAKGGLFRAGPMDKGDGIAEAWLGHPIFQDGE
GRELTVRRMPAFFETFPVILVDKDGIIRADIPFRRAESKYSIEQVGVTVS
FYGGKLNGKVFTDAPSVKKYARKAQLGEVFEFDRTTLESDGVFRSSPRGW
FTFGHANFALIFFFGHLWHGSRTIFRDVFAGIGAEVTEQVEFGAFQKLGD
RSSKKQGAV
>NC_006290@PSC0743@psbb@74363@75889@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSVTGGAIPNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFSDERTGKPSLDLPKIFGIHLFLAGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQSVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSAGLAENQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQVV
>NC_006861@HupaCp018@psbb@12842@14368@R@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLIAVHLMHTALVSGWAGSMALYELAVFDPSDP
ILDPMWRQGLFVVPFMTRLGITKSWGGWSITGETVNDAGVWSYEGVAAAH
IVLSGLFFLAAIWHWVFWDLDLFRDPRTGKPTLDLPKIFGIHLFLSGVLC
FGFGAFHVTGLFGPGIWVSDPYGLTGKVQPVAPVWGAEGFDPFVPGGIAS
HHIAAGILGILAGLFHLSVRPPQRLYKALRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSAATPIELFGPTRYQWDQGFFQQEIDRRIRSSRAENLSLSE
AWSEIPQKLAFYDYIGNNPAKGGLFRAGPMDNGDGIAVGWLGHAVFKDKE
GHELFVRRMPTLFETFPVVLADGEGIVRADVPFRRAESKYSIEQVGVTVE
FYGGELDGVSFSDPATVKKYARRAQLGEIFESDRATLKSDGVFRSSPRGW
FTFGHATFALLFFFGHIWHGARTLFRDVFAGIDPDSDAQVEFGTFQKLGD
PTTRRPVV
>NC_007144@CsCp068@psbb@74652@76178@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMQTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPSMTRLGITNSWGGWSITGGIITNPGIWSYEGVAGAH
ILFSGLCFLAAIWHWVYWDLEIFSDERTGKPSLDLPKIFGIHLFLSGLGC
FGFGAFHVTGLYGPGIWVSDPYGLTGRVQAVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSTGLAENQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPVFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDTQVEFGAFQKTWR
SNYKKSLV
>NC_007288@EmhuCp034@psbb@39140@40669@D@1@510 photosystem_II_47_kDa_protein
MALPWYRVHTVVLNDPGRLIAVHLMHTALVAGWAGSMALYELAVFDPSDP
VLNPMWRQGMFVMPFMARLGVTDSWGGWSITGESVSNPGIWSFEGVALTH
IVLSGMCFLAAIWHWVYWDLELFRDPRTGEPALDLPKIFGIHLFLSSLLC
FGFGAFHVTGTFGPGIWVSDAYGITGRVQAVAPAWGAEGFNPFNPGGIAS
HHIAAGILGLLAGVFHLTIRPPQRLYRALRMGNIETVLSSSISAVFFAAF
ITSGTMWYGAATTPIELFGPTRYQWDSGYFQQEIERRVESSLSEGLSLSQ
AWSRIPDKLAFYDYIGNNPAKGGLFRAGPMNKGDGIAEAWLGHPVFQDKE
GRELTVRRMPAFFETFPVILVDKDGIVRADIPFRRAESKYSIEQVGVSCN
FYGGKLNGQVFTDAPTVKKYARKSQLGEVFEFDRTTLESDGVFRSSPRGW
YTFGHANFALLFFLGHLWHGGRTLFRDVFAGIGAEVLEQVEFGAFQKLGD
KSTKKQGIV
>NC_007407@AccaCp049@psbb@72204@73730@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPVNPAWGAEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVGAGLAENLSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPVFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKIGD
PTTRRQAV
>NC_007499@PhapfoPp059@psbb@73940@75466@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVSGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSISGGTITNPGIWSYEGVAGAH
ILFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGIAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQSVNPAWGAEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVGAGLAENLSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GHELFVRRMPTFFETFPVVLVDADGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVIYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHATFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQVV
>NC_007500@NisyCp060@psbb@74954@76480@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTVTNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSAGLAENQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTKRQAA
>NC_007578@LasaCp048@psbb@72372@73898@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFSDERTGKPSLDLPKIFGIHLFLAGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQAVNPSWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSAGLAENQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPVTVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQIG
>NC_007602@NitoCp059@psbb@74763@76289@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTVTNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSAGLAENQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTKRQAA
>NC_007898@LyesC2p044@psbb@74338@75864@D@1@509 photosystem_II_CP47_chlorophyll_apoprotein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTVTNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSAGLAENQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTKRQAA
>NC_007932@PoyeCp137@psbb@112182@113711@D@1@510 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLIAVHLMHTALVAGWAGSMALYELAVFDPSDP
VLNPMWRQGMFVMPFMARLGVTDSWGGWSITGESVSNPGLWSFEGVALTH
IVLSGMLFLAAIWHWVYWDLELFRDPRTGEPALDLPKIFGIHLLLSSLLC
FGFGAFHVTGLFGPGMWVSDGYGVTGKVLPVAPAWGPEGFNPFNPGGVAS
HHIAAGTVGILAGVFHLTVRPPQRLYRALRMGNIETVLSSSISAVFFSAF
VTCGTMWYGSATTPIELFGPTRYQWDSGYFQQEIEKRVENAIADGAAPSE
AWSRIPDKLAFYDYIGNNPAKGGLFRAGPMNKGDGVAEAWLGHPVFQDKE
GRELSVRRMPAFFETFPVILVDKDGIIRADIPFRRAESKYSIEQVGVTAS
FYGGKLNGQVFNDAPSVKKYARKAQLGEVFEFDRTTLESDGVFRSSPRGW
FTFGHANFALIFFFGHLWHGSRTIFRDVFAGIGAEVTEQVEFGAFQKLGD
RSSKKQGAV
>NC_007942@GlmaCp047@psbb@71019@72545@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWNITGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLAGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGRIQSVNPAWGVEGFDPFVPGGVAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVGAGLAENQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPVFRDKE
GHELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVIVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTKKQVV
>NC_007943@SobuCp048@psbb@74255@75781@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTVTNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSAGLAENQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTKRQAA
>NC_007944@GohiCp048@psbb@76792@78318@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSAGLAENQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKD
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQVV
>NC_007957@ViviCp048@psbb@77362@78888@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLISVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGLAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQSVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVGAGLAENQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGTFQKLGD
PTTRRQVV
>NC_007977@HeanCp048@psbb@71779@73305@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLAGLAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQSVNPSWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSAGLAENQSLSE
VWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPVTVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGSRTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQAI
>NC_008096@SotuCp048@psbb@74183@75709@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTVTNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSAGLAENQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTKRQAA
>NC_008097@ChvuCp069@psbb@112833@114359@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLIAVHIMHTALVSGWAGSMALYELAVFDPSDP
ILDPMWRQGMFVIPFMTRLGITKSWGGWSITGETITNPGIWSYEGVAAVH
IILSGLLFLAAIWHWVYWDLELFRDERTGKPALDLPKIFGIHLFLSGLLC
FGFGAFHVTGLFGPGIWISDPYGITGKVQSVSPAWGAEGFDPFNPGGIAS
HHIAAGILGILAGLFHLSVRPPQRLYKALRMGNVETVLSSSIAAVFFAAF
IVSGTMWYGSAATPIELFGPTRYQWDQGYFQQEIDRRVRLSTSQGFSISE
AWSRIPEKLAFYDYIGNNPAKGGLFRAGPMDNGDGIAVGWLGHAVFKDKE
GHELFVRRMPTFFETFPVVLVDEEGIIRADLPFRRAESKYSIEQVGVTVE
FYGGELDNVSFSDPATVKKYARRAQLGEIFEFDRTTLKSDGVFRSSPRGW
FTFGHLCFALLFFFGHIWHGARTLFRDVFAGIDPDIDSQIEFGIFQKLGD
PTTKKQTV
>NC_008099@OlviCp008@psbb@8761@10287@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLIAVHLMHTSLVSGWAGSMAFYELAVFDPSDP
VLNPMWRQGMFVLPFMTRLGISQSWGGWTISGETASNPGIWSYEGVAASH
IVLSGALFMAAVWHWVFWDLELFRDPRTGNPALDLPKIFGIHLFLSGVLC
FGFGAFHVTGLFGPGIWVSDPYGLTGSVQPVSPAWGPEGFDPYNPGGVAS
HHIAAGILGILAGLFHLCVRPPQRLYNGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSAATPVELFGPTRYQWDKGFFQEEIQKRVQSSLAEGKSLSE
AWAEIPEKLAFYDYIGNNPAKGGLFRAGAMNSGDGIAVGWLGHAVFTDKA
GNELFVRRMPTFFETFPVILLDKDGVVRADVPFRRAESKYSIEQVGVSVT
FYGGELDGVTFSDPATVKKYARRSQLGEIFEFDRATLQSDGVFRSSPRGW
FTFGHLSFALLFFFGHIWHGARTIFRDVFAGIDDDLEEQVEFGAFLKLGD
TSTRRQSV
>NC_008101@ScobCp029@psbb@57410@58936@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVINDPGRLISVHLMHTALVAGWAGSMTLFEIAVFDPSDP
VLNPMWRQGMFVLPFMTRLGVTQSWGGWTISGETATNPGIWSYEGVAASH
IILSGLLFLASVWHWVYWDLELFRDPRTGKTALDLPKIFGIHLFLSGLLC
FGFGAFHVTGLFGPGIWVSDPYGLTGSVQPVAPSWGADGFDPFNPGGIAA
HHIAAGILGVLAGLFHLCVRPSIRLYFGLSMGSIETVLSSSIAAVFWAAF
VVAGTMWYGSAATPIELFGPTRYQWDQGFFQQEIQKRVQTSLAGGSSLSD
AWSKIPEKLAFYDYIGNNPAKGGLFRTGAMNSGDGIAVGWLGHAVFKDQD
GRELYVRRMPTFFETFPVLLIDKDGVVRADVPFRRAESKYSIEQVGVSVT
FYGGELDGLTFNDPATVKKYARKAQLGEIFEFDRSTLQSDGVFRSSPRGW
FTFGHVCFALLFFFGHIWHGARTIFRDVFAGIDDDLNESLEFGKYKKLGD
TSSVREAF
>NC_008114@PsakCp061@psbb@111476@116480@D@4@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLIAVHLMHTALVSGWAGSMAFYELAVFDPSDP
VLNPMWRQGMFVLPFMTRLGISQSWGGWTISGETATNAGIWSYEGVAVSH
IVLSGALFLAAIWHWVNWDLELFRDPRTGNPALDLPKIFGIHLFLSGLLC
FGFGAFHVTGLFGPGIWVSDPYGLTGSVQPVAPSWGPDGFDPYNPGGVAS
HHIAAGILGILAGLFHLCVRPPQRLYNGLRMGNVETVLSSSIAAVFWAAF
VVAGTAWYGSATTPIELFGPTRYQWDLGFFQQEIDKRVQTSLSEGKSLQE
AWSQIPEKLAFYDYIGNNPAKGGLFRTGAMNSGDGIAVGWLGHAVFKDKD
GNELFVRRMPTFFETFPVILLDKDGVVRADVPFRRAESKYSIEQVGVSVT
FFGGELDGVSFNNPTTVKKYARRAQLGEIFEFDRSTLQSDGVFRSSPRGW
FTFGHLSFALLFFFGHIWHGARTIFRDVFAGIDEGIDEQIEFGAFLKLGD
DSTRRQSV
>NC_008115@EuglglCp048@psbb@77207@78733@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVGAGLAKNQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQVV
>NC_008116@StpuCp072@psbb@101879@103405@R@1@509 photosystem_II_47_kDa_protein
MALPWYRVHTVVLNDPGRLIAVHLMHTALVSGWAGSMALYELAVFDPSDP
ILDPMWRQGMFVIPFMTRLGVTKSWGGWSITGETITNAGLWSYEGVAATH
IILSGLLFLAAIWHWVYWDLELFRDERTGKPSLDLPKIFGIHLFLSGVLC
FGFGAFHVTGLFGPGIWVSDPYGLTGNVQPVIPAWGAEGFDPFNPGGIAS
HHIAAGILGIIAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFWAAF
VVAGTMWYGSAATPVELFGPTRYQWDQGYFQQEIERRIRTSLDEGLSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGAMDNGDGIAVGWLGHAVFKDKE
GNELFVRRMPTFFETFPVVLLDKDGVVRADVPFRRAESKYSIEQVGVSVE
FYGGELNGVSFSDPATVKKYARRAQLGEIFEFDRATLKSDGVFRSSPRGW
FTFGHANFALLFFFGHIWHGSRTLFRDVFSGIDPDLESQVEFGLFQKLGD
PTTRKQAV
>NC_008117@ZyciCp004@psbb@7207@8733@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLIAVHLMHTALVSGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGVTQSWGGWSITGETVTNAGLWSYEGVAAVH
IVLSGLLFLAAIWHWVYWDLELFRDERTGKPSLDLPKIFGIHLFLSGVLC
FGFGAFHVTGLFGPGVWVSDPYGLTGRVQPVAPAWGAEGFDPFNPGGIAS
HHIAAGILGILAGLFHLSVRPPQRLYKGLRMGNVETVLSSSIAAVFFAAF
VVAGTMWYGCAATPVELFGPTRYQWDQGYFQQEIDRRIRNSVAENVSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGAMDNGDGIAVGWLGHAVFKDKE
GNELFVRRMPTFFETFPVVLVDEEGIVRADVPFRRAESKYSIEQVGVSVE
FYGGELNGVSFSDPATVKKYARRAQLGEIFEFDRATLKSDGVFRSSPRGW
FTFGHACFALLFFFGHLWHGSRTLFRDVFAGIDPDLDSQVEFGLFQKLGD
PTTRKQTV
>NC_008155@OrsaiCp33@psbb@68751@70277@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVSGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSISGGTVTNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLAGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQAVNPVWGAEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSDGLAENLSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDEEGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRSQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHATFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGTFQKVGD
PTTRRQPV
>NC_008235@PoalCp047@psbb@72881@74407@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLAVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQSVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVGTGLAENQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAIGWLGHPLFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGSRTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQVV
>NC_008289@OstapCp04@psbb@2759@4090@R@1@444 PsbB
MTRLGVTNSWGGWTISGESTSNPGLWSYEGVAASHIILSGLLFLAAIWHW
VFWDLELFRDPRTQQPALDLPKIFGIHLFLSGVLCFGFGAFHVTGLFGPG
IWVSDPYGLTGAVEPVAPAWGAEGFDPYNPGGIAAHHIAAGIVGILAGLF
HLSVRPPQRLYKALRMGNVETVLSSSIAAVFWAAFVVGGTMWYGCAATPI
ELFGPTRYQWDQGFFQQEIEKRVQTSVAGGASLSTAWSTIPEKLAFYDYI
GNNPAKGGLFRSGPMDNGDGIAAGWLGHATFTDKNGRELFVRRMPTFFET
FPVILIDGDGVVRADVPFRRAESKYSIEQVGVNVTFYGGELDGLTFTDPA
TVKKYARRAQLGEVFEFDRATLQSDGVFRSSPRAWFTFAHVSFALLFFFG
HIWHGARTIFRDVFAGIDPDLDEQVEFGAFQKLGDVTTRRQAV
>NC_008325@DacaCp048@psbb@72588@74114@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLAVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITSSWGGWSITGGATPNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWTYWDLAIFCDERTGKPSLDLPKIFGIHLFLAGLAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQSVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSAGLAENQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQTV
>NC_008326@LituCp048@psbb@76397@77923@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVSGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGINNSWGGWSITGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQSVNPAWGAEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVGAGLAENLSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GHELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHATFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQVV
>NC_008334@CisiCp048@psbb@76568@78094@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLIAVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITDSWGGWSITGGTVTNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLAIFVDDRTGKRSLDLPKIFGIHLFLSGVAC
FGFGTFHVTGLYGPGIWVSDPYGLTGKVQSVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSAGLAENQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGVFQKLGD
PTTRRQVV
>NC_008335@PlocCp048@psbb@80213@81739@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVSGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVGTGLAENQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQVV
>NC_008336@NadoCp048@psbb@73739@75265@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLAVHIMHTALVSGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTVTNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFRDERTGKPSLDLPKIFGIHLFLSGLAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQSVSPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVGAGLAENQSLAE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTKRQVV
>NC_008359@MoinCp047@psbb@75637@77163@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLISVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGRVQAVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSAGLAENKSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELYVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQVV
>NC_008372@StheCp012@psbb@46845@48371@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLISVHLMHTALVSGWAGSMALYELAVFDPSDP
ILNPMFRQGMFVLPFMTRLGITKSWGGWSISGETVTTGFEWTYEAVAASH
IILSGALFLASIWHWVYWDLDLFRDPREGKPALDLPKIFGIHLFLAGILC
FSFGAFHVTGLYGPGIWVSDPYGLTGSVQPVSPSWGADGFDPYNPGGIAA
HHVAAGILGILAGLFHLCVRPSLRLYLGLSMGSIESVLSSSIAAVFWAAF
VVAGTMWYGSAATPIELFGPTRYQWDQGFFQQEIEKRVASSLANGSSVSE
AWATIPEKLAFYDYIGNNPAKGGLFRSGAMNSGDGIAVGWLGHAIFTDSE
GRELYVRRMPTFFETFPVILLDKDGVVRADVPFRRAESKYSIEQVGVSVT
FSGGELDGVKFSDPATVKKYARRAQLGEIFEFDRATLQSDGVFRSSPRGW
FTFGHVCFALLFFFGHIWHGARTLARDRFAGIDEDLNDQVEFGKFQKVGD
PSSSRQAV
>NC_008407@JNC0808@psbb@80859@82385@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTVTNPGIWSYEGVAGSH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGVFHVTGLYGPGIWVSDPYGLTGKVQPVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSAGLAENKSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTLE
FYGGELNGVSYSDPAVVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRREVV
>NC_008408@BinaPp48@psbb@52200@53726@D@1@509 photosystem_II_P680_chlorophyll_A_apoprotein
MGLPWYRVHTVVLNDPGRLIAVHLMHTSLVSGWAGSMAFYELALFDPSDP
ILNPMWRQGMFVLPFMTRIGITQSWSNWSISGDSVVNPGIWSYEGVAASH
IILSGLLFMAAIWHWVYWDLELFIDKRTMFPVLDLPKIFGIHLLLSGILC
FGFGAFHVTGLFGPGIWVSDPYGLTGKVQQISPAWGADGFDPFNPGGVAS
HHIAAGILGIIAGLFHLSVRPSQRLYDALKMGNIETVLSSSIAAVFWAAF
VVAGTMWYGSAATPIELFGPTRYQWDQGYFQQEIERRVQANIDNGNSIDK
AWSLIPEKLAFYDYIGNNPAKGGLFRVGAMNSGDGIAVGWLGHPIFKDKL
GNELFVRRMPTFFETFPVLLVDENGIVKADIPFRRAESKYSIEQVGVSAT
FYGGELNNATFTDPATVKKYARRAQLGEIFEFDRTTLKSDGVFRSSPRAW
FTFGHLIFALLFFFGHIWHGARTLFRQVFAGIDPDLDEQIEFGTFLKLGD
TSTRRQSV
>NC_008454@PehoCp091@psbb@118096@119622@R@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTITNSGIWSYEGVAGAH
IVLSGLCFLAAIWHWVYWDLEIFSDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGRVQSVNPAWGVGGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRIGAGLAENQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPVFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRAALKSDGVFRSSPRGW
FTFGHVSFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTKRQAV
>NC_008454@PehoCp114@psbb@158031@159557@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTITNSGIWSYEGVAGAH
IVLSGLCFLAAIWHWVYWDLEIFSDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGRVQSVNPAWGVGGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRIGAGLAENQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPVFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRAALKSDGVFRSSPRGW
FTFGHVSFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTKRQAV
>NC_008456@DrgrCp048@psbb@76690@78216@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVSGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVTC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQSVNPAWGTEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVGAGLAENLSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GHELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYGDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHATFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGTFQKLGD
PTTRRQVV
>NC_008457@PiceCp048@psbb@75567@77093@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVSGWAGSMVLYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTITNPGIWSYEGVAGAH
IMLSGLCFLAAIWHWVYWDLEIFRDERTGKPSLDLPKIFGIHLFLAGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPVNPSWGAEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSAGLAENLSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPVFRDKE
GHELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDSQVEFGTFQKIGD
PTTRRQAV
>NC_008535@CoarCp048@psbb@73541@75067@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTVTNAGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSAGLAENQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAIGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKIGD
PTTRRQAV
>NC_008588@PhtrCp030@psbb@19018@20547@R@1@510 photosystem_II_47_kDa_protein
MALPWYRVHTVVLNDPGRLIAVHIMHTALVAGWAGSMALYELAVFDPSDP
VLNPMWRQGMFVMPFMTRLGITDSWGGWSITGESVSNPGLWSFEGVALSH
IVLSGMCFLAAIWHWVYWDLELFRDPRTGEPALDLPKIFGIHLFLSGLLC
FGFGAFHVTGLFGPGIWVSDAYGITGKVQPVAPSWGADGFNPFNPGGIAA
HHIAAGLFGILAGVFHLTVRPPQRLYRALRMGNIETVLSSSISAVFFAAF
VTSGTMWYGAAATPIELFGPTRYQWDSGYFQQEIERQVEASVSEGLSESQ
AWSRIPDKLAFYDYIGNNPAKGGLFRAGPMNKGDGIAEAWLGHPIFRDKE
GRELTVRRMPAFFETFPVILVDKDGIIRADIPFRRAESKYSIEQVGVTVD
FYGGKLNGQTFKDAPTVKKFARKSQLGEVFEFDRTSLESDGVFRSSPRGW
YTYGHANFALLFFFGHLWHGGRTIFRDVFTGIGAEVTEQVEFGVFQKLGD
KTTKKQGAV
>NC_008589@ThpsCp018@psbb@17275@18804@D@1@510 photosystem_II_47_kDa_protein
MALPWYRVHTVVLNDPGRLISVHLMHTALVAGWAGSMALYELAVFDPSDP
VLNPMWRQGMFVMPFMTRLGITDSWGGWSITGESVSNPGLWSFEGVALSH
IVLSGMCFLAAIWHWVYWDLELFRDPRTGEPALDLPKIFGIHLLLSGLLC
FGFGAFHVTGLFGPGIWVSDAYGITGKVQPVAPSWGADGFNPFNPGGIAA
HHIAAGIFGIFAGIFHLTVRPPQRLYRALRMGNIETVLSSSISAVFWAAF
VTSGTMWYGAAATPIELFGPTRYQWDSGYFQQEIERQVESSVTEGLSESQ
AWSRIPDKLAFYDYIGNNPAKGGLFRSGPMDKGDGIAEAWLGHPIFRDKD
GRELTVRRMPAFFETFPVILVDKDGIIRADIPFRRAESKYSIEQVGVTVD
FYGGKLNGQTFKDAPTVKKFARKAQLGEVFEFDRTSLESDGVFRSSPRGW
YTFGHANFALLFFLGHLWHGGRTIFRDVFTGIGAEVTEQVEFGAFQKLGD
KTTKKQGAV
>NC_008590@HvsvCp049@psbb@69411@70937@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLAVHIMHTALVSGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITDSWGGWSISGGTVTNPGIWSYEGVAATH
IVFSGLCFLAAIWHWVYWDLEIFSDERTGKPSLDLPKIFGIHLFLAGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQAVNPAWGAEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSNGLAENLSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPVFRDKE
GRELFVRRMPTFFETFPVVLVDEEGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVNYSDPATVKKYARRSQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHATFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGTFQKVGD
PTTKKQAV
>NC_008591@AgstCp049@psbb@69359@70885@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLAVHIMHTALVSGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITDSWGGWSISGGTVTNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFSDERTGKPSLDLPKIFGIHLFLAGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQAVNPAWGAEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSNGLAENLSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPVFRDKE
GRELFVRRMPTFFETFPVVLVDEEGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRSQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHATFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGTFQKVGD
PTTRKQAV
>NC_008602@SobiCp049@psbb@71523@73049@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVSGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSISGGTVTNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLAGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQAVNPAWGAEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSDGLAENLSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPVFRDKE
GRELFVRRMPTFFETFPVVLVDEEGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHATFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGTFQKVGD
PTTRRQAA
>NC_008641@GobaCp049@psbb@76835@78361@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPCGLTGKVQPVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSAGLAENQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKD
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQVV
>NC_008788@NuadCp048@psbb@78498@80024@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVSGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPISPSWGAEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKALRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVNAGLAENLSLSE
SWSKIPDKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GHELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELDGVSYNDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGTFQKLGD
PTTRRQVV
>NC_008796@RamaCp050@psbb@72557@74083@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLAVHIMHTALVSGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLQIFCDERTGKPSLDLPKIFGIHLFLSGLAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQSVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVGAGLAENKSLSD
VWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELDGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTKRQVV
>NC_008822@ChatCp010@psbb@13435@14961@D@1@509 photosystem_II_47_kDa_protein
MGLPWFRVHTVVLNDPGRLISVHLMHTALVSGWAGSMAFYELAVFDPSDP
VLNPMWRQGMFVLPFMTRLGITKSWGGWNISGESISDPGLWSYEGVAATH
IVLSGLLFLASIWHWVYWDLELFRDPRTGKPALDLPKIFGIHLFLSGLLC
FGFGAFHVTGLFGPGIWVSDPYGITGRVQPVAPAWGAEGFDPFNPGGIAS
HHIAAGILGILAGLFHLTVRPPFRLYKALRMGNIETVLSSSIAAVFWAAF
VVAGTMWYGSAATPIELFGPTRYQWDLGFFQQEIEKRVQASLAGGASLSE
AWSSIPEKLAFYDYIGNNPAKGGLFRAGPMNNGDGIAAGWLGHAVFKDKE
GRELFVRRMPTFFETFPVLLLDKDGVVKADVPFRRAESKYSVEQVGVTVT
FYGGELDGVTFKDPATVKKYARRAQLGEVFEFDRARLKSDGVFRSSPRGW
FTFGHLCFALLFFFGHIWHGARTIFRDVFAGIDPDLDEQVEFGAYQKLGD
PSTRKQAV
>NC_008829@AnevCp053@psbb@76067@77593@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHLMHTALVSGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRIGITKSWGGWSITGDTVNDAGIWSYEGVAASH
IVLSGLLFLAAIWHWVYWDLDLFRDERTGKPSLDLPKIFGIHLFLSGVLC
FGFGAFHITGLFGPGIWVSDPYGLTGKVQPVDPAWGAEGFDPFVPGGIAS
HHIAAGILGILAGLFHLSVRPPQRLYKALRMGNVETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIDRRIRASKAENLSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGAMDNGDGIAVGWLGHATFKDKE
GHELFVRRMPTFFETFPVVLVDEEGVVRADVPFRRAESKYSVEQVGVTVE
FYGGELDGVSFSDPATVKKYARRAQLGEIFEFDRATLKSDGVFRSSPRGW
FTFGHATFALIFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTKRQAV
>NC_009143@Poptr_cp049@psbb@73334@74860@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLAVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQSVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVGTGLAENQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAIGWLGHPLFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGSRTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQVV
>NC_009259@PhvuCp50@psbb@71441@72967@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWNITGGAITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLAGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGRIQSVNPAWGVEGFDPFVPGGVAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVGAGLAENQNLTE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GHELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGISYSDPTTVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQVV
>NC_009265@AecoCp047@psbb@71681@73207@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWNITGGTITNPGLWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSAGLAENPSLSE
VWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPVFRNKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTKRQAV
>NC_009266@AegrCp047@psbb@71742@73268@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWNITGGTITNPGLWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYEWDQGYFQQEIYRRVSAGLAENQSLSE
VWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPVFRNKE
GRELFVRRMPTFFETFPVVLVDGDGIVRAYVPFRRAESKYSVEQVGVTVE
LYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTKRQAA
>NC_009267@OlpuCp048@psbb@72067@73593@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWNITGGTITNPGLWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSAGLAENQSLSD
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPVFRNKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTKRQAV
>NC_009268@ArhiCp047@psbb@70996@72522@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWNITGGTITNPGLWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSAGLAENQSVSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPVFRNKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTKRQAV
>NC_009269@BaveCp048@psbb@71601@73127@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWNITGGTITNPGLWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSAGLAENQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPVFRNKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTKRQAV
>NC_009270@CabupaCp048@psbb@71944@73470@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWNITGGTITNPGLWSYEGVAAAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSAGLAENQSLSE
AWAKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPVFRNKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGSRTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTKRQAV
>NC_009271@CrmaCp048@psbb@72260@73786@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWNITGGTITNPGLWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSAGLAENQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPVFRNKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTKRQAV
>NC_009272@DrneCp047@psbb@70567@72093@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPARLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWNITGGTITNPGLWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQTVNPTWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSAGLAENQSVSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPVFRNKE
GRELFVRRMPTFFDTFPVVLVYGFGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYAIRAQLGEIFELDPATLKSYGVFRSSPRGW
FTFGHASFALLFFFGHIWHGSRTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTKRQAV
>NC_009273@LeviCp048@psbb@72256@73782@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWNITGGTITNPGLWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSAGLAENQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPVFRNKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGSRTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTKRQAV
>NC_009274@LomaCp047@psbb@70589@72115@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVSGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWNITGGTITNPGLWSYEGVAAAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSAGLAENQSVSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPVFRNKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGSRTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTKRQAV
>NC_009275@NaofCp048@psbb@72469@73995@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWNITGGTITNPGLWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSAGLAENQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPVFRNKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEVFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTKRQAV
>NC_009573@RhsaCp141@psbb@125316@126845@D@1@510 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLIAVHLMHTALVAGWAGSMALYELAVFDPSDP
VLNPMWRQGMFVMPFMARIGVTDSWGGWSITGESVANPGFWSFEGVALAH
IGLSGLLFLAAVWHWVYWDLELFRDPRTGNPALDLPKIFGIHLLLSGVLC
FGFGAFHVTGAWGPGIWVSDAYGITGKVQPVAPAWGPEGFNPFNPSGVAS
HHIAAGILGFAAGIFHIAVRPPQRLYRALRMGNIETVLSSSIAAVFWSAF
ITTGTMWYGSATTPIELFGPTRYQWDSGYFQQEIERRVENSLNEGLSLSE
AWSRIPDKLAFYDYVGNNPAKGGLFRAGPMNKGDGIAEAWLGHPIFQDKE
GRELTVRRMPAFFETFPVILVDKDGIIRADIPFRRAESKYSIEQVGVTTS
FYGGKLNGQVFTDAPTVKKYARKAQLGEVMEFDRTTLESDGVFRSSPRGW
YTFGHANFALLFFLGHLWHGSRTLFRDVFSGIGAEVTEQVEFGAFQKLGD
RSTKKQGAV
>NC_009598@ChspCp048@psbb@75183@76709@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVSGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGINNSWGGWSITGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQSVNPAWGAEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVGTGLSENQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGPMDNGDGIAVGWLGHPIFRDKE
GHELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHATFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGTFQKLGD
PTTRRQVV
>NC_009599@BumiCp048@psbb@76387@77913@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLAVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQSVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVGVSLAENKSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQVV
>NC_009600@IlolCp048@psbb@76324@77850@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVSGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQSVNPAWGAEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVGTGLAENLSLSE
AWSKIPDKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKD
GHELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYGDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQVV
>NC_009601@CielCp047@psbb@70931@72457@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVSGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSISGGSITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGLAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQSINPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVGVGLAENLSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDVDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPTTVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKIGD
PTTRRQAV
>NC_009618@CYtaCp067@psbb@76344@77870@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVSGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGINNSWGGWSITGETVTNPGLWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLDIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGSGAFHVTGLYGPGIWVSDPYGLTGKIQPVNPAWGAEGFDPFVPGGIAS
HHIAAGILGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
IVAGTMWYGSATAPVELFGPTRYQWDQGYFQQEIDRRVRAGLSENLSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGAMDNGDGIAVGWLGHPIFRDKE
GHELFVRRMPTFFETFPVVLVDEEGIVKADVPFRRAESKYSVEQVGVTVE
FYGGELDGVSFGDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHATFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQXLGD
PTTKRQIV
>NC_009681@LeteCp033@psbb@76152@77678@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLIAVHLMHTSLVSGWAGSMAFYELGVFDASDP
VLNPMWRQGMFVLPFMTRLGITQSWGGWTISGETATNPGIWSYEGVAAAH
IVLSGALFSAAIWHWVYWDLELFRDPRTGNPVLDLPKIFGIHLFLSGLLC
FSFGAFHVTGLFGPGIWVSDPYGITGSVQPVAPAWGADGFDPYNPGGIAS
HHIAAGILGVLAGLFHLCVRPPQRLYKGLCMGNIETVLSSSIAAVFWAAF
VVAGTMWYGSAATPIELFGPTRYQWDLGYFQQAIETRVQTSLAEGKSLSE
AWSQIPEKLAFYDYIGNNPAKGGLFRAGAMNSGDGIAVGWLGHAVFKDKQ
GNELFVRRMPTFFETFPVLLIDKDGVVKADVPFRRAESKYSIEQVGVSVT
FYGGELDGVTFTDPATVKKYARRAQLGEIFEFDRATLQSDGVFRSSPRGW
FTFGHLSFALLFFFGHIWHGARTIFRDVFAGIDSDLDDQVEFGAFQKLGD
SSTRRQTV
>NC_009765@CugrCp39@psbb@39302@40828@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTILLNDPGRLLSVHIMHTALVAGWAGSTALYELAVFDPSDP
ILDPMWRQGMFVIPFMTRLGITTSWAGWDITGGPITTPGLWSYEGVAGAH
IFFSGLCFLAAIWHWVYWDLEVFFDQRTGKPSLDLPKIFGIHLFLAGLTC
FGFGTFHVTGLYGPGIWVSDPYGLTGKVQAVNPAWGIEGFDPLVPGGIAS
HHIAAGTLGLLAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VTAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRISVGLADKQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDKGDGIAIGWLGHPIFRDKE
GRELFVRRMPTFFETFPVILVDSGGVVRADVPFRRAESKYSVEQVGVTVS
FYGGELNGLTYSDPTTVKKYARRAQFGEIFELDRATLKSDGVFRSSPRGW
FTFSHVSFALLFFFGHIWHGARTLFRDVFAGINPDLDLQVEFGAFQKLGD
PTTRKLGI
>NC_009766@CureCp044@psbb@62662@64188@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWGIAGGTVTNPGLWSYEGVAGAH
IAFSGLCFLAAIWHWVYWDLEVFYDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPIKPTWGAEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSAGLAENQSLSE
TWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDNE
GRELFVRRMPTFFETFPIILVDGDGIVRADVPFRRAESKYSVEQVGVTVA
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQGA
>NC_009808@Ippucp048@psbb@75011@76537@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTVTNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGLAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSAGLAENQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVA
FYGGELNGVSYSDPTTVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFLKLGD
PTTKRQAA
>NC_009949@CuobCp39@psbb@38622@40148@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTILLNDPGRLLSVHIMHTALVAGWAGSTALYELAVFDPSDP
ILDPMWRQGMFVIPFMTRLGITTSWAGWDITGEPIKIPGLWSYEGVAGAH
IFFSGLCFLAAIWHWVYWDLEVFFDQRTGKPSLDLPKIFGIHLFLAGLMC
FGFGTFHVTGLYGPGIWVSDPYGLTGKVQAVNPAWGIEGFDPLVPGGIAS
HHIAAGTLGLLAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VTAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRISVELADKQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDKGDGIAIGWLGHPIFRDKE
GRELFVRRMPTFFETFPVILVDSGGVVRADVPFRRAESKYSVEQVGVTVS
FYGGELNGLTYSDPTTVKKYARRAQFGEIFELDRATLKSDGVFRSSPRGW
FTFSHVSFALLFFFGHIWHGARTLFRDVFAGINPDLDLQVEFGAFQKLGD
PTTRKLGV
>NC_009950@LopeCp067@psbb@68457@69983@D@1@509 photosystem_II_CP47_chlorophyll_apoprotein
MGLPWYRVHTVVLNDPGRLLAVHIMHTALVSGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITDSWGGWSISGGTVTNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLAIFSDDRTGKPSLDLPKIFGIHLFLAGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQAVNPAWGAEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSNGLAENLSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPVFRDKE
GRELFVRRMPTFFETFPVVLVDEEGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRSQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHATFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGTFQKVGD
PTTRKQAV
>NC_009962@CedeCp048@psbb@74803@76329@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVSGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTITNPGLWSYEGVAGAH
IMFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGLAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQSVSPAWGAEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVGNGLSENLSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPVFRDNE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGTFQKLGD
PTTRRQVV
>NC_009963@CuexCp045@psbb@65214@66740@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWGIAGGTVTNPGLWSYEGVAGAH
IAFSGLCFLAAIWHWVYWDLEVFYDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPLKPAWGAEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSAGLAENQSLSE
TWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVLLVDGDGIVRADVPFRRAESKYSVEQVGVTVA
FYGGELNDVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQAV
>NC_010093@AcamCp047@psbb@71880@73406@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPVNPAWGAEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVGAGLAENLSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPVFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKIGD
PTTRRQAV
>NC_010109@LemiCp048@psbb@77386@78912@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPVSPAWGAEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRISAGLAENLSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAIGWLGHPVFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTKRQAV
>NC_010323@CapaCp048@psbb@76916@78442@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTITNPGLWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSAGLAENQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQVV
>NC_010358@OearCp048@psbb@76525@78051@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLAVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTVTNPGIWSYEGVAGSH
ILFSGLCFLAAIWHWVYWDLAIFSDERTGKPSLDLPKIFGIHLFLSGLAC
FGFGAFHVTGLYGPGIWVSDPYGLTGEVQPVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVGAGLAKNQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDSGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDTQVEFGAFQKLGD
PTTRRQAV
>NC_010360@OeglCp048@psbb@77585@79111@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLAVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTVTNPGIWSYEGVAGSH
ILFSGLCFLAAIWHWVYWDLAIFSDERTGKPSLDLPKIFGIHLFLSGLAC
FGFGAFHVTGLYGPGIWVSDPYGLTGEVQPVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVGAGLAKNQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDSGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTIE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDTQVEFGAFQKLGD
PTTRRQAV
>NC_010361@OebiCp048@psbb@76970@78496@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLAVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTVTNPGIWSYEGVAGSH
ILFSGLCFLAAIWHWVYWDLAIFSDERTGKPSLDLPKIFGIHLFLSGLAC
FGFGAFHVTGLYGPGIWVSDPYGLTGEVQPVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVGAGLAKNQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDSGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTIE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDTQVEFGAFQKLGD
PTTRRQAV
>NC_010362@OepaCp048@psbb@75730@77256@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLAVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTVTNPGIWSYEGVAGSH
ILFSGLCFLAAIWHWVYWDLAIFSDERTGKPSLDLPKIFGIHLFLSGLAC
FGFGAFHVTGLYGPGIWVSDPYGLTGEVQPVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVGAGLAKNQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDSGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDTQVEFGAFQKLGD
PTTRRQAV
>NC_010433@MaesCp048@psbb@77269@78795@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPVSPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSAGLAENQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPVTVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQVV
>NC_010442@TrCaCp027@psbb@27068@28594@R@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTIVLNDPGRLLAVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGIINSWGGWGITGGTITYPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFTDERTGKPSLDLPKIFGIHLFLAGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQYVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSTGLAKNQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGAGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYNDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQVV
>NC_010548@CrjaCp005@psbb@4013@5539@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLIAVHIMHTALVSGWAGSMALYELAVFDPSDP
ILDPMWRQGMFVIPFMTRLGIKDSWGGWSITGETGSNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLDVFCDSRTGKPSLDLPKIFGIHLFLSGAAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKIQPVNPAWGAEGFDPFVPGGIAS
HHIAAGILGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
IVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIDRRVRAGLAENLSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGAMDNGDGIAVGWLGHPIFKDKN
GHELFVRRMPTFFETFPVVLVDEEGIVKADVPFRRAESKYSVEQVGVTVE
FYGGELDGVSFGDPAIVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHATFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTKRQVV
>NC_010601@GuabC_p048@psbb@71841@73367@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTTTNPGIWSYEGVAGAH
IMFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLAGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQSVNPSWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSAGLAENQSLSE
VWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPVTVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQAV
>NC_010654@WemiC_p045@psbb@56136@57662@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLIAVHIMHTALVAGWAGSMALYELAVFDPSDS
VLDPMWRQGMFILPFMTRLGIKESWGGWSITGEPIANPGLWSYEGVAGAH
IVFSGLCFLSATWHWVYWDLEIFSDPRTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPFGLTGKIQPVSPAWGAEGFDPFVPGGIAS
HHVAAGLLGIIAGLFHLSVRPPQRLYRGLRMGNIETVLSSSIAAVFFAAF
IVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIDRRVQAGLAENLSLSE
AWSRIPEKLAFYDYIGNNPAKGGLFRAGAMDNGDGIAVGWLGHPIFKDKE
GNELFVRRMPTFFETFPVVLVDKEGVIKADIPFRRAESKYSVEQVGVTVE
FYGGELNGVSFSDPAIVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHATFALLFFFGHIWHGARTLFRDIFAGIDPELDIQVEFGAFQKIGD
PTTKRQVV
>NC_010772@Heak293_Cp153@psbb@155992@157521@R@1@510 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLIAVHLMHTALVSGWAGSMALYELAVFDPSDP
VLNPMWRQGMFVMPFMTRLGVTDSWGGWTITGDSASNPGIWSYEGVALTH
IVLSGLLFLAAIWHWVYWDLELFRDPRTGETGLDLPKIFGIHLLLSGLLC
FGFGAFHVTGLFGPGIWVSDAYGLTGKVQPVAPAWGPDGFNPFNPGGVAS
HHIAAGTFGILAGVFHLTVRPPQRLYRALRMGNIETVLSSSISAVFFAAF
VTSGTMWYGSATTPIELFGPTRYQWDSGYFQQEIERRVETSLNEDLSESE
AWSKIPDKLAFYDYIGNNPAKGGLFRAGPMDKGDGIAEAWLGHPIFRDRE
GRELTVRRMPAFFETFPVILVDKDGIIRADIPFRRAESKYSIEQVGVNVS
FYGGKLNGQSFKDAPTVKKYARKAQLGEVFEFDRTSLESDGVFRSSPRGW
YTFGHANFALLFFFGHLWHGSRTLFRDVFTGIGAEVTEQVEFGSFQKLGD
RTTRKQGAV
>NC_010776@FaesanCp048@psbb@73391@74917@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLISVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTVTDPGIWSYEGVAGSH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQSVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSAGLAENQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLIDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGSRTLFRDVFAGIDPDLDSQVEFGAFQKLGD
PTTRRQAV
>NC_011031@OecaC_p071@psbb@129608@131931@R@2@510 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLIAVHLMHTSLVSGWAGAMALYELAVFDPSDP
VLNPMWRQGTFVLPFMTRLGVTQSWGGWTISGETIGNTGFQWTYETVAAA
HIILSGLLFLAAIWHWIYWDLDLFRDPREKKPALDLPKIFGIHLFLAGLL
CFSFGAFHITGLYGPGIWVSDPYGITGSVQPVAPSWGADGFDPFNPGGIA
AHHIAAGVLGILAGLFHLCVRPSLRLYLGLSMGSIESVLSSSIAAVFWAA
FVVAGTMWYGSAATPIELFGPTRYQWDQGFFQQEIEKRVQSTIAAGSSLS
EAWSQIPEKLSFYDYIGNNPAKGGLFRSGAMNSGDGIAVGWLGHAVFKDQ
EGRELYVRRMPTFFETFPVLLLDKDGIVRADVPFRRAESKYSIEQVGVSV
TFYGGELDGVTFSDPATVKKYARRAQLGEIFEFDRATLQSDGVFRSSPRG
WFTFGHVTFALLFFFGHIWHGARTLARDRFAGIDEDITDQVEFGKFQKVG
DPSSFRGAV
>NC_011032@BrdiC_p051@psbb@67711@69237@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLAVHIMHTALVSGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITDSWGGWSISGGTVTNPGIWSYEGVAGTH
IVFSGLCFLAAIWHWVYWDLAIFSDDRTGKPSLDLPKIFGIHLFLAGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQAVNPAWGAEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSNGLSENLSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPVFRDKE
GRELFVRRMPTFFETFPVVLVDEEGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRSQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHATFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGTFQKVGD
PTTRKQAV
>NC_011152@CLPGMS-5045@psbb@52710@54236@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLISVHIMHTALVAGWAGSMTLYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGIKDSWSGWNITGETVINPGIWSYEGVAXXX
XXXXXXXFLAAIWHWVYWDLEIFYDERTGKLCLDLPKVFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKIQPVDPAWGAEGFDPFVPGGIAS
HHIAAGILGILAGLFHLSVRPPQRLYVGLRMGNIETVLSSSIAAVFFAAF
IVAGTMWYGSATTPVELFGPTRYQWDQGYFQQEIDRRVRAGLAENLSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGAMDNGDGIAVGWLGHPIFKDKE
GNELFVRRMPTFFETFPVVLVDKEGIVKADVPFRRAESKYSVEQVGVTVE
FYGGGLDRVSFGDPAIVKKYARRAQLGEIFELDRATLKSDGVFRSXXXXX
XXXXXXXXXXXFFSGHIWHGSRTLFRDVFAGIDPDLDARIEFGAFQKLGD
PTTKRQVV
>NC_011153@CLPGMS-2245@psbb@52529@54055@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLISVHIMHTALVAGWAGSMTLYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGIKDSWTGWNITGETVINPGIWSYEGVAVAH
IVFSGLCFLAAIWHWVYWDLDIFCDERTGKRCLDLPKVFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKIQPVDPAWGAEGFDPFVPGGIAS
HHIAAGILGILAGLFHLSVRPPQRLYVGLRMGNIETVLSSSIAAVFFAAF
IVAGTMWYGSATTPVELFGPTRYQWDQGYFQQEIDRRVRAGLAENLSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGAMDNGDGIAVGWLGHPIFKDKE
GNELFVRRMPTFFETFPVVLVDKEGIVKADVPFRRAESKYSVEQVGVTVE
FYGGGLDRVSFGDPAIVKKYARRAQLGEIFELDRATLKSDGVFRSXXXXX
XXXGHATFALLFFSGHIWHGSRTLFRDVFAGIDSDLDSRIEFGAFQKLGD
PTTKRQVV
>NC_011154@CLPGMS-2645@psbb@51916@53442@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLISVHIMHTALVAGWAGSMTLYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGIKDSWSGWNITGETVINPGIWSYEGVAGAH
IMFSGLMFLAAIWHWVYWDLEIFYDERTGKLCLDLPKVFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKIQPVDPAWGAEGFDPFVPGGIAS
HHIAAGILGILAGLFHLSVRPPQRLYVGLRMGNIETVLSSSIAAVFFAAF
IVAGTMWYGSATTPVELFGPTRYQWDQGYFQQEIDRRVRAGLAENLSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGAMDNGDGIAVGWLGHPIFKDKE
GNELFVRRMPTFFETFPVVLVDKEGIVKADVPFRRAESKYSVEQVGVTVE
FYGGGLDRVSFGDPAIVKKYARRAQLGEIFELDRATLKSDGVFRSXXXXX
XXXGHATFALLFFSGHIWHGARTLFRDVFAGIDPDLDSRIEFGAFQKLGD
PTTKRQVV
>NC_011155@CLPGMS-2845@psbb@51836@53362@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLISVHIMHTALVAGWAGSMTLYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGIKDSWSGWNITGETVINPGIWSYEGVAGAH
IMFSGLMFLAAIWHWVYWDLEIFYDERTGKLCLDLPKVFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKIQPVDPAWGAEGFDPFVPGGIAS
HHIAAGILGILAGLFHLSVRPPQRLYVGLRMGNIETVLSSSIAAVFFAAF
IVAGTMWYGSATTPVELFGPTRYQWDQGYFQQEIDRRVRAGLAENLSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGAMDNGDGIAVGWLGHPIFKDKE
GNELFVRRMPTFFETFPVVLVDKEGIVKADVPFRRAESKYSVEQVGVTVE
FYGGGLDRVSFGDPAIVKKYARRAQLGEIFELDRATLKSDGVFRSXXXXX
XXXGHATFALLFFSGHIWHGARTLFRDVFAGIDPDLDSRIEFGAFQKLGD
PTTKRQVV
>NC_011156@CLPGMS-3245@psbb@51343@52869@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLISVHIMHTALVAGWAGSMTLYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGIKDSWSGWNITGETVINPGIWSYEGVAGAH
IMFSGLMFLAAIWHWVYWDLEIFYDERTGKLCLDLPKVFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKIQPVDPAWGAEGFDPFVPGGIAS
HHIAAGILGILAGLFHLSVRPPQRLYVGLRMGNIETVLSSSIAAVFFAAF
IVAGTMWYGSATTPVELFGPTRYQWDQGYFQQEIDRRVRAGLAENLSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGAMDNGDGIAVGWLGHPIFKDKE
GNELFVRRMPTFFETFPVVLVDKEGIVKADVPFRRAESKYSVEQVGVTVE
FYGGGLDRVSFGDPAIVKKYARRAQLGEIFELDRATLKSDGVFRSXXXXX
XXXGHAXFALLFFSGHIWHGARTLFRDVFAGIDPDLDSRIEFGAFQKLGD
PTTKRQVV
>NC_011158@CLPGMS-4045@psbb@51517@53043@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLISVHIMHTALVAGWAGSMTLYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGIKDSWTGWNITGETVINPGIWSYEGVAVAH
IIFSGLMFLAAIWHWVYWDLEIFYDERTGKLCLDLPKVFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKIQPVDPAWGAEGFDPFVPGGIAS
HHIAAGILGILAGLFHLSVRPPQRLYVGLRMGNIETVLSSSIAAVFFAAF
IVAGTMWYGSATTPVELFGPTRYQWDQGYFQQEIDRRVRAGLAENLSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGAMDNGDGIAVGWLGHPIFKDKE
GNELFVRRMPTFFETFPVVLVDKEGIVKADVPFRRAESKYSVEQVGVTVE
FYGGGLDRVSFGDPAIVKKYARRAQLGEIFELDRATLKSDGVFRSXXXXX
XXXGHATFALLFFSGHIWHGARTLFRDVFAGIDPDLDSRIEFGAFQKLGD
PTTKRQVV
>NC_011159@CLPGMS-4445@psbb@51718@53244@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLISVHIMHTALVAGWAGSMTLYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGIKDSWTGWNITGETVINPGIWSYEGVAGAH
IMFSGLMFLAAIWHWVYWDLEIFYDERTGKLCLDLPKVFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKIQPVDPAWGAEGFDPFVPGGIAS
HHIAAGILGILAGLFHLSVRPPQRLYVGLRMGNIETVLSSSIAAVFFAAF
IVAGTMWYGSATTPVELFGPTRYQWDQGYFQQEIDRRVRAGLAENLSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGAMDNGDGIAVGWLGHPIFKDKE
GNELFVRRMPTFFETFPVVLVDKEGIVKADVPFRRAESKYSVEQVGVTVE
FYGGGLDRVSFGDPAIVKKYARRAQLGEIFELDRATLKSDGVFRSXXXXX
XXXGHATFALLFFSGHIWHGARTLFRDVFAGIDPDLDSRIEFGAFQKLGD
PTTKRQVV
>NC_011163@CiarC_p045@psbb@70243@71772@D@1@510 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWNITGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLAGVGC
FGFGAFHVTGLFGPGIWVSDPYGLTGRVQSVNPAWGVDGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVGAGLAENQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHVSFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PSTKKPVVS
>NC_011600@ValiC_p047@psbb@42451@43980@D@1@510 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLISVHLMHTALVAGWAGSMALYELAVFDPSDP
VLNPMWRQGMFVMPFMTRLGVTDSWGGWSITGESVSNPGIWSFEGVALTH
IVLSGLCFLAAIWHWVYWDLELFRDLRTGEPTLDLPKIFGIHLFLSGLLC
FGFGAFHVTGLFGPGIWVSDAYGITGKIQPVAPAWGPEGFNPFNPGGIAS
HHIAAGTFGILAGVFHLTIRPPQRLYRALRIGNIETVLSSSISAVFFAAF
ITSGTMWYGSATTPIELFGPTRYQWDSGYFQQEIERRVELSLNEGLSESE
TWANIPDKLAFYDYIGNNPAKGGLFRAGPMNKGDGIAEAWLGHPIFRDKE
GRELTVRRMPAFFETFPVILVDKDGIIRADIPFRRAESXYSIEQVGVNVS
FYGGKLNGQSFKDAQTVKKFARKAQLGEVFEFDRTSLESDGVFRSSPRGW
YTFGHVNFGLLFFLGHLWHGSRTIFRDVFTGIGAEVTEQVEFGAFQKLGD
ESTRKQGIV
>NC_011713@FearC_p043@psbb@69030@70562@D@1@511 photosystem_II_CP47_chlorophyll_apoprotein
MGLPWYRVHTVVLNDPGRLLAVHIMHTALVSGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITDSWGGWSISGGTVTNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLAGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQAVNPAWGAEGFDPFRSGIGIA
SHHIAAGTWGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIPAVFFAA
FVVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSDGLAENLSLS
EAWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIPVGWLGHPVFIDK
EGRELFVRRMPTFFETFPVVLVDEEGIVRADVPFRRAESKYSVEQVGVTV
EFYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRG
WFTFGHATFAFALLFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGTFQKV
GDPTTRKQAV
>NC_011828@TrsuC_p015@psbb@16797@18323@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWNITGGTITNPGIWSYEGVAAAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLAGVGC
FGFGAFHVTGLFGPGIWVSDPYGLTGRVQSVNPAWGVDGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVGAGLAENQNLSE
AWSKIPEKLVFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTKKQVV
>NC_011930@KedaC_p057@psbb@91794@93320@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLIAVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGIKNSWSGWSITGETVINPGIWSYEGVAGAH
IMFSGLCFLAAIWHWVYWDLELFCDERTGKLCLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKIQPVDPAWGAEGFDPFVPGGIAS
HHIAAGILGILAGLFHLSVRPPQRLYIGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPVELFGPTRYQWDQGYFQQEIDRRVRAGLAENLSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGAMDNGDGIAVGWLGHPIFKDKE
GNELFVRRMPTFFETFPVVLVDKEGIVKADVPFRRAESKYSVEQVGVTVE
FYGGGLDRVCFGDPAIVKKYARRAQLGEIFELDRATLKSDGVFRTSPRGW
FTFGHATFALLFFSGHIWHGARTLFRDVFAGIDPDLDARIEFGAFQKLGD
PTTKRQVV
>NC_011942@GnpaC_p033@psbb@68467@69993@R@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLIAVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFILPFMTRLGIKESWGGWSITGESAVNPGLWSYEGVAGAH
IVFSGLCFLSAIWHWVYWDLEIFSDPRTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPFGLTGRIQPVSPAWGAEGFDPFVPGGIAS
HHIAAGLLGIIAGLFHLSVRPPQRLYRGLRMGNIETVLSSSIAAVFFAAF
IVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIDRRVRAGLTEKLSLSE
AWSRIPEKLAFYDYIGNNPAKGGLFRAGAMDNGDGIAVGWLGHPIFRDKE
GNELFVRRMPTFFETFPVVLVNKEGIVKADVPFRRSESKYSVEQVGVTVE
FYGGELNGVSFSDPAIVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHATFALLFFFGHIWHGARTLFRDIFAGIDPELDAQVEFGAFQKLGD
PTTKRQVV
>NC_011954@EpeqC_p044@psbb@48900@50426@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHIVFLNDPGRLISVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFILPFMTRLGIKESWGGWSITGETEANPGFWSYEGVAGAH
IVFSGLCFLSAIWHWVYWDLEIFTDPRTGKPSLDLPKIFGIHLFLSGVVC
FGFGAFHVTGLYGPGIWISDPFGLTGKIQPVSPAWGAEGFDPFVPGGIAS
HHVAAGLLGIIAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFASF
IVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIDRRVRAGLNKNLSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGAMDNGDGIAIGWLGHPIFKDKD
GNELFVRRMPTFFETFPVVLVDKEGVVKADVPFRRSESKYSVEQVGVTVE
FYGGELDGVSFSDPTIVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHATFALLFFFGHIWHGSRTLFRDIFAGIDPELNAQVEFGAFQKLGD
PTTKKQVI
>NC_012052@Syruc_p017@psbb@10711@12237@R@1@509 photosystem_II_CP47_chlorophyll_apoprotein
MGLPWYRVHTVVLNDPGRLIAVHLMHTALVSGWAGSMALYELAVFDPSDP
ILDPMWRQGMFVIPFMTRLGITKSWGGWSITGETINNAGLWSYEGVAAVH
IVLSGLLFLAAIWHWVYWDLELFRDERTGKPSLDLPKIFGIHLFLSGVLC
FAFGAFHVTGLFGPGIWVSDPYGLTGKVQPVVPAWGAEGFDPFVPGGIAS
HHIAAGILGILAGLFHLSVRPPQRLYKGLRMGNVETVLSSSIAAVFFAAF
VVAGTMWYGSAATPVELFGPTRYQWDQGFFQQEIDRRIRASKNENLSLSE
SWSKIPEKLAFYDYIGNNPAKGGLFRAGAMDNGDGIAVGWLGHAIFKDRE
GHELFVRRMPTFFETFPVVLVDEEGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELDGVSFSDPATVKKYARRAQLGEIFEFDRATLKSDGVFRSSPRGW
FTFGHATFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTKRQIV
>NC_012097@PyprC_p056@psbb@65650@67176@R@1@509 photosystem_II_47_kDa_protein
MGLPWFRVHTVVLNDPGRLIAVHIMHTALVSGWAGSMALYELSVFDPSDP
VLNPMWRQGMFVLPFMTRLGVTKSWGGWDINGDTITSPGIWSYEGVAASH
IILSGLLFLAAIWHWVFWDLELFRDPRTGDPALDLPKIFGIHLFLSGLLC
FGFGAFHVTGLFGPGIWVSDPYGITGSVQPVAPAWGAEGFDPYNPGGIAS
HHIAAGILGILAGLFHLTVRPPQRLYKGLRMGNIETVLSSSIAAVFWAAF
VVAGTMWYGSAATPIELFGPTRYQWDQGFFAQEIEKRVQANLAAGDNLST
AWSKIPEKLSFYDYIGNNPAKGGLFRSGPMDNGDGIAIGWLGHAVFTDTT
GNELFVRRMPTFFETFPVLLVDKDGVVRADVPFRRAESKYSIEQVGVSVT
FYGGELDGVTFNDPATVKKYARRAQLGEIFEFDRAILQSDGVFRSSPRGW
FTFGHLNFALLFFFGHIWHGARTIFRDVFAGIDPDLDEQVEFGAFQKLGD
TSTRRQTV
>NC_012099@PypaC_p009@psbb@10646@12172@R@1@509 CP47_chlorophyll_apoprotein_of_photosystem_II
MGLPWYRVHTVVLNDPGRLIAVHLMHTALVSGWAGSMALYELAVFDPSDP
VLNPMWRQGMFVIPFMTRLGVTKSWGGWSISGETITNPGIWSYEGVAASH
IVLSGLLFLAAIWHWVYWDLELFRDPRTGDPALDLPKIFGIHLFLSGLLC
FGFGAFHVTGLFGPGIWVSDPYGITGSVQPVSPAWGPEGFDPYNPGGVAS
HHIAAGVLGIIAGLFHLTVRPPQRLYKALRMGNIETVLSSSIAAVFWAAF
VVAGTMWYGSAATPIELFGPTRYQWDQGFFQEEIERRVQKSVASGKSLSQ
AWSTIPEKLAFYDYIGNNPAKGGLFRSGPMDNGDGIAAGWLGHAVFSDKE
GRELFIRRMPTFFETFPVLLLDKDGVVRADVPFRRAESKYSVEQVGVNVT
FYGGELDGVSFSDPATVKKYARRAQLGEIFEFDRATLQSDGVFRSSPRGW
FTFGHLCFALLFFFGHIWHGARTIFRDVFAGIDPDLDEQIEFGAFQKLGD
ITTKRQAV
>NC_012101@MoOKC_p055@psbb@83425@84951@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHNVVLNDPGRLIAVHLMHTALVSGWAGSMALYELAVFDPSDP
VLNPMWRQGMFVLPFMTRLGVTGSWGGWSITGETIGNPGIWSYEGVAASH
IILSGLLFLAAVWHWTFWDLELFRDPRTGDPALDLPKIFGIHLFLSGLLC
FGFGAFHVTGFFGPGIWVSDPYGITGSVQPVAPAWGPEGFDPYNPGGIAS
HHVAAGILGILAGLFHLTVRPPQRLYKGLRMGNIETVLSSSIAAVFWAAF
VVSGTMWYGSAATPIELFGPTRYQWDQGFFQAEIDKRVQKSLSEGKNLST
AWASIPEKLAFYDYIGNNPAKGGLFRSGPMDNGDGIAAGWLGHAVFTDKD
GRELTTRRMPTFFETFPVILVDQDGIVRADVPFRRAESKYSIEQVGVSVT
FYGGELDGITFNDPATVKKYARRAQLGEIFEFDRATLQSDGVFRSSPRGW
FTFGHLCFALLFFFGHIWHGARTIFRDVFAGIDPDLDEQVEFGAFQKLGD
VTTRRQAV
>NC_012224@JacuC_p046@psbb@78922@80448@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEVFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPVSPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSAGLAENQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQVV
>NC_012615@MesaC_p048@psbb@76517@78043@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLAVHIMHTALVSGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGLAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQSVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVGAGLSENQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPVFRDKD
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELDGVNYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQGV
>NC_012818@AlspC_p052@psbb@71811@73337@D@1@509 photosystem_II_CP47_chlorophyll_apoprotein
MGLPWYRVHTVVLNDPGRLISVHLMHTALVSGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRIGVTKSWGGWSITGDTVTDAGIWSYEGVAAAH
IILSGLLFLAAIWHWVYRDLDLFRDDRTGKPSLDLPKIFGIHLFLSGVLC
FAFGAFHVTGLFGPGIWVSDPYGLTGKVEPVDPAWGAEGFDPFVPGGIAS
HHIAAGVLGILAGLFHLSVRPPQRLYKALRMGNVETVSSSSIAAVFFAAF
VVSGTMWYGSAATPIELFGPTRYQWDQGYFQQEIDQRIRSSKAENLSLSE
AWSKIPEKSAFYDYIGNNPAKGGLFRAGAMDNGDGIAVGWLGHAIFKDKE
GHELFVRRMPTFFETFPVVLVDGEGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELDGASFSDPATVKKYARRAQSGEIFEFDRATLKSDGVFRSSPRGW
FTFGHATFALIFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGTFQKLGD
PSTKRQPI
>NC_012898@AuanCp054@psbb@47880@49418@D@1@513 photosystem_II_p680_chlorophyll_A_apoprotein_(CP-47)
MALPWYRVHTVVLNDPGRLIAVHLMHTSLVAGWAGSMALYELAIFDPSDP
VLNPMWRQGMYVMPFMTRLGVTDSWGGWSITGESVSAPGLWSYEGVALTH
IVLSGLCFLAAIWHWVYWDLDLFRDPRTGEPAIDLPKVFGIHLFLSGLLC
FGFGAFHVTGIFGPGIWVSDAFGVTGKVAGVAPAWGPEGFNPFNPGGVAS
HHIAAGAFGILAGIFHLTVRPPQRLYRALRMGNIETVLSSSISAVFFAAF
VTSGTMWYGCATTPIELFGPTRYQWDSGYFQQEIERQVETSLSEGLSESN
AWSRIPDKLAFYDYIGNNPAKGGLFRSGPMNKGDGIAEAWLGHPVFKDRD
GRELTVRRMPAFFETFPVILVDKDGVIRADIPFRRAESKYSIEQVGVSVD
FYGGKLNGQSFKDAPTVKKFARKAQLGEVFDFDRTSLESDGVFRSSPRGW
YTFGHLNFALLFFFGHLWHGARTLFRDVFTGIGAEITEQIEFGAFQKLGD
VSTDRSRKQGAV
>NC_012903@AulaCp037@psbb@28803@30335@D@1@511 photosystem_II_p680_chlorophyll_A_apoprotein_(CP-47)
MALPWYRVHTVVLNDPGRLIAVHLMHTALVAGWAGSMALYELAIYDPSDP
VLNPMWRQGMYVMPFMTRLGVTDSWGGWSITGESVSSPGIWSYEGVALTH
IVLSGLCFLAAIWHWVYWDLDLFRDPRTNEPAIDLPKVFGIHLLLSGLLC
FGFGAFHVTGIFGPGIWVSDAYGVTGKVAGVAPAWGPEGFNPFNPGGVAS
HHIAAGAFGILAGIFHLTVRPSQRLYRALRMGNIETVLSSSISAVFFAAF
VTSGTMWYGCATTPVELFGPTRYQWDSGYFQQEIERQVEESLSQGLSESN
AWSRIPDKLAFYDYIGNNPAKGGLFRSGPMNKGDGIAEAWLGHPIFKDRE
GRELTVRRMPAFFETFPIILVDKDGVIRADIPFRRAESKYSIEQVGVSVD
FYGGKLNGQSFKDAPTVKKFARKAQLGEVFEFDRTSLESDGVFRSSPRGW
YTFGHLNFALLFFFGHLWHGSRTLFRDVFTGIGAEVTEQVEFGAFQKLGD
ETTARKQGAV
>NC_012978@PakeC_p027@psbb@46182@47708@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLISVHLMHTALVSGWAGSMAFYELAVFDPSDP
VLNPLWRQGMFVLPFMTRLGISESWGGWTISGETAVNPGVWSYEGVAAAH
IVLSGLLILASIWHWVYWDLELFRDPRTGDPALDLPKIFGIHLFLSGLLC
FSFGAFHVTGLFGPGIWVSDPYGITGSVQPVSPSWDATGFDPYNPGGIAA
HHIAAGILGVLAGLFHLCVRPPQRLYNGLRMGNIETVLSSSIAAVFWAAF
VVSGTMWYGSAATPIELFGPTRYQWDLGFFQQEIERRIQTSLSQGKSLSQ
AWSEIPEKLAFYDYIGNNPAKGGLFRAGAMNSGDGIAVGWLGHAVFKDKQ
GNELFVRRMPNFFETFPVVLVDKDGIVRADVPFRRAESKYSVEQVGVSVT
FYGGELDGVVFTDPTTVKKYARRAQLGEIFEFDRATLQSDGVFRTSPRGW
FTFAHLCFALLFFFGHIWHGARTIFRDVFAGIDADLDEQVEFGAFQKLGD
SSTRRQSV
>NC_013086@SemoP_p040@psbb@69055@70581@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRAHTVVSNDPGRSLPVHLMHTALVSGWAGPMAPYELAVSDPSDP
ALDPMRRQGMSVIPLTTRPGVTESWSGWSIAGETVTNAGIRSYEGVATAH
IVPPGLLLLAAIWHWVYWDSEISSDERTGTFALDLPKISGVHPSPPGVPR
FGFGASHVTGLLGPGIWVSDPYGLTGRIEPVAPVWTAAGFDPFVPGGIAS
HHIAAGILGILAGLFHPSARPPQRSHKSLRMGNVETVSSSSIAAVPLAAL
VVAGTMWYGSATTPVEPFGPTRYQWDLGFYQQETDRRIRSARAGNIGLPE
AWSKIPEKSASHDHIGSNPAKGGSSRAGATDSGDGIAVGRLGHATPRDKE
GHEPFVRRMPTLLETSPVVLVDEEGIARADVPSRRAESKYSAEQVGVTAE
FCGGELDGVSFSDPATVKKHARRAQLGEIPESDRATSKPDGVPRSSPRGW
STFGHATFALLSSSGHIRHGARTPFRDVLAGTDPDPDAQAELGTSQKSGD
PTTKRQAV
>NC_013088@DelaC_p046@psbb@71159@72685@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVSGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSISGGTVTNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLAGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQAVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
IVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSDGLAENLSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPVFRDKE
GRELFVRRMPTFFETFPVVLVDEEGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRSQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHATFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGTFQKVGD
PTTRRQAV
>NC_013273@ColajoC_p049@psbb@71096@72622@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVSGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSISGGTVTNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLAGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQAVNPAWGAEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSDGLAENLSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPVFRDKE
GRELFVRRMPTFFETFPVVLVDEEGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHATFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGTFQKVGD
PTTRRQAT
>NC_013359@BrhyC_p045@psbb@68461@71091@D@2@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLIAVHLMHTSLVSGWAGSMAFYELAVFDPSDP
VLNPMWRQGMFVLPFMTRLGITQSWGGWTISGETATNPGIWSYEGVATSH
ILLSGALFAAALWHWVYWDLELFRDPRTGKPALDLPKIFGIHLFLSGLLC
FGFGAFHVTGLFGPGIWVSDPFGITGSVQAIKPSWGADGFDPFNPGGIAS
HHIAAGILGILAGLFHLCVRPSFRLYLGLSMGNIETVLSSSIAAVFWSAF
VVCGTMWYGSAATPIELFGPTRYQWDNGFFANEIEKRVSESVASGKTLSE
AWSQIPEKLAFYDYIGNNPAKGGLFRAGAMNSGDGIAVGWLGHSVFKDKN
GTELHVRRMPTFFETFPVVLLDDDGIVRADIPFRRAESKYSIEQVGVSVT
FYGGELDGVTFSDPSTVKKYARRSQLGEIFEFDRATLQSDGVFRSSPRGW
FTFGHLCFGLLFFFGHIWHGARTIFRDVFAGIDTDLDEQVEFGAFQKVGD
TSTRRQSV
>NC_013498@Es_cpDNA_63@psbb@31225@32757@D@1@511 Photosystem_II_chlorophyll_A_core_antenna_apoprotein_CP47
MALPWYRVHTVVLNDPGRLIAVHLMHTGLVAGWAGSMALYELSIFDFSDP
ILNPMWRQGMFVMPFMTRLGVSDSWTGWDIAGERSEPIASLWCYEGVAYT
HIILSGLCFLAAVWHWVYWDLELFRDPRTGEPSLDLPKIFGIHLFLSGLL
CFGFGAFHVTGFFGPGIWVSDAYGLTGQVQPVAPSWGPSGFNPFNPGGIA
SHHMAAGSFGVLAGGFHLTLRPPQRLYRALRMGNIETVLSSSIAAVFFAA
FITSGTMWYGSATTPIELFGPTRYQWDSGYFQQEIERRVEVSLNEGLSES
EAWSSLPDKLAFYDYIGNNPAKGGLFRSGPMNKGDGIAEAWLGHPIFRDR
EGRELSVRRMPAFFETFPVILIDKDGIIRADIPFRRAESKYSIEQVGVNV
SFYGGKLNGQSFKDAPTVKKFARKAQLGEVFEFDRTSLESDGVFRSSPRG
WYTFGHLNLALLFFLGHLWHGSRTLFRDVFTGIGSEVTEQVEFGAFQKLG
DETTRKQGLV
>NC_013553@PaarC_p044@psbb@72850@74376@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLAGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQSVNPSWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSAGLAENQSLSE
VWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPVTVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQAI
>NC_013707@OleuC_p046@psbb@75065@76591@D@1@509 PSII_47kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTVTNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSAGLAENQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQVV
>NC_013823@TylaC_p048@psbb@77541@79067@D@1@509 photosystem_II_CP47_chlorophyll_apoprotein
MGLPWYRVHTVVLNDPGRLISVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSISGGTVTNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFTDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQSVNPAWGAEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSAGLAENLSLSE
AWSKVPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPVFKDKE
GRELFVRRMPTFFETFPVVLVDEDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHATFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGTFQKLGD
PTTKRQVV
>NC_013843@Vrkps_p051@psbb@72446@73972@D@1@509 photosystem_II_CP47_chlorophyll_apoprotein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWNITGGAITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLAGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGRIQSVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVGAGLAENQNLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GHELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRPVV
>NC_013991@PhdaC_p048@psbb@74503@76029@D@1@509 photosystem_II_p680_chlorophyll_A_apoprotein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVSGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSISGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQSVNPAWGAEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSAGLAENLSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPVFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYGDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHATFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGTFQKLGD
PTTRRQVV
>NC_014056@OngoraC_p047@psbb@70653@72179@D@1@509 photosystem_II_CP47_chlorophyll_apoprotein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVSGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWNISGGTITNPGIWSYEGVAGAH
ILFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGNVQSVNPAWGAEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVGAGLAENLSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRTGSMDSGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVIYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHATFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGTFQKLGD
PTTRRQVV
>NC_014057@PisaC_p058@psbb@101858@103384@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWNITGGTITNPGIWSYEGVAAAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLAGVAC
FGFGAFHVTGLFGPGIWVSDPYGLTGRVQSVNPAWGVDGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVGGGLVENQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVIVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTKKQGV
>NC_014062@AnmaCp047@psbb@70572@72098@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVSGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSISGGTVTNPGIWSYEGVAGAH
IVFSGCVFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLAGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQAVNPAWGAEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSNGLAENLSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPVFRDKE
GRELFVRRMPTFFETFPVVLVDEEGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHATFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGTFQKVGD
PTTRRQVV
>NC_014063@LasapC_p029@psbb@36667@38193@R@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWNITGGTITNSGIWSYEGVAAAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLAGVAC
FGFGAFHVTGLFGPGIWVSDPYGLTGRVQFVNPAWGVDGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVGSGLVENQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GHELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVIVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTKKQGV
>NC_014267@KrfoC_p031@psbb@21419@22948@R@1@510 photosystem_II_P680_chlorophyll_A_apoprotein
MALPWYRVHTVVLNDPGRLIAVHLMHTALVAGWAGSMALYELAVFDPSDP
VLNPMWRQGMFVMPFMTRLGITDSWGGWSITGESVSNPGIWSFEGVALSH
IILSGMCFLAAIWHWVYWDLELFRDPRTGEPALDLPKIFGIHLFLSGLAC
FGFGAFHVTGLFGPGIWVSDAYGITGKVQPVAPAWGADGFNPFNPGGIAA
HHIAAGIFGIFAGIFHLTVRPPQRLYRALRMGNIETVLSSSIAAVFFAAF
VTSGTMWYGAAATPIELFGPTRYQWDSGYFQQEIERQVEASVSEGLSESQ
AWSRIPDKLAFYDYIGNNPAKGGLFRAGPMDKGDGIAEAWLGHPIFRDKE
GRELTVRRMPAFFETFPVILVDKDGIIRADIPFRRAESKYSIEQVGVSVD
FYGGKLNGQTFKDAPTVKKFARKAQLGEVFEFDRTSLESDGVFRSSPRGW
YTFGHANFALLFFLGHLWHGGRTIFRDVFTGIGAEVTEQVEFGAFQKLGD
KSTKKQGAV
>NC_014287@PyulOm_p030@psbb@18811@20340@R@1@510 photosystem_II_chlorophyll_A_core_antenna_apoprotein
MALPWYRVHTVVLNDPGRLIAVHLMHTALVAGWAGSMALYELAVFDPSDP
VLNPMWRQGMFVMPFMTRLGITDSWGGWSITGESVSNPGIWSFEGVALSH
IILSGMCFLAAIWHWVYWDLELFRDPRTGEPALDLPKIFGIHLFLSGLAC
FGFGAFHVTGLFGPGIWVSDAYGITGKVQPVAPAWGADGFNPFNPGGIAA
HHIAAGIFGIFAGIFHLTVRPPQRLYRALRMGNIETVLSSSIAAVFFAAF
VTSGTMWYGAAATPIELFGPTRYQWDSGYFQQEIERQVEASVSEGLSESQ
AWSRIPDKLAFYDYIGNNPAKGGLFRAGPMDKGDGIAEAWLGHPIFRDKE
GRELTVRRMPAFFETFPVILVDKDGIIRADIPFRRAESKYSIEQVGVTVD
FYGGKLNGQTFKDAPTVKKFARKAQLGEVFEFDRTSLESDGVFRSSPRGW
YTFGHANFALLFFLGHLWHGGRTIFRDVFTGIGAEVTEQVEFGAFQKLGD
KSTKKQGAV
>NC_014340@CHVEC_p070@psbb@12173@13819@R@1@549 photosystem_II_47_kDa_protein
MGRQRRILPWYRVHSILFNDPGRLISVHLMHTALIAGWAGAMTLYELNIF
DPSDPVLNPMWRQGMYVLPFMARLGITNSSDKWNLFGSQDYYKSDTPNGT
GVLNWWTRTGNQGGWTFESVALAHFGLSGMLILASMWHWYYWNLDLFEND
NVFFQNVTTLDYLLLFSIHLTLASALCFGFGALHLTGTWGPGVWMNDRFG
LNPHLVYVQPEWGGEGFNPFNLSGVPAHHIAAGTLGLLGGYFHLRVRPGL
YLFLWAHMGNIETILASGIAALLFAALLTTASMWYGTVLTPITLFGPTRY
QWDSGFFQTQVDELVTDNLAKYGSLAKAYQQLPDRLLFYDYIGNNPGKGG
LFRAGALNKGDGVAKTWLGHPIFYDGNTNEILTVRRMPTFFETFPVTLTD
RYGVLRVDIPFRRAESKFSIEQQGTVCKYFGGLKDGQELYAVAAVKAAAR
KAVLGEQFDFDRQQFNSDGVFRASPRTWYAFGHAIFAFFFFFGHLWHAGR
TLFEELLTGVDSEVFDFVKFGGMSKVGGKFVYRRAPMTITNYILNNNY
>NC_014345@AlspOC_p032@psbb@28117@29715@R@1@533 photosystem_II_47_kDa_protein
MALPWYRVHTVVLNDPGRLIAVHIMHTALVAGWAGSMALYELSVFDPSDP
VLNPMWRQGMFVLPFMARLGVTESWNGWSLLGDTDLEAVPIYAVDESTGV
VDQIFQFLVSRGPGIWSVEGVAVSHIILSGLLFLAAIWHWTFWDLDIFRD
PESNQLVLDLPLVFGIHLALASFLCLGFGGFHVAGLFGPGIWVSDAYGLS
AAVKPVQPEWGPDGFNPFNPGGVAAHHIAAGILGIIASVFHLSVRPSERL
FKLLRMGNIETVLSSSIAAVFFAAFVTSGTMWYGSATTPVDLFGPTRYQW
DSGYFQQEVERQVENNLRRGYSLTEAWSLVPDKLAFYDYVGNNPAKGGLF
RAGPMNKGDGIAQAWLGHPIFRTKDGNELTVRRMPSFFETFPVILVDKDG
VVQADIPFRRAESKYSIEQVGVSVQFLGGKLNGQKFDDPTTVKKFARKAQ
LGEMFQFDRVTLQSDGVFRSSPRGWYTFGHLNLALLFYFGHLWHGGRTLF
RDVLTGIGADVVKQVEFGAFQKLGDETTELSR
>NC_014346@FlteC_p035@psbb@224687@226216@D@1@510 CP47_chlorophyll_apoprotein_of_photosystem_II
MGLPWYRVHTVVLNDPGRLIAVHLMHTSLVSGWAGSMALYELAVFDPSDP
VLNPMWRQGMFVLPFMTRLGITKSWGGWSISGETIANTGFEWTYESVAAA
HIVLSGALFLAAIWHWTYWDLDLFRDPREKKPALDLPKIFGIHLFLSGLV
CFGFGAFHITGLFGPGIWVSDPYGLTGSVQPVAPSWGSDGFDPFNPGGIA
AHHIAAGILGVLAGLFHLCVRPSLRLYLGLSMGSIETVLSSSIAAVFWAA
FVVAGTMWYGSAATPVELFGPTRYQWDQGFFQQEIEKRVSKSLAAGESVT
EAWAKIPEKLAFYDYIGNNPAKGGLFRSGAMNSGDGIAVGWLGHAVFKDR
DGNELYVRRMPTFFETFPVLLIDKDGLVRADVPFRRAESKYSIEQVGVSV
SFYGGELDGLTFSDPATVKKYARRAQLGEIFEFDRATLQSDGVFRSSPRG
WFTFGHLCFALLFFFGHIWHGARTLARDRFAGIDDDVTDQVEFGKFQKVG
DPSTARQGV
>NC_014348@PTAQ_Cp070@psbb@70211@71740@D@1@510 photosystem_II_CP47_chlorophyll_apoprotein
MGLPRYRVHTVVLNDPGRLISVHLMHTALVSGWAGSMASYELAVFDPSDP
VLDPMWRQGMFVIPFMTRIGVTKSWGGWSITGDTATDAGIWSYEGVAAAH
IILSGLLFLAAIRHWVYWDLDLFRDDRTGKPSLDLPKIFGIHLFLSGVLC
FAFGAFHVTGLFGPGIWVSDPYGLTGKVEPVDPAWGAEGFDPFVPGGIAS
HHIAAGVLGILAGLFHLSVRPPQRLYKALRMGNVETVSSSSIAAVFFAAF
VVSGTMWYGSAATPIELFGPTRYQWDQGYFQQEIEKRIRLGEAENLSLSQ
AWSKIPEKLAFYDYIGNNPAKGGLFRAGAMDNGDGIAVGWLGHAVFKDRE
GHELFVRRMPTFFETFPVVLVDGEGIVRADVPFRRAESKYSVEQVGVTVE
FFGGELDGASFSDPATVKKYARRAQLGEIFEFDRATLKSDGVFRSSPRGW
FTFGHATFALIFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PSTKRQAVR
>NC_014569@ErteP_p006@psbb@10401@11927@D@1@509 photosystem_II_CP47_chlorophyll_apoprotein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTVTNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFSDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGRVQSVNPAWGVDGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVGAGLGKNQSLSE
AWAKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GCELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGQLNGVIYSDPATVKKYARRAQLGEIFELDRAALKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDTQVEFGAFQKLGD
PTTKRQAV
>NC_014570@EucgrC_p047@psbb@77076@78602@D@1@509 photosystem_II_CP47_chlorophyll_apoprotein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVGAGLAKNQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQVV
>NC_014573@GepaP_p034@psbb@49421@50947@R@1@509 photosystem_II_CP47_chlorophyll_apoprotein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGETITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFSDERTGKPSLDLPKIFGIHLFLSGVSC
FGFGAFHVTGLYGPGIWVSDPYGLTGRVQFVNPAWGVSGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVGAGLVKNQSLSE
AWSKIPEKLSFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GYELFVRRMPTFFETFPVVLVDGNGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVIYSDPTTVKKYARRAQLGEIFELDRAALKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
STTKRQAV
>NC_014575@CedeC_p004@psbb@1775@3301@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLISVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGIKDSWSGWSITGETVTNPGIWSYEGVAGAH
IMFSGLCFLAAIWHWVYWDLEIFCDERTGKLCLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKIQPVDPAWGAEGFDPFVPGGIAS
HHIAAGILGILAGLFHLSVRPPQRLYIGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPVELFGPTRYQWDQGYFQQEIDRRVRAGLAENLSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGAMDNGDGIAVGWLGHPIFKDKE
GNELFVRRMPTFFETFPVVLVDKEGIVKADVPFRRAESKYSVEQVGVTVE
FYGGGLDRVSFGDPAIVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHATFALLFFFGHIWHGARTLFRDVFAGIDPDLDARIEFGAFQKLGD
PTTKRQVV
>NC_014582@MospP_p017@psbb@25806@27332@D@1@509 photosystem_II_CP47_chlorophyll_apoprotein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
ALDPMWRQGMFVIPFMTRLGISNSWGGWSITGGTLTNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFSDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGRVQFVNPAWGVDGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVGAGLAENQSLSE
AWAKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIALGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEEVGVTLE
FYGGELNGVIYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTKKRAV
>NC_014589@CaarC_p023@psbb@21617@23143@R@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLISVHIMHTALVAGWAGSMTLYELAVFDPSDP
VLDPMWRQGLFVIPFMTRLGIKDSWTGWNITGETVNNPGIWSYEGVALAH
ILFSGLCFLAAIWHWVYWDLEIFVDERTGKLCLDLPKVFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKIQPVNPAWGAEGFDPFVPGGIAS
HHIAAGILGILAGLFHLSVRPPQRLYVGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPVELFGPTRYQWDQGYFQQEIDRRVRTGLAEKLSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGAMDNGDGIAVGWLGHPIFKDKE
GNELFVRRMPTFFETFPVVLVDKEGIVKADVPFRRAESKYSVEQVGVTVE
FYGGGLDRVSFGDPAIVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHATFALLFFSGHIWHGARTLFRDVFAGIDPDLDDRIEFGVFQKLGD
PTTKRQMV
>NC_014592@ChliC_p070@psbb@68703@70229@D@1@509 photosystem_II_CP47_chlorophyll_apoprotein
MGLPWYRVHTVVLNDPGRLISVHLMHTALVSGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRIGITKSWGGWSITGDTATDAGIWSYEGVAAAH
IILSGLLFLAAIWHWVYWDLDLFRDDRTGKPSLDLPKIFGIHLFLSGVLC
FAFGAFHVTGLFGPGIWVSDPYGLTGKVEPIDPAWGAEGFDPFIPGGVAS
HHIAAGVLGILAGLFHLSVRPPQRLYKALRMGNVETVLSSSIAAVFFAAF
VVSGTMWYGSAATPIELFGPTRYQWDQGYFQQEIERRIRSGKDENLSLSE
VWSKIPEKLAFYDYIGNNPAKGGLFRAGAMDNGDGIAVGWLGHAVFKDRE
GHELFVRRMPTFFETFPVVLVDGEGVVRADVPFRRAESKYSVEQVGVTVE
FFGGELDGASFSDPATVKKYARRAQLGEIFEFDRATLKSDGVFRSSPRGW
FTFGHATFALIFFFGHIWHGSRTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PSTRRQAV
>NC_014674@CamoC_p048@psbb@78568@80094@D@1@509 photosystem_II_CP47_chlorophyll_apoprotein
MGLPWYRVHTVVLNDPGRLISVHIMHTALVAGWAGSMALYELAIFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFSDERTGKPSLDLPKIFGIHLFLSGLAC
FGFGAFHVTGLYGPGIWVSDPYGLTGRVQSVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSAGIAENQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGTFQKLGD
PTTRRQVV
>NC_014675@IsflC_p018@psbb@12399@13925@R@1@509 photosystem_II_CP47_chlorophyll_apoprotein
MGPPWYRVHTVVSNDPGRSIAVHIMHTALVSGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITKSWGGWSITGETVTNAGIWSYEGVAAAH
IVLSGLLFLSAIWHWVYWDLEIFTDERTGALTIDLPKVFGVHLFLSGVLC
FGFGAFHVTGLFGPGIWVSDPYGLTGEAQPVAPVWGAEGFDPFVPGGIAS
HHIAAGILGILAGLFYLSVRPPQRLYKGLRMGNVETVLSSSIAAVFFAAF
VAAGTMWYGSATTPIELFGPTRYQWDQGFFQQEIDRRIRSSRAENLSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGAMDNGDGIAVGWLGHAVFRDKE
GHELFVRRMPTFFETFPVVLVDGEGIARADVPFRRAESKYSIEQVGVTVE
FYGGELDGVSFSDPATVKKYARRAQLGEISEFDRATLKSDGVFRSSPRGW
FTFGHATFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTKRQAV
>NC_014676@ThcaC_p047@psbb@77440@78966@D@1@509 photosystem_II_CP47_chlorophyll_apoprotein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSAGLAENQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKIGD
PTTRRQVV
>NC_014697@PrpeC_p048@psbb@74124@75650@D@1@509 photosystem_II_CP47_chlorophyll_apoprotein
MGLPWYRVHTVVLNDPGRLIAVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTVTNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFTDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGRVQSVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRIGAGLAENQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQVV
>NC_014699@EvarC_p018@psbb@11827@13353@R@1@509 photosystem_II_CP47_chlorophyll_apoprotein
MGLPWYRVHTVVLNDPGRLLAVHLMHTALVSGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRIGITKSWGGWSITGETVTDAGIWSYEGVAAAH
IILSGLLFLSAIWHWVYWDLELFRDERTGKPSLDLPKIFGVHLFLSGVLC
FGFGAFHVTGLFGPGIWVSDPYGLTGNVRPVDPAWGADGFDPFVPGGIAS
HHIAAGILGILAGLFHLSVRPPQRLYKALRMGNIETVLSSSIAAVFFAAF
VVSGTMWYGSAATPIELYGPTRYQWDQGYFQQEIDRRIRVSLADNSSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGAMDNGDGIAVGWLGHAVFRDKE
GHDLFVRRMPTFFETFPVVLVDEEGIVRADVPFRRAESKYSVEQVGVTVD
FYGGELNGVSFSDPATVKKYARRSQLGEIFEFDRATLKSDGVFRSSPRGW
FTFGHATFALLFFFGHIWHGARTLFRDVFAGIDPDLESQIEFGAFEKLGD
PSTEKRAV
>NC_014807@ColaC_p048@psbb@77004@78530@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLAVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGIINSWGGWSITGGTVTNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFSDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGRVQSVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVGAGLAENQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQVV
>NC_014808@THAOCp052@psbb@44806@46335@D@1@510 photosystem_II_CP47_chlorophyll_apoprotein
MALPWYRVHTVVLNDPGRLISVHLMHTALVAGWAGSMALYELAVFDPSDP
VLNPMWRQGMFVMPFMTRLGITDSWGGWSITGESVSNPGLWSFEGVALSH
IVLSGMCFLAAIWHWVYWDLELFRDPRTGEPALDLPKIFGIHLLLSGLLC
FGFGAFHVTGLFGPGIWVSDAYGITGKVQPVAPSWGADGFNPFNPGGIAA
HHIAAGIFGILAGIFHLTVRPPQRLYRALRMGNIETVLSSSISAVFFAAF
VTSGTMWYGAAATPIELFGPTRYQWDSGYFQQEIERQVEASVTEGLSESQ
AWSRIPDKLAFYDYIGNNPAKGGLFRSGPMDKGDGIAEAWLGHPIFRDKE
GRELTVRRMPAFFETFPVILVDKDGIIRADIPFRRAESKYSIEQVGVTVD
FYGGKLNGQTFKDAPTVKKFARKAQLGEVFEFDRTSLESDGVFRSSPRGW
YTFGHANFALLFFLGHLWHGGRTIFRDVFTGIGAEVTEQVEFGAFQKLGD
KTTKKQGAV
>NC_015083@ErcaC_p047@psbb@71566@73092@D@1@509 photosystem_II_CP47_chlorophyll_apoprotein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSIAGGAVTNPGIWSYEGVAGAH
IVFSGLCFLASIWHWVYWDLEIFSDERTGKPSLDLPKIFGIHLFLSGVAC
FSFGAFHVTGLYGPGIWVSDPYGLTGRVQSVNPAWGVDGFDPFVAGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
IVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVGAGLAENQSLSE
AWAKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GSELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVVYSDPATVKKYARRAQLGEIFELDRAALKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTKRQAV
>NC_015084@CospP_p057@psbb@108961@111917@D@2@507 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLIAVHLMHTALVSGWAGSMAFYELAVFDPSDP
VLNPMWRQGMFVLPFMTRLGITQSWGNWTISGETATSPGIWTYEGVATAH
ILLSGALFMASIWHWVYWDLELFRDPRTGDPALDLPKIFGIHLFLSGLLC
FGFGAFHVTGLFGPGIWVSDPYGITGSVQPVSPAWGADGFDPYNPGGIAS
MAAGILGVLAGLFHLCVRPSQRLYNGLRMGNIETVLSSSIAAVFWAAFVV
AGTMWYGSAATPIELYGPTRYQWDLGFFQQEIERRVQGSLAEGKSSSQAW
SEIPEKLAFYDYIGNNPAKGGLFRAGAMNSGDGIAVGWLGHAVFKDKDGN
ELFVRRMPTFFETFPVLLIDKDGVVRADVPFRRAESKYSIEQVGVSVAFY
GGELNGVTFTDPATVKKYARRAQLGEVFEFDRATLQSDGVFRSSPRGWFT
FGHLCFALLFFFGHIWHGARTIFRDVFAGIDSDIDDQVEFGAFQKLGDPS
TRRQSV
>NC_015113@AnceC_p048@psbb@73151@74677@D@1@509 photosystem_II_CP47_chlorophyll_apoprotein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITSSWGGWSITGGATPNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLAGLAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQSVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSAGLAENKSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQTV
>NC_015204@GothC_p048@psbb@76746@78272@D@1@509 photosystem_II_CP47_chlorophyll_apoprotein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSAGLAENQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKD
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQVV
>NC_015206@FvH4_C0069@psbb@73676@75202@D@1@509 photosystem_II_CP47_chlorophyll_apoprotein
MGLPWYRVHTVVLNDPGRLIAVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTVSNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLAIFTDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGRVQAVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRIGAGLAENQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDSGDGIAVGWLGHPIFRDKE
GHELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTKRQVV
>NC_015308@HebrCp068@psbb@77025@78551@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPVSPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSAGLAENQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQVV
>NC_015359@ChvaP_p036@psbb@65915@67363@D@1@483 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLIAVHLMHTSLVSGWAGSMAFYELAVFDPSDP
VLNPMWRQGMFVLPFMTRLGINQSWGGWTISGETASNPGIWSYEGVAAAH
IVLSGLLFAASIWHWVYWDLELFRDPRTSNPALDLPKIFGIHLFLSGVLC
FGFGAFHVTGIFGPGIWVSDPYGITGTVQAVAPSWDATGFDPYNPGGISA
HHIAAGILGVLAGLFHLCVRPPQRLYNGLRMGNIETVLSSSIAAVFWAAF
VVSGTMWYGSAATPIELFGPTRYQWDLGFFQQEIERRVQTSLSEGKSSSQ
AWAEIPEKLAFYDYIGNNPAKGGLFRAGAMNSGDGIAVGWLGHAVFKDKQ
GNELFVRRMPTFFETFPVFLVDKDGVVRADVPFRRSESKYSIEQVGVSVT
FYGGELNGVTFSDPATVKKYARRAQLGEIFEFDRATLQSDGVFRTSPRGW
FTFAHLCFALLFFFGHIWHGARTIFRDVFGRY
>NC_015401@OleuseuP_p046@psbb@75092@76618@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTVTNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSAGLAENQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQVV
>NC_015402@PtpuC_p054@psbb@68793@70310@D@1@506 photosystem_II_CP47_chlorophyll_apoprotein
MGLPWYRVHTVVLNDPGRLIAVHLMHTALVSGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITKSWGGWSITGETVTNAGIWSYEGVAVVH
IVLSGLLFLAAIWHWVFWDLELFRDERTGKPSLDLPKIFGIHLFLSGVLC
FAFGAFHVTGLFGPGIWVSDPYGLTGKIQPVVPAWGAEGFDPFVPGGIAS
HHIAAGILGILAGLFHLSVRPPQRLYKGLRMGNVETVLSSSIAAVFFAAF
VVAGTMWYGSAATPIELFGPTRYQWDQGFFQQEIDRRIRSAKAENLNLSE
VWSKIPEKLAFYDYIGNNPAKGGLFRAGAMDNGDGIAVGWLGHAVFRDKQ
GHQLFVRRMPTFFETFPVVLVDEEGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELDGVSFDDPATVKKYARRAQLGEIFEFDRATLKSDGVFRSSPRGW
FTFGHATFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQLEFGAFQKLGD
LTTKR
>NC_015403@FispC_p121@psbb@116424@117953@R@1@510 photosystem_II_chlorophyll_A_core_antenna_apoprotein
MALPWYRVHTVVLNDPGRLIAVHIMHTALVAGWAGSMALYELAVFDPSDP
VLNPMWRQGMFVMPFMTRLGITDSWGGWSITGESVSNPGIWSFEGVALSH
IVLSGMCFLAAIWHWVYWDLELFRDPRTGEPALDLPKIFGIHLFLSGLLC
FGFGAFHVTGLFGPGIWVSDAYGIAGKVQPVAPSWGPDGFNPFNPGGIAA
HHIAAGLFGILAGVFHLTVRPPQRLYRALRMGNIETVLSSSIAAVFFAAF
VTSGTMWYGAAATPIELFGPTRYQWDSGYFQQEIERQVEASVSEGLSESQ
AWSRIPDKLAFYDYIGNNPAKGGLFRAGAMTKGDGIAEAWLGHPVFRDKE
GRELTVRRMPAFFETFPVILVDKDGIIRADIPFRRAESKYSIEQVGVTVD
FYGGKLNGQTFKDAPTVKKFARKAQLGEVFEFDRTSLESDGVFRSSPRGW
YTFGHANFALLFFFGHLWHGGRTIFRDVFTGIGAEVTEQVEFGAFQKLGD
RSTKKQGAV
>NC_015543@JavuC_p047@psbb@71114@72640@D@1@509 photosystem_II_CP47_chlorophyll_apoprotein
MGLPWYRVHTVVLNDPGRLLAVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFSDERTGKPSLDLPKIFGIHLFLAGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQSVNPLWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSAGLAENQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDSGDGIAVGWLGHPIFRDKE
GHELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVNYSDPVTVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQVV
>NC_015604@OleuscuC_p046@psbb@75088@76614@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTVTNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSAGLAENQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQVV
>NC_015605@NeluCp048@psbb@79923@81449@D@1@509 photosystem_II_CP47_chlorophyll_apoprotein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVSGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTITNPGLWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVGAGLAENQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGTFQKLGD
PTTKRQVV
>NC_015608@OlwoswoC_p046@psbb@75180@76706@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTVTNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSAGLAENQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQVV
>NC_015610@NenuCp048@psbb@80003@81529@D@1@509 photosystem_II_CP47_chlorophyll_apoprotein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVSGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTITNPGLWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVGAGLAENQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGTFQKLGD
PTTKRQVV
>NC_015621@AradC_p048@psbb@72059@73576@D@1@506 photosystem_II_CP47_chlorophyll_apoprotein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLAGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQSVNPSWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSAGLAENQSLSE
VWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GHELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPVTVKKYARRAQLGEVFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRR
>NC_015623@OleusmaC_p046@psbb@75102@76628@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTVTNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSAGLAENQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQVV
>NC_015645@ScleC_p023@psbb@46894@48420@D@1@509 CP47_chlorophyll_apoprotein_of_photosystem_II
MGLPWYRVHTVVLNDPGRLIAVHLMHTSLVSGWAGSMALYELAVFDPSDP
VLNPMWRQGMFVLPFMTRLGITKSWGGWTISGETVTTGFEWTYEAVAAAH
IILSGALFLAAIWHWIYWDLDLFRDPREGKPALDLPKIFGIHLFLAGLLC
FGFGAFHVTGLYGPGIWVSDPYGLTGSVQPVAPSWGADGFDPYNPGGIAS
HHIAAGILGVLAGLFHLCVRPSLRLYLGLSMGSIESVLSSSIAAVFWAAF
VVAGTMWYGSAATPVELFGPTRYQWDQGFFQQEIEKRVATSVANGASVSD
AWAQIPEKLAFYDYIGNNPAKGGLFRSGAMNSGDGIAVGWLGHAVFKDSE
GRELSVRRMPTFFETFPVILLDKDGIVRADVPFRRAESKYSIEQVGVSVS
FYGGELDGVTFSDPATVKKYARRAQLGEIFEFDRATLQSDGVFRSSPRGW
FTFGHLCFALIFFFGHIWHGARTLARDRFAGIDDDLNDQVEFGKFQKIGD
PSSFRQAV
>NC_015803@InloC_p046@psbb@71431@72957@D@1@509 photosystem_II_CP47_chlorophyll_apoprotein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVSGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSISGGTVTNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLAGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQAVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSDGLAENLSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPVFRDKE
GRELFVRRMPTFFETFPVVLVDEEGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRSQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHATFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGTFQKVGD
PTTRRQAV
>NC_015817@PhedC_p046@psbb@71384@72910@D@1@509 photosystem_II_CP47_chlorophyll_apoprotein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVSGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSISGGTVTNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLAGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQAVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSDGLAENLSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPVFRDKE
GRELFVRRMPTFFETFPVVLVDEEGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRSQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHATFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGTFQKVGD
PTTRRQAV
>NC_015820@AcpuC_p046@psbb@71426@72952@D@1@509 photosystem_II_CP47_chlorophyll_apoprotein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVSGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSISGGTVTNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLAGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQAVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSDGLAENLSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPVFRDKE
GRELFVRRMPTFFETFPVVLVDEEGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRSQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHATFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGTFQKVGD
PTTRRQAV
>NC_015826@PhnivhC_p046@psbb@71392@72918@D@1@509 photosystem_II_CP47_chlorophyll_apoprotein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVSGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSISGGTVTNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLAGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQAVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSDGLAENLSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPVFRDKE
GRELFVRRMPTFFETFPVVLVDEEGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRSQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHATFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGTFQKVGD
PTTRRQAV
>NC_015830@BaemC_p046@psbb@71159@72685@D@1@509 photosystem_II_CP47_chlorophyll_apoprotein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVSGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSISGGTVTNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLAGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQAVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSDGLAENLSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPVFRDKE
GRELFVRRMPTFFETFPVVLVDEEGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRSQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHATFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGTFQKVGD
PTTRRQAV
>NC_015831@FeriP_p046@psbb@71169@72695@D@1@509 photosystem_II_CP47_chlorophyll_apoprotein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVSGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSISGGTVTNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLAGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQAVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSDGLAENLSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPVFRDKE
GRELFVRRMPTFFETFPVVLVDEEGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRSQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHATFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGTFQKVGD
PTTRRQAV
>NC_015891@SppoC_p045@psbb@78907@80433@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTVTNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPVSPAWGAEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSAGLAENLSLSE
AWAKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAIGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGTFQKLGD
PTTKRQAV
>NC_015892@MakwC_p048@psbb@76260@77786@D@1@509 photosystem_II_CP47_chlorophyll_apoprotein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVSGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGINNSWGGWSVTGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQSVNPAWGAEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVGAGLAENLSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDSGDGIAVGWLGHPIFRDKE
GHELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHATFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTKRQVV
>NC_015894@WoliC_p046@psbb@79666@81192@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGLAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPVSPAWGAEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSTGLSENLSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAIGWLGHPVFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHVSFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGTFQKLGD
PTTKRQAV
>NC_015899@WoauC_p047@psbb@79172@80698@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPVSPAWGAEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSAGLAENLSLSE
AWAKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAIGWLGHPVFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGTFQKLGD
PTTKRQAV
>NC_015983@CumesmeC_p048@psbb@74395@75915@D@1@507 photosystem_II_CP47_chlorophyll_apoprotein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGLGC
FGFGAFHVTGLYGPGIWVSDPYGLTGRVQAVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSTGLAENQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPVFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTKRV
>NC_015990@PVIS_g047@psbb@69991@71517@D@1@509 photosystem_II_CP47_chlorophyll_apoprotein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVSGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSISGGTVTNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLAGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQAVNPAWGAEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSDGLAENLSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPVFRDKE
GRELFVRRMPTFFETFPVVLVDEEGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHATFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGTFQKVGD
PTTRRQAA
>NC_015996@PypyC_p047@psbb@75933@77459@D@1@509 photosystem_II_CP47_chlorophyll_apoprotein
MGLPWYRVHTVVLNDPGRLISVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTVTNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFTDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGRVQSVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRIGAGLAENQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQVV
>NC_016058@LadeC_p013@psbb@21548@23074@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLISVHIMHTALVAGWAGSMTLYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGIKNSWSGWSINGETVINPGIWSYEGVALAH
IFFSGLCFLAAIWHWVYWDLELFFDERTGKLCLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKIQPVDPAWGAEGFDPFVPGGIAS
HHIAAGILGILAGLFHLSVRPPQRLYVGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPVELFGPTRYQWDQGYFQQEIDRRVRAGLAENLSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGAMDNGDGIAVGWLGHPIFKDKE
GNELFVRRMPTFFETFPVVLVDKEGIVKADVPFRRAESKYSVEQVGVTVE
FYGGGLDRVSFGDPAIVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHATFALLFFSGHIWHGSRTLFRDVFAGIDPDLDSRVEFGAFQKLGD
PTTKRQVV
>NC_016063@CewiC_p008@psbb@5661@7187@R@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLIAVHIMHTALVSGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGIKDSWGGWSITGETVSNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLDVFCDDRTGKPSLDLPKIFGIHLFLSGAAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKIQPVNPAWGAEGFDPFVPGGIAS
HHIAAGILGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
IVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIDRRVRAGLADNLSLSE
AWSKIPDKLAFYDYIGNNPAKGGLFRAGAMDNGDGIAVGWLGHPIFKDKK
GHELFVRRMPTFFETFPVVLVDEEGIVKADVPFRRAESKYSVEQVGVTVE
FYGGELDGVSFGDPAIVKKYARRSQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHATFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTKRQVV
>NC_016064@Pssivw_p039@psbb@53661@55187@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLISVHIMHTALVSGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGIKDSWSGWSITGETVINPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLDLFCDDRTGKLCLDLPKVFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKIQPVDPAWGAEGFDPFVPGGIAS
HHIAAGILGILAGLFHLSVRPPQRLYIGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPVELFGPTRYQWDQGYFQQEIDRRVRAGLAENLSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGAMDNGDGIAVGWLGHPIFKDKE
GNELFVRRMPTFFETFPVVLVDKEGIVKADVPFRRAESKYSVEQVGVTVE
FYGGGLDRVSFGDPAIVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHATFALLFFSGHIWHGARTLFRDVFAGIDPDLDARVEFGAFQKLGD
PTTKRQVV
>NC_016065@TacrC_p057@psbb@93765@95291@R@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLIAVHIMHTALVSGWAGSMALYELAVFDPSDP
ILDPMWRQGMFVIPFMTRLGIKDSWGGWSITGETVSNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLDVFCDSRTGKPSLDLPKIFGIHLFLSGAAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKIQPVNPAWGAEGFDPFVPGGIAS
HHIAAGILGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
IVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIDRRVRAGLAENLSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGAMDNGDGIAVGWLGHPIFKDKK
GHELFVRRMPTFFETFPVVLVDEEGIVKADVPFRRAESKYSVEQVGVTVE
FYGGELDGVSFGDPAIVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHATFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTKRQVV
>NC_016068@NiunC_p056@psbb@74901@76427@D@1@509 PSII_47kD_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTVTNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSAGLAENQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTKRQAA
>NC_016069@PimoC_p038@psbb@69410@70936@R@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLISVHIMHTALVAGWAGSMTLYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGIKDSWTGWNITGETVINPGIWSYEGVAGAH
IMFSGLCFLAAIWHWVYWDLEIFCDERTGKLCLDLPKVFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKIQPVDPAWGAEGFDPFVPGGIAS
HHIAAGILGILAGLFHLSVRPPQRLYVGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPVELFGPTRYQWDQGYFQQEIDRRVRAGLAENLSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGAMDNGDGIAVGWLGHPIFKDKE
GNELFVRRMPTFFETFPVVLVDKEGIVKADVPFRRAESKYSVEQVGVTVE
FYGGGLDRVSFGDPAIVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHATFALLFFSGHIWHGARTLFRDVFAGIDPDLDARIEFGAFQKLGD
PTTKRQVV
>NC_016430@ESH0743@psbb@74978@76504@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSVTGGAIPNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFSDERTGKPSLDLPKIFGIHLFLAGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQSVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSAGLAENQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDSDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQVV
>NC_016433@SIC0743@psbb@73634@75160@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTVTNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPVNPSWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSAGLAENQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGTFQKLGD
PTTRRQAV
>NC_016668@GoraCp048@psbb@76732@78258@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSAGLAENQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKD
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQVV
>NC_016670@GodaCp048@psbb@76892@78418@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSAGLAENQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKD
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQVV
>NC_016677@LetiP_p047@psbb@70225@71751@D@1@509 photosystem_II_CP47_chlorophyll_apoprotein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVSGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSISGGTVTNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLAGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQAVNPAWGAEGFDPFVPGGVAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSDGLAENLSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDEEGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRSQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHATFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGTFQKVGD
PTTRRQPV
>NC_016690@GotoCp048@psbb@76913@78439@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSAGLAENQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKD
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQVV
>NC_016692@GoheCp048@psbb@76770@78296@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSAGLAENQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKD
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQVV
>NC_016699@PhprC_p047@psbb@71390@72916@D@1@509 photosystem_II_CP47_chlorophyll_apoprotein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVSGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSISGGTVTNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLAGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQAVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSDGLAENLSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPVFRDKE
GRELFVRRMPTFFETFPVVLVDEEGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRSQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHATFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGTFQKVGD
PTTRRQAV
>NC_016703@Phant_p059@psbb@58034@59563@D@1@510 photosystem_II_47_kDa_protein
MALPWYRVHTVVLNDPGRLIAVHLMHTALVAGWAGSMALYELAVFDPSDP
VLNPMWRQGMFVMPFMARLGVTDSWGGWSITGESVSDPGIWSFEGVALTH
IILSGMCFLAAIWHWVYWDLELFRDPRTGEPALDLPKIFGIHLFLASLLC
FGFGAFHVTGTFGPGIWVSDAYGVTGRVQAVAPAWGAEGFNPFNPGGIAS
HHIAAGILGILAGVFHLTIRPPQRLYRALRMGNIETVLSSSISAVFFAAF
ITSGTMWYGAATTPIELFGPTRYQWDSGYFQQEIERRVESSLGEGLSLSQ
AWSRIPDKLAFYDYIGNNPAKGGLFRAGPMNKGDGIAEAWLGHPVFQDKE
GRELTVRRMPAFFETFPVILVDKDGIVRADIPFRRAESKYSIEQVGVSTN
FYGGKLNGQVFTDAPTVKKYARKAQLGEVFEFDRTTLESDGVFRSSPRGW
YTFGHANFALLFFLGHLWHGGRTLFRDVFAGIGSEVLEQVEFGAFQKLGD
KTTKKQGVV
>NC_016708@MipiCp048@psbb@71228@72754@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWNITGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLGIFCDERTGKPSLDLPKIFGIHLFLAGVVC
FGFGAFHVTGLYGPGIWVSDPYGLTGRVQSVNPAWSVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVGAGLAENQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GCEFFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQVV
>NC_016711@GomuCp048@psbb@76807@78333@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSAGLAENQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKD
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQVV
>NC_016712@GoarCp048@psbb@76707@78233@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSAGLAENQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKD
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQVV
>NC_016718@RhsuP_p047@psbb@70303@71829@D@1@509 photosystem_II_CP47_chlorophyll_apoprotein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVSGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSISGGTVTNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLAGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQAVNPAWGAEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSDGLAENLSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDEEGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRSQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHATFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGTFQKVGD
PTTRRQPV
>NC_016727@PHSUFM_p047@psbb@70830@72356@D@1@509 photosystem_II_CP47_chlorophyll_apoprotein
MGLPWYRVHTVVLNDPGRLISVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTITDPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFSDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPISPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSAGLSENQSLSE
AWAKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKD
GRELFVRRMPTFFETFPVVLIDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQGV
>NC_016728@SinoC_p047@psbb@67983@69509@D@1@509 photosystem_II_CP47_chlorophyll_apoprotein
MGLPWYRVHTVVLNDPGRLISVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTITDPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFSDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPISPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSAGLSENQSLSE
TWAKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKD
GRELFVRRMPTFFETFPVVLIDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PSTRRQGV
>NC_016729@SicoC_p047@psbb@67918@69444@D@1@509 photosystem_II_CP47_chlorophyll_apoprotein
MGLPWYRVHTVVLNDPGRLISVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTITDPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFSDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPISPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
IVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSAGLSENQSLSE
AWAKIPEKLVFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKD
GRELFVRRMPTFFETFPVVLIDGNGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATIKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQGV
>NC_016730@SilaC_p047@psbb@71270@72796@D@1@509 photosystem_II_CP47_chlorophyll_apoprotein
MGLPWYRVHTVVLNDPGRLISVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTITDPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFSDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPISPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSAGLSENQSLSE
AWAKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKD
GRELFVRRMPTFFETFPVVLIDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTKRQGV
>NC_016731@PHSUFM_p030@psbb@18433@19962@R@1@510 photosystem_II_47_kDa_protein
MALPWYRVHTVVLNDPGRLIAVHLMHTALVAGWAGSMALYELAVFDPSDP
VLNPMWRQGMFVMPFMTRLGITDSWGGWSITGESVSNPGIWSFEGVALSH
IVLSGMCFLAAIWHWVYWDLELFRDPRTGEPALDLPKIFGIHLFLSGLLC
FGFGAFHVTGLFGPGIWVSDAYGITGKVQPVAPAWGADGFNPFNPGGIAS
HHIAAGIFGILAGIFHLTVRPSQRLYRALRMGNIETVLSSSISAVFFAAF
VTSGTMWYGAAATPIELFGPTRYQWDSGYFQQEIERQVETSVSEGLSESQ
AWSRIPDKLAFYDYIGNNPAKGGLFRAGPMDKGDGIAEAWLGHPIFRDKE
GRELTVRRMPAFFETFPVILIDKDGIIRADIPFRRAESKYSIEQVGVTVD
FYGGKLNGQTFKDAPTVKKFARKAQLGEVFEFDRTSLESDGVFRSSPRGW
YTFGHANFALLFFLGHLWHGGRTIFRDVFTGIGAEVTEQVEFGVFQKLGD
KTTKKQGAV
>NC_016732@DUSAC_p065@psbb@185271@186797@R@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVINDPGRLISVHLMHTALVAGWAGAMTLFEIAVFDPSDP
VLNPMWRQGMFVLPFLTRLGVTQSWGGWTISGETSSNPGIWSYEGAAASH
IVLSGLLFLASVWHWVYWDLELFRDPRTGKTALDLPKIFGIHLFLAGLLC
FGFGAFHVTGVFGPGIWVSDPYGLTGSVQPVAPSWGAEGFDPYNPGGVPA
HHIAAGILGVLAGLFHLCVRPSIRLYFGLSMGSIESVLSSSIAAVFWAAF
VVAGTMWYGSAATPIELFGPTRYQWDQGFFQQEIQKRVAQSTSEGLSLSE
AWAKIPEKLAFYDYIGNNPAKGGLFRTGAMNSGDGIAVGWLGHASFKDQE
GRELFVRRMPTFFETFPVVLIDKDGVVRADVPFRKAESKYSIEQVGVSVT
FYGGELNGLTFTDPLTVKKYARKAQLGEIFEFDRSTLQSDGVFRSSPRGW
FTFGHLSFALLFFFGHIWHGSRTIFRDVFAGIDEDINDQLEFGKYKKLGD
TSSVREAF
>NC_016733@PrmiC_p010@psbb@15310@16836@D@1@509 CP47_chlorophyll_apoprotein_of_photosystem_II
MGLPWYRVHTVVLNDPGRLISVHLMHTALVAGWAGSMAFYELAVFDPSDP
VLNPMWRQGMFVLPFMTRLGVTQSWGGWSISGETATNPGVWSYEGVATSH
IGLSGLLILASIWHWVYWDLELFRDPRTGNPALDLPKIFGIHLFLSGVLC
FGFGAFHVTGLFGPGIWVSDPYGLTGSVQPVAPSWGADGFDPYNPGGVPA
HHIAAGILGILAGLFHLCVRPPQRLYNALRMGNIETVLASSIAAVFWAAF
VVAGTMWYGSAATPIELYGPTRYQWDLGFFQQEIEKRVQTSLAEGKSLSE
AWAQIPEKLAFYDYIGNNPAKGGLFRAGAMNSGDGIAVGWLGHSVFRDKD
GNELFVRRMPTFFETFPVLLIDKDGIVRADVPFRRAESKYSIEQVGVTVT
FYGGELDGVTFNDPSTVKKYARRAQLGEVFEFDRATLQSDGVFRSSPRGW
FTFGHLCFALLFFFGHIWHGSRTIFRDVFAGIDPDLDDQVEFGAFQKLGD
VSTRRQSV
>NC_016734@BRNAC_p048@psbb@71245@72729@D@1@495 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWNITGGTITNPGYEGVAAAHIVF
SGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVACFGF
GAFHVTGLYGPGIWVSDPYGLTGKVQPVNPAWGVEGFDPFVPALGILAGL
FHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAFIVAGTMWYGSATTP
IELFGPTRYQWDQGYFQQEIYRRVSAGLAENQSVSEAWSKIPEKLAFYDY
IGNNPAKGGLFRAGSMDNGDGIAVGWLGHPVFRNKEGRELFVRRMPTFFE
TFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVEFYGGELNGVSYSDP
ATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGWFTFGHASFALLFFF
GHIWHGSRTLFRDVFAGIDPDLDAQVEFGAFQKLGDPTTKRQAV
>NC_016735@FuveC_p104@psbb@104875@106407@D@1@511 photosystem_II_chlorophyll_A_core_antenna_apoprotein
MALPWYRVHTVVLNDPGRLIAVHIMHTGLVAGWAGSMALYELSVFDFSDP
ILNPMWRQGMFVMPFMTRLGVSDSWTGWDIAGEKTEPIASLWCYEGVAYT
HIILSGLCFLAAVWHWVYWDLELFRDPRTGEPSLDLPKIFGIHLFLSGLL
CFGFGAFHVTGFFGPGIWVSDAYGLTGQVQPVAPSWGPNGFNPFNPGGIA
AHHIAAGSFGVLAGGFHLTLRPPQRLYRALRMGNIETVLSSSIAAVFFAA
FITSGTMWYGSATTPIELFGPTRYQWDSGYFQQEIERRVEISLNDGLSET
EAWSSLPDKLAFYDYIGNNPAKGGLFRSGPMNKGDGIAEAWLGHPIFRDR
EGRELTVRRMPAFFETFPVILIDKDGIIRADIPFRRAESKYSIEQVGVNV
SFYGGKLNGQSFKDAPTVKKFARKAQLGEVFEFDRTSLESDGVFRSSPRG
WYTFGHLNLALFFFLGHLWHGSRTIFRDVFTGIGSEVTEQVEFGAFQKLG
DETTRRQGVV
>NC_016736@RCOM_ORF00070@psbb@77996@79522@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPVSPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSAGLAENQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTIE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDVQVEFGAFQKIGD
PTTRRQVV
>NC_016753@COESC_p048@psbb@77705@79231@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVSGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTITNPGLWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPVNPAWGAEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVGAGLAENLSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GHELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGTFQKIGD
PTTRRQTV
>NC_016921@PeruC_p048@psbb@73177@74703@D@1@509 PS_II_CP47_chlorophyll_apoprotein
MGLPWYRVHTVVLNDPGRLIAVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTVTNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFTDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGRVQSVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRIGAGLAENQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQVV
>NC_016927@OrmeC_p044@psbb@68811@70337@D@1@509 photosystem_II_CP47_chlorophyll_apoprotein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVSGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSISGGTVTNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLAGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQAVNPAWGAEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSDGLAENLSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDEEGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRSQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHATFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGTFQKVGD
PTTRRQPV
>NC_016986@GinbiCp049@psbb@77317@78843@D@1@509 PSII_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVSGWAGSMALYELAVFDPSDP
VLDPMWRQSMFVIPFMTRLGIKDSWGGWSITGETVTNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLDIFCDERTGKPSPDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKIQPVNPAWGAEGFDPFVPGGIAS
HHIAAGILGILAGPFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
IVAGTMWYGSATTPVELFGPTRYQWDQGYFQQEIDRRVRAGLAENRSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGAMDNGDGIAVGRLGHPIFKDKE
GHELFVRRMPTFFETFPVVLVDEEGIVKADVPFRRAESKYSVEQVGVTVE
FYGGELDGVSFGDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHATFALLFFSGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTKRQVV
>NC_017006@MACHC_p058@psbb@92236@93762@D@1@509 photosystem_II_CP47_chlorophyll_apoprotein
MGLPWYRVHTVVLNDPGRLIAVHLMHTALVSGWAGSMALYELAVFDPSDP
ALDPMWRQGMFVIPFMTRIGITKSWGGWSITGDTVTDAGIWSYEGVAAAH
IILSGLLFLSAIWHWVYWDLDLFRDERTGKPSLDLPKIFGIHLFLSGVLC
FGFGAFHVTGLFGPGIWVSDPYGLTGKVQPVDPAWGAEGFDPFVPGGIAS
HHIAAGILGILAGLFHLSVRPPQRSYKALRMGNVETVLSSSIAAVFFVAF
VVSGTMWYGSATTPIELFGPTHYQWDQGYFQQEIDRRIRTNRSEGLSLSE
AWSKIPEKLAFYDYIGNNPAKCGLFRVGSMDNGDGRGVGWLGHAVFKDKE
GHELFVRRMSIFFETFPVVSVEEEGIVRADVPFRRAESKYSVEQVGVTIE
FYGGELDGASFSDPAMVKKYARRAQLGEIFEFDRATLKSDGVFRSSPRGW
FTFGHATFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTERRAI
>NC_017602@ElguCp067@psbb@73416@74942@D@1@509 photosystem_II_CP47_chlorophyll_apoprotein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVSGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSISGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQSVNPAWGAEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSAGLAENLSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPVFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHATFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGTFQKIGD
PTTRRQVV
>NC_017609@PHEQC_p048@psbb@73952@75478@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVSGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSISGGTITNPGIWSYEGVAGAH
ILFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGIAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQSVNPAWGAEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVGAGLAENLSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GHELFVRRMPTFFETFPVVLVDADGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVIYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHATFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQAV
>NC_017754@EUGYP_p54@psbb@45049@46575@R@1@509 photosystem_II_47_kDa_protein,_P680_chlorophyll_A_apoprotein
MGLPWYRVHTVVLNDPGRLISVHLMHTALVSGWAGSMALYELAIFDPSDP
VLNPMWRQGMFVLPFMTRLGVTKSWGAWSISGENAANPGFWSYEGVAAAH
IVLSGLLFLAAIWHWVYWDLQLFRDPRTGDPALDLPKIFGIHLFLSGLLC
FGFGAFHVTGLYGPGIWVSDPYGITGSVQPVTPAWGAEGFDPYNPGGIAS
HHIAAGILGIIAGLFHLTVRPPQRLYKVLRMGNIETVLSSSIAAVFWSAF
VVAGTMWYGSAATPIELFGPTRYQWDQSFFQVETQRRVQNSLSEGNTLSQ
AWSKIPEKLAFYDYVGNNPAKGGLFRSGPMDNGDGIAAGWLGHSVFTDKS
GRELTVRRMPTFFETFPVLLLDQDGIVRADVPFRRAESKYSIEQVGVTVS
FYGGELDGVNFSDPATVKKYARRAQLGEIFEFDRATLQSDGVFRSSPRGW
FTFGHLCFALLFFFGHIWHGARTIFRDVFAGIDPDLEEQIEFGAFQKLGD
ATTRKQTV
>NC_017835@OrruC_p044@psbb@68801@70327@D@1@509 photosystem_II_CP47_chlorophyll_apoprotein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVSGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSISGGTVTNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLAGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQAVNPVWGAEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSDGLAENLSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDEEGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRSQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHATFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGTFQKVGD
PTTRRQPV
>NC_017894@GogoCp048@psbb@76808@78334@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSAGLAENQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKD
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGGGYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQVV
>NC_018109@GoinCp048@psbb@75933@77459@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSAGLAENQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKD
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQVV
>NC_018110@GosoCp048@psbb@76174@77700@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSAGLAENQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKD
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQVV
>NC_018111@GocaCp048@psbb@76089@77615@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSAGLAENQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKD
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQVV
>NC_018112@GoarCp048@psbb@76206@77732@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSAGLAENQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKD
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQVV
>NC_018113@GoroCp048@psbb@76452@77978@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSAGLAENQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKD
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQVV
>NC_018114@PHSUFM_p037@psbb@72121@73647@D@1@509 photosystem_II_CP47_chlorophyll_apoprotein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVSGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWNISGGTITNPGIWSYEGVAGAH
ILFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGIAC
FGFGAFHVTGLYGPGIWVSDPYGLTGNVQSVNPAWGAEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVGAGLAENLSLSE
VWSKIPEKLAFYDYIGNNPAKGGLFRTGSMDSGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVIYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHATFALLFFFGHIWHGARTLFRDVFAGIDPDLDTQVEFGTFQKLGD
PTTRRQVV
>NC_018117@Dast_Cp048@psbb@74625@76151@D@1@509 PSII_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTVTNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSAGLAENQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTKRQAA
>NC_018357@MagndeCp046@psbb@76351@77877@D@1@509 PsbB
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVSGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGINNSWGGWSITGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQSVNPAWGAEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVGAGLAENLSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GHELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHATFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTKRQVV
>NC_018523@LJCPDNA_115@psbb@106214@107746@R@1@511 photosystem_II_chlorophyll_A_core_antenna_apoprotein
MALPWYRVHTVVLNDPGRLIAVHLMHTGLVAGWAGSMALYELSIFDFSDP
ILNPMWRQGMFVMPFMTRLGVSDSWTGWDIAGERSEPIVSLWCYEGVAYS
HIILSGLCFLAAVWHWVYWDLELFRDPRTGEPSLDLPKIFGIHLFLSGLL
CFGFGAFHVTGFFGPGIWVSDAYGLTGQVQPVAPSWGASGFNPFNPGGIA
SHHMAAGSFGVLAGGFHLTLRPPQRLYRALRMGNIETVLSSSIAAVFFAA
FITSGTMWYGSATTPIELFGPTRYQWDSGYFQQEIERRVEVSLNEGLSES
EAWSSLPDKLAFYDYIGNNPAKGGLFRSGPMNKGDGIAEAWLGHPIFRDR
EGRELAVRRMPAFFETFPVILIDKDGIIRADIPFRRAESKYSIEQVGVNV
SFYGGKLNGQSFKDAPTVKKFARKAQLGEVFEFDRTSLESDGVFRSSPRG
WYTFGHLNLALLFFLGHLWHGSRTIFRDVFTGIGSEVTEQVEFGAFQKLG
DETTRKQGVV
>NC_018541@C305_p038@psbb@73923@75449@D@1@509 photosystem_II_CP47_chlorophyll_apoprotein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTVTNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPVNPAWGAEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVGAGLAENLSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPVFRDKE
GHELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHATFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGTFQKLGD
PTTKRQAV
>NC_018552@C329_p043@psbb@75670@77196@D@1@509 photosystem_II_CP47_chlorophyll_apoprotein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTVTNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSAGLAENQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTKRQAA
>NC_018565@C330_p037@psbb@72095@73621@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWNITGGTITNPGLWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSAGLAENQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAIGWLGHPVFRNKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTKRQAV
>NC_018569@C311c_p073@psbb@25961@27487@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLIAVHLMHTALVSGWAGSMAFYELAVFDPSDP
VLNPMWRQGMFVLPFMTRLGITQSWGNWTISGETSANPGIWTYEGVATAH
ILLSGALFMASIWHWVYWDLELFRDPRTGDPALDLPKIFGIHLFLSGLLC
FGFGAFHVTGLFGPGIWVSDPYGITGSVQPVSPAWGADGFDPYNPGGIAS
HHMAAGILGVLAGLFHLCVRPSQRLYNGLRMGNIETVLSSSIAAVFWAAF
VVAGTMWYGSAATPIELYGPTRYQWDLGFFQQEIERRVQGSLAEGKSPSQ
AWAEIPEKLAFYDYIGNNPAKGGLFRAGAMNSGDGIAVGWLGHAVFTDKD
GNELFVRRMPTFFETFPVLLIDKDGVVRADVPFRRAESKYSIEQVGVSVT
FYGGELNGVTFTDPTTVKKYARRAQLGEIFEFDRATLQSDGVFRSSPRGW
FTFGHLCFALLFFFGHIWHGARTIFRDVFAGIDSDLDDQVEFGAFQKIGD
PSTRRQSV
>NC_018766@D207_p031@psbb@73726@75252@D@1@509 photosystem_II_CP47_chlorophyll_apoprotein
MGLPWYRVHTVVLNDPGRLIAVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTVSNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLAIFTDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGRVQAVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRIGAGLAENQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDSGDGIAVGWLGHPIFRDKE
GHELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTKRQVV
>NC_018767@D229_p032@psbb@73730@75256@D@1@509 photosystem_II_CP47_chlorophyll_apoprotein
MGLPWYRVHTVVLNDPGRLIAVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTVSNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLAIFTDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGRVQAVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRIGAGLAENQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDSGDGIAVGWLGHPIFRDKE
GHELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTKRQVV
>NC_019601@F653_p038@psbb@73633@75159@D@1@509 photosystem_II_CP47_chlorophyll_apoprotein
MGLPWYRVHTVVLNDPGRLISVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTVSNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLAIFTDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGRVQAVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRIGAGLAENQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDSGDGIAVGWLGHPIFRDKE
GHELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTKRQVV
>NC_019602@F654_p038@psbb@73671@75197@D@1@509 photosystem_II_CP47_chlorophyll_apoprotein
MGLPWYRVHTVVLNDPGRLISVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTVSNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLAIFTDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGRVQAVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRIGAGLAENQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDSGDGIAVGWLGHPIFRDKE
GHELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTKRQVV
>NC_019616@F713_p078@psbb@39399@40925@D@1@509 no_product_string_in_file
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTVTNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVGAELAENQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDIE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTLE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQVV
>NC_019628@F728_p038@psbb@70270@71787@D@1@506 photosystem_II_CP47_chlorophyll_apoprotein
MGLPWYRVHTVVLNDPGRLIAVHLMHTALVSGWAGSMALYELAVFDPTDP
VLDPMWRQGMFVIPFMTRLGITKSWGGWSITGETVTNAGLWSYEGVAAVH
IVLSGLLFLAAIWHWVFWDLELFRDERTGKPSLDLPKIFGIHLFLSGVLC
FAFGAFHVTGLFGPGIWVSDPYGLTGKVQPVAPAWGAEGFDPFVPGGIAS
HHIAAGILGILAGLFHLSVRPPQRLYKGLRMGNVETVLSSSIAAVFFAAF
VVAGTMWYGSAATPIELFGPTRYQWDQGFFQQEIDRRIRAGKAENLNLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGAMDNGDGIAVGWLGHAIFKDKE
GHELFVRRMPTFFETFPVVLVDEEGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELDGVSFDDPAAVKKYARRAQLGEIFEFDRAILKSDGVFRSSPRGW
FTFGHATFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQLEFGAFQKLGD
STTKR
>NC_019648@FealCp068@psbb@68310@69836@D@1@509 photosystem_II_CP47_chlorophyll_apoprotein
MGLPWYRVHTVVLNDPGRLLAVHIMHTALVSGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITDSWGGWSISGGTVTNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFSDERTGKPSLDLPKIFGIHLFLAGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQAVNPAWGAEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSNGLAENLSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPVFRDKE
GRELFVRRMPTFFETFPVVLVDEEGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRSQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHATFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGTFQKVGD
PTTRKQAV
>NC_019649@FeovCp068@psbb@66694@68220@D@1@509 photosystem_II_CP47_chlorophyll_apoprotein
MGLPWYRVHTVVLNDPGRLLAVHIMHTALVSGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITDSWGGWSISGGTVTNPGIWSYEGVAGTH
IVFSGLCFLAAIWHWVYWDLAIFEDDRTGKPSLDLPKIFGIHLFLAGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQAVNPAWGAEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSNGLAENLSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAIGWLGHPVFRDKE
GRELFVRRMPTFFETFPVVLVDEEGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRSQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHATFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGTFQKVGD
PTTRKQAV
>NC_019650@FeprCp068@psbb@68405@69931@D@1@509 photosystem_II_CP47_chlorophyll_apoprotein
MGLPWYRVHTVVLNDPGRLLAVHIMHTALVSGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITDSWGGWSISGGTVTNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFSDERTGKPSLDLPKIFGIHLFLAGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQAVNPAWGAEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSNGLAENLSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPVFRDKE
GRELFVRRMPTFFETFPVVLVDEEGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRSQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHATFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGTFQKVGD
PTTRKQAV
>NC_019651@LomuCp068@psbb@68348@69874@D@1@509 photosystem_II_CP47_chlorophyll_apoprotein
MGLPWYRVHTVVLNDPGRLLAVHIMHTALVSGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITDSWGGWSISGGTVTNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFSDERTGKPSLDLPKIFGIHLFLAGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQAVNPAWGAEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSNGLAENLSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPVFRDKE
GRELFVRRMPTFFETFPVVLVDEEGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRSQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHATFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGTFQKVGD
PTTRKQAV
>NC_020018@G259_p48@psbb@25654@27283@D@2@509 photosystem_II_47_kDa_protein
MGLPWFRVHTVVLNDPGRLIAVHLMHTALVSGWAGSMALYELTVFDPSDL
VLNPMWRQGMFVLPFMTRLGVTKSWGAWSMTGESSANPGIWSYEGVAAAH
IVLSGLLFLAAIWHWVYWDLQLFRDPRTGDPALDLPKIFGIHLFLSGLLC
FSFGAFHVTGLFGPGIWVSDPYGITGSIQSVVPSWGAEGFDPYNVGGIAS
HHIAAGILGIIAGLFHLTVRPPQRLYKVLRMGNIETVLSSSIAAVFWSAF
VVSGTMWYGSAATPIELFGPTRYQWDKGFFQEEIQRRVQTSLNSGSSLSE
SWSKIPEKLAFYDYIGNNPAKGGLFRSGAMNNGDGIAIGWLGHSIFTDKE
GNELFVRRMPTFFETFPVLLIDKDGIVRADIPFRRAESKYSIEQVGVSVG
FFGGELDGLSFNDPTTVKKYARRSQLGEIFEFDRATLESDGVFRSSPRGW
FTFGHLSFALLFFFGHIWHGARTIFRDVFAGVDPDLEEQIEFGAFQKLGD
VTTRKQLV
>NC_020019@CSC0743@psbb@74928@76454@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTVTNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVGAGLAENQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQVV
>NC_020092@DenmoCp048@psbb@71117@72643@D@1@509 PSII_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLAVHIMHTALVSGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFSDERTGKPSLDLPKIFGIHLFLAGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQSVNPSWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSAGLAENQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPVFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVTYSDPVTVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTKRQAV
>NC_020098@BN828_cpI0690@psbb@73750@75276@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTVTNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFSDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPVNPSWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSAGLAENQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQAV
>NC_020146@H086_p037@psbb@80018@81544@D@1@509 photosystem_II_CP47_chlorophyll_apoprotein
MGLPWYRVHTVVLNDPGRLLSVHLMHTALVSGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRIGITKSWGGWSITGETVTDAGIWSYEGVAAAH
IILSGLLFLAAIWHWVYWDLDLFRDERTGKPSLDLPKIFGVHLFLSGVLC
FGFGAFHVTGLFGPGIWVSDPYGLTGNVRPVDPAWGAEGFDPFVPGGIAS
HHIAAGILGILAGLFHLSVRPPQRLYKALRMGNIETVLSSSIAAVFFAAF
VVSGTMWYGSAATPIELYGPTRYQWDQGYFQQEIDRRIRVSLADNSSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGAMDNGDGIAVGWLGHAVFRDKE
GHDLFVRRMPTFFETFPVVLVDEEGIVRADVPFRRAESKYSVEQVGVTVD
FYGGELNGVSFSDPATVKKYARRSQLGEIFEFDRATLKSDGVFRSSPRGW
FTFGHATFALLFFFGHIWHGARTLFRDVFAGIDPDLESQIEFGAFEKLGD
PSTEKRAV
>NC_020147@H081_p037@psbb@85167@86693@D@1@509 photosystem_II_CP47_chlorophyll_apoprotein
MGLPRYRVHTVVLNDPGRLISVHLMHTALVSGWAGSMALYELAVFDPSDP
ALDPMWRQGMFVIPFMTRIGVTKSWGGWSVTGDTVTDAGVWSYEGVAASH
IILSGLLFLSAIWHWVYWDLDLFRDERTGKPSLDLPKIFGIHSFLSGVLC
FGFGAFHVTGLFGPGIWVSDPYGLTGKVQPVDPAWGAEGFDPFVPGGIAS
HHIAAGILGILAGLFHLSVRPPQRLYKALRMGNVETVLSSSIAAVSSAAF
VVSGTMWYGSATTPIESFGPTRYQWDQGYFQQEIDRRIRTGRAEGLSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDKGDGIAVGWLGHAISRDKE
GHELFVRRMPTFFETFPVVLVDEEGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELDGANFNDPATVKKYARRAQLGEIFEFDRATLKSDGVFRSSPRGW
FTFGHATFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQIEFGAFQKLGD
PTTERRAV
>NC_020316@MagofCp046@psbb@76434@77960@D@1@509 PSII_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVSGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGINNSWGGWSITGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQSVNPAWGAEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVGAGLAENLSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GHELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHATFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTKRQVV
>NC_020317@MagofCp046@psbb@76430@77956@D@1@509 PSII_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVSGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGINNSWGGWSITGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQSVNPAWGAEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVGAGLAENLSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GHELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHATFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTKRQVV
>NC_020318@Maggra_Cp046@psbb@76000@77526@D@1@509 PSII_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVSGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGINNSWGGWSITGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQSVNPAWGAEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVGAGLAENLSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GHELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHATFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTKRQVV
>NC_020319@Cycre_Cp030@psbb@37222@38748@R@1@509 PSII_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVSGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGINNSWGGWSITGETVTNPGLWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLDIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGSGAFHVTGLYGPGIWVSDPYGLTGKIQPVNPAWGAEGFDPFVPGGIAS
HHIAAGILGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
IVAGTMWYGSATAPVELFGPTRYQWDQGYFQQEIDRRVRAGLSENLSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGAMDNGDGIAVGWLGHPIFRDKE
GHELFVRRMPTFFETFPVVLVDEEGIVKADVPFRRAESKYSVEQVGVTVE
FYGGELDGVSFGDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHATFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTKRQIV
>NC_020320@Denin_Cp036@psbb@71076@72602@D@1@509 PSII_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLAVHIMHTALVSGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFSDERTGKPSLDLPKIFGIHLFLAGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQSVNPSWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSAGLAENQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPVFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVTYSDPVTVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTKRQAV
>NC_020321@Taxchi_Cp042@psbb@62850@64376@R@1@509 PSII_47_kDa_protein
MGLPWYRVHTVVLNDPGRLIAVHIMHTALVSGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGIKDSWGGWSITGETVSNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLDVFCDDRTGKPSLDLPKIFGIHLFLSGAAC
FGFGAFHVTGLYGPGIWVSDPYGLTGNIQPVSPAWGAEGFDPFVPGGIAA
HHIAAGILGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
IVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIDRRVRAGLAENLSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGAMDNGDGIAVGWLGHPIFKDKK
GHELFVRRMPTFFETFPVVLVDEEGIVKADVPFRRAESKYSVEQVGVTVE
FYGGELDGVSFGDPTIVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHATFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTKKQVV
>NC_020341@ArgiCp047@psbb@70786@72312@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVSGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSISGGTVTNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLAGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQAVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSDGLAENLSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPVFRDKE
GRELFVRRMPTFFETFPVVLVDEEGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRSQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHATFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGTFQKVGD
PTTRRQAV
>NC_020361@H870_p49@psbb@49485@51011@D@1@509 PsbB
MGLPWYRVHTVVLNDPGRLIAVHIMHTALVSGWAGSMALYELAIFDPSDP
VLDPMWRQGMFVIPFMTRLGIKDSWGGWSITGETVTNPGLWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLDVFCDERTGKPSLDLPKIFGIHLFLSGAAC
FGFGAFHVTGLYGPGIWVSDPYGLTGRIQPVNPAWGAEGFDPFVPGGIAA
HHIAAGILGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIDRRVRAGLAENLSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGAMDNGDGIAVGWLGHPIFKDKD
GRELFVRRMPTFFETFPVVLVDEEGIVKADVPFRRAESKYSVEQVGVTVE
FYGGELDGVSFGDPAIVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHATFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTKKQVV
>NC_020362@H882_p041@psbb@78006@79532@D@1@509 photosystem_II_p680_chlorophyll_A_apoprotein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
ALDPMWRQGMFVIPFMTRLGITNSWGGWSISGGTVTNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGLAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPVSPAWGAEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSAGLAENLSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPVFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHATFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGTFQKIGD
PTTRRQVV
>NC_020363@H892_p041@psbb@73982@75508@D@1@509 photosystem_II_p680_chlorophyll_A_apoprotein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
ALDPMWRQGMFVIPFMTRLGITNSWGGWSISGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGLAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPVSPAWGAEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSAGLDENLSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPVFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPVTVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHATFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKIGD
PTTRRQVV
>NC_020364@H889_p042@psbb@74172@75698@D@1@509 photosystem_II_p680_chlorophyll_A_apoprotein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVSGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSISGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQSVNPAWGAEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSAGLAENLSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPVFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYGDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHATFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGTFQKIGD
PTTRRQVV
>NC_020365@H894_p042@psbb@73751@75277@D@1@509 photosystem_II_p680_chlorophyll_A_apoprotein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVSGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSISGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQSVNPAWGAEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSAGLAENPSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPVFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYGDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHATFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQVV
>NC_020366@H912_p042@psbb@74743@76269@D@1@509 photosystem_II_p680_chlorophyll_A_apoprotein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVSGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSISGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQSVNPAWGAEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSAGLAENLSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPVFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYGDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHATFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQVV
>NC_020367@H858_p042@psbb@74445@75971@D@1@509 photosystem_II_p680_chlorophyll_A_apoprotein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVSGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSISGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQSVNPAWGAEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSAGLAENLSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPVFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHATFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGTFQKLGD
PTTRRQVV
>NC_020371@H907_p089@psbb@16993@18522@D@1@510 photosystem_II_CP47_chlorophyll_apoprotein
MALPWFRVHTVVLNDPGRLLSVHLMHTSLVSGWAGSMALYELAVFDPSDP
VLNPMWRQGMFVMPFMARIGVTDSWAGWSITGESVSNPGIWSFEGVALTH
IILSGLCFLAAIWHWVYWDLELFRDDRTGEPALDLPKIFGIHLFLAGTLC
FGFGAFHCTGLFGPGIWVSDAFGVSGKVQPVIPAWGPEGFNPFNPGGVAS
HHIAAGAIGFLAGVFHLTVRPPQRLYRALRMGNIETVLSSSISAVFWAAF
VTSGTMWYGSATTPVELFGPTRYQWDSGYFQQEIERRVETSLSEGKSLTE
AWSGIPDKLAFYDYIGNNPAKGGLFRAGPMNKGDGIAEAWLGHSVFQDKD
GRELTVRRMPAFFETFPVILVDKDGVVRADIPFRRAESKYSIEQVGVTAS
FYGGKLNGQVFKDAPTVKKYARKAQLGEVFEFDRTTLESDGVFRSSPRGW
YTFGHANFALIFFLGHLWHGGRALFRDVFAGIGAEVVEQVEFGAFQKLGD
KTTKKQGIV
>NC_020372@H865_p057@psbb@72717@74243@D@1@509 PsbB
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITDSWGGWSIAGGTLTNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDIEIFFDERTGKPSLDLPKIFGIHLFLSGLAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPVSPTWGAEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVNAALAENRSFSE
AWSKIPDKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GHELFVRRMPTFFETFPVVLLDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELAGVSYNDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHANFGLLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTKKEAV
>NC_020431@Salmi_Cp047@psbb@71214@72740@D@1@509 PSII_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
ILDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTVTNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFSDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGRVQPVNPSWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSAGLAENQSLSE
VWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQAV
>NC_020438@I506_p040@psbb@190287@191813@R@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVINDPGRLISVHLMHTALVSGWAGSMALFEISVFDPSDP
VLNPMWRQGMFVLPFMTRLGITQSWGGWTISGETATNPGIWSYEGVAAAH
IILSGALFLASVWHWTYWDLELFRDPRTGKTALDLPKIFGIHLFLSGLLC
FGFGAFHVTGVFGPGIWVSDPYGLTGSVQPVAPSWGADGFDPFNPGGIAS
HHIAAGILGVLAGLFHLCVRPSIRLYFGLSMGSIETVLSSSIAAVFWAAF
VVAGTMWYGSAATPIELFGPTRYQWDQGFFQQEIQKRVQASLAEGASLSE
AWSRIPEKLAFYDYIGNNPAKGGLFRTGAMNSGDGIAVGWLGHAVFKDQE
GRDLFVRRMPTFFETFPVILLDKDGIVRADVPFRKAESKYSIEQVGVSVT
FYGGELDGLTFTDPATVKKYARKSQLGEIFEFDRSTLQSDGVFRSSPRGW
FTFGHVCFALLFFFGHIWHGARTIFRDVFAGIDDDINDQVEFGKYKKLGD
TSSLREAF
>NC_020460@I642_p023@psbb@70520@72499@R@3@509 photosystem_II_CP47_chlorophyll_apoprotein
MGLPWYRVHTVVLNDPGRLISVHLMHTALVSGWAGSMALYELAIFDPSDL
VLNPMWRQGMFVLPFMTRLGVTKSWGAWSIAGDASSNPGIWSYEGVAAAH
IVLSGLLFLAAIWHWVYWDLQLFRDPRTGDPALDLPKIFGIHLFLSGLLC
FGFGAFHVTGLFGPGIWVSDPYGITGNIQPVVPSWGADGFDPYNAGGIAS
HHIAAGILGIIAGLFHLTVRPPQRLYKVLRMGNIETVLSSSIAAVFWSAF
VVSGTMWYGSAATPIELFGPTRYQWDKGYFQEEIQNRVQTSLVSGSSLSE
AWTKIPEKLAFYDYIGNNPAKGGLFRSGPMNNGDGIAIGWLGHAVFTDKE
GNELFVRRMPTFFETFPVLLIDQDGIVRADIPFRRAESKYSIEQVGVTVN
FFGGELDGLNFSDPSTVKKYARRSQLGEIFEFDRATLQSDGVFRSSPRGW
FTFGHLSFALLFFFGHIWHGARTIFRDVFAGVDPDLEEQIEFGAFQKLGD
VTTRKQLV
>NC_020607@ArfrCp048@psbb@71071@72597@D@1@509 photosystem_II_P680_chlorophyll_A_apoprotein
MGLPWYRVHTVVLNDPGRLLAVHIMHTALVSGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFSDERTGKPSLDLPKIFGIHLFLAGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQSVNPSWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSAGLAENQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPVFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVTYSDPVTVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTKRQAV
>NC_020795@CHC_440@psbb@64284@65813@R@1@510 photosystem_II_CP47_protein
MGLPWYRVHTVVLNDPGRLISVHLMHTALVSGWAGSMALYELAVFDPSDP
VLNPMWRQGMFVMPFMSRLGVTDSWGGWSITGESVSNPGLWSFEGVAITH
IVLSGMLFLASIWHWVYWDLELFRDPRTGEPALDLPKIFGIHLLLSSLLC
FGFGAFHATGLFGPGIWISDAYGVTGKVQPVAPAWGPDGFNPFNPGGVAS
HHIAAGTVGILAGLFHLTVRPPQRLYRALRMGNIETVLSSSISAVFFSAF
ITCGTMWYGSATTPLELFGPTRYQWDSGYFQQEIERRIENSLNEGSTPEE
AWSKIPDKLAFYDYIGNNPAKGGLFRAGPMDKGDGIAEAWLGHPIFQDKD
GRELTVRRMPAFFETFPVILIDKDGIIRADIPFRRAESKYSIEQVGVTVN
FYGGKLNGKVFTDAPSVKKYARKAQLGEVFEFDRTTLESDGVFRSSPRGW
FTFGHANFALIFFFGHLWHGSRTIFRDVFAGIGAEVTEQVEFGAFQKLGD
RSSKKQGAV
>NC_021075@K937_p141@psbb@61056@62585@R@1@510 photosystem_II_CP47_protein
MGLPWYRVHTVVLNDPGRLISVHLMHTALVAGWAGSMALYELAVFDPSDP
VLNPMWRQGMFVMPFMARLGVTDSWGGWSITGESVSNPGLWSFEGVAITH
IVLSGMLFLASIWHWVYWDLELFRDPRTGEPALDLPKIFGIHLLLASLLC
FGFGAFHATGLFGPGIWISDGYGVTGKVQPVAPAWGPDGFNPFNPGGIAS
HHIAAGTVGILAGIFHLTVRPPQRLYRALRMGNIETVLSSSISAVFFSAF
ITCGTMWYGSATTPLELFGPTRYQWDSGYFQQEIEQRVENALNEGSTPAE
AWSRIPDKLAFYDYIGNNPAKGGLFRAGPMDKGDGIAEAWLGHPIFQDKE
NRELIVRRMPAFFETFPVILVDKDGIIRADIPFRRAESKYSIEQVGVTVS
FYGGKLNNKVFTDAPSVKKYARKAQLGEVFEFDRTTLESDGVFRSSPRGW
FTFGHANFALIFFFGHLWHGSRTIFRDVFAGIGAEVTEQVEFGAFQKLGD
KSSKKQGAV
>NC_021091@L076_p050@psbb@72860@74386@D@1@509 photosystem_II_CP47_chloropholl_apoprotein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWNITGGAITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLAGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGRIQSVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVGAGLAENQNLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GHELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRPVV
>NC_021101@L036_p038@psbb@74157@75683@D@1@509 PsbB
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGLAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQAVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSAGLDENQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPAFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQVV
>NC_021102@L053_p037@psbb@71710@73236@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWNITGGTITNPGLWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSAGLAENQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPVFRNKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTKRQAV
>NC_021109@L079_p026@psbb@187946@189472@D@1@509 CP47_chlorophyll_apoprotein_of_photosystem_II
MGLPWYRVHTVVINDPGRLISVHLMHTALVSGWAGSMALFEISVFDPSDP
VLNPMWRQGMFVLPFMTRLGITQSWGGWTISGETATNPGIWSYEGVAAAH
IILSGALFLASVWHWTYWDLELFRDPRTGKTALDLPKIFGIHLFLSGLLC
FGFGAFHVTGVFGPGIWVSDPYGLTGSVQPVAPSWGADGFDPFNPGGIAS
HHIAAGILGVLAGLFHLCVRPSIRLYFGLSMGSIETVLSSSIAAVFWAAF
VVAGTMWYGSAATPIELFGPTRYQWDQGFFQQEIQKRVQASLAEGASLSE
AWSRIPEKLAFYDYIGNNPAKGGLFRTGAMNSGDGIAVGWLGHAVFKDQE
GRDLFVRRMPTFFETFPVILLDKDGIVRADVPFRKAESKYSIEQVGVSVT
FYGGELDGLTFTDPATVKKYARKAQLGEIFEFDRSTLQSDGVFRSSPRGW
FTFGHVCFALLFFFGHIWHGARTIFRDVFAGIDDDINDQVEFGKYKKLGD
TSSLREAF
>NC_021110@L046_p004@psbb@5563@7089@R@1@509 photosystem_II_CP47_chlorophyll_apoprotein
MGLPWYRVHTVVLNDPGRLIAVHIMHTALVSGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGIKDSWGGWSITGETVSNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLDVFCDDRTGKPSLDLPKIFGIHLFLSGAAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKIQPVNPAWGAEGFDPFVPGGIAS
HHIAAGILGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
IVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIDRRVRAGLADNLSLSE
AWAKIPDKLAFYDYIGNNPAKGGLFRAGAMDNGDGIAVGWLGHPIFKDKK
GHELFVRRMPTFFETFPVVLVDEEGIVKADVPFRRAESKYSVEQVGVTVE
FYGGELDGVSFGDPAIVKKYARRSQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHATFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGVFQKLGD
PTTKRQVV
>NC_021121@ApCp048@psbb@74136@75662@D@1@509 photosystem_II_P680_chlorophyll_A_apoprotein
MGLPWYRVHTVVLNDPGRLLAVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTGTNPGIWSYEGVAGAH
ILFSGLCFLAAIWHWVYWDLEIFRDERTGKPVLDLPKIFGIHLFLAGLAC
FGFGVFHVTGLYGPGIWVSDPYGLTGKVQSVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSAGLAENQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYNDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQVV
>NC_021189@PyhaCp138@psbb@113211@114740@D@1@510 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLIAVHLMHTALVAGWAGSMALYELAVFDPSDP
VLNPMWRQGMFVMPFMARLGVTDSWGGWSITGESVSNPGLWSFEGVALTH
IVLSGMLFLAAIWHWVYWDLELFRDPRTGEPALDLPKIFGIHLLLSSLLC
FGFGAFHVTGLFGPGMWVSDGYGVTGKVLPVAPAWGPEGFNPFNPGGVAS
HHIAAGTVGILAGVFHLTVRPPQRLYRALRMGNIETVLSSSISAVFFSAF
VTCGTMWYGSATTPIELFGPTRYQWDSGYFQQEIEKRVENAIADGAAPSE
AWSRIPDKLAFYDYIGNNPAKGGLFRAGPMNKGDGVAEAWLGHPVFQDKE
GRELSVRRMPAFFETFPVILVDKDGIIRADIPFRRAESKYSIEQVGVTAS
FYGGKLNGQVFNDAPSVKKYARKAQLGEVFEFDRTTLESDGVFRSSPRGW
FTFGHANFALIFFFGHLWHGSRTIFRDVFAGIGAEVTEQVEFGAFQKLGD
RSSKKQGAV
>NC_021372@PhlaCp039@psbb@71469@72995@D@1@509 photosystem_II_protein_B
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVSGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSISGGTITNPGIWSYEGVASAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLAGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQAVNPAWGAEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSNGLAENLSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPVFRDKE
GRELFVRRMPTFFETFPVVLVDEEGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHATFALIFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGTFQKVGD
PTTRRQVV
>NC_021423@CrCp048@psbb@74120@75646@D@1@509 photosystem_II_P680_chlorophyll_A_apoprotein
MGLPWYRVHTVVLNDPGRLLSVHLMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTVTNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSAGLAENQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQAV
>NC_021425@TesiCp048@psbb@76902@78428@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQSVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVGTGLAENQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTKRQVV
>NC_021426@TrarCp048@psbb@77832@79358@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQSVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVGTGLAENQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGNGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQVV
>NC_021429@M372_p076@psbb@73733@75259@D@1@509 photosystem_II_p680_chlorophyll_A_apoprotein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVSGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWNISGGTIMNPGIWSYEGVAGAH
ILFSGLCFLSAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQSVNPAWGAEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVGAGLAENLSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FCGGELNGVIYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHATFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRKQVV
>NC_021430@M371_p077@psbb@73061@74587@D@1@509 photosystem_II_p680_chlorophyll_A_apoprotein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVSGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWNISGGTIMNPGIWSYEGVAGAH
ILFSGLCFLSAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQSVNPAWGAEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVGAGLAENLSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FCGGELNGVIYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHATFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQVV
>NC_021431@M314_p076@psbb@73107@74633@D@1@509 photosystem_II_p680_chlorophyll_A_apoprotein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVSGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWNISGGTIMNPGIWSYEGVAGAH
ILFSGLCFLSAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQSVNPAWGAEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVGAGLAENLSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FCGGELNGVIYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHATFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQVV
>NC_021432@M315_p076@psbb@73143@74669@D@1@509 photosystem_II_p680_chlorophyll_A_apoprotein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVSGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWNISGGTIMNPGIWSYEGVAGAH
ILFSGLCFLSAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQYVNPAWGAEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVGAGLAENLSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FCGGELNGVIYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHATFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQVV
>NC_021433@M353_p077@psbb@73345@74871@D@1@509 photosystem_II_p680_chlorophyll_A_apoprotein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVSGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWNISGGTIMNPGIWSYEGVAGAH
ILFSGLCFLSAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQSVNPAWGAEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVGAGLAENLSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDEDGIVRADVPFRRAESKYSVEQVGVTVE
FCGGELNGVIYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHATFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQVV
>NC_021437@M2888_p040@psbb@81825@83351@R@1@509 photosystem_II_CP47_chlorophyll_apoprotein
MGLPWYRVHTVVLNDPGRLIAVHIMHTALVSGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGIKDSWGGWSITGETVSNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLDVFCDSRTGKPSLDLPKIFGIHLFLSGAAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKIQPVNPAWGAEGFDPFVPGGIAS
HHIAAGILGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
IVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIDRRVRAGLAENLSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGAMDNGDGIAVGWLGHPIFKDKK
GHELFVRRMPTFFETFPVVLVDEEGIVKADVPFRRAESKYSVEQVGVTVE
FYGGELDGVSFGDPAIVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHATFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTKRQVV
>NC_021438@M344_p026@psbb@54127@55653@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLIAVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFILPFMTRLGIKESWGGWSITGESAVNPGLWSYEGVAGAH
IVFSGLCFLSAIWHWVYWDLEIFSDPRTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPFGLTGRIQPVSPAWGAEGFDPFVPGGIAS
HHIAAGLLGIIAGLFHLSVRPPQRLYRGLRMGNIETVLSSSIAAVFFAAF
IVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIDRRVRAGLTEKLSLSE
AWSRIPEKLAFYDYIGNNPAKGGLFRAGAMDNGDGIAVGWLGHPIFRDKE
GNELFVRRMPTFFETFPVVLVNKEGIVKADVPFRRSESKYSVEQVGVTVE
FYGGELNGVSFSDPAIVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHATFALLFFFGHIWHGARTLFRDIFAGIDPELDAQVEFGAFQKLGD
PTTKRQVV
>NC_021439@M319_p038@psbb@52363@53889@D@1@509 photosystem_II_CP47_protein
MGLPWYRVHTVVLNDPGRLISVHIMHTALVAGWAGSMTLYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGIKDSWSGWNITGETVINPGIWSYEGVAGAH
IMFSGLCFLAAIWHWVYWDLDIFCDERTGKRCLDLPKVFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKIQPVDPAWGAEGFDPFVPGGIAS
HHIAAGILGILAGLFHLSVRPPQRLYVGLRMGNIETVLSSSIAAVFFAAF
IVAGTMWYGSATTPVELFGPTRYQWDQGYFQQEIDRRVRAGLAENLSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGAMDNGDGIAVGWLGHPIFKDKE
GNELFVRRMPTFFETFPVVLVDKEGIVKADVPFRRAESKYSVEQVGVTVE
FYGGGLDRVSFGDPAIVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHATFALLFFSGHIWHGARTLFRDVFAGIDSDLDARIEFGAFQKLGD
PTTKRQVV
>NC_021440@M345_p038@psbb@53087@54613@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLISVHIMHTALVAGWAGSMTLYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGIKDSWSGWNITGETVINPGIWSYEGVAGAH
IMFSGLCFLAAIWHWVYWDLDIFCDERTGKRCLDLPKVFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKIQPVDPAWGAEGFDPFVPGGIAS
HHIAAGILGILAGLFHLSVRPPQRLYVGLRMGNIETVLSSSIAAVFFAAF
IVAGTMWYGSATTPVELFGPTRYQWDQGYFQQEIDRRVRAGLAENLSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGAMDNGDGIAVGWLGHPIFKDKE
GNELFVRRMPTFFETFPVVLVDKEGIVKADVPFRRAESKYSVEQVGVTVE
FYGGGLDRVSFGDPAIVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHATFALLFFSGHIWHGSRTLFRDVFAGIDSDLDARIEFGAFQKLGD
PTTKRQVV
>NC_021441@M348_p057@psbb@92790@94316@R@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLIAVHIMHTALVSGWAGSMALYELAVFDPSDP
ILDPMWRQGMFVIPFMTRLGIKDSWGGWSITGETVSNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLDVFCDSRTGKPSLDLPKIFGIHLFLSGAAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKIQPVNPAWGAEGFDPFVPGGIAS
HHIAAGILGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
IVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIDRRVRAGLAENLSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGAMDNGDGIAVGWLGHPIFKDKK
GHELFVRRMPTFFETFPVVLVDEEGIVKADVPFRRAESKYSVEQVGVTVE
FYGGELDGVSFGDPAIVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHATFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTKRQVV
>NC_021449@M316_p041@psbb@70258@71784@D@1@509 PsbB
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGAVTNPGIWSYEGVAGAH
IVFSGLCFLASIWHWVYWDLELFRDERTGKPALDLPKIFGIHLFLAGAAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPVSPSWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSGGLAENQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDSGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGISYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKVGD
PTTLRQGV
>NC_021455@M356_p042@psbb@73478@75004@D@1@509 photosystem_II_CP47_chlorophyll_apoprotein
MGLPWYRVHTVVLNDPGRLISVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTVTNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFTDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGRVQSVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRIGAGLAENQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQVV
>NC_021456@PACH01_0060@psbb@54252@55778@D@1@509 photosystem_II_CP47_chlorophyll_apoprotein
MGLPWYRVHTVVLNDPGRLISVHIMHTALVAGWAGSMTLYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGIKDSWTGWNITGETVINPGIWSYEGVAGAH
IMFSGLCFLAAIWHWVYWDLEIFCDERTGKLCLDLPKVFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKIQPVDPAWGAEGFDPFVPGGIAS
HHIAAGILGILAGLFHLSVRPPQRLYVGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPVELFGPTRYQWDQGYFQQEIDRRVRAGLAENLSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGAMDNGDGIAVGWLGHPIFKDKE
GNELFVRRMPTFFETFPVVLVDKEGIVKADVPFRRAESKYSVEQVGVTVE
FYGGGLDRVSFGDPAIVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHATFALLFFSGHIWHGARTLFRDVFAGIDPDLDARIEFGAFQKLGD
PTTKRQVV
>NC_021618@M829_p118@psbb@109042@110571@R@1@510 photosystem_II_CP47_chlorophyll_apoprotein
MGLPWYRVHTVVLNDPGRLISVHLMHTALVAGWAGSMALYELSVFDPSDP
VLNPMWRQGMFVMPFMARLGVTDSWGGWSITGESVSNPGLWSFEGVAITH
IVLSGMLFLASIWHWVYWDLELFRDPRTGEPALDLPKIFGIHLLLSSLLC
FGFGAFHATGLFGPGIWVSDGYGVTGKVQPVAPAWGPDGFNPFNPSGIAS
HHIAAGTVGILAGLFHLTVRPPQRLYRALRMGNIETVLSSSISAVFFSAF
VTCGTMWYGSATTPIELFGPTRYQWDSGYFQQEIERRVENSLNEGASPEE
AWSKIPDKLAFYDYIGNNPAKGGLFRAGPMDKGDGIAEAWLGHPIFQDKE
GRELTVRRMPAFFETFPVILVDKDGIIRADIPFRRAESKYSIEQVGVTAN
FYGGKLNGKVFTDAPSVKKYARKAQLGEVFEFDRTTLESDGVFRSSPRGW
FTFGHANFALIFFFGHLWHGSRTIFRDVFAGIGAEVTEQVEFGAFQKLGD
RSSKKQGAV
>NC_021636@M909_p037@psbb@71685@73211@D@1@509 photosystem_II_CP47_chlorophyll_apoprotein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWNITGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLAGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGRIQSVNPAWGVEGFDPFVPGGVAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVGAGLAENQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPVFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGISYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTKKQVV
>NC_021637@M912_p046@psbb@59312@60841@D@1@510 photosystem_II_47_kDa_protein
MALPWYRVHTVVLNDPGRLIAVHLMHTALVAGWAGSMALYELAVFDPSDP
VLNPMWRQGMFVMPFMARLGVTDSWGGWSITGESVSDPGIWSFEGVALTH
IILSGMCFLAAIWHWVYWDLELFRDPRTGEPALDLPKIFGIHLFLASLLC
FGFGAFHVTGTFGPGIWVSDAYGVTGRVQAVAPAWGAEGFNPFNPGGIAS
HHIAAGILGLLAGVFHLTIRPPQRLYRALRMGNIETVLSSSISAVFFAAF
ITSGTMWYGAATTPIELFGPTRYQWDSGYFQQEIERRVESSLGEGLSLSQ
AWSRIPDKLAFYDYIGNNPAKGGLFRAGPMNKGDGIAEAWLGHPVFQDKE
GRELTVRRMPAFFETFPVILVDKDGIVRADIPFRRAESKYSIEQVGVSTN
FYGGKLNGQVFTDAPTVKKYARKAQLGEVFEFDRTTLESDGVFRSSPRGW
YTFGHANFALLFFLGHLWHGGRTLFRDVFAGIGSEVLEQVEFGAFQKLGD
KTTKKQGVV
>NC_021645@M939_p038@psbb@71488@73014@D@1@509 photosystem_II_CP47_chlorophyll_apoprotein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWNITGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLAGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGRIQSVNPAWGVEGFDPFVPGGVAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVGAGLAENQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPVFRDKE
GHELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVIVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTKKQVV
>NC_021646@M931_p037@psbb@71801@73327@D@1@509 photosystem_II_CP47_chlorophyll_apoprotein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWNITGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLAGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGRIQSVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVGAGLAENQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPVFRDKE
GHELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVIVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTKKQVV
>NC_021647@M938_p037@psbb@71495@73021@D@1@509 photosystem_II_CP47_chlorophyll_apoprotein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWNITGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLAGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGRIQSVNPAWGVEGFDPFVPGGVAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVGAGLAENQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPVFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGISYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTKKQVV
>NC_021648@M932_p037@psbb@71727@73253@D@1@509 photosystem_II_CP47_chlorophyll_apoprotein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWNITGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLAGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGRIQSVNPAWGVEGFDPFVPGGVAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVGAGLAENQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPVFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGISYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTKKQVV
>NC_021649@M935_p037@psbb@71898@73424@D@1@509 photosystem_II_CP47_chlorophyll_apoprotein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWNITGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLAGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGRIQSVNPAWGVEGFDPFVPGGVAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVGAGLAENQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPVFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTKKQVV
>NC_021650@M933_p037@psbb@71742@73268@D@1@509 photosystem_II_CP47_chlorophyll_apoprotein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWNITGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLAGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGRIQSVNPAWGVEGFDPFVPGGVAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVGAGLAENQRLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPVFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGISYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTKKQVV
>NC_021760@N248_p035@psbb@69274@70800@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLAVHIMHTALVSGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITDSWGGWSISGGTVTNPGIWSYEGVAGTH
IVFSGLCFLAAIWHWVYWDLEIFSDERTGKPSLDLPKIFGIHLFLAGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQAVNPAWGAEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSNGLAENLSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPVFRDKE
GRELFVRRMPTFFETFPVVLVDEEGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRSQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHATFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGTFQKVGD
PTTRKQAV
>NC_021761@N250_p034@psbb@69063@70589@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLAVHIMHTALVSGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITDSWGGWSISGGTVTNPGIWSYEGVAGTH
IVFSGLCFLAAIWHWVYWDLEIFSDERTGKPSLDLPKIFGIHLFLAGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQAVNPAWGAEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSNGLAENLSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPVFRDKE
GRELFVRRMPTFFETFPVVLVDEEGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRSQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHATFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGTFQKVGD
PTTRKQAV
>NC_021762@N245_p28@psbb@68953@70479@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLAVHIMHTALVSGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITDSWGGWSISGGTVTNPGIWSYEGVAGTH
IVFSGLCFLAAIWHWVYWDLEIFSDERTGKPSLDLPKIFGIHLFLAGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQAVNPAWGAEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSNGLAENLSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPVFRDKE
GRELFVRRMPTFFETFPVVLVDEEGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRSQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHATFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGTFQKVGD
PTTRKQAV
>NC_021936@D176_069@psbb@76788@78314@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVSGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGETITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPISPMWGAEGFDPFVPGGIAS
HHIAAGILGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVNAGLAENRSLSE
AWSTIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GSELFVRRMPTFFETFPVVLVDGEGVVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHATFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGTFQKVGD
PTTKRQTV
>NC_022133@P217_p035@psbb@68059@69585@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLAVHIMHTALVSGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITDSWGGWSISGGTVTNPGIWSYEGVAGTH
IVFSGLCFLAAIWHWVYWDLEIFSDERTGKPSLDLPKIFGIHLFLAGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQAVNPAWGAEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSNGLAENLSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPVFRDKE
GRELFVRRMPTFFETFPVVLVDEEGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRSQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHATFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGTFQKVGD
PTTRKQAV
>NC_022136@P228_p056@psbb@70804@72330@D@1@509 photosystem_II_CP47_chlorophyll_apoprotein
MGLPWYRVHTVVLNDPGRLISVHLMHTALVSGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRIGITKSWGGWGITGDTVTDAGIWSYEGVAAAH
IVLSGLLFLASIWHWVYWDLDLFRDDRTGKPSLDLPKIFGIHLFLSGVLC
FAFGAFHVTGLFGPGIWVSDPYGLTGKVQPVDPSWGAEGFDAFVPGGIAS
HHIAAGVLGILAGLFHLSVRPPQRLYKALRMGNVETVLSSSIAAVFFAAF
VVSGTMWYGSAATPIELFGPTRYQWDQGYFQQEIDRRIRASRSENLSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGAMDNGDGIAVGWLGHASFKDRE
GHELFVRRMPTFFETFPVVLVDGEGVVRADVPFRRAESKYSVEQVGVTVE
FYGGELDGATFSDPATVKKYARRAQLGEIFEFDRATLKSDGVFRSSPRGW
FTFGHATFALIFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTKRQIV
>NC_022137@P213_p054@psbb@73566@75092@D@1@509 photosystem_II_CP47_chlorophyll_apoprotein
MGLPWYRVHTVVLNDPGRLISVHLMHTALVSGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRIGITKSWGGWSITGDTVSDAGIWSYEGVAASH
IILSGLLFLAAIWHWVYWDLDLFRDDRTGKPSLDLPKIFGIHLFLSGLLC
FSFGAFHVTGLFGPGIWVSDPYGLTGKVEPVDPAWGAEGFDPFVPGGIAS
HHIAAGVLGILAGLFHLSVRPPQRLYKALRMGNVETVLSSSIAAVFFAAF
VVSGTMWYGSAATPIELFGPTRYQWDQGYFQQEIDRRIRSSRAENLSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGAMDNGDGIAVGWLGHAVFKDKE
GHELFVRRMPTFFETFPVVLVDADGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELDGASFSDPATVKKYARRAQLGEIFEFDRATLKSDGVFRSSPRGW
FTFGHATFALLFFFGHIWHGSRTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTKRQVV
>NC_022259@P417_p107@psbb@14474@16003@R@1@510 photosystem_II_47_kDa_protein
MALPWYRVHTVVLNDPGRLLAVHIMHTALVSGWAGSMALYELAIFDPSDP
ILNPMWRQGMFVMPFMTRLGVTDSWGGWSVTGESGLNPGLWSYEGVALTH
IVLSGLLFLAAIWHWVYWDLDIFNIQRSDEISLDLPKVFGIHLFLSGILC
LGFGAFHVTGFFGPGIWLSDAYGLTGKVQGVAPSWGPDGFNPFNPGGVAA
HHIAAGTIGILAGFFHIIVRPPQRLYRGLRMGNIETVLSSSIAAVFFAAF
VTSGTMWYGSATTPIELFGPTRYQWDSGYFQQEIERRVENSVAEGLSKSQ
AWARIPDKLAFYDYIGNNPAKGGLFRAGPMNKGDGIAEAWLGHPIFTDRE
GRELTVRRMPAFFETFPVLLLDKDGIIRADIPFRRAESKYSIEQVGVNVN
FYGGKLNGQTFKDAPTVKKYARKAQLGEVFEFDRTSLESDGVFRSSPRGW
YTFGHANFALIFFLGHLWHGARTLYRDVFTGIDASITDQIEFGVLQKLGD
ESTRRQGFI
>NC_022260@P412_p108@psbb@14472@16001@R@1@510 photosystem_II_47_kDa_protein
MALPWYRVHTVVLNDPGRLLAVHIMHTALVSGWAGSMALYELAIFDPSDP
ILNPMWRQGMFVMPFMTRLGVTDSWAGWSVTGESGLNPGLWSYEGVALTH
IVLSGLLFLAAIWHWVYWDLDIFNIQRSDEISLDLPKVFGIHLFLSGILC
LGFGAFHVTGFFGPGIWLSDAYGLTGKVQGVAPSWGPDGFNPFNPGGVAA
HHIAAGTIGILAGFFHIIVRPPQRLYRGLRMGNIETVLSSSIAAVFFAAF
VTSGTMWYGSATTPIELFGPTRYQWDSGYFQQEIERRVENSVAEGLSKSQ
AWARIPDKLAFYDYIGNNPAKGGLFRAGPMNKGDGIAEAWLGHPIFTDRE
GRELTVRRMPAFFETFPVLLLDKDGIIRADIPFRRAESKYSIEQVGVNVN
FYGGKLNGQTFKDAPTVKKYARKAQLGEVFEFDRTSLESDGVFRSSPRGW
YTFGHANFALIFFLGHLWHGARTLYRDVFTGIDASITDQIEFGVLQKLGD
ESTRRQGFI
>NC_022261@P414_p105@psbb@14499@16028@R@1@510 photosystem_II_47_kDa_protein
MALPWYRVHTVVLNDPGRLLAVHIMHTALVSGWAGSMALYELAIFDPSDP
ILNPMWRQGMFVMPFMTRLGVTDSWGGWSVTGESGLNPGLWSYEGVALTH
IVLSGLLFLAAIWHWVYWDLDIFNIQRSDEISLDLPKVFGIHLFLSGILC
LGFGAFHVTGFFGPGIWLSDAYGLTGKVQGVAPSWGPDGFNPFNPGGVAA
HHIAAGTFGILAGFFHIIVRPPQRLYRGLRMGNIETVLSSSIAAVFFAAF
VTSGTMWYGSATTPIELFGPTRYQWDSGYFQQEIERRVENSVAEGLSKSQ
AWARIPDKLAFYDYIGNNPAKGGLFRAGPMNKGDGIAEAWLGHPIFTDRE
GRELTVRRMPAFFETFPVLLLDKDGIIRADIPFRRAESKYSIEQVGVNVN
FYGGKLNGQTFKDAPTVKKYARKAQLGEVFEFDRTSLESDGVFRSSPRGW
YTFGHANFALIFFLGHLWHGARTLYRDVFTGIDASISDQIEFGVLQKLGD
ESTRRQGFI
>NC_022262@P416_p106@psbb@14500@16029@R@1@510 photosystem_II_47_kDa_protein
MALPWYRVHTVVLNDPGRLLAVHIMHTALVSGWAGSMALYELAIFDPSDP
ILNPMWRQGMFVMPFMTRLGVTDSWGGWSVTGENGLNPGLWSYEGVALTH
IVLSGLLFLAAIWHWVYWDLDIFNIQRSDEISLDLPKVFGIHLFLSGILC
LGFGAFHVTGFFGPGIWLSDAYGLTGKVQGVAPSWGPDGFNPFNPGSVAA
HHIAAGTIGILAGFFHIIVRPPQRLYRALRMGNIETVLSSSIAAVFFAAF
VTSGTMWYGSATTPIELFGPTRYQWDSGYFQQEIERRVENSVAEGLSKSQ
AWARIPDKLAFYDYIGNNPAKGGLFRAGPMNKGDGIAEAWLGHPIFTDRE
GRELTVRRMPAFFETFPVLLLDKDGIIRADIPFRRAESKYSIEQVGVNVN
FYGGKLNGQTFKDAPTVKKYARKAQLGEVFEFDRTSLESDGVFRSSPRGW
YTFGHANFALIFFLGHLWHGARTLYRDVFTGIDASITDQIEFGVLQKLGD
ESTRRQGFI
>NC_022263@P418_p108@psbb@14472@16001@R@1@510 photosystem_II_47_kDa_protein
MALPWYRVHTVVLNDPGRLLAVHIMHTALVSGWAGSMALYELAIFDPSDP
ILNPMWRQGMFVMPFMTRLGVTDSWGGWSVTGESGINPGLWSYEGVALTH
IVLSGLLFLAAIWHWVYWDLDIFNIQRSDEISLDLPKVFGIHLFLSGILC
LGFGAFHVTGFFGPGIWLSDAYGLTGKVQGVAPSWGPDGFNPFNPGGVAA
HHIAAGTIGILAGFFHIIVRPPQRLYRGLRMGNIETVLSSSIAAVFFAAF
VTSGTMWYGSATTPIELFGPTRYQWDSGYFQQEIERRVENSVAESLSKSQ
AWARIPDKLAFYDYIGNNPAKGGLFRAGPMNKGDGIAEAWLGHPIFTDRE
GRELTVRRMPAFFETFPVLLLDKDGIIRADIPFRRAESKYSIEQVGVNVN
FYGGKLNGQTFKDAPTVKKYARKAQLGEVFEFDRTSLESDGVFRSSPRGW
YTFGHANFALIFFLGHLWHGARTLYRDVFTGIDASITDQIEFGVLQKLGD
ESTRRQGFI
>NC_022264@P413_p073@psbb@74962@76488@D@1@509 photosystem_II_p680_chlorophyll_A_apoprotein_CP-47
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTVTNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVGAGLAENQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDSDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQVV
>NC_022378@EOBL_CP_p048@psbb@76470@77996@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVGAGLAKNQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQVV
>NC_022379@ERD2_CP_p048@psbb@76471@77997@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVGAGLAKNQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQVV
>NC_022380@EDEL_CP_p048@psbb@76646@78172@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVGAGLAKNQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQVV
>NC_022381@EVER_CP_p048@psbb@77061@78587@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVGAGLAKNQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQVV
>NC_022382@EBAX_CP_p048@psbb@77089@78615@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVGAGLAKNQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQVV
>NC_022383@EDIF_CP_p048@psbb@77074@78600@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVGAGLAKNQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQVV
>NC_022384@ESIE_CP_p048@psbb@77014@78540@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVGAGLAKNQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQVV
>NC_022385@EELA_CP_p048@psbb@76928@78454@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVGAGLAKNQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQVV
>NC_022386@EREG_CP_p048@psbb@77026@78552@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVGAGLAKNQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQVV
>NC_022387@EUMB_CP_p048@psbb@77015@78541@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVGAGLAKNQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQVV
>NC_022388@ECLO_CP_p048@psbb@77021@78547@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVGAGLAKNQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPVTVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQVV
>NC_022389@EPAT_CP_p048@psbb@77099@78625@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVGAGLAKNQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQVV
>NC_022390@EMAR_CP_p048@psbb@77029@78555@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVGAGLAKNQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVAVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQVV
>NC_022391@ECUR_CP_p048@psbb@76996@78522@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVGAGLAKNQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQVV
>NC_022392@EMEL_CP_p048@psbb@77273@78799@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVGAGLAKNQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQVV
>NC_022393@EPOL_CP_p048@psbb@77146@78672@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVGAGLAKNQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQVV
>NC_022394@ECLA_CP_p048@psbb@77245@78771@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVGAGLAKNQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQVV
>NC_022395@ENIT_CP_p048@psbb@77210@78736@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVGAGLAKNQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQVV
>NC_022396@EARO_CP_p048@psbb@77106@78632@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVGAGLAKNQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQVV
>NC_022397@ESLI_CP_p048@psbb@77243@78769@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVGAGLAKNQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQVV
>NC_022398@ECAM_CP_p048@psbb@77072@78598@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVGAGLAKNQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQVV
>NC_022399@EDEG_CP_p048@psbb@77137@78663@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVGAGLAKNQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQVV
>NC_022400@ESPA_CP_p048@psbb@76935@78461@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVGAGLAKNQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQVV
>NC_022401@ETOR_CP_p048@psbb@77222@78748@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVGADLAKNQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQVV
>NC_022402@EDIC_CP_p048@psbb@77218@78744@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVGAGLAKNQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGSRTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQVV
>NC_022403@ESAL_CP_p048@psbb@77367@78893@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVGAGLAKNQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQVV
>NC_022404@EMIC_CP_p048@psbb@77211@78737@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVGAGLAKNQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQVV
>NC_022405@EGUI_CP_p048@psbb@77209@78735@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVGAGLAKNQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQVV
>NC_022406@EERY_CP_p048@psbb@76864@78390@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVGAGLSKNQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELDGVSYSDPATVKKYARRAQLGEIFEFDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQVV
>NC_022407@CGUM_CP_p048@psbb@76489@78015@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVGAGLAKNQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKADGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQVV
>NC_022408@CMAC_CP_p048@psbb@76755@78281@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVGAGLAKNQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKADGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQVV
>NC_022409@CEXI_CP_p048@psbb@76722@78248@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVGAGLAKNQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFEFDRATLKADGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQVV
>NC_022410@CTES_CP_p048@psbb@76814@78340@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVGAGLAKNQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKADGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQVV
>NC_022411@AFLO_CP_p048@psbb@76906@78432@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVGAGLAKNQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKADGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQVV
>NC_022412@ACOS_CP_p048@psbb@76960@78486@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVGAGLAKNQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKADGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQVV
>NC_022413@ALLO_CP_p048@psbb@76481@78007@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTVTNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFGAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVVAGLAKNQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQMGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQVV
>NC_022414@SQUA_CP_p048@psbb@76502@78028@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTVTNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVGVGLAKNQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQVV
>NC_022417@Q438_p044@psbb@72158@73684@D@1@509 photosystem_II_p680_chlorophyll_A_apoprotein_(CP-47)
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVSGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSISGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQSVNPAWGAEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSAGLAENLSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPVFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHATFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKIGD
PTTRRQVV
>NC_022431@Ascsyr_cp-57@psbb@79995@81521@D@1@509 photosystem_II_CP47_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWSGWSITGGAVTNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFSDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPVDPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSAGLAENQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDSGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDSQVEFGTFQKVGD
PTTRRPAV
>NC_022432@Q663_p039@psbb@77304@78830@D@1@509 photosystem_II_CP47_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWSGWSITGGAVTNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFSDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPVDPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSAGLAENQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDSGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDSQVEFGTFQKVGD
PTTRRPAV
>NC_022451@Q730_p041@psbb@70867@72393@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTVTNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPVNPLWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSVGLAENQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVTYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKIGD
PTTRRQAV
>NC_022457@Q738_p057@psbb@73155@74681@D@1@509 photosystem_II_CP47_chlorophyll_apoprotein
MGLPWYRVHTVVLNDPGRLLAVHIMHTALVSGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTVTNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFRDERTGKPSLDLPKIFGIHLFLSGLAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQSVSPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVGAGLAENQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQVI
>NC_022457@Q738_p001@psbb@163191@164717@R@1@509 photosystem_II_CP47_chlorophyll_apoprotein
MGLPWYRVHTVVLNDPGRLLAVHIMHTALVSGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTVTNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFRDERTGKPSLDLPKIFGIHLFLSGLAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQSVSPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVGAGLAENQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQVI
>NC_022459@Q710_p073@psbb@74576@76102@D@1@509 photosystem_II_p680_chlorophyll_A_apoprotein_CP-47
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTVTNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVGAGLAENQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQVV
>NC_022460@Q737_p071@psbb@74503@76029@D@1@509 photosystem_II_p680_chlorophyll_A_apoprotein_CP-47
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTVTNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVGAGLAENQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQVV
>NC_022461@Q731_p042@psbb@74863@76389@D@1@509 photosystem_II_p680_chlorophyll_A_apoprotein_CP-47
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTVTNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVGAGLAENQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQVV
>NC_022462@Q707_p074@psbb@74511@76037@D@1@509 photosystem_II_p680_chlorophyll_A_apoprotein_CP-47
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTVTNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVGAGLAENQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQVV
>NC_022463@Q725_p073@psbb@74519@76045@D@1@509 photosystem_II_p680_chlorophyll_A_apoprotein_CP-47
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTVTNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVGAGLAENQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQVV
>NC_022668@U806_p064@psbb@68810@70336@D@1@509 photosystem_II_CP47_chlorophyll_apoprotein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVSGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSISGGTVTNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLAGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQAVNPAWGAEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSDGLAENLSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDEEGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRSQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHATFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGTFQKVGD
PTTRRQPV
>NC_022715@U848_p047@psbb@71656@73182@D@1@509 photosystem_II_p680_chlorophyll_A_apoprotein_(CP-47)
MGLPWYRVHTVVLNDPGRLLAVHIMHTALVSGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWTISGGTITNPGIWSYEGVAGAH
ILFSGLCFLAAIWHWVYWDLEIFSDERTGKPSLDLPKIFGIHLFLSGLAC
FAFGAFHVTGLYGPGIWVSDPYGLTGKVQSVNPTWGAEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDHGYFQQEIYRRVGAGLAGNLSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHATFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQVV
>NC_022810@W872_p044@psbb@74279@75805@D@1@509 photosystem_II_protein_47KD
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSVTGGAIPNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFSDERTGKPSLDLPKIFGIHLFLAGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQSVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSAGLAENQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQVV
>NC_022811@W886_p044@psbb@74809@76335@D@1@509 photosystem_II_47KD_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSVTGGAIPNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFSDERTGKPSLDLPKIFGIHLFLAGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQSVNPAWGVEGFDPFVPGGIAA
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRISAGLAENQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDSDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQVV
>NC_022812@W879_p044@psbb@74577@76103@D@1@509 photosystem_II_47KD_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSVTGGAIPNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFSDERTGKPSLDLPKIFGIHLFLAGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQSVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSAGLAENQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDSDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQVV
>NC_022813@W869_p044@psbb@74286@75812@D@1@509 photosystem_II_protein_47KD
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSVTGGDIPNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFSDERTGKPSLDLPKIFGIHLFLAGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQSVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSAGLAENQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDSDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQVV
>NC_022814@W871_p044@psbb@74812@76338@D@1@509 photosystem_II_47KD_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSVTGGAIPNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFSDERTGKPSLDLPKIFGIHLFLAGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQSVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSAGLAENQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDSDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQVV
>NC_022850@W841_p038@psbb@68110@69636@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVSGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSISGGTVTNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLAGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQAVNPAWGAEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSDGLAENLSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPVFRDKE
GRELFVRRMPTFFETFPVVLVDEEGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHATFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGTFQKVGD
PTTKRQAA
>NC_022859@W829_p052@psbb@74033@75559@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTVTNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPVNPSWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSAGLAENQSLSE
AWAKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQAA
>NC_022868@W848_p039@psbb@71018@72544@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWNITGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLAGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGRIQSVNPAWGVEGFDPFVPGGVAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVGAGLAENQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPVFRDKE
GHELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVIVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTKKQVV
>NC_022926@X609_p042@psbb@76260@77786@D@1@509 photosystem_II_protein_B
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
ALDPMWRQGMFVIPFMTRLGITNSWGGWSISGGTVTNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGLAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPVSPAWGAEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSAGLAQNLSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPVFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPVTVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHATFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTKRQVV
>NC_022927@X587_p042@psbb@80403@81929@D@1@509 photosystem_II_protein_B
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
ALDPMWRQGMFVIPFMTRLGITNSWGGWSISGETVTNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGLAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPVSPAWGAEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSAGLAENLSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPVFREKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHATFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQVV
>NC_022928@X606_p041@psbb@75320@76846@D@1@509 photosystem_II_protein_B
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
ALDPMWRQGMFVIPFMTRLGITNSWGGWSISGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGLAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPVSPAWGAEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSAGLDENLSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPVFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPVTVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHATFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGTFQKIGD
PTTRRQVV
>NC_022958@X588_p042@psbb@70680@72206@D@1@509 PSII_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLAVHIMHTALVSGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSISGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLAGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQAVSPAWGAEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSDGLAENLSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPVFRDKE
GRELFVRRMPTFFETFPVVLVDEEGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHATFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGTFQKVGD
PTTRRQTV
>NC_023084@Y726_p045@psbb@74753@76279@D@1@509 PsbB
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTVTNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVGAGLAENQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRSQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQVV
>NC_023085@Y754_p040@psbb@70440@71966@D@1@509 photosystem_II_CP47_chlorophyll_apoprotein
MGLPWYRVHTVVLNDPGRLLAVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTVTNPGIWSYEGVAGAH
IMFSGLCFLAAIWHWVYWDLEIFSDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGVFHVTGLYGPGIWVSDPYGLTGKVQSVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSAGLAENQSLTE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDSGDGIAVGWLGHPVFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDSQVEFGAFQKLGD
PTTRKQAV
>NC_023090@Y718_p037@psbb@70284@71813@D@1@510 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDS
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFSDERTGKPSLDLPKIFGIHLFLAGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGRVQPVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVGAGLAENKSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDSGDGIAVGWLGHPIFKDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYNDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQVVG
>NC_023092@Y765_p040@psbb@77133@78659@D@1@509 PsbB
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQSVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVGAGLAENQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQVV
>NC_023096@Y745_p033@psbb@68046@69572@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLAVHIMHTALVSGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITDSWGGWSISGGTVTNPGIWSYEGVAGTH
IVFSGLCFLAAIWHWVYWDLEIFSDERTGKPSLDLPKIFGIHLFLAGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQAVNPAWGAEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSNGLAENLSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPVFRDKE
GRELFVRRMPTFFETFPVVLVDEEGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRSQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHATFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGTFQKVGD
PTTRKQAV
>NC_023097@Y742_p035@psbb@67841@69367@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLAVHIMHTALVSGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITDSWGGWSISGGTVTNPGIWSYEGVAGTH
IVFSGLCFLAAIWHWVYWDLEIFSDERTGKPSLDLPKIFGIHLFLAGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQAVNPAWGAEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSNGLAENLSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPVFRDKE
GRELFVRRMPTFFETFPVVLVDEEGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRSQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHATFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGTFQKVGD
PTTRKQAV
>NC_023102@Y720_p038@psbb@70395@71921@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTVTNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFSDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPVNPSWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSAGLAENQSLSE
VWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQPV
>NC_023107@Y758_p040@psbb@71856@73382@D@1@509 photosystem_II_P680_chlorophyll_A_apoprotein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLAGLAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQSVNPSWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSAGLAENQSLSE
VWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPVTVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGSRTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQAI
>NC_023108@Y763_p039@psbb@71836@73362@D@1@509 photosystem_II_P680_chlorophyll_A_apoprotein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLAGLAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQSVNPSWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSAGLAENQSLSE
VWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPVTVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGSRTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQAI
>NC_023109@Y759_p039@psbb@71862@73388@D@1@509 photosystem_II_P680_chlorophyll_A_apoprotein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLAGLAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQSVNPSWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSAGLAENQSLSE
VWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPVTVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGSRTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQAI
>NC_023110@Y764_p039@psbb@71858@73384@D@1@509 photosystem_II_P680_chlorophyll_A_apoprotein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLAGLAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQSVNPSWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSAGLAENQSLSE
VWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPVTVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGSRTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQAI
>NC_023111@Y747_p039@psbb@71854@73380@D@1@509 photosystem_II_P680_chlorophyll_A_apoprotein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLAGLAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQSVNPSWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSAGLAENQSLSE
VWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPVTVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGSRTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQAI
>NC_023112@Y761_p039@psbb@71857@73383@D@1@509 photosystem_II_P680_chlorophyll_A_apoprotein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLAGLAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQSVNPSWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSAGLAENQSLSE
VWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPVTVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGSRTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQAI
>NC_023113@Y719_p039@psbb@71844@73370@D@1@509 photosystem_II_P680_chlorophyll_A_apoprotein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLAGLAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQSVNPSWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSAGLAENQSLSE
VWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPVTVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGSRTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQAI
>NC_023114@Y756_p039@psbb@71860@73386@D@1@509 photosystem_II_P680_chlorophyll_A_apoprotein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLAGLAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQSVNPSWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSAGLAENQSLSE
VWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPVTVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGSRTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQAI
>NC_023115@Y757_p036@psbb@73198@74724@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTVTNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDDRTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPVNPSWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVGAGLAENQSLPE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQAV
>NC_023119@Y769_p036@psbb@77531@79057@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLIAVHLMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGIKDSWGGWSITGETVTNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLDIFVDERTGKPSLDLPKIFGIHLFLSGAAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKIQPVNPAWGAEGFDPFVPGGIAS
HHIAAGILGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
IVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIDRRVRAGLAENLSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGAMDNGDGIAVGWLGHPIFKDKE
GHELFVRRMPTFFETFPVVLVDEEGIVKADVPFRRAESKYSIEQVGVTVE
FYGGELDGVSFGDPAIVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHATFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTKRQVV
>NC_023120@Y725_p020@psbb@81791@83317@R@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLIAVHIMHTALVSGWAGSMALYELAIFDPSDP
VLDPMWRQGMFVIPFMTRLGIKDSWGGWSITGETVTNPGLWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLDVFCDERTGKPSLDLPKIFGIHLFLSGAAC
FGFGAFHVTGLYGPGIWVSDPYGLTGRIQPVNPAWGAEGFDPFVPGGIAA
HHIAAGILGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIDRRVRAGLAENLSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGAMDNGDGIAVGWLGHPIFKDKD
GHELFVRRMPTFFETFPVVLVDEEGIVKADVPFRRAESKYSVEQVGVTVE
FYGGELDGVSFGDPTIVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHATFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTKKQVV
>NC_023121@Y766_p028@psbb@98908@100434@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLIAVHIMHTALVSGWAGSMALYELAVFDPSDP
ILDPMWRQGMFVIPFMTRLGIKDSWGGWSITGETISNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLDVFCDSRTGKPSLDLPKIFGIHLFLSGAAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKIQPVNPAWGAEGFDPFVPGGIAS
HHIAAGILGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
IVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIDRRVRAGLAENLSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGAMDNGDGIAVGWLGHPIFKDKK
GHELFVRRMPTFFETFPVVLVDEEGIVKADVPFRRAESKYSVEQVGVTVE
FYGGELDGVSFGDPAIVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHATFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTKRQVV
>NC_023130@Y732_p038@psbb@75765@77291@D@1@509 photosystem_II_CP47_chlorophyll_apoprotein
MGLPWYRVHTVVLNDPGRLISVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTVTNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFTDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGRVQSVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRIGAGLAENQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQVV
>NC_023133@Y721_p046@psbb@155366@156895@R@1@510 photosystem_II_chlorophyll_A_core_antenna_apoprotein_CP47
MGLPWYRVHTVVLNDPGRLIAVHLMHTALVAGWAGSMALYELAVFDPSDP
VLNPMWRQGMFVMPFMTRLGVTDSWGGWSITGESVSNPGIWSFEGVALTH
IVLSGLLFLAAIWHWIYWDLELFRDPRTGEPALDLPKIFGIHLLLASILC
FGFGAFHVTGLFGPGIWVSDAYGITGKVQPVAPAWGPEGFNPFNPGGVAS
HHIAAGTVGILAGVFHLSIRPPQRLYRALRMGNIETVLSSSIAAVFFAAF
ITSGTMWYGCATTPIELFGPTRYQWDSGYFQQEIERQVENSLSEGLSLSD
AWSRIPDKLAFYDYIGNNPAKGGLFRSGPMDKGDGIAEAWLGHPVFKDKE
GRELTVRRMPAFFETFPVILVDQDGIIRADIPFRRAESKYSIEQVGVTID
FYGGKLNGQSFTDAPTVKKYARKAQLGEVFEFDRTTLESDGVFRSSPRGW
YTFGHANFALLFFFGHLWHGSRTLFRDVFAGIGAEVTEQVEFGAFAKLGD
RTTKKQGIV
>NC_023213@Z075_p041@psbb@76130@77656@D@1@509 photosystem_II_CP47_chlorophyll_apoprotein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSAGLAENQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKD
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQVV
>NC_023214@Z068_p041@psbb@76089@77615@D@1@509 photosystem_II_CP47_chlorophyll_apoprotein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSAGLAENQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKD
GRELFVRRIPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQVV
>NC_023215@Z081_p041@psbb@76729@78255@D@1@509 photosystem_II_CP47_chlorophyll_apoprotein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSAGLAENQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKD
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQVV
>NC_023216@Z077_p041@psbb@76667@78193@D@1@509 photosystem_II_CP47_chlorophyll_apoprotein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSAGLAENQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKD
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQVV
>NC_023217@Z064_p040@psbb@75893@77419@D@1@509 photosystem_II_CP47_chlorophyll_apoprotein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSAGLAENQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKD
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQVV
>NC_023218@Z083_p040@psbb@76250@77776@D@1@509 photosystem_II_CP47_chlorophyll_apoprotein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSAGLAENQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKD
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQVV
>NC_023245@PhlapCp047@psbb@71302@72828@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVSGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSISGGTITNPGIWSYEGVASAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLAGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQAVNPAWGAEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSNGLAENLSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPVFRDKE
GRELFVRRMPTFFETFPVVLVDEEGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHATFALIFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGTFQKVGD
PTTRRQVV
>NC_023247@FritaCp046@psbb@69537@71063@D@1@509 PSII_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVSGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSISGGTIPNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFSDERTGKPSLDLPKIFGIHLFLSGLAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQSVNPAWGAEGFDPFVSGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVGTGLAENLSFSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDSGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHATFALLFFFGHIWHGARTLFRDVFAGIDPDLDSQVEFGAFQKLGD
PTTRKQVV
>NC_023256@Z072_p038@psbb@74100@75626@D@1@509 PsbB
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQAVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVGAGLAENQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPTFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQVV
>NC_023259@Z092_p046@psbb@70090@71616@D@1@509 photosystem_II_CP47_chlorophyll_apoprotein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGIINSWGGWSITGGTVTNPGIWSYEGVAGAH
ILFSGLCFLAAIWHWVYWDLEIFSDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQAVNPVWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVRLGLAENQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDSGDGIAVGWLGHPVFSDKE
GHELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVIIE
FYGGELNGVSYNDPSTVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQVV
>NC_023260@Z104_p060@psbb@36144@37670@D@1@509 photosystem_II_CP47_chlorophyll_apoprotein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFSDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGRVQPVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVGAGLAESQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDSSTVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTKRQAV
>NC_023261@Z067_p051@psbb@85475@87001@D@1@509 photosystem_II_CP47_chlorophyll_apoprotein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTITNSGIWSYEGVAGAH
IVLSGLCFLAAIWHWVYWDLEIFSDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGRVQAVNPAWGVGGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVGAGLAENQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPVFRDKE
GCELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRAALKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTKRQAV
>NC_023357@AT74_p035@psbb@72317@73843@D@1@509 photosystem_II_CP47_chlorophyll_apoprotein
MGLPWYRVHTVVLNDPGRLISVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTITDPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVFWDLEIFSDERTGKPSLDLPKIFGIHLFLSGLAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPISPAWGVEGFDPFVAGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSAGLSENQSLSE
AWAKIPDKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKD
GRELFVRRMPTFFETFPVVLIDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTKRQGV
>NC_023358@AT78_p035@psbb@68694@70220@D@1@509 photosystem_II_CP47_chlorophyll_apoprotein
MGLPWYRVHTVVLNDPGRLISVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTITDPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFSDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPISPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSAGLSENQSLSE
AWAKIPEKLVFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKD
GRELFVRRMPTFFETFPVVLIDGNGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQGV
>NC_023359@AT60_p034@psbb@70628@72154@D@1@509 photosystem_II_CP47_chlorophyll_apoprotein
MGLPWYRVHTVVLNDPGRLISVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTITDPGFWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFSDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPISPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
IVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSAGLSENQSLSE
AWAKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKD
GRELFVRRMPTFFETFPVVLIDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQGV
>NC_023360@AT96_p035@psbb@70782@72308@D@1@509 photosystem_II_CP47_chlorophyll_apoprotein
MGLPWYRVHTVVLNDPGRLISVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTITDPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFSDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPISPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSAGLSENQSLSE
AWAKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKD
GRELFVRRMPTFFETFPVVLIDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
LTTRRQGV
>NC_023367@BN845_0670@psbb@70551@72077@D@1@509 psbB_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWNITGGTITNPGLWSYEGVAAAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSAGLAENQSVSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPVFRNKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTKRQAV
>NC_023449@PuolCp047@psbb@70232@71758@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVSGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSISGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLAGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQAVNPAWGAEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSDGLAENLSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPVFRDKE
GRELFVRRMPTFFETFPVVLVDEEGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHATFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGTFQKVGD
PTTRRQVV
>NC_023463@BF67_p037@psbb@70234@71760@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLISVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTVTNPGIWSYEGVAGAH
IVFSGLCFLASIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGAAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPVNPSWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSAGLAENQSFSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTIRQVV
>NC_023533@DeanCp049@psbb@68294@69820@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLAVHIMHTALVSGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITDSWGGWSISGGTVTNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFSDERTGKPSLDLPKIFGIHLFLAGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQAVNPAWGAEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSNGLSENLSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPVFRDKE
GRELFVRRMPTFFETFPVVLVDEEGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRSQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHATFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGTFQKVGD
PTTRKQAV
>NC_023544@CD82_p041@psbb@74569@76089@D@1@507 photosystem_II_CP47_chlorophyll_apoprotein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTITNPGIWSYEGVAGAH
ILFSGLCFLAAIWHWVYWDLEIFSDERTGKPSLDLPKIFGIHLFLSGLGC
FGFGAFHVTGLYGPGIWVSDPYGLTGRVQAVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSTGLAENQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPVFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDTQVEFGAFQKLGD
PTTKRV
>NC_023785@CP76_p137@psbb@63972@65501@R@1@510 photosystem_II_P680_chlorophyll_A_apoprotein
MGLPWYRVHTVVLNDPGRLISVHLMHTALVAGWAGSMALYELAVFDPSDP
VLNPMWRQGMFVMPFMARLGVTDSWGGWSITGESVSNPGLWSFEGVAITH
IVLSGMLFLASIWHWVYWDLELFRDPRTGEPALDLPKIFGIHLLLSSLLC
FGFGAFHTTGLFGPGIWISDGYGITGKVQPVAPAWGPDGFNPFNPGGIAS
HHIAAGTVGILAGLFHLTVRPPQRLYRALRMGNIETVLSSSISAVFFSAF
VTCGTMWYGSATTPIELFGPTRYQWDSGYFQQEIERRVENSLNEGATPEE
AWSKIPDKLAFYDYIGNNPAKGGLFRAGPMDKGDGIAEAWLGHPIFQDKE
GRELTVRRMPAFFETFPVILVDKDGIIRADIPFRRAESKYSIEQVGVTVS
FYGGKLNGKVFTDAPSVKKYARKAQLGEVFEFDRTTLESDGVFRSSPRGW
FTFGHANFALIFFFGHLWHGSRTIFRDVFAGIGAEVTEQVEFGAFQKLGD
RSSKKQGAV
>NC_023790@CP92_p038@psbb@77318@78844@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLISVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGLAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQPVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVGAGLAANQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGTFQKLGD
PTTRRQIV
>NC_023792@CP89_p039@psbb@76746@78272@D@1@509 PsbB
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFGDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQSVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSAGLAENQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPVTVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQVV
>NC_023798@CP95_p040@psbb@74078@75604@D@1@509 photosystem_II_CP47_chlorophyll_apoprotein
MGLPWYRVHTVVLNDPGRLIAVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTVTNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFTDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGRVQSVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRIGAGLAENQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQVV
>NC_023800@CP56_p038@psbb@71296@72822@D@1@509 photosystem_II_protein_B
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVSGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSISGGTVTNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLAGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQAVNPAWGAEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSDGLAENLSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPVFRDKE
GRELFVRRMPTFFETFPVVLVDEEGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHATFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGTFQKVGD
PTTRRQAA
>NC_023801@CP80_p038@psbb@78444@79973@D@1@510 PsbB
MGLPWYRVHTVVLNDPGRLISVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFSDERTGKPSLDLPKIFGIHLFLSGLAC
FGFGAFHVTGLYGPGIWVSDPYGLTGRVQSVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFCPTRYQWDQGYFQQEIYRRVSAGIAENQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFSRAGSMDNGDGIAVGWLGHPIFRDK
EGRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTV
EFYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRG
WFTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGTFQKLG
DPTTRRQVV
>NC_023805@CP88_p026@psbb@71975@73501@R@1@509 photosystem_II_CP47_chlorophyll_apoprotein
MGLPWYRVHTVVLNDPGRLIAVHIMHTALVSGWAGSMALYELAIFDPSDP
VLDPMWRQGMFVIPFMTRLGIKDSWGGWSITGETVTNPGLWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLDVFCDERTGKPSLDLPKIFGIHLFLSGAAC
FGFGAFHVTGLYGPGIWVSDPYGLTGRIQPVNPAWGAEGFDPFVPGGIAA
HHIAAGILGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIDRRVRAGLAENLSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGAMDNGDGIAVGWLGHPIFKDKD
GRELFVRRMPTFFETFPVVLVDEEGIVKADVPFRRAESKYSVEQVGVTVE
FYGGELDGVSFGDPAIVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHATFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGVFQKLGD
PTTKKQVV
>NC_023934@ArapCp047@psbb@71388@72914@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVSGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSISGGTVTNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLAGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQAVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSDGLAENLSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPVFRDKE
GRELFVRRMPTFFETFPVVLVDEEGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRSQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHATFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGTFQKVGD
PTTRRQAV
>NC_023935@ArteCp047@psbb@71323@72849@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVSGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSISGGTVTNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLAGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQAVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSDGLAENLSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPVFRDKE
GRELFVRRMPTFFETFPVVLVDEEGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRSQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHATFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGTFQKVGD
PTTRRQAV
>NC_023956@DO26_p039@psbb@74012@75538@D@1@509 photosystem_II_CP47_chlorophyll_apoprotein
MGLPWYRVHTVVLNDPGRLIAVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTVTNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFTDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGRVQSVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRIGAGLAENQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQVV
>NC_023959@DN99_p035@psbb@76987@78513@D@1@509 photosystem_II_P680_chlorophyll_A_apoprotein
MGLPWYRVHTVVLNDPGRLISVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFSDERTGKPSLDLPKIFGIHLFLSGLAC
FGFGAFHVTGLYGPGIWVSDPYGLTGRVQSVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVSAGIAENPSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDGGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGTFQKLGD
PTTRRQVV
>NC_024019@DEOF_Cp046@psbb@72988@74514@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVSGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSISGGTITNPGIWSYEGVAGAH
ILFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQSVNPAWGAEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVGAGLAENLSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVIYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHATFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQVV
>NC_024021@ED49_p020@psbb@17249@18775@R@1@509 photosystem_II_CP47_chlorophyll_apoprotein
MGLPWYRVHTVVLNDPGRLIAVHIMHTALVSGWAGSMALYELAVFDPSDP
ILDPMWRQGMFVIPFMTRLGIKDSWGGWSITGETISNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLDVFCDSRTGKPSLDLPKIFGIHLFLSGAAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKIQPVNPAWGAEGFDPFVPGGIAS
HHIAAGILGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
IVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIDRRVRAGLAENLSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGAMDNGDGIAVGWLGHPIFKDKK
GHELFVRRMPTFFETFPVVLVDEEGIVKADVPFRRAESKYSVEQVGVTVE
FYGGELDGVSFGDPAIVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHATFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTKRQVV
>NC_024022@ED58_p020@psbb@17306@18832@R@1@509 photosystem_II_CP47_chlorophyll_apoprotein
MGLPWYRVHTVVLNDPGRLIAVHIMHTALVSGWAGSMALYELAVFDPSDP
ILDPMWRQGMFVIPFMTRLGIKDSWGGWSITGETISNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLDVFCDSRTGKPSLDLPKIFGIHLFLSGAAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKIQPVNPAWGAEGFDPFVPGGIAS
HHIAAGILGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
IVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIDRRVRAGLAENLSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGAMDNGDGIAVGWLGHPIFKDKK
GHELFVRRMPTFFETFPVVLVDEEGIVKADVPFRRAESKYSVEQVGVTVE
FYGGELDGVSFGDPAIVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHATFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTKRQVV
>NC_024023@ED53_p020@psbb@17283@18809@R@1@509 photosystem_II_CP47_chlorophyll_apoprotein
MGLPWYRVHTVVLNDPGRLIAVHIMHTALVSGWAGSMALYELAVFDPSDP
ILDPMWRQGMFVIPFMTRLGIKDSWGGWSITGETISNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLDVFCDSRTGKPSLDLPKIFGIHLFLSGAAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKIQPVNPAWGAEGFDPFVPGGIAS
HHIAAGILGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
IVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIDRRVRAGLAENLSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGAMDNGDGIAVGWLGHPIFKDKK
GHELFVRRMPTFFETFPVVLVDEEGIVKADVPFRRAESKYSVEQVGVTVE
FYGGELDGVSFGDPAIVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHATFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTKRQVV
>NC_024024@ED55_p020@psbb@17295@18821@R@1@509 photosystem_II_CP47_chlorophyll_apoprotein
MGLPWYRVHTVVLNDPGRLIAVHIMHTALVSGWAGSMALYELAVFDPSDP
ILDPMWRQGMFVIPFMTRLGIKDSWGGWSITGETISNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLDVFCDSRTGKPSLDLPKIFGIHLFLSGAAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKIQPVNPAWGAEGFDPFVPGGIAS
HHIAAGILGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
IVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIDRRVRAGLAENLCLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGAMDNGDGIAVGWLGHPIFKDKK
GHELFVRRMPTFFETFPVVLVDEEGIVKADVPFRRAESKYSVEQVGVTVE
FYGGELDGVSFGDPAIVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHATFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTKRQVV
>NC_024027@ED56_p039@psbb@76392@77918@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVSGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGINNSWGGWSITGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGKVQSVNPAWGAEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVGAGLAENLSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GHELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHATFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTKRQVV
>NC_024034@EJ83_p018@psbb@100327@101853@D@1@509 PsbB
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWNITGGTITNPGIWSYEGVAAAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLAGVGC
FGFGAFHVTGLFGPGIWVSDPYGLTGRVQSVNPAWGVDGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVGAGLAENQSLSE
AWSKIPEKLVFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTKKQVV
>NC_024035@EJ79_p018@psbb@101627@103153@D@1@509 PsbB
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWNITGGTITNPGIWSYEGVAAAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLAGVGC
FGFGAFHVTGLFGPGIWVSDPYGLTGRVQSVNPAWGVDGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVGAGLAENQSLSE
AWSKIPEKLVFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTKKQVV
>NC_024036@EJ75_p016@psbb@94878@96404@R@1@509 no_product_string_in_file
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWNITGGTITNPGIWSYEGVAAAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLAGVGC
FGFGAFHVTGLFGPGIWVSDPYGLTGRVQSVNPAWGVDGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVGAGLAENQSLSE
AWSKIPEKLVFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTKKQVV
>NC_024038@EJ78_p031@psbb@72405@73931@D@1@509 PsbB
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWNITGGTITNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLAGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGRVQSVNPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVGAGLAENQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTKRQVV
>NC_024060@EN55_p039@psbb@76946@78472@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTVTNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGRVQSVSPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVGAGLAENQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYNDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQVV
>NC_024061@EN56_p039@psbb@76976@78502@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTVTNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGRVQSVSPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVGAGLAENQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQVV
>NC_024062@EN53_p039@psbb@76977@78503@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTVTNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGRVQSVSPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVGAGLAENQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQVV
>NC_024064@EN63_p039@psbb@76676@78202@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTVTNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGRVQSVSPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVGAGLAENQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQVV
>NC_024065@EN60_p039@psbb@76610@78136@D@1@509 photosystem_II_47_kDa_protein
MGLPWYRVHTVVLNDPGRLLSVHIMHTALVAGWAGSMALYELAVFDPSDP
VLDPMWRQGMFVIPFMTRLGITNSWGGWSITGGTVTNPGIWSYEGVAGAH
IVFSGLCFLAAIWHWVYWDLEIFCDERTGKPSLDLPKIFGIHLFLSGVAC
FGFGAFHVTGLYGPGIWVSDPYGLTGRVQSVSPAWGVEGFDPFVPGGIAS
HHIAAGTLGILAGLFHLSVRPPQRLYKGLRMGNIETVLSSSIAAVFFAAF
VVAGTMWYGSATTPIELFGPTRYQWDQGYFQQEIYRRVGAGLAENQSLSE
AWSKIPEKLAFYDYIGNNPAKGGLFRAGSMDNGDGIAVGWLGHPIFRDKE
GRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVE
FYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGW
FTFGHASFALLFFFGHIWHGARTLFRDVFAGIDPDLDAQVEFGAFQKLGD
PTTRRQVV