From e4d6a8484da5a00bbbbbce0d27957f2fb9ba0ed9 Mon Sep 17 00:00:00 2001 From: alain viari Date: Fri, 13 Nov 2015 17:41:18 +0100 Subject: [PATCH] cds/tools/chlorodb added Former-commit-id: 0579e878a69b7c285ca71870e9ca5730649a2fda Former-commit-id: 7cced5b488441d87bf070a9a444317db0e048880 --- TODO | 6 +- data/cds/chlorodb/fasta/AC_000188.fst.gz | Bin 48693 -> 48693 bytes data/cds/chlorodb/fasta/NC_000925.fst.gz | Bin 59421 -> 59421 bytes data/cds/chlorodb/fasta/NC_000926.fst.gz | Bin 37910 -> 37910 bytes data/cds/chlorodb/fasta/NC_000927.fst.gz | Bin 63086 -> 63086 bytes data/cds/chlorodb/fasta/NC_000932.fst.gz | Bin 48304 -> 48304 bytes data/cds/chlorodb/fasta/NC_001319.fst.gz | Bin 36998 -> 36998 bytes data/cds/chlorodb/fasta/NC_001320.fst.gz | Bin 42298 -> 42298 bytes data/cds/chlorodb/fasta/NC_001568.fst.gz | Bin 22069 -> 22069 bytes data/cds/chlorodb/fasta/NC_001603.fst.gz | Bin 40492 -> 40492 bytes data/cds/chlorodb/fasta/NC_001631.fst.gz | Bin 37642 -> 37642 bytes data/cds/chlorodb/fasta/NC_001666.fst.gz | Bin 44061 -> 44061 bytes data/cds/chlorodb/fasta/NC_001675.fst.gz | Bin 41609 -> 41609 bytes data/cds/chlorodb/fasta/NC_001713.fst.gz | Bin 37239 -> 37239 bytes data/cds/chlorodb/fasta/NC_001840.fst.gz | Bin 51212 -> 51212 bytes data/cds/chlorodb/fasta/NC_001865.fst.gz | Bin 45850 -> 45850 bytes data/cds/chlorodb/fasta/NC_001879.fst.gz | Bin 48873 -> 48873 bytes data/cds/chlorodb/fasta/NC_002186.fst.gz | Bin 36388 -> 36388 bytes data/cds/chlorodb/fasta/NC_002202.fst.gz | Bin 47121 -> 47121 bytes data/cds/chlorodb/fasta/NC_002652.fst.gz | Bin 19694 -> 19694 bytes data/cds/chlorodb/fasta/NC_002693.fst.gz | Bin 51208 -> 51208 bytes data/cds/chlorodb/fasta/NC_002694.fst.gz | Bin 46923 -> 46923 bytes data/cds/chlorodb/fasta/NC_002762.fst.gz | Bin 42255 -> 42255 bytes data/cds/chlorodb/fasta/NC_003119.fst.gz | Bin 38309 -> 38309 bytes data/cds/chlorodb/fasta/NC_003386.fst.gz | Bin 43338 -> 43338 bytes data/cds/chlorodb/fasta/NC_004115.fst.gz | Bin 40186 -> 40186 bytes data/cds/chlorodb/fasta/NC_004543.fst.gz | Bin 49972 -> 49972 bytes data/cds/chlorodb/fasta/NC_004561.fst.gz | Bin 49094 -> 49094 bytes data/cds/chlorodb/fasta/NC_004677.fst.gz | Bin 36735 -> 36735 bytes data/cds/chlorodb/fasta/NC_004766.fst.gz | Bin 47333 -> 47333 bytes data/cds/chlorodb/fasta/NC_004799.fst.gz | Bin 46544 -> 46544 bytes data/cds/chlorodb/fasta/NC_004993.fst.gz | Bin 48143 -> 48143 bytes data/cds/chlorodb/fasta/NC_005086.fst.gz | Bin 50896 -> 50896 bytes data/cds/chlorodb/fasta/NC_005087.fst.gz | Bin 37451 -> 37451 bytes data/cds/chlorodb/fasta/NC_005353.fst.gz | Bin 60583 -> 60583 bytes data/cds/chlorodb/fasta/NC_005878.fst.gz | Bin 44266 -> 44266 bytes data/cds/chlorodb/fasta/NC_005973.fst.gz | Bin 42277 -> 42277 bytes data/cds/chlorodb/fasta/NC_006050.fst.gz | Bin 50208 -> 50208 bytes data/cds/chlorodb/fasta/NC_006084.fst.gz | Bin 44282 -> 44282 bytes data/cds/chlorodb/fasta/NC_006137.fst.gz | Bin 56557 -> 56557 bytes data/cds/chlorodb/fasta/NC_006290.fst.gz | Bin 48925 -> 48925 bytes data/cds/chlorodb/fasta/NC_006861.fst.gz | Bin 48104 -> 48104 bytes data/cds/chlorodb/fasta/NC_007144.fst.gz | Bin 48496 -> 48496 bytes data/cds/chlorodb/fasta/NC_007288.fst.gz | Bin 33136 -> 33136 bytes data/cds/chlorodb/fasta/NC_007407.fst.gz | Bin 48191 -> 48191 bytes data/cds/chlorodb/fasta/NC_007499.fst.gz | Bin 46396 -> 46396 bytes data/cds/chlorodb/fasta/NC_007500.fst.gz | Bin 48843 -> 48843 bytes data/cds/chlorodb/fasta/NC_007578.fst.gz | Bin 47807 -> 47807 bytes data/cds/chlorodb/fasta/NC_007602.fst.gz | Bin 48771 -> 48771 bytes data/cds/chlorodb/fasta/NC_007898.fst.gz | Bin 48688 -> 48688 bytes data/cds/chlorodb/fasta/NC_007932.fst.gz | Bin 59731 -> 59731 bytes data/cds/chlorodb/fasta/NC_007942.fst.gz | Bin 47401 -> 47401 bytes data/cds/chlorodb/fasta/NC_007943.fst.gz | Bin 48678 -> 48678 bytes data/cds/chlorodb/fasta/NC_007944.fst.gz | Bin 50038 -> 50038 bytes data/cds/chlorodb/fasta/NC_007957.fst.gz | Bin 50333 -> 50333 bytes data/cds/chlorodb/fasta/NC_007977.fst.gz | Bin 47259 -> 47259 bytes data/cds/chlorodb/fasta/NC_008096.fst.gz | Bin 48668 -> 48668 bytes data/cds/chlorodb/fasta/NC_008097.fst.gz | Bin 55543 -> 55543 bytes data/cds/chlorodb/fasta/NC_008099.fst.gz | Bin 46413 -> 46413 bytes data/cds/chlorodb/fasta/NC_008100.fst.gz | Bin 11582 -> 11582 bytes data/cds/chlorodb/fasta/NC_008101.fst.gz | Bin 47319 -> 47319 bytes data/cds/chlorodb/fasta/NC_008114.fst.gz | Bin 59698 -> 59698 bytes data/cds/chlorodb/fasta/NC_008115.fst.gz | Bin 50071 -> 50071 bytes data/cds/chlorodb/fasta/NC_008116.fst.gz | Bin 48680 -> 48680 bytes data/cds/chlorodb/fasta/NC_008117.fst.gz | Bin 50966 -> 50966 bytes data/cds/chlorodb/fasta/NC_008155.fst.gz | Bin 42276 -> 42276 bytes data/cds/chlorodb/fasta/NC_008235.fst.gz | Bin 48857 -> 48857 bytes data/cds/chlorodb/fasta/NC_008289.fst.gz | Bin 22663 -> 22663 bytes data/cds/chlorodb/fasta/NC_008325.fst.gz | Bin 48883 -> 48883 bytes data/cds/chlorodb/fasta/NC_008326.fst.gz | Bin 50082 -> 50082 bytes data/cds/chlorodb/fasta/NC_008334.fst.gz | Bin 50200 -> 50200 bytes data/cds/chlorodb/fasta/NC_008335.fst.gz | Bin 50551 -> 50551 bytes data/cds/chlorodb/fasta/NC_008336.fst.gz | Bin 49106 -> 49106 bytes data/cds/chlorodb/fasta/NC_008359.fst.gz | Bin 49555 -> 49555 bytes data/cds/chlorodb/fasta/NC_008372.fst.gz | Bin 65929 -> 65929 bytes data/cds/chlorodb/fasta/NC_008407.fst.gz | Bin 50941 -> 50941 bytes data/cds/chlorodb/fasta/NC_008408.fst.gz | Bin 21315 -> 21315 bytes data/cds/chlorodb/fasta/NC_008454.fst.gz | Bin 67780 -> 67780 bytes data/cds/chlorodb/fasta/NC_008456.fst.gz | Bin 50250 -> 50250 bytes data/cds/chlorodb/fasta/NC_008457.fst.gz | Bin 50126 -> 50126 bytes data/cds/chlorodb/fasta/NC_008535.fst.gz | Bin 48515 -> 48515 bytes data/cds/chlorodb/fasta/NC_008588.fst.gz | Bin 36527 -> 36527 bytes data/cds/chlorodb/fasta/NC_008589.fst.gz | Bin 39723 -> 39723 bytes data/cds/chlorodb/fasta/NC_008590.fst.gz | Bin 42862 -> 42862 bytes data/cds/chlorodb/fasta/NC_008591.fst.gz | Bin 42976 -> 42976 bytes data/cds/chlorodb/fasta/NC_008602.fst.gz | Bin 44176 -> 44176 bytes data/cds/chlorodb/fasta/NC_008641.fst.gz | Bin 50132 -> 50132 bytes data/cds/chlorodb/fasta/NC_008788.fst.gz | Bin 50462 -> 50462 bytes data/cds/chlorodb/fasta/NC_008796.fst.gz | Bin 48563 -> 48563 bytes data/cds/chlorodb/fasta/NC_008822.fst.gz | Bin 47567 -> 47567 bytes data/cds/chlorodb/fasta/NC_008829.fst.gz | Bin 47396 -> 47396 bytes data/cds/chlorodb/fasta/NC_009143.fst.gz | Bin 48999 -> 48999 bytes data/cds/chlorodb/fasta/NC_009259.fst.gz | Bin 46780 -> 46780 bytes data/cds/chlorodb/fasta/NC_009265.fst.gz | Bin 48158 -> 48158 bytes data/cds/chlorodb/fasta/NC_009266.fst.gz | Bin 48186 -> 48186 bytes data/cds/chlorodb/fasta/NC_009267.fst.gz | Bin 48403 -> 48403 bytes data/cds/chlorodb/fasta/NC_009268.fst.gz | Bin 48050 -> 48050 bytes data/cds/chlorodb/fasta/NC_009269.fst.gz | Bin 48326 -> 48326 bytes data/cds/chlorodb/fasta/NC_009270.fst.gz | Bin 48322 -> 48322 bytes data/cds/chlorodb/fasta/NC_009271.fst.gz | Bin 48470 -> 48470 bytes data/cds/chlorodb/fasta/NC_009272.fst.gz | Bin 47960 -> 47960 bytes data/cds/chlorodb/fasta/NC_009273.fst.gz | Bin 48373 -> 48373 bytes data/cds/chlorodb/fasta/NC_009274.fst.gz | Bin 47622 -> 47622 bytes data/cds/chlorodb/fasta/NC_009275.fst.gz | Bin 48458 -> 48458 bytes data/cds/chlorodb/fasta/NC_009573.fst.gz | Bin 42448 -> 42448 bytes data/cds/chlorodb/fasta/NC_009598.fst.gz | Bin 49354 -> 49354 bytes data/cds/chlorodb/fasta/NC_009599.fst.gz | Bin 49804 -> 49804 bytes data/cds/chlorodb/fasta/NC_009600.fst.gz | Bin 46521 -> 46521 bytes data/cds/chlorodb/fasta/NC_009601.fst.gz | Bin 47753 -> 47753 bytes data/cds/chlorodb/fasta/NC_009618.fst.gz | Bin 51143 -> 51143 bytes data/cds/chlorodb/fasta/NC_009681.fst.gz | Bin 58782 -> 58782 bytes data/cds/chlorodb/fasta/NC_009765.fst.gz | Bin 27368 -> 27368 bytes data/cds/chlorodb/fasta/NC_009766.fst.gz | Bin 38162 -> 38162 bytes data/cds/chlorodb/fasta/NC_009808.fst.gz | Bin 50372 -> 50372 bytes data/cds/chlorodb/fasta/NC_009949.fst.gz | Bin 26941 -> 26941 bytes data/cds/chlorodb/fasta/NC_009950.fst.gz | Bin 42491 -> 42491 bytes data/cds/chlorodb/fasta/NC_009962.fst.gz | Bin 48871 -> 48871 bytes data/cds/chlorodb/fasta/NC_009963.fst.gz | Bin 39375 -> 39375 bytes data/cds/chlorodb/fasta/NC_010093.fst.gz | Bin 48194 -> 48194 bytes data/cds/chlorodb/fasta/NC_010109.fst.gz | Bin 51755 -> 51755 bytes data/cds/chlorodb/fasta/NC_010323.fst.gz | Bin 49998 -> 49998 bytes data/cds/chlorodb/fasta/NC_010358.fst.gz | Bin 51010 -> 51010 bytes data/cds/chlorodb/fasta/NC_010359.fst.gz | Bin 34140 -> 34140 bytes data/cds/chlorodb/fasta/NC_010360.fst.gz | Bin 51089 -> 51089 bytes data/cds/chlorodb/fasta/NC_010361.fst.gz | Bin 51076 -> 51076 bytes data/cds/chlorodb/fasta/NC_010362.fst.gz | Bin 50762 -> 50762 bytes data/cds/chlorodb/fasta/NC_010433.fst.gz | Bin 50128 -> 50128 bytes data/cds/chlorodb/fasta/NC_010442.fst.gz | Bin 50277 -> 50277 bytes data/cds/chlorodb/fasta/NC_010548.fst.gz | Bin 41076 -> 41076 bytes data/cds/chlorodb/fasta/NC_010601.fst.gz | Bin 47550 -> 47550 bytes data/cds/chlorodb/fasta/NC_010654.fst.gz | Bin 37218 -> 37218 bytes data/cds/chlorodb/fasta/NC_010772.fst.gz | Bin 49157 -> 49157 bytes data/cds/chlorodb/fasta/NC_010776.fst.gz | Bin 50088 -> 50088 bytes data/cds/chlorodb/fasta/NC_011031.fst.gz | Bin 59663 -> 59663 bytes data/cds/chlorodb/fasta/NC_011032.fst.gz | Bin 42401 -> 42401 bytes data/cds/chlorodb/fasta/NC_011152.fst.gz | Bin 36086 -> 36086 bytes data/cds/chlorodb/fasta/NC_011153.fst.gz | Bin 36720 -> 36720 bytes data/cds/chlorodb/fasta/NC_011154.fst.gz | Bin 36692 -> 36692 bytes data/cds/chlorodb/fasta/NC_011155.fst.gz | Bin 36290 -> 36290 bytes data/cds/chlorodb/fasta/NC_011156.fst.gz | Bin 36554 -> 36554 bytes data/cds/chlorodb/fasta/NC_011158.fst.gz | Bin 36148 -> 36148 bytes data/cds/chlorodb/fasta/NC_011159.fst.gz | Bin 36028 -> 36028 bytes data/cds/chlorodb/fasta/NC_011163.fst.gz | Bin 38927 -> 38927 bytes data/cds/chlorodb/fasta/NC_011600.fst.gz | Bin 35035 -> 35035 bytes data/cds/chlorodb/fasta/NC_011713.fst.gz | Bin 42631 -> 42631 bytes data/cds/chlorodb/fasta/NC_011828.fst.gz | Bin 44406 -> 44406 bytes data/cds/chlorodb/fasta/NC_011930.fst.gz | Bin 36888 -> 36888 bytes data/cds/chlorodb/fasta/NC_011942.fst.gz | Bin 35962 -> 35962 bytes data/cds/chlorodb/fasta/NC_011954.fst.gz | Bin 34295 -> 34295 bytes data/cds/chlorodb/fasta/NC_012052.fst.gz | Bin 37374 -> 37374 bytes data/cds/chlorodb/fasta/NC_012097.fst.gz | Bin 25348 -> 25348 bytes data/cds/chlorodb/fasta/NC_012099.fst.gz | Bin 31622 -> 31622 bytes data/cds/chlorodb/fasta/NC_012101.fst.gz | Bin 34438 -> 34438 bytes data/cds/chlorodb/fasta/NC_012224.fst.gz | Bin 50755 -> 50755 bytes data/cds/chlorodb/fasta/NC_012568.fst.gz | Bin 13020 -> 13020 bytes data/cds/chlorodb/fasta/NC_012575.fst.gz | Bin 22846 -> 22846 bytes data/cds/chlorodb/fasta/NC_012615.fst.gz | Bin 50070 -> 50070 bytes data/cds/chlorodb/fasta/NC_012818.fst.gz | Bin 49143 -> 49143 bytes data/cds/chlorodb/fasta/NC_012898.fst.gz | Bin 28217 -> 28217 bytes data/cds/chlorodb/fasta/NC_012903.fst.gz | Bin 29452 -> 29452 bytes data/cds/chlorodb/fasta/NC_012927.fst.gz | Bin 43760 -> 43760 bytes data/cds/chlorodb/fasta/NC_012978.fst.gz | Bin 37563 -> 37563 bytes data/cds/chlorodb/fasta/NC_013086.fst.gz | Bin 45297 -> 45297 bytes data/cds/chlorodb/fasta/NC_013088.fst.gz | Bin 43800 -> 43800 bytes data/cds/chlorodb/fasta/NC_013273.fst.gz | Bin 44170 -> 44170 bytes data/cds/chlorodb/fasta/NC_013359.fst.gz | Bin 45624 -> 45624 bytes data/cds/chlorodb/fasta/NC_013498.fst.gz | Bin 43302 -> 43302 bytes data/cds/chlorodb/fasta/NC_013553.fst.gz | Bin 47641 -> 47641 bytes data/cds/chlorodb/fasta/NC_013703.fst.gz | Bin 24545 -> 24545 bytes data/cds/chlorodb/fasta/NC_013707.fst.gz | Bin 48821 -> 48821 bytes data/cds/chlorodb/fasta/NC_013823.fst.gz | Bin 50341 -> 50341 bytes data/cds/chlorodb/fasta/NC_013843.fst.gz | Bin 46985 -> 46985 bytes data/cds/chlorodb/fasta/NC_013991.fst.gz | Bin 49428 -> 49428 bytes data/cds/chlorodb/fasta/NC_014056.fst.gz | Bin 45744 -> 45744 bytes data/cds/chlorodb/fasta/NC_014057.fst.gz | Bin 38043 -> 38043 bytes data/cds/chlorodb/fasta/NC_014062.fst.gz | Bin 43435 -> 43435 bytes data/cds/chlorodb/fasta/NC_014063.fst.gz | Bin 37736 -> 37736 bytes data/cds/chlorodb/fasta/NC_014267.fst.gz | Bin 43526 -> 43526 bytes data/cds/chlorodb/fasta/NC_014287.fst.gz | Bin 36077 -> 36077 bytes data/cds/chlorodb/fasta/NC_014340.fst.gz | Bin 37849 -> 37849 bytes data/cds/chlorodb/fasta/NC_014345.fst.gz | Bin 27304 -> 27304 bytes data/cds/chlorodb/fasta/NC_014346.fst.gz | Bin 140781 -> 140781 bytes data/cds/chlorodb/fasta/NC_014348.fst.gz | Bin 48064 -> 48064 bytes data/cds/chlorodb/fasta/NC_014569.fst.gz | Bin 40980 -> 40980 bytes data/cds/chlorodb/fasta/NC_014570.fst.gz | Bin 49981 -> 49981 bytes data/cds/chlorodb/fasta/NC_014573.fst.gz | Bin 48399 -> 48399 bytes data/cds/chlorodb/fasta/NC_014575.fst.gz | Bin 37431 -> 37431 bytes data/cds/chlorodb/fasta/NC_014582.fst.gz | Bin 40343 -> 40343 bytes data/cds/chlorodb/fasta/NC_014589.fst.gz | Bin 33680 -> 33680 bytes data/cds/chlorodb/fasta/NC_014592.fst.gz | Bin 49129 -> 49129 bytes data/cds/chlorodb/fasta/NC_014674.fst.gz | Bin 50318 -> 50318 bytes data/cds/chlorodb/fasta/NC_014675.fst.gz | Bin 45621 -> 45621 bytes data/cds/chlorodb/fasta/NC_014676.fst.gz | Bin 50127 -> 50127 bytes data/cds/chlorodb/fasta/NC_014697.fst.gz | Bin 49353 -> 49353 bytes data/cds/chlorodb/fasta/NC_014699.fst.gz | Bin 41222 -> 41222 bytes data/cds/chlorodb/fasta/NC_014807.fst.gz | Bin 49684 -> 49684 bytes data/cds/chlorodb/fasta/NC_014808.fst.gz | Bin 43733 -> 43733 bytes data/cds/chlorodb/fasta/NC_014874.fst.gz | Bin 18628 -> 18628 bytes data/cds/chlorodb/fasta/NC_015083.fst.gz | Bin 36723 -> 36723 bytes data/cds/chlorodb/fasta/NC_015084.fst.gz | Bin 54431 -> 54431 bytes data/cds/chlorodb/fasta/NC_015113.fst.gz | Bin 48490 -> 48490 bytes data/cds/chlorodb/fasta/NC_015204.fst.gz | Bin 50060 -> 50060 bytes data/cds/chlorodb/fasta/NC_015206.fst.gz | Bin 48793 -> 48793 bytes data/cds/chlorodb/fasta/NC_015308.fst.gz | Bin 50164 -> 50164 bytes data/cds/chlorodb/fasta/NC_015359.fst.gz | Bin 38593 -> 38593 bytes data/cds/chlorodb/fasta/NC_015401.fst.gz | Bin 48766 -> 48766 bytes data/cds/chlorodb/fasta/NC_015402.fst.gz | Bin 37147 -> 37147 bytes data/cds/chlorodb/fasta/NC_015403.fst.gz | Bin 42055 -> 42055 bytes data/cds/chlorodb/fasta/NC_015543.fst.gz | Bin 47230 -> 47230 bytes data/cds/chlorodb/fasta/NC_015604.fst.gz | Bin 48772 -> 48772 bytes data/cds/chlorodb/fasta/NC_015605.fst.gz | Bin 50927 -> 50927 bytes data/cds/chlorodb/fasta/NC_015608.fst.gz | Bin 48852 -> 48852 bytes data/cds/chlorodb/fasta/NC_015610.fst.gz | Bin 51001 -> 51001 bytes data/cds/chlorodb/fasta/NC_015621.fst.gz | Bin 47048 -> 47048 bytes data/cds/chlorodb/fasta/NC_015623.fst.gz | Bin 48825 -> 48825 bytes data/cds/chlorodb/fasta/NC_015645.fst.gz | Bin 55064 -> 55064 bytes data/cds/chlorodb/fasta/NC_015803.fst.gz | Bin 43802 -> 43802 bytes data/cds/chlorodb/fasta/NC_015817.fst.gz | Bin 43863 -> 43863 bytes data/cds/chlorodb/fasta/NC_015820.fst.gz | Bin 43829 -> 43829 bytes data/cds/chlorodb/fasta/NC_015826.fst.gz | Bin 43884 -> 43884 bytes data/cds/chlorodb/fasta/NC_015830.fst.gz | Bin 43781 -> 43781 bytes data/cds/chlorodb/fasta/NC_015831.fst.gz | Bin 43805 -> 43805 bytes data/cds/chlorodb/fasta/NC_015891.fst.gz | Bin 52611 -> 52611 bytes data/cds/chlorodb/fasta/NC_015892.fst.gz | Bin 50029 -> 50029 bytes data/cds/chlorodb/fasta/NC_015894.fst.gz | Bin 52897 -> 52897 bytes data/cds/chlorodb/fasta/NC_015899.fst.gz | Bin 52718 -> 52718 bytes data/cds/chlorodb/fasta/NC_015983.fst.gz | Bin 48791 -> 48791 bytes data/cds/chlorodb/fasta/NC_015990.fst.gz | Bin 43869 -> 43869 bytes data/cds/chlorodb/fasta/NC_015996.fst.gz | Bin 49956 -> 49956 bytes data/cds/chlorodb/fasta/NC_016058.fst.gz | Bin 38285 -> 38285 bytes data/cds/chlorodb/fasta/NC_016063.fst.gz | Bin 42233 -> 42233 bytes data/cds/chlorodb/fasta/NC_016064.fst.gz | Bin 38256 -> 38256 bytes data/cds/chlorodb/fasta/NC_016065.fst.gz | Bin 41096 -> 41096 bytes data/cds/chlorodb/fasta/NC_016068.fst.gz | Bin 48867 -> 48867 bytes data/cds/chlorodb/fasta/NC_016069.fst.gz | Bin 38901 -> 38901 bytes data/cds/chlorodb/fasta/NC_016430.fst.gz | Bin 49143 -> 49143 bytes data/cds/chlorodb/fasta/NC_016433.fst.gz | Bin 48026 -> 48026 bytes data/cds/chlorodb/fasta/NC_016468.fst.gz | Bin 48066 -> 48066 bytes data/cds/chlorodb/fasta/NC_016471.fst.gz | Bin 28838 -> 28838 bytes data/cds/chlorodb/fasta/NC_016668.fst.gz | Bin 50038 -> 50038 bytes data/cds/chlorodb/fasta/NC_016670.fst.gz | Bin 50117 -> 50117 bytes data/cds/chlorodb/fasta/NC_016677.fst.gz | Bin 42886 -> 42886 bytes data/cds/chlorodb/fasta/NC_016690.fst.gz | Bin 50198 -> 50198 bytes data/cds/chlorodb/fasta/NC_016692.fst.gz | Bin 50063 -> 50063 bytes data/cds/chlorodb/fasta/NC_016699.fst.gz | Bin 43862 -> 43862 bytes data/cds/chlorodb/fasta/NC_016703.fst.gz | Bin 33150 -> 33150 bytes data/cds/chlorodb/fasta/NC_016708.fst.gz | Bin 47486 -> 47486 bytes data/cds/chlorodb/fasta/NC_016711.fst.gz | Bin 50103 -> 50103 bytes data/cds/chlorodb/fasta/NC_016712.fst.gz | Bin 50051 -> 50051 bytes data/cds/chlorodb/fasta/NC_016718.fst.gz | Bin 42813 -> 42813 bytes data/cds/chlorodb/fasta/NC_016727.fst.gz | Bin 47333 -> 47333 bytes data/cds/chlorodb/fasta/NC_016728.fst.gz | Bin 47281 -> 47281 bytes data/cds/chlorodb/fasta/NC_016729.fst.gz | Bin 45974 -> 45974 bytes data/cds/chlorodb/fasta/NC_016730.fst.gz | Bin 47406 -> 47406 bytes data/cds/chlorodb/fasta/NC_016731.fst.gz | Bin 35915 -> 35915 bytes data/cds/chlorodb/fasta/NC_016732.fst.gz | Bin 80968 -> 80968 bytes data/cds/chlorodb/fasta/NC_016733.fst.gz | Bin 30552 -> 30552 bytes data/cds/chlorodb/fasta/NC_016734.fst.gz | Bin 47763 -> 47763 bytes data/cds/chlorodb/fasta/NC_016735.fst.gz | Bin 38413 -> 38413 bytes data/cds/chlorodb/fasta/NC_016736.fst.gz | Bin 50694 -> 50694 bytes data/cds/chlorodb/fasta/NC_016753.fst.gz | Bin 50686 -> 50686 bytes data/cds/chlorodb/fasta/NC_016921.fst.gz | Bin 48982 -> 48982 bytes data/cds/chlorodb/fasta/NC_016927.fst.gz | Bin 42274 -> 42274 bytes data/cds/chlorodb/fasta/NC_016986.fst.gz | Bin 49073 -> 49073 bytes data/cds/chlorodb/fasta/NC_017006.fst.gz | Bin 45772 -> 45772 bytes data/cds/chlorodb/fasta/NC_017602.fst.gz | Bin 49049 -> 49049 bytes data/cds/chlorodb/fasta/NC_017609.fst.gz | Bin 46461 -> 46461 bytes data/cds/chlorodb/fasta/NC_017754.fst.gz | Bin 21109 -> 21109 bytes data/cds/chlorodb/fasta/NC_017835.fst.gz | Bin 42218 -> 42218 bytes data/cds/chlorodb/fasta/NC_017894.fst.gz | Bin 49930 -> 49930 bytes data/cds/chlorodb/fasta/NC_018051.fst.gz | Bin 47265 -> 47265 bytes data/cds/chlorodb/fasta/NC_018109.fst.gz | Bin 49752 -> 49752 bytes data/cds/chlorodb/fasta/NC_018110.fst.gz | Bin 49857 -> 49857 bytes data/cds/chlorodb/fasta/NC_018111.fst.gz | Bin 49925 -> 49925 bytes data/cds/chlorodb/fasta/NC_018112.fst.gz | Bin 49881 -> 49881 bytes data/cds/chlorodb/fasta/NC_018113.fst.gz | Bin 49980 -> 49980 bytes data/cds/chlorodb/fasta/NC_018114.fst.gz | Bin 44651 -> 44651 bytes data/cds/chlorodb/fasta/NC_018117.fst.gz | Bin 48915 -> 48915 bytes data/cds/chlorodb/fasta/NC_018357.fst.gz | Bin 50148 -> 50148 bytes data/cds/chlorodb/fasta/NC_018523.fst.gz | Bin 40473 -> 40473 bytes data/cds/chlorodb/fasta/NC_018541.fst.gz | Bin 49087 -> 49087 bytes data/cds/chlorodb/fasta/NC_018552.fst.gz | Bin 49076 -> 49076 bytes data/cds/chlorodb/fasta/NC_018565.fst.gz | Bin 48440 -> 48440 bytes data/cds/chlorodb/fasta/NC_018569.fst.gz | Bin 46936 -> 46936 bytes data/cds/chlorodb/fasta/NC_018766.fst.gz | Bin 40640 -> 40640 bytes data/cds/chlorodb/fasta/NC_018767.fst.gz | Bin 40697 -> 40697 bytes data/cds/chlorodb/fasta/NC_019601.fst.gz | Bin 48694 -> 48694 bytes data/cds/chlorodb/fasta/NC_019602.fst.gz | Bin 48748 -> 48748 bytes data/cds/chlorodb/fasta/NC_019616.fst.gz | Bin 53636 -> 53636 bytes data/cds/chlorodb/fasta/NC_019628.fst.gz | Bin 37864 -> 37864 bytes data/cds/chlorodb/fasta/NC_019648.fst.gz | Bin 42482 -> 42482 bytes data/cds/chlorodb/fasta/NC_019649.fst.gz | Bin 41793 -> 41793 bytes data/cds/chlorodb/fasta/NC_019650.fst.gz | Bin 42429 -> 42429 bytes data/cds/chlorodb/fasta/NC_019651.fst.gz | Bin 42422 -> 42422 bytes data/cds/chlorodb/fasta/NC_020014.fst.gz | Bin 35763 -> 35763 bytes data/cds/chlorodb/fasta/NC_020018.fst.gz | Bin 22942 -> 22942 bytes data/cds/chlorodb/fasta/NC_020019.fst.gz | Bin 49124 -> 49124 bytes data/cds/chlorodb/fasta/NC_020092.fst.gz | Bin 47280 -> 47280 bytes data/cds/chlorodb/fasta/NC_020098.fst.gz | Bin 48218 -> 48218 bytes data/cds/chlorodb/fasta/NC_020146.fst.gz | Bin 40761 -> 40761 bytes data/cds/chlorodb/fasta/NC_020147.fst.gz | Bin 43522 -> 43522 bytes data/cds/chlorodb/fasta/NC_020152.fst.gz | Bin 50473 -> 50473 bytes data/cds/chlorodb/fasta/NC_020316.fst.gz | Bin 50167 -> 50167 bytes data/cds/chlorodb/fasta/NC_020317.fst.gz | Bin 50155 -> 50155 bytes data/cds/chlorodb/fasta/NC_020318.fst.gz | Bin 50005 -> 50005 bytes data/cds/chlorodb/fasta/NC_020319.fst.gz | Bin 50856 -> 50856 bytes data/cds/chlorodb/fasta/NC_020320.fst.gz | Bin 47262 -> 47262 bytes data/cds/chlorodb/fasta/NC_020321.fst.gz | Bin 39771 -> 39771 bytes data/cds/chlorodb/fasta/NC_020341.fst.gz | Bin 43604 -> 43604 bytes data/cds/chlorodb/fasta/NC_020361.fst.gz | Bin 41745 -> 41745 bytes data/cds/chlorodb/fasta/NC_020362.fst.gz | Bin 50593 -> 50593 bytes data/cds/chlorodb/fasta/NC_020363.fst.gz | Bin 48690 -> 48690 bytes data/cds/chlorodb/fasta/NC_020364.fst.gz | Bin 49378 -> 49378 bytes data/cds/chlorodb/fasta/NC_020365.fst.gz | Bin 49194 -> 49194 bytes data/cds/chlorodb/fasta/NC_020366.fst.gz | Bin 49487 -> 49487 bytes data/cds/chlorodb/fasta/NC_020367.fst.gz | Bin 49339 -> 49339 bytes data/cds/chlorodb/fasta/NC_020371.fst.gz | Bin 29960 -> 29960 bytes data/cds/chlorodb/fasta/NC_020372.fst.gz | Bin 51745 -> 51745 bytes data/cds/chlorodb/fasta/NC_020431.fst.gz | Bin 47436 -> 47436 bytes data/cds/chlorodb/fasta/NC_020438.fst.gz | Bin 65577 -> 65577 bytes data/cds/chlorodb/fasta/NC_020460.fst.gz | Bin 27657 -> 27657 bytes data/cds/chlorodb/fasta/NC_020607.fst.gz | Bin 47290 -> 47290 bytes data/cds/chlorodb/fasta/NC_020795.fst.gz | Bin 55203 -> 55203 bytes data/cds/chlorodb/fasta/NC_021075.fst.gz | Bin 54841 -> 54841 bytes data/cds/chlorodb/fasta/NC_021091.fst.gz | Bin 47122 -> 47122 bytes data/cds/chlorodb/fasta/NC_021101.fst.gz | Bin 49219 -> 49219 bytes data/cds/chlorodb/fasta/NC_021102.fst.gz | Bin 48253 -> 48253 bytes data/cds/chlorodb/fasta/NC_021109.fst.gz | Bin 83656 -> 83656 bytes data/cds/chlorodb/fasta/NC_021110.fst.gz | Bin 41896 -> 41896 bytes data/cds/chlorodb/fasta/NC_021111.fst.gz | Bin 32194 -> 32194 bytes data/cds/chlorodb/fasta/NC_021121.fst.gz | Bin 48988 -> 48988 bytes data/cds/chlorodb/fasta/NC_021189.fst.gz | Bin 60859 -> 60859 bytes data/cds/chlorodb/fasta/NC_021372.fst.gz | Bin 44489 -> 44489 bytes data/cds/chlorodb/fasta/NC_021423.fst.gz | Bin 48535 -> 48535 bytes data/cds/chlorodb/fasta/NC_021425.fst.gz | Bin 51498 -> 51498 bytes data/cds/chlorodb/fasta/NC_021426.fst.gz | Bin 51820 -> 51820 bytes data/cds/chlorodb/fasta/NC_021429.fst.gz | Bin 48976 -> 48976 bytes data/cds/chlorodb/fasta/NC_021430.fst.gz | Bin 48565 -> 48565 bytes data/cds/chlorodb/fasta/NC_021431.fst.gz | Bin 48627 -> 48627 bytes data/cds/chlorodb/fasta/NC_021432.fst.gz | Bin 48735 -> 48735 bytes data/cds/chlorodb/fasta/NC_021433.fst.gz | Bin 48488 -> 48488 bytes data/cds/chlorodb/fasta/NC_021437.fst.gz | Bin 42133 -> 42133 bytes data/cds/chlorodb/fasta/NC_021438.fst.gz | Bin 36000 -> 36000 bytes data/cds/chlorodb/fasta/NC_021439.fst.gz | Bin 37588 -> 37588 bytes data/cds/chlorodb/fasta/NC_021440.fst.gz | Bin 37938 -> 37938 bytes data/cds/chlorodb/fasta/NC_021441.fst.gz | Bin 40901 -> 40901 bytes data/cds/chlorodb/fasta/NC_021449.fst.gz | Bin 47642 -> 47642 bytes data/cds/chlorodb/fasta/NC_021455.fst.gz | Bin 48927 -> 48927 bytes data/cds/chlorodb/fasta/NC_021456.fst.gz | Bin 38850 -> 38850 bytes data/cds/chlorodb/fasta/NC_021618.fst.gz | Bin 59093 -> 59093 bytes data/cds/chlorodb/fasta/NC_021636.fst.gz | Bin 47511 -> 47511 bytes data/cds/chlorodb/fasta/NC_021637.fst.gz | Bin 33827 -> 33827 bytes data/cds/chlorodb/fasta/NC_021645.fst.gz | Bin 47405 -> 47405 bytes data/cds/chlorodb/fasta/NC_021646.fst.gz | Bin 47494 -> 47494 bytes data/cds/chlorodb/fasta/NC_021647.fst.gz | Bin 47440 -> 47440 bytes data/cds/chlorodb/fasta/NC_021648.fst.gz | Bin 47541 -> 47541 bytes data/cds/chlorodb/fasta/NC_021649.fst.gz | Bin 47599 -> 47599 bytes data/cds/chlorodb/fasta/NC_021650.fst.gz | Bin 47521 -> 47521 bytes data/cds/chlorodb/fasta/NC_021760.fst.gz | Bin 36515 -> 36515 bytes data/cds/chlorodb/fasta/NC_021761.fst.gz | Bin 36012 -> 36012 bytes data/cds/chlorodb/fasta/NC_021762.fst.gz | Bin 36344 -> 36344 bytes data/cds/chlorodb/fasta/NC_021936.fst.gz | Bin 48785 -> 48785 bytes data/cds/chlorodb/fasta/NC_022133.fst.gz | Bin 35855 -> 35855 bytes data/cds/chlorodb/fasta/NC_022135.fst.gz | Bin 35610 -> 35610 bytes data/cds/chlorodb/fasta/NC_022136.fst.gz | Bin 49449 -> 49449 bytes data/cds/chlorodb/fasta/NC_022137.fst.gz | Bin 47876 -> 47876 bytes data/cds/chlorodb/fasta/NC_022259.fst.gz | Bin 36749 -> 36749 bytes data/cds/chlorodb/fasta/NC_022260.fst.gz | Bin 36593 -> 36593 bytes data/cds/chlorodb/fasta/NC_022261.fst.gz | Bin 35830 -> 35830 bytes data/cds/chlorodb/fasta/NC_022262.fst.gz | Bin 36730 -> 36730 bytes data/cds/chlorodb/fasta/NC_022263.fst.gz | Bin 36719 -> 36719 bytes data/cds/chlorodb/fasta/NC_022264.fst.gz | Bin 49126 -> 49126 bytes data/cds/chlorodb/fasta/NC_022378.fst.gz | Bin 49784 -> 49784 bytes data/cds/chlorodb/fasta/NC_022379.fst.gz | Bin 49767 -> 49767 bytes data/cds/chlorodb/fasta/NC_022380.fst.gz | Bin 49893 -> 49893 bytes data/cds/chlorodb/fasta/NC_022381.fst.gz | Bin 49997 -> 49997 bytes data/cds/chlorodb/fasta/NC_022382.fst.gz | Bin 50001 -> 50001 bytes data/cds/chlorodb/fasta/NC_022383.fst.gz | Bin 49881 -> 49881 bytes data/cds/chlorodb/fasta/NC_022384.fst.gz | Bin 49892 -> 49892 bytes data/cds/chlorodb/fasta/NC_022385.fst.gz | Bin 49928 -> 49928 bytes data/cds/chlorodb/fasta/NC_022386.fst.gz | Bin 49963 -> 49963 bytes data/cds/chlorodb/fasta/NC_022387.fst.gz | Bin 49769 -> 49769 bytes data/cds/chlorodb/fasta/NC_022388.fst.gz | Bin 49941 -> 49941 bytes data/cds/chlorodb/fasta/NC_022389.fst.gz | Bin 49963 -> 49963 bytes data/cds/chlorodb/fasta/NC_022390.fst.gz | Bin 49962 -> 49962 bytes data/cds/chlorodb/fasta/NC_022391.fst.gz | Bin 50041 -> 50041 bytes data/cds/chlorodb/fasta/NC_022392.fst.gz | Bin 50016 -> 50016 bytes data/cds/chlorodb/fasta/NC_022393.fst.gz | Bin 50019 -> 50019 bytes data/cds/chlorodb/fasta/NC_022394.fst.gz | Bin 50016 -> 50016 bytes data/cds/chlorodb/fasta/NC_022395.fst.gz | Bin 50025 -> 50025 bytes data/cds/chlorodb/fasta/NC_022396.fst.gz | Bin 50061 -> 50061 bytes data/cds/chlorodb/fasta/NC_022397.fst.gz | Bin 49871 -> 49871 bytes data/cds/chlorodb/fasta/NC_022398.fst.gz | Bin 50031 -> 50031 bytes data/cds/chlorodb/fasta/NC_022399.fst.gz | Bin 50045 -> 50045 bytes data/cds/chlorodb/fasta/NC_022400.fst.gz | Bin 50287 -> 50287 bytes data/cds/chlorodb/fasta/NC_022401.fst.gz | Bin 50058 -> 50058 bytes data/cds/chlorodb/fasta/NC_022402.fst.gz | Bin 49992 -> 49992 bytes data/cds/chlorodb/fasta/NC_022403.fst.gz | Bin 50075 -> 50075 bytes data/cds/chlorodb/fasta/NC_022404.fst.gz | Bin 49932 -> 49932 bytes data/cds/chlorodb/fasta/NC_022405.fst.gz | Bin 50062 -> 50062 bytes data/cds/chlorodb/fasta/NC_022406.fst.gz | Bin 49852 -> 49852 bytes data/cds/chlorodb/fasta/NC_022407.fst.gz | Bin 50172 -> 50172 bytes data/cds/chlorodb/fasta/NC_022408.fst.gz | Bin 50004 -> 50004 bytes data/cds/chlorodb/fasta/NC_022409.fst.gz | Bin 49951 -> 49951 bytes data/cds/chlorodb/fasta/NC_022410.fst.gz | Bin 49996 -> 49996 bytes data/cds/chlorodb/fasta/NC_022411.fst.gz | Bin 49954 -> 49954 bytes data/cds/chlorodb/fasta/NC_022412.fst.gz | Bin 50059 -> 50059 bytes data/cds/chlorodb/fasta/NC_022413.fst.gz | Bin 49831 -> 49831 bytes data/cds/chlorodb/fasta/NC_022414.fst.gz | Bin 49830 -> 49830 bytes data/cds/chlorodb/fasta/NC_022417.fst.gz | Bin 48325 -> 48325 bytes data/cds/chlorodb/fasta/NC_022431.fst.gz | Bin 50341 -> 50341 bytes data/cds/chlorodb/fasta/NC_022432.fst.gz | Bin 49405 -> 49405 bytes data/cds/chlorodb/fasta/NC_022451.fst.gz | Bin 47157 -> 47157 bytes data/cds/chlorodb/fasta/NC_022457.fst.gz | Bin 51611 -> 51611 bytes data/cds/chlorodb/fasta/NC_022459.fst.gz | Bin 48944 -> 48944 bytes data/cds/chlorodb/fasta/NC_022460.fst.gz | Bin 48979 -> 48979 bytes data/cds/chlorodb/fasta/NC_022461.fst.gz | Bin 49089 -> 49089 bytes data/cds/chlorodb/fasta/NC_022462.fst.gz | Bin 48967 -> 48967 bytes data/cds/chlorodb/fasta/NC_022463.fst.gz | Bin 48972 -> 48972 bytes data/cds/chlorodb/fasta/NC_022668.fst.gz | Bin 42229 -> 42229 bytes data/cds/chlorodb/fasta/NC_022715.fst.gz | Bin 48080 -> 48080 bytes data/cds/chlorodb/fasta/NC_022810.fst.gz | Bin 48909 -> 48909 bytes data/cds/chlorodb/fasta/NC_022811.fst.gz | Bin 49095 -> 49095 bytes data/cds/chlorodb/fasta/NC_022812.fst.gz | Bin 49030 -> 49030 bytes data/cds/chlorodb/fasta/NC_022813.fst.gz | Bin 48889 -> 48889 bytes data/cds/chlorodb/fasta/NC_022814.fst.gz | Bin 48977 -> 48977 bytes data/cds/chlorodb/fasta/NC_022850.fst.gz | Bin 42654 -> 42654 bytes data/cds/chlorodb/fasta/NC_022859.fst.gz | Bin 48514 -> 48514 bytes data/cds/chlorodb/fasta/NC_022868.fst.gz | Bin 47385 -> 47385 bytes data/cds/chlorodb/fasta/NC_022926.fst.gz | Bin 50219 -> 50219 bytes data/cds/chlorodb/fasta/NC_022927.fst.gz | Bin 51670 -> 51670 bytes data/cds/chlorodb/fasta/NC_022928.fst.gz | Bin 49774 -> 49774 bytes data/cds/chlorodb/fasta/NC_022958.fst.gz | Bin 43149 -> 43149 bytes data/cds/chlorodb/fasta/NC_023084.fst.gz | Bin 49049 -> 49049 bytes data/cds/chlorodb/fasta/NC_023085.fst.gz | Bin 47036 -> 47036 bytes data/cds/chlorodb/fasta/NC_023086.fst.gz | Bin 49071 -> 49071 bytes data/cds/chlorodb/fasta/NC_023090.fst.gz | Bin 47377 -> 47377 bytes data/cds/chlorodb/fasta/NC_023092.fst.gz | Bin 50201 -> 50201 bytes data/cds/chlorodb/fasta/NC_023096.fst.gz | Bin 35632 -> 35632 bytes data/cds/chlorodb/fasta/NC_023097.fst.gz | Bin 35755 -> 35755 bytes data/cds/chlorodb/fasta/NC_023102.fst.gz | Bin 46994 -> 46994 bytes data/cds/chlorodb/fasta/NC_023107.fst.gz | Bin 47266 -> 47266 bytes data/cds/chlorodb/fasta/NC_023108.fst.gz | Bin 47226 -> 47226 bytes data/cds/chlorodb/fasta/NC_023109.fst.gz | Bin 47267 -> 47267 bytes data/cds/chlorodb/fasta/NC_023110.fst.gz | Bin 47303 -> 47303 bytes data/cds/chlorodb/fasta/NC_023111.fst.gz | Bin 47244 -> 47244 bytes data/cds/chlorodb/fasta/NC_023112.fst.gz | Bin 47294 -> 47294 bytes data/cds/chlorodb/fasta/NC_023113.fst.gz | Bin 47259 -> 47259 bytes data/cds/chlorodb/fasta/NC_023114.fst.gz | Bin 47268 -> 47268 bytes data/cds/chlorodb/fasta/NC_023115.fst.gz | Bin 50288 -> 50288 bytes data/cds/chlorodb/fasta/NC_023119.fst.gz | Bin 45315 -> 45315 bytes data/cds/chlorodb/fasta/NC_023120.fst.gz | Bin 41861 -> 41861 bytes data/cds/chlorodb/fasta/NC_023121.fst.gz | Bin 39639 -> 39639 bytes data/cds/chlorodb/fasta/NC_023130.fst.gz | Bin 49729 -> 49729 bytes data/cds/chlorodb/fasta/NC_023131.fst.gz | Bin 14409 -> 14409 bytes data/cds/chlorodb/fasta/NC_023132.fst.gz | Bin 19693 -> 19693 bytes data/cds/chlorodb/fasta/NC_023133.fst.gz | Bin 67322 -> 67322 bytes data/cds/chlorodb/fasta/NC_023213.fst.gz | Bin 49847 -> 49847 bytes data/cds/chlorodb/fasta/NC_023214.fst.gz | Bin 49826 -> 49826 bytes data/cds/chlorodb/fasta/NC_023215.fst.gz | Bin 50047 -> 50047 bytes data/cds/chlorodb/fasta/NC_023216.fst.gz | Bin 50036 -> 50036 bytes data/cds/chlorodb/fasta/NC_023217.fst.gz | Bin 49717 -> 49717 bytes data/cds/chlorodb/fasta/NC_023218.fst.gz | Bin 49936 -> 49936 bytes data/cds/chlorodb/fasta/NC_023245.fst.gz | Bin 44462 -> 44462 bytes data/cds/chlorodb/fasta/NC_023247.fst.gz | Bin 47428 -> 47428 bytes data/cds/chlorodb/fasta/NC_023256.fst.gz | Bin 49008 -> 49008 bytes data/cds/chlorodb/fasta/NC_023259.fst.gz | Bin 49131 -> 49131 bytes data/cds/chlorodb/fasta/NC_023260.fst.gz | Bin 51465 -> 51465 bytes data/cds/chlorodb/fasta/NC_023261.fst.gz | Bin 53627 -> 53627 bytes data/cds/chlorodb/fasta/NC_023356.fst.gz | Bin 32605 -> 32605 bytes data/cds/chlorodb/fasta/NC_023357.fst.gz | Bin 47544 -> 47544 bytes data/cds/chlorodb/fasta/NC_023358.fst.gz | Bin 46098 -> 46098 bytes data/cds/chlorodb/fasta/NC_023359.fst.gz | Bin 46093 -> 46093 bytes data/cds/chlorodb/fasta/NC_023360.fst.gz | Bin 47235 -> 47235 bytes data/cds/chlorodb/fasta/NC_023367.fst.gz | Bin 47855 -> 47855 bytes data/cds/chlorodb/fasta/NC_023449.fst.gz | Bin 44027 -> 44027 bytes data/cds/chlorodb/fasta/NC_023463.fst.gz | Bin 46151 -> 46151 bytes data/cds/chlorodb/fasta/NC_023464.fst.gz | Bin 20612 -> 20612 bytes data/cds/chlorodb/fasta/NC_023465.fst.gz | Bin 19290 -> 19290 bytes data/cds/chlorodb/fasta/NC_023533.fst.gz | Bin 42471 -> 42471 bytes data/cds/chlorodb/fasta/NC_023544.fst.gz | Bin 48498 -> 48498 bytes data/cds/chlorodb/fasta/NC_023775.fst.gz | Bin 26201 -> 26201 bytes data/cds/chlorodb/fasta/NC_023785.fst.gz | Bin 55092 -> 55092 bytes data/cds/chlorodb/fasta/NC_023790.fst.gz | Bin 50261 -> 50261 bytes data/cds/chlorodb/fasta/NC_023792.fst.gz | Bin 50264 -> 50264 bytes data/cds/chlorodb/fasta/NC_023798.fst.gz | Bin 49352 -> 49352 bytes data/cds/chlorodb/fasta/NC_023800.fst.gz | Bin 44158 -> 44158 bytes data/cds/chlorodb/fasta/NC_023801.fst.gz | Bin 50171 -> 50171 bytes data/cds/chlorodb/fasta/NC_023805.fst.gz | Bin 41910 -> 41910 bytes data/cds/chlorodb/fasta/NC_023833.fst.gz | Bin 47230 -> 47230 bytes data/cds/chlorodb/fasta/NC_023835.fst.gz | Bin 34093 -> 34093 bytes data/cds/chlorodb/fasta/NC_023934.fst.gz | Bin 43789 -> 43789 bytes data/cds/chlorodb/fasta/NC_023935.fst.gz | Bin 43784 -> 43784 bytes data/cds/chlorodb/fasta/NC_023956.fst.gz | Bin 49317 -> 49317 bytes data/cds/chlorodb/fasta/NC_023959.fst.gz | Bin 49998 -> 49998 bytes data/cds/chlorodb/fasta/NC_024019.fst.gz | Bin 47509 -> 47509 bytes data/cds/chlorodb/fasta/NC_024021.fst.gz | Bin 39756 -> 39756 bytes data/cds/chlorodb/fasta/NC_024022.fst.gz | Bin 39714 -> 39714 bytes data/cds/chlorodb/fasta/NC_024023.fst.gz | Bin 39783 -> 39783 bytes data/cds/chlorodb/fasta/NC_024024.fst.gz | Bin 39761 -> 39761 bytes data/cds/chlorodb/fasta/NC_024027.fst.gz | Bin 50122 -> 50122 bytes data/cds/chlorodb/fasta/NC_024034.fst.gz | Bin 39115 -> 39115 bytes data/cds/chlorodb/fasta/NC_024035.fst.gz | Bin 39524 -> 39524 bytes data/cds/chlorodb/fasta/NC_024036.fst.gz | Bin 41045 -> 41045 bytes data/cds/chlorodb/fasta/NC_024038.fst.gz | Bin 39713 -> 39713 bytes data/cds/chlorodb/fasta/NC_024050.fst.gz | Bin 59005 -> 59005 bytes data/cds/chlorodb/fasta/NC_024060.fst.gz | Bin 50642 -> 50642 bytes data/cds/chlorodb/fasta/NC_024061.fst.gz | Bin 50745 -> 50745 bytes data/cds/chlorodb/fasta/NC_024062.fst.gz | Bin 50726 -> 50726 bytes data/cds/chlorodb/fasta/NC_024064.fst.gz | Bin 50626 -> 50626 bytes data/cds/chlorodb/fasta/NC_024065.fst.gz | Bin 50499 -> 50499 bytes data/cds/chlorodb/models/blosum62.mat | 29 ++ data/cds/chlorodb/models/splice.none.frq | 6 + data/cds/chlorodb/models/splice3.default.frq | 13 + data/cds/chlorodb/models/splice3.ndha.frq | 13 + data/cds/chlorodb/models/splice3.psba.frq | 13 + data/cds/chlorodb/models/splice5.default.frq | 13 + data/cds/chlorodb/models/splice5.ndha.frq | 13 + data/cds/chlorodb/models/splice5.psba.frq | 13 + data/cds/chlorodb/models/start.default.frq | 8 + data/cds/chlorodb/models/start.ndhd.frq | 7 + data/cds/chlorodb/models/start.rps19.frq | 3 + data/cds/chlorodb/models/stop.default.frq | 4 + data/cds/chlorodb/parameters.sh | 28 ++ .../cds/bin/{go_pass1.sh => do_exonerate.sh} | 27 +- .../bin/{go_filterbx.sh => do_filterbx.sh} | 2 +- detectors/cds/bin/go_cds.sh | 20 +- detectors/cds/test/go_test.sh | 8 +- detectors/cds/test/test.db/Annot.lst | 18 + detectors/cds/test/test.db/atpf.fst | 50 ++ detectors/cds/test/test.db/ccsa.fst | 78 +++ detectors/cds/test/test.db/ndha.fst | 90 ++++ detectors/cds/test/test.db/ndhb.fst | 120 +++++ detectors/cds/test/test.db/ndhd.fst | 113 +++++ detectors/cds/test/test.db/ndhe.fst | 39 ++ detectors/cds/test/test.db/ndhf.fst | 157 ++++++ detectors/cds/test/test.db/ndhg.fst | 50 ++ detectors/cds/test/test.db/ndhh.fst | 90 ++++ detectors/cds/test/test.db/ndhi.fst | 50 ++ detectors/cds/test/test.db/psac.fst | 30 ++ detectors/cds/test/test.db/rpl2.fst | 70 +++ detectors/cds/test/test.db/rpl23.fst | 30 ++ detectors/cds/test/test.db/rpl32.fst | 30 ++ detectors/cds/test/test.db/rps15.fst | 30 ++ detectors/cds/test/test.db/rps7.fst | 50 ++ detectors/cds/test/test.db/ycf1.fst | 353 +++++++++++++ detectors/cds/test/test.db/ycf2.fst | 466 ++++++++++++++++++ detectors/cds/test/test.ref | 31 +- detectors/cds/tools/chlorodb/go_chlorodb.sh | 254 ++++++++++ .../cds/tools/chlorodb/matrices/blosum62.mat | 29 ++ .../cds/tools/chlorodb/subdb/go_subdb.sh | 195 ++++++++ .../cds/tools/chlorodb/subdb/lib/db.annot.awk | 39 ++ .../tools/chlorodb/subdb/lib/db.blastlink.awk | 48 ++ .../cds/tools/chlorodb/subdb/lib/db.cc.r | 18 + .../tools/chlorodb/subdb/lib/db.filter.len.r | 19 + .../chlorodb/subdb/lib/db.filter.pat.awk | 10 + .../chlorodb/subdb/lib/db.filter.sym.awk | 30 ++ .../tools/chlorodb/subdb/lib/db.getlen.awk | 10 + .../tools/chlorodb/subdb/lib/db.reportcc.awk | 15 + .../cds/tools/chlorodb/subdb/lib/db.selcc.awk | 19 + .../cds/tools/chlorodb/subdb/lib/db.subdb.awk | 17 + .../cds/tools/chlorodb/subdb/lib/db.todl.awk | 21 + detectors/cds/tools/compare/go_compare.sh | 4 +- detectors/cds/tools/compare/go_summarize.sh | 2 + detectors/cds/tools/lib/cds2fasta.awk | 19 + .../lib/{compareCds.awk => compare.cds.awk} | 0 detectors/cds/tools/lib/embl.cds_long.awk | 97 ++++ detectors/cds/tools/lib/embl.info.awk | 97 ++++ detectors/cds/tools/lib/embl.intron.awk | 97 ++++ detectors/cds/tools/lib/embl.tofasta.awk | 36 ++ detectors/cds/tools/lib/gbk.cds_long.awk | 99 ++++ detectors/cds/tools/lib/gbk.info.awk | 97 ++++ detectors/cds/tools/lib/gbk.intron.awk | 96 ++++ detectors/cds/tools/lib/gbk.tofasta.awk | 32 ++ detectors/cds/tools/lib/install.rpackages.r | 31 ++ detectors/cds/tools/lib/make.models.r | 224 +++++++++ detectors/cds/tools/lib/plot.models.r | 424 ++++++++++++++++ detectors/cds/tools/lib/summarize_cmp.r | 71 +++ detectors/cds/tools/lib/summary.cmp.awk | 54 ++ detectors/cds/tools/lib/util.base.r | 12 + detectors/cds/tools/lib/util.cons.r | 109 ++++ detectors/cds/tools/lib/util.grid.r | 93 ++++ detectors/cds/tools/lib/util.modelio.r | 90 ++++ detectors/cds/tools/lib/util.plot.r | 105 ++++ scripts/csh_init.sh | 16 +- 585 files changed, 4750 insertions(+), 50 deletions(-) create mode 100644 data/cds/chlorodb/models/blosum62.mat create mode 100644 data/cds/chlorodb/models/splice.none.frq create mode 100644 data/cds/chlorodb/models/splice3.default.frq create mode 100644 data/cds/chlorodb/models/splice3.ndha.frq create mode 100644 data/cds/chlorodb/models/splice3.psba.frq create mode 100644 data/cds/chlorodb/models/splice5.default.frq create mode 100644 data/cds/chlorodb/models/splice5.ndha.frq create mode 100644 data/cds/chlorodb/models/splice5.psba.frq create mode 100644 data/cds/chlorodb/models/start.default.frq create mode 100644 data/cds/chlorodb/models/start.ndhd.frq create mode 100644 data/cds/chlorodb/models/start.rps19.frq create mode 100644 data/cds/chlorodb/models/stop.default.frq create mode 100644 data/cds/chlorodb/parameters.sh rename detectors/cds/bin/{go_pass1.sh => do_exonerate.sh} (85%) rename detectors/cds/bin/{go_filterbx.sh => do_filterbx.sh} (94%) create mode 100644 detectors/cds/test/test.db/Annot.lst create mode 100644 detectors/cds/test/test.db/atpf.fst create mode 100644 detectors/cds/test/test.db/ccsa.fst create mode 100644 detectors/cds/test/test.db/ndha.fst create mode 100644 detectors/cds/test/test.db/ndhb.fst create mode 100644 detectors/cds/test/test.db/ndhd.fst create mode 100644 detectors/cds/test/test.db/ndhe.fst create mode 100644 detectors/cds/test/test.db/ndhf.fst create mode 100644 detectors/cds/test/test.db/ndhg.fst create mode 100644 detectors/cds/test/test.db/ndhh.fst create mode 100644 detectors/cds/test/test.db/ndhi.fst create mode 100644 detectors/cds/test/test.db/psac.fst create mode 100644 detectors/cds/test/test.db/rpl2.fst create mode 100644 detectors/cds/test/test.db/rpl23.fst create mode 100644 detectors/cds/test/test.db/rpl32.fst create mode 100644 detectors/cds/test/test.db/rps15.fst create mode 100644 detectors/cds/test/test.db/rps7.fst create mode 100644 detectors/cds/test/test.db/ycf1.fst create mode 100644 detectors/cds/test/test.db/ycf2.fst create mode 100755 detectors/cds/tools/chlorodb/go_chlorodb.sh create mode 100644 detectors/cds/tools/chlorodb/matrices/blosum62.mat create mode 100755 detectors/cds/tools/chlorodb/subdb/go_subdb.sh create mode 100644 detectors/cds/tools/chlorodb/subdb/lib/db.annot.awk create mode 100644 detectors/cds/tools/chlorodb/subdb/lib/db.blastlink.awk create mode 100755 detectors/cds/tools/chlorodb/subdb/lib/db.cc.r create mode 100755 detectors/cds/tools/chlorodb/subdb/lib/db.filter.len.r create mode 100644 detectors/cds/tools/chlorodb/subdb/lib/db.filter.pat.awk create mode 100644 detectors/cds/tools/chlorodb/subdb/lib/db.filter.sym.awk create mode 100644 detectors/cds/tools/chlorodb/subdb/lib/db.getlen.awk create mode 100644 detectors/cds/tools/chlorodb/subdb/lib/db.reportcc.awk create mode 100644 detectors/cds/tools/chlorodb/subdb/lib/db.selcc.awk create mode 100644 detectors/cds/tools/chlorodb/subdb/lib/db.subdb.awk create mode 100644 detectors/cds/tools/chlorodb/subdb/lib/db.todl.awk create mode 100644 detectors/cds/tools/lib/cds2fasta.awk rename detectors/cds/tools/lib/{compareCds.awk => compare.cds.awk} (100%) create mode 100644 detectors/cds/tools/lib/embl.cds_long.awk create mode 100644 detectors/cds/tools/lib/embl.info.awk create mode 100644 detectors/cds/tools/lib/embl.intron.awk create mode 100644 detectors/cds/tools/lib/embl.tofasta.awk create mode 100644 detectors/cds/tools/lib/gbk.cds_long.awk create mode 100644 detectors/cds/tools/lib/gbk.info.awk create mode 100644 detectors/cds/tools/lib/gbk.intron.awk create mode 100644 detectors/cds/tools/lib/gbk.tofasta.awk create mode 100755 detectors/cds/tools/lib/install.rpackages.r create mode 100755 detectors/cds/tools/lib/make.models.r create mode 100755 detectors/cds/tools/lib/plot.models.r create mode 100755 detectors/cds/tools/lib/summarize_cmp.r create mode 100644 detectors/cds/tools/lib/summary.cmp.awk create mode 100644 detectors/cds/tools/lib/util.base.r create mode 100644 detectors/cds/tools/lib/util.cons.r create mode 100644 detectors/cds/tools/lib/util.grid.r create mode 100644 detectors/cds/tools/lib/util.modelio.r create mode 100644 detectors/cds/tools/lib/util.plot.r diff --git a/TODO b/TODO index 062a3fa..66e715a 100644 --- a/TODO +++ b/TODO @@ -12,5 +12,9 @@ o CDS speedup à tester o CDS ajouter tools/dbchloro et tools/compare -o $red +o concurency issue in formatdb + +o parameters in go_subdb.sh + +o models in DB_DIR diff --git a/data/cds/chlorodb/fasta/AC_000188.fst.gz b/data/cds/chlorodb/fasta/AC_000188.fst.gz index f4842c3b064c42d01c06de171b802bcb02dfe24a..b52e08f97067ce56b5bae1b98e1dc0e70932bc81 100644 GIT binary patch delta 18 acmdn`hiU5{CU*I54vvy5&KueF_5lD(DhF2p delta 18 Zcmdn`hiU5{CU*I54i5cHr;Y4-`v6A32BrW2 diff --git a/data/cds/chlorodb/fasta/NC_000925.fst.gz b/data/cds/chlorodb/fasta/NC_000925.fst.gz index e44f5b5a948316c72bbe32de6802b826ea85865e..e0321cb47f5c72c222b745f6e6d98e9c68152401 100644 GIT binary patch delta 18 acmbPxfqCu)W_I~*4vvy5&KudqUH||>)du4L delta 18 ZcmbPxfqCu)W_I~*4i5cHr;Y4lF91Gk1~LEu diff --git a/data/cds/chlorodb/fasta/NC_000926.fst.gz b/data/cds/chlorodb/fasta/NC_000926.fst.gz index 4b9501f5b67d1f1caedef70147f16685b01f440a..63d7a7db2f7b83ef6aa5d58bfebabae66c9441c8 100644 GIT binary patch delta 18 acmbQXf@#_cCU*I54vvy5&KueJrvLyvmj);R delta 18 ZcmbQXf@#_cCU*I54i5cHr;Y6VQvf(E1$O`d diff --git a/data/cds/chlorodb/fasta/NC_000927.fst.gz b/data/cds/chlorodb/fasta/NC_000927.fst.gz index 1bfc1c8d2582c9c94e5ab3df4acf64624d075381..10566415e3a54551d00f46073da9054891be52f1 100644 GIT binary patch delta 18 acmaF&hWXtaW_I~*4vvy5&Kud&zX1SIS_m8f delta 18 ZcmaF&hWXtaW_I~*4i5cHr;Y6C-vCVT2WtQT diff --git a/data/cds/chlorodb/fasta/NC_000932.fst.gz b/data/cds/chlorodb/fasta/NC_000932.fst.gz index 584fead3aa6484da1093ffac852a30938a7b3066..6fbda8b26c7d5d25552ad13defb72e21c9990862 100644 GIT binary patch delta 18 acmdn+lWD_GCU*I54vvy5&KucR?g0Qx90$Mv delta 18 acmdn+lWD_GCU*I54i5cHr;Y3@_W%G!vIh?U diff --git a/data/cds/chlorodb/fasta/NC_001319.fst.gz b/data/cds/chlorodb/fasta/NC_001319.fst.gz index af37fb4be5fe457ffb4ab8f7afce623e1e284dbe..810b8db312cc42dba775648e6546e3e683077e1a 100644 GIT binary patch delta 18 ZcmZo$$keuwiCw;%gQMh%^G5di2>?2Z24(;N delta 18 ZcmZo$$keuwiCw;%gF`>lX(N061OPT51+@SG diff --git a/data/cds/chlorodb/fasta/NC_001320.fst.gz b/data/cds/chlorodb/fasta/NC_001320.fst.gz index feae685e996cd1011aa80ad27e44976584898854..4c048fd7c07aeb31acdb0a8f8493d25b20df8f2a 100644 GIT binary patch delta 18 acmdmWifPv=CU*I54vvy5&Kuc{mjVDqvIgk@ delta 18 ZcmdmWifPv=CU*I54i1A%r;Y5!O94So1~~u# diff --git a/data/cds/chlorodb/fasta/NC_001568.fst.gz b/data/cds/chlorodb/fasta/NC_001568.fst.gz index 44e3caa3c9075d6a332ca5f0738e2f617c864b04..907e292132007e8286b33097d6a78fa16478c7f8 100644 GIT binary patch delta 18 ZcmdnGhH>i}Mt1pb4vvy5&KueF!T><^22B6} delta 18 ZcmdnGhH>i}Mt1pb4i1A%r;Y4-VE{am1)Tr@ diff --git a/data/cds/chlorodb/fasta/NC_001603.fst.gz b/data/cds/chlorodb/fasta/NC_001603.fst.gz index 6f9a8d19bab52eb890b50b54d4d12f0d4cde8df2..d1c0b811c75489b0f212b4af1de98c7b85eb2bca 100644 GIT binary patch delta 18 acmZ3phiT0oCU*I54vvy5&KucP=K%mh4+fk7 delta 18 ZcmZ3phiT0oCU*I54i1A%r;Y5Y^8h`p1?&I- diff --git a/data/cds/chlorodb/fasta/NC_001631.fst.gz b/data/cds/chlorodb/fasta/NC_001631.fst.gz index 90533e2eed641a3609e31493496e2648a03a585d..ac33655083ac41aea1c27962e3490fc6892f51fc 100644 GIT binary patch delta 18 ZcmeBL#?-ZpiCw;%gQMh%^G0^&$pAXE1^)m5 delta 18 ZcmeBL#?-ZpiCw;%gTo-xX(K!HWB@i%1y29~ diff --git a/data/cds/chlorodb/fasta/NC_001666.fst.gz b/data/cds/chlorodb/fasta/NC_001666.fst.gz index a64bc3c8ccb4647afd1ae9bda25c3f4889dbb577..f3a9ae98ab4359402b82b028fd6cd22974d28d33 100644 GIT binary patch delta 18 acmbPxgK6#!CU*I54vvy5&Kudq)&KxQbOyBm delta 18 ZcmbPxgK6#!CU*I54i1A%r;Y4lYXCnH1_b~B diff --git a/data/cds/chlorodb/fasta/NC_001675.fst.gz b/data/cds/chlorodb/fasta/NC_001675.fst.gz index 76b6c7f5abe24324f13514170715045e7dafb3f4..131d11261b5bee6179ba227becacd73b9eca92b7 100644 GIT binary patch delta 18 ZcmeA?%G7z3iCw;%gQMh%^G5cjMF2lx2FU;b delta 18 ZcmeA?%G7z3iCw;%gTo-xX(M~nA^>)d1z-RG diff --git a/data/cds/chlorodb/fasta/NC_001865.fst.gz b/data/cds/chlorodb/fasta/NC_001865.fst.gz index 0ffbd6c2bf9e68cfc8b5b6e4a1c04de82e1b3500..10a1bfe711c4acba614355eec213759705a4c1e1 100644 GIT binary patch delta 18 acmbRBjA_<0CU*I54vvy5&KucM51%vrS2ABW< diff --git a/data/cds/chlorodb/fasta/NC_002693.fst.gz b/data/cds/chlorodb/fasta/NC_002693.fst.gz index a02a4348e7af27269590562221c8f304c011e138..22ac1f2b1537f16c65abb7561aab1362aa650d96 100644 GIT binary patch delta 18 ZcmeB}z}zu`nO(k{gQMh%^G0^Y6970C1_S^A delta 18 ZcmeB}z}zu`nO(k{gTo-xX(K!12>>&*1yle4 diff --git a/data/cds/chlorodb/fasta/NC_002694.fst.gz b/data/cds/chlorodb/fasta/NC_002694.fst.gz index fe10b0a9c5b45ccc84d7a450be046d705615faa5..b75dc302ce2e75fe1ed1d227ed4259e5b0a1bf34 100644 GIT binary patch delta 18 acmX^8j_LF}CU*I54vvy5&KucXwgUi6a|d<+ delta 18 ZcmX^8j_LF}CU*I54i1A%r;Y3`+W|-r2F3sY diff --git a/data/cds/chlorodb/fasta/NC_002762.fst.gz b/data/cds/chlorodb/fasta/NC_002762.fst.gz index fcac93cb9968088ca6083d6f092e0a37feb568ea..f391cb5676079fb29b995fa91a520a3db4f912f4 100644 GIT binary patch delta 18 ZcmeA_#ngX_iCw;%gQMh%^G0@#r2s$C250~P delta 18 ZcmeA_#ngX_iCw;%gTo-xX(KzwQUE({1-JkJ diff --git a/data/cds/chlorodb/fasta/NC_003119.fst.gz b/data/cds/chlorodb/fasta/NC_003119.fst.gz index cd4cfb51b9a7a4198f3397717f7144dcd8e466dc..70cbde2c5dc77c0c188b2950238a883399843c43 100644 GIT binary patch delta 18 acmZ3wnrZ23CU*I54vvy5&Kue1O$7iz0tVaw delta 18 acmZ3wnrZ23CU*I54i1A%r;Y6MrUC#vp9U-d diff --git a/data/cds/chlorodb/fasta/NC_003386.fst.gz b/data/cds/chlorodb/fasta/NC_003386.fst.gz index 1aa50f1d82b71dc04e9e2fa0b1d1071c9d1241ac..857a5a0386a1eda44d3d476354a0504d54a92fcf 100644 GIT binary patch delta 18 acmX?giRsiOCU*I54vvy5&KudCR{{V?-UlrJ delta 18 ZcmX?giRsiOCU*I54i1A%r;Y5+D*;4%27Lek diff --git a/data/cds/chlorodb/fasta/NC_004115.fst.gz b/data/cds/chlorodb/fasta/NC_004115.fst.gz index 88d5d660f10df17d62d10342df679d43e04b9a5f..793905d0e0a557b6363a4416833dfd0ef7ac428f 100644 GIT binary patch delta 18 acmeyhlj+w^CU*I54vvy5&Kuc3&jA2US_l3B delta 18 acmeyhlj+w^CU*I54i1A%r;Y5N=Kugm_Xkb@ diff --git a/data/cds/chlorodb/fasta/NC_004543.fst.gz b/data/cds/chlorodb/fasta/NC_004543.fst.gz index 74684ba43b37c365c9f36f2b252ea8bb37562687..11dca985303e437664e3e721e63973afd57813f5 100644 GIT binary patch delta 18 Zcmdne#=NDCnO(k{gQMh%^G0^v!vH+r25$fW delta 18 Zcmdne#=NDCnO(k{gTo-xX(PMtVE{OM1-}3Q diff --git a/data/cds/chlorodb/fasta/NC_004561.fst.gz b/data/cds/chlorodb/fasta/NC_004561.fst.gz index 1082a524c30db31b6dbaa2842263acec16921a37..cacd7293a4e6bb2b983db36bff96fced81cfa0d1 100644 GIT binary patch delta 18 acmX^1pXu0tCU*I54vx|*&KueH?*{-*;s_D| delta 18 acmX^1pXu0tCU*I54i1A%r;Y6U_X7Y*cn4ts diff --git a/data/cds/chlorodb/fasta/NC_004677.fst.gz b/data/cds/chlorodb/fasta/NC_004677.fst.gz index 809e6b7d70b4ed90885b81f577a7e255b6a51c91..20d33e0ecf425c61b9f9e52fd1111d0ec1deefbc 100644 GIT binary patch delta 18 ZcmexAkLmwBCU*I54vx|*&Kub)`T diff --git a/data/cds/chlorodb/fasta/NC_004766.fst.gz b/data/cds/chlorodb/fasta/NC_004766.fst.gz index c13006a2b4ebffbdd407b79cfdea2434ddccbabb..b4bc8271fb2f7564faa0875973241ae15705b203 100644 GIT binary patch delta 18 acmaF*k?HA2CU*I54vx|*&Kue9?EnB#W(Z6G delta 18 acmaF*k?HA2CU*I54i1A%r;Y6Qb^riO{0Ex= diff --git a/data/cds/chlorodb/fasta/NC_004799.fst.gz b/data/cds/chlorodb/fasta/NC_004799.fst.gz index 4bdb5289a9ace99f4ef0c70ee32986276c813ca6..6068441231557c3c958b968dc5f092854f81e224 100644 GIT binary patch delta 18 acmcccn(4x8CU*I54vx|*&KucJZUq2M$_M@c delta 18 acmcccn(4x8CU*I54i1A%r;Y32UP$7 delta 18 Zcmcc6%Y31inO(k{gTo-xX(Ri|V*oxZ2BZK0 diff --git a/data/cds/chlorodb/fasta/NC_005087.fst.gz b/data/cds/chlorodb/fasta/NC_005087.fst.gz index c547133934b2e999c44e355a2b591476cb7805c8..db1b3bb6ba98f1b8d665f6d3c380fecbbd06ffad 100644 GIT binary patch delta 18 acmX@Tgz5AWCU*I54vx|*&KucXCIJ9LUk1Ja delta 18 ZcmX@Tgz5AWCU*I54i1A%r;Y3`lK?*T1`PlJ diff --git a/data/cds/chlorodb/fasta/NC_005353.fst.gz b/data/cds/chlorodb/fasta/NC_005353.fst.gz index 8d70fe3623f53dc2bc0c8ae095e2a2cac6e4a533..aa91114bc087876455152e67730c2aab8c36a393 100644 GIT binary patch delta 18 acmZ2}lX>|~W_I~*4vx|*&Kubmya514RR@>= delta 18 acmZ2}lX>|~W_I~*4i1A%r;Y3j-T(kW>jvil diff --git a/data/cds/chlorodb/fasta/NC_005878.fst.gz b/data/cds/chlorodb/fasta/NC_005878.fst.gz index 8659698cbcf2b157d11387ce41d08cee029bb147..5e77ec14823f4733dafc4d7f1cc159ff2059f7e2 100644 GIT binary patch delta 18 acmaELlj+q>CU*I54vx|*&KubuuK@s0AqXD; delta 18 acmaELlj+q>CU*I54i1A%r;Y57*8l)Yw+C(j diff --git a/data/cds/chlorodb/fasta/NC_005973.fst.gz b/data/cds/chlorodb/fasta/NC_005973.fst.gz index 3bd7e1fe79220c798daaa62762b9bbd0608a2808..c0d61046fa0c21f8d5097f80cc8e3f58354a7434 100644 GIT binary patch delta 18 acmZ2_ifQR7CU*I54vx|*&Kud~mI44m+6Jot delta 18 ZcmZ2_ifQR7CU*I54i1A%r;Y4#O94J`1^NI0 diff --git a/data/cds/chlorodb/fasta/NC_006050.fst.gz b/data/cds/chlorodb/fasta/NC_006050.fst.gz index cf05aa0980c9f2d39819819c94d2636f04d83701..1c2a90f467349dd281f91cd09fc7558e321e38f5 100644 GIT binary patch delta 18 ZcmZ3`!Mvb@nO(k{gQN6{^G0^bBLF&S1~~u# delta 18 ZcmZ3`!Mvb@nO(k{gTo-xX(PMj5dby+1&9Cu diff --git a/data/cds/chlorodb/fasta/NC_006084.fst.gz b/data/cds/chlorodb/fasta/NC_006084.fst.gz index 825c3c70b9d518928f9516140ce60bbdf8fec53e..72f66214657a2ef8e47a747468665205947a2e0e 100644 GIT binary patch delta 18 acmex$lj+w@CU*I54vx|*&Kuc3uK@s2Q3y`} delta 18 acmex$lj+w@CU*I54i1A%r;Y5N*8l)a=Lenu diff --git a/data/cds/chlorodb/fasta/NC_006137.fst.gz b/data/cds/chlorodb/fasta/NC_006137.fst.gz index 19a088ab8fdc464b1dcd5a11db75128d462c38de..a77a31c94e9bebfbceba69647219630bc206e244 100644 GIT binary patch delta 18 acmaF6llkpVW_I~*4vx|*&KudE-2nhg_XrvQ delta 18 acmaF6llkpVW_I~*4i1A%r;Y5-?f?KsjR$D} diff --git a/data/cds/chlorodb/fasta/NC_006290.fst.gz b/data/cds/chlorodb/fasta/NC_006290.fst.gz index 059ae338dc07183469b4b526dc8b6339ca988dc5..e8d74e369d601b2a3748d9dfe6bab1a9d91dcb2f 100644 GIT binary patch delta 18 acmbRHk7@2dCU*I54vx|*&Kudq_5%P&C;nK#QV1LX delta 18 acmX^8m+AChCU*I54i1A%r;Y4K_5lD&=m%>6 diff --git a/data/cds/chlorodb/fasta/NC_007578.fst.gz b/data/cds/chlorodb/fasta/NC_007578.fst.gz index dc35d20ee65ccf4f87d0983e123503eb4deb5157..18254b11ceea848ad993c139a4042791f40d3dc3 100644 GIT binary patch delta 18 acmdo0m1+N1CU*I54vx|*&Kucx>;eExvIpb< delta 18 acmdo0m1+N1CU*I54i1A%r;Y48b^!oLNCz_j diff --git a/data/cds/chlorodb/fasta/NC_007602.fst.gz b/data/cds/chlorodb/fasta/NC_007602.fst.gz index 318a4891a2a8b3a5fdc942145ac3d7b8fb0f5834..febcf2b5cd0dffdcf6d744d0648048cb3f6d63cf 100644 GIT binary patch delta 18 ZcmZqv%hddriCw;%gQN6{^G5cXeE>yz2Sfk> delta 18 ZcmZqv%hddriCw;%gTo-xX(M~hJ^(=w29p2) diff --git a/data/cds/chlorodb/fasta/NC_007898.fst.gz b/data/cds/chlorodb/fasta/NC_007898.fst.gz index dc02a6b150c0c6daca952a7900c364d2f89a0dd0..ff0236ce3c58a02132785906ad102b21c48ca255 100644 GIT binary patch delta 18 acmdn+hiStfCU*I54vx|*&Kub^_W=M(f(J2Q~lz delta 18 Zcmey?#{8{~nO(k{gTpY>X(N07VE{pi28I9t diff --git a/data/cds/chlorodb/fasta/NC_007957.fst.gz b/data/cds/chlorodb/fasta/NC_007957.fst.gz index 3426db7eadbd0547ebef610e8fee184b0f37a879..34a4a152db5cde6ef65229fbe984a9f0c6a9d848 100644 GIT binary patch delta 18 ZcmbQ+$vn4{nO(k{gQN6{^G5b*M*uq?2C@JE delta 18 ZcmbQ+$vn4{nO(k{gTpY>X(RizBLFtM1_A&8 diff --git a/data/cds/chlorodb/fasta/NC_007977.fst.gz b/data/cds/chlorodb/fasta/NC_007977.fst.gz index 050f99ea1ae19cd68cc2e8f03c5be269f8004461..2df2fd9f134ca4e68a9ed4eb62a3a0ec981bd300 100644 GIT binary patch delta 18 acmbRJk!kivCU*I54vx|*&KudM>;M2qNC$2J delta 18 acmbRJk!kivCU*I54i3Xir;Y4Wb^riE`m delta 18 ZcmbR9hiT3qCU*I54i3Xir;Y5Q`v5~@23-IE diff --git a/data/cds/chlorodb/fasta/NC_008097.fst.gz b/data/cds/chlorodb/fasta/NC_008097.fst.gz index d55e79426f381757f0017ff9079e9a92074d4294..9c4c037caa71de1410ec13b9f9e436dfcf77aceb 100644 GIT binary patch delta 18 acmeyqk@@>ZW_I~*4vx|*&Kuc3+yDSfSqLNm delta 18 acmeyqk@@>ZW_I~*4i3Xir;Y3%ZU6vB_6KwT diff --git a/data/cds/chlorodb/fasta/NC_008099.fst.gz b/data/cds/chlorodb/fasta/NC_008099.fst.gz index 79f1308256dc63bcce9b89fdb56c626a27b54caa..9eed1a0ed14261ffc0eb070b5f8dd459bf64c781 100644 GIT binary patch delta 18 acmX^6is|etCU*I54vx|*&Kud?wgLc5LI-mI delta 18 ZcmX^6is|etCU*I54i3Xir;Y4xTLDMk2EzaV diff --git a/data/cds/chlorodb/fasta/NC_008100.fst.gz b/data/cds/chlorodb/fasta/NC_008100.fst.gz index 702ad815515517012dfefaca9bb848abce51e950..ddd585007999772d7a43a813e98f67d5685777b2 100644 GIT binary patch delta 16 XcmdlNwJ(ZYzMF%i^osLFc5__-G`R(u delta 16 XcmdlNwJ(ZYzMF%?Fw;M2ydX(RiD!vHm_1?vC+ diff --git a/data/cds/chlorodb/fasta/NC_008116.fst.gz b/data/cds/chlorodb/fasta/NC_008116.fst.gz index 96d29e47dd1964d0c014c1c190964957ee14c9d9..32f1c9858c730d89b72ce853d6a92d62a657bace 100644 GIT binary patch delta 18 acmZ4ShiSzhCU*I54vx|*&Kubk_W=M&Y6md@ delta 18 ZcmZ4ShiSzhCU*I54i3Xir;Y52`v64;27v$o diff --git a/data/cds/chlorodb/fasta/NC_008117.fst.gz b/data/cds/chlorodb/fasta/NC_008117.fst.gz index aacc0949c120e8822ad7e3f201fd5a791e781636..153eda2dbd9a889fcc13bc6f98a7fcd885b0aacb 100644 GIT binary patch delta 18 ZcmbQ%$2_f%nO(k{gQN6{^G0_5;{Z9x1}Xpm delta 18 ZcmbQ%$2_f%nO(k{gTpY>X(K!TaR4=C1$qDg diff --git a/data/cds/chlorodb/fasta/NC_008155.fst.gz b/data/cds/chlorodb/fasta/NC_008155.fst.gz index 560ef24728aefbe1e1e7052e8a7a57ab940f0d88..a781ff87e698e97ae413e10d067084c88f8b5d35 100644 GIT binary patch delta 18 acmZ2-ifPFyCU*I54vx|*&KucfmjVDnw+5&H delta 18 ZcmZ2-ifPFyCU*I54i3Xir;Y5gO94Jq1^55} diff --git a/data/cds/chlorodb/fasta/NC_008235.fst.gz b/data/cds/chlorodb/fasta/NC_008235.fst.gz index 8f5b5a28461f04dfb7fd4cc19273697eba6f52c5..d80a3f3be013b391ed14dc70292c926aeef9ef66 100644 GIT binary patch delta 18 acmcclm+9tTCU*I54vx|*&Kub;?E?T&JP1Yr delta 18 acmcclm+9tTCU*I54i3Xir;Y5F_5lD)*$0*Y diff --git a/data/cds/chlorodb/fasta/NC_008289.fst.gz b/data/cds/chlorodb/fasta/NC_008289.fst.gz index 25041ee50cea973ae33bd64ca5a91f8bae8b76e6..a3253a7e82ccb7b2f9d54b289cc6d00a38d1b073 100644 GIT binary patch delta 18 ZcmZqQ$k@J-kzKxX(M|>1OPYe1)u-` diff --git a/data/cds/chlorodb/fasta/NC_008325.fst.gz b/data/cds/chlorodb/fasta/NC_008325.fst.gz index cf5bc52388e2cd207666189fa9d0445ba0af3889..849ee385713dbc40bc2c6fa89bbd4b854a85bb81 100644 GIT binary patch delta 18 acmezTm+A9gCU*I54vw-b&Kud^>;nK)(Fm0Q delta 18 acmezTm+A9gCU*I54i3Xir;Y4y_5lD;X9wf} diff --git a/data/cds/chlorodb/fasta/NC_008326.fst.gz b/data/cds/chlorodb/fasta/NC_008326.fst.gz index 9ceff078c5c414699f817df8759bb319c128875a..3f737608f889800d61a0a2a3da53505a8ce06bbf 100644 GIT binary patch delta 18 ZcmZ3~&b+9dnO(k{gQM(<^G5dBhXFg52E70P delta 18 ZcmZ3~&b+9dnO(k{gTpY>X(RjW!vHrd1`GfI diff --git a/data/cds/chlorodb/fasta/NC_008334.fst.gz b/data/cds/chlorodb/fasta/NC_008334.fst.gz index af729dbc3c834563829ff83211037fa576922f3b..aa49af000336e93a8c1490797137b8478f0c1f13 100644 GIT binary patch delta 18 ZcmbQy!91gbnO(k{gQM(<^G0^TBLF#A1|k3e delta 18 ZcmbQy!91gbnO(k{gTpY>X(PMf5dbvq1#tiX diff --git a/data/cds/chlorodb/fasta/NC_008335.fst.gz b/data/cds/chlorodb/fasta/NC_008335.fst.gz index 745f83242c4442126050659e5a250a0d71d01119..3e899a98b827be9f51a53b123842c48f097aa7e0 100644 GIT binary patch delta 18 Zcmey~#r(aCnO(k{gQM(<^G5c9qX0&f2Sfk> delta 18 Zcmey~#r(aCnO(k{gTpY>X(M~VQ2;_J29p2) diff --git a/data/cds/chlorodb/fasta/NC_008336.fst.gz b/data/cds/chlorodb/fasta/NC_008336.fst.gz index 2dfbec1e4de665c8d20acf44a14c66440d1f33d7..e4c7d9afa087f580c5b428a81b3e27b9698b4557 100644 GIT binary patch delta 18 acmccgpXt(nCU*I54vw-b&KucJ?*{--jR-dY delta 18 acmccgpXt(nCU*I54i3Xir;Y5V_X7Y-BL{{6 diff --git a/data/cds/chlorodb/fasta/NC_008359.fst.gz b/data/cds/chlorodb/fasta/NC_008359.fst.gz index 98b893c1b077d6a86e59f50fc94457f8ba55a129..478888bac89dfdc15988f9a52603cfc560d5b5f7 100644 GIT binary patch delta 18 ZcmbQ-%sjc7nO(k{gQM(<^G5cbg8(@T28I9t delta 18 ZcmbQ-%sjc7nO(k{gTpY>X(M~jK>#$N1=Rom diff --git a/data/cds/chlorodb/fasta/NC_008372.fst.gz b/data/cds/chlorodb/fasta/NC_008372.fst.gz index 78249524e0e9803e8b0e993180406adba6b7bfc5..47c3a8ab4743aa7a4d93ce33d251d17b0b35ecd1 100644 GIT binary patch delta 21 ccmeBdX6bBZVVCdb;3&J|+{nI_ow11#07%ycHvj+t delta 21 ccmeBdX6bBZVVCdb;4sW|YGmKa&e+5V076;?h5!Hn diff --git a/data/cds/chlorodb/fasta/NC_008407.fst.gz b/data/cds/chlorodb/fasta/NC_008407.fst.gz index 22801352e77b1866490d2badb92675cc6eddffaf..ad3fb8d210eb5bb5840d6fea12deac67b6fadcab 100644 GIT binary patch delta 18 Zcmey{%lx;OnO(k{gQM(<^G5b>#{fvg2i*Vw delta 18 Zcmey{%lx;OnO(k{gTpY>X(Ri$V*o^22P^;p diff --git a/data/cds/chlorodb/fasta/NC_008408.fst.gz b/data/cds/chlorodb/fasta/NC_008408.fst.gz index 4b45f6b1d57d2a724219f5444d2117d7e6b5bcf5..5910a74236d0e060f84eb8a85a30c38e6effc31f 100644 GIT binary patch delta 18 ZcmX@SjPdX?Mt1pb4vw-b&Kucnf&oG>25JBR delta 18 ZcmX@SjPdX?Mt1pb4i3Xir;Y43!2mtR1-SqK diff --git a/data/cds/chlorodb/fasta/NC_008454.fst.gz b/data/cds/chlorodb/fasta/NC_008454.fst.gz index 07e443cbdb75533e73cb019cf0d1b17fba9fb1ca..e59d3037aa4dde324166e24270e79f0007b355e3 100644 GIT binary patch delta 21 dcmX>yk>$ul7Iyh=4vw-b&W-F_*%|k8002~12MYiI delta 21 ccmX>yk>$ul7Iyh=4i3Xir$+Xz?2LOk08QEkS^xk5 diff --git a/data/cds/chlorodb/fasta/NC_008456.fst.gz b/data/cds/chlorodb/fasta/NC_008456.fst.gz index bf1e179437ee7efacf90985dce9b2d499dc28940..55f00ab0a74d83926a7b17c2c8176aa5a424ae4f 100644 GIT binary patch delta 18 ZcmX@r!F;NNnO(k{gQM(<^G0^(BLF}y2DktK delta 18 ZcmX@r!F;NNnO(k{gTpY>X(PMy5db^H1_uBD diff --git a/data/cds/chlorodb/fasta/NC_008457.fst.gz b/data/cds/chlorodb/fasta/NC_008457.fst.gz index 123a1431a822bedfacdf3258aa32a80fad10e6d5..461e47f88fa5978510f3102549bb36a06a3b7eae 100644 GIT binary patch delta 18 ZcmX@t&U~(&nO(k{gQM(<^G5dLhXFyF2SES; delta 18 ZcmX@t&U~(&nO(k{gTpY>X(Rjb!vH-n29N*% diff --git a/data/cds/chlorodb/fasta/NC_008535.fst.gz b/data/cds/chlorodb/fasta/NC_008535.fst.gz index 0fbd7fbb3afdc65a1b5dc8977da7cdf1fda36772..9979d79f3ff914ce49dd51fac0eb24c23b45f262 100644 GIT binary patch delta 18 ZcmZqv&D8vxiCw;%gQM(<^G5cXy#Pf*2S5M- delta 18 ZcmZqv&D8vxiCw;%gTpY>X(M~hUI0MY29E#$ diff --git a/data/cds/chlorodb/fasta/NC_008588.fst.gz b/data/cds/chlorodb/fasta/NC_008588.fst.gz index bc8fdcafa5766e445fef9222fc3e0337a3ecede0..3572a6ecaed5a06e906c899aef6b44bbea207ce5 100644 GIT binary patch delta 18 acmZ2KmudZ6CU*I54vw-b&KucR^Z@`rwFcP$ delta 18 ZcmZ2KmudZ6CU*I54i3Xir;Y3@`T#pi1}Fdk diff --git a/data/cds/chlorodb/fasta/NC_008589.fst.gz b/data/cds/chlorodb/fasta/NC_008589.fst.gz index bb5bbd0dc5c39cf146def6417143afe5cba13766..f30fb4ccb6c67f98098c95a08a267b9072739114 100644 GIT binary patch delta 18 acmZ3zjcN5ZCU*I54vw-b&KucPW&;30JqC;b delta 18 ZcmZ3zjcN5ZCU*I54i3Xir;Y3?vjIHQ1=|1s diff --git a/data/cds/chlorodb/fasta/NC_008590.fst.gz b/data/cds/chlorodb/fasta/NC_008590.fst.gz index 8a4b33ca0252b2d3fba62512a0b13b17ed0cc1cd..116ff312deef8c8efab55aa33ffbd10061a2d637 100644 GIT binary patch delta 18 acmaENj_KVwCU*I54vw-b&Kud&mjeJzS_hE; delta 18 ZcmaENj_KVwCU*I54i3Xir;Y6C%K=F62H*ey diff --git a/data/cds/chlorodb/fasta/NC_008591.fst.gz b/data/cds/chlorodb/fasta/NC_008591.fst.gz index 3368d94bc54ec464de7e9459581ffbd90db17c6c..53d86492c2c98c58349f0bf19a7ed2166eb4fd3a 100644 GIT binary patch delta 18 acmaEGp6S7PCU*I54vw-b&KucpE(ZWij|b@h delta 18 acmaEGp6S7PCU*I54i3Xir;Y44mjeJuB?mYF diff --git a/data/cds/chlorodb/fasta/NC_008602.fst.gz b/data/cds/chlorodb/fasta/NC_008602.fst.gz index 431e4347be217d7622244a7191adb9081ddd3dcf..0853868442e548e9cc9b013ddabd0e82c00e0b2a 100644 GIT binary patch delta 18 acmbPmlWD?DCU*I54vw-b&Kub~*8l)Q+6NK< delta 18 ZcmbPmlWD?DCU*I54i3Xir;Y5LYXClQ24MgI diff --git a/data/cds/chlorodb/fasta/NC_008641.fst.gz b/data/cds/chlorodb/fasta/NC_008641.fst.gz index ddbd83374ab4c5318f9a3fd4c1d8b8becde971cd..f5c440a12ab6c8f08d07f4f1d1982c0252964bd4 100644 GIT binary patch delta 18 Zcmcc8&U~evnO(k{gQM(<^G5cwhXF!t2U7q5 delta 18 Zcmcc8&U~evnO(k{gTpY>X(RjD!vH=42BH7} diff --git a/data/cds/chlorodb/fasta/NC_008788.fst.gz b/data/cds/chlorodb/fasta/NC_008788.fst.gz index 57acf428a2367a7d9220bf5b8c6fdcdb3cfc8b4b..8fdf4526a086e188780de4a2aedd1855a3e0bea0 100644 GIT binary patch delta 18 ZcmbQ&#XPTznO(k{gQM(<^G0^@qX0T-1~~u# delta 18 ZcmbQ&#XPTznO(k{gTpY>X(PM%Q2;gn1&9Cu diff --git a/data/cds/chlorodb/fasta/NC_008796.fst.gz b/data/cds/chlorodb/fasta/NC_008796.fst.gz index e59c87a1c34a05cf5e00e204888a38f14ff6f1c5..70357485c73fa39638c94b40eb6f0eb53a89a499 100644 GIT binary patch delta 18 acmdn|n`!fJCU*I54vw-b&Kud+>;(Wz(g)B0 delta 18 acmdn|n`!fJCU*I54i3Xir;Y4u_5uJ$Xa^qv diff --git a/data/cds/chlorodb/fasta/NC_008822.fst.gz b/data/cds/chlorodb/fasta/NC_008822.fst.gz index b68566473d913b2b9f60026afeb76486c9c55498..afab3bdcafcdb1c7cac3b55db8ce00148dd9db0d 100644 GIT binary patch delta 18 acmX^And$szCU*I54vw-b&KucJ>;wQ#st6DO delta 18 acmX^And$szCU*I54i3Xir;Y3 diff --git a/data/cds/chlorodb/fasta/NC_009259.fst.gz b/data/cds/chlorodb/fasta/NC_009259.fst.gz index d4b3622822b7a53f061eba0a95de8371753c6146..83932a219551a44991978e550e6c21aee647eea2 100644 GIT binary patch delta 18 acmdnIR0qfa delta 18 acmdngK5_fCU*I54vw-b&Kuc{_W%G(X$M{a delta 18 Zcmdn>gK5_fCU*I54i2MCr;Y5!djLlU2Ce`A diff --git a/data/cds/chlorodb/fasta/NC_009267.fst.gz b/data/cds/chlorodb/fasta/NC_009267.fst.gz index e3235b346a2e974a7d65f60a04e34c2a22f429e2..093a7f819652717a1dc668681bb6f9e619aa3463 100644 GIT binary patch delta 18 acmbRIi)r#NCU*I54vw-b&Kucz_5uJ#QwHt; delta 18 ZcmbRIi)r#NCU*I54i2MCr;Y49djUc420j1) diff --git a/data/cds/chlorodb/fasta/NC_009268.fst.gz b/data/cds/chlorodb/fasta/NC_009268.fst.gz index ccdf24615a55cd690c8a50ae68db116853fa5087..5e4731fc0ac0a63366f734faaa11da299ea218c2 100644 GIT binary patch delta 18 acmdn=ooUl|CU*I54vw-b&KucR?*;%%F$co{ delta 18 acmdn=ooUl|CU*I54i2MCr;Y5ZcLM-M&Ic0! diff --git a/data/cds/chlorodb/fasta/NC_009269.fst.gz b/data/cds/chlorodb/fasta/NC_009269.fst.gz index f32b48984e5d203f193f62126cc71e7deaa550ee..b2418ef09a0325eeeb224e3a5fa2eb541fff54ac 100644 GIT binary patch delta 18 acmX^1lj+z`CU*I54vw-b&KueH?*RZ#EC>Vu delta 18 acmX^1lj+z`CU*I54i2MCr;Y6U_W%G%$p=&b diff --git a/data/cds/chlorodb/fasta/NC_009270.fst.gz b/data/cds/chlorodb/fasta/NC_009270.fst.gz index edfdceffeba2f858ce3ac3fa5ff19c21962ac328..a5d1566b8f25ed752af47dd8e6dfd17595e52f82 100644 GIT binary patch delta 18 acmX@~lj+b;CU*I54vw-b&Kucx?*RZ!pa=K> delta 18 acmX@~lj+b;CU*I54i2MCr;Y5p_W%G%JqJht diff --git a/data/cds/chlorodb/fasta/NC_009271.fst.gz b/data/cds/chlorodb/fasta/NC_009271.fst.gz index b45c20befd892084739e2042bb52433ba4fbf72d..0e101a57bb4eb8f0c0aa0e4473f1fbddd04257bd 100644 GIT binary patch delta 18 acmccii|N`gCU*I54vw-b&KueN_W}S delta 18 acmca`n(4x6CU*I54i2MCr;Y3wR12Sfk> delta 18 ZcmeDD%GCLliCw;%gTpA(X(M~nE&xFE29p2) diff --git a/data/cds/chlorodb/fasta/NC_009618.fst.gz b/data/cds/chlorodb/fasta/NC_009618.fst.gz index 9004afe9ab70a45aa3f74206af02e0fc9558b880..30d2f2415af35b999d81de10e8fda82ef50a7729 100644 GIT binary patch delta 18 ZcmX@!&wRX}nO(k{gQNV4^G5aq#{og82SES; delta 18 ZcmX@!&wRX}nO(k{gTpA(X(RiA;{ZKA29N*% diff --git a/data/cds/chlorodb/fasta/NC_009681.fst.gz b/data/cds/chlorodb/fasta/NC_009681.fst.gz index 84c4bae0907636463e6982331cf166fd6e486e26..f149b20cf42d20cde62db331f9a44185a74e4cad 100644 GIT binary patch delta 18 acmbPtnt9%7W_I~*4vz9G&KudMKLr3oZwFie delta 18 acmbPtnt9%7W_I~*4i2MCr;Y5>p8^0s1qQ1C diff --git a/data/cds/chlorodb/fasta/NC_009765.fst.gz b/data/cds/chlorodb/fasta/NC_009765.fst.gz index a0fde90317ea8cd48071e0774514ac1d237ece8d..48213251ed39c8bec294842ce33b36d9fdd5c48e 100644 GIT binary patch delta 18 acmaEHmGQ+@Mt1pb4vz9G&KubuW&r?B4hPQw delta 18 ZcmaEHmGQ+@Mt1pb4i2MCr;Y3nvj9n?2Oa;nK(GzfA4 delta 18 acmaFk1?~U< diff --git a/data/cds/chlorodb/fasta/NC_010361.fst.gz b/data/cds/chlorodb/fasta/NC_010361.fst.gz index 5e1d051a053e62dedbcb92ddc11763d44a288c9e..cd12d0f97017dd069f54482e169f4abd2bb530a0 100644 GIT binary patch delta 18 ZcmZqaXKv|dW|!~g;3&W1ypg^3H~=_*26zAf delta 18 ZcmZqaXKv|dW|!~g;4sQ`+Q?pe8~`*G1;+pY diff --git a/data/cds/chlorodb/fasta/NC_010362.fst.gz b/data/cds/chlorodb/fasta/NC_010362.fst.gz index a122408a84afbde127ec650ffa9c8178167f21d2..6b202aaa63768822e28dcc601fb9d5cca327a3b8 100644 GIT binary patch delta 18 ZcmX@r!+ffTnO(k{gQNV4^G0^(V*o(22EzaV delta 18 ZcmX@r!+ffTnO(k{gTpA(X(PMyF#tSC1`+@O diff --git a/data/cds/chlorodb/fasta/NC_010433.fst.gz b/data/cds/chlorodb/fasta/NC_010433.fst.gz index bc0cd8e5ff4fac6bf6c05a08757b1d73cdc25d31..4d3045b38bd87a3ffa42a33ddb1d1a31228627ef 100644 GIT binary patch delta 18 Zcmcc6&U~SrnO(k{gQNV4^G5cQhXFz72S@+_ delta 18 Zcmcc6&U~SrnO(k{gTpA(X(Ri|!vH;f2A2Q; diff --git a/data/cds/chlorodb/fasta/NC_010442.fst.gz b/data/cds/chlorodb/fasta/NC_010442.fst.gz index 1f7932eea11d7e0374069e6f44d36c462d01125d..06f9575eea5a8d626caf6cb79eef85b6c707159c 100644 GIT binary patch delta 18 ZcmaFb!Thv?nO(k{gQNV4^G5c#BLG9@2MPcH delta 18 ZcmaFb!Thv?nO(k{gTpA(X(M~w5dc4Y23Y_A diff --git a/data/cds/chlorodb/fasta/NC_010548.fst.gz b/data/cds/chlorodb/fasta/NC_010548.fst.gz index 38c30be49d3fcf81657f5f611230277c70258bf3..4779c4ef7a01408be86de9a5b3c26f2ae7c7108d 100644 GIT binary patch delta 18 acmexzfa%KtCU*I54vz9G&Kuct7XScEdIy03 delta 18 Zcmexzfa%KtCU*I54i2MCr;Y5n3jjzE2G9Ti diff --git a/data/cds/chlorodb/fasta/NC_010601.fst.gz b/data/cds/chlorodb/fasta/NC_010601.fst.gz index a74d0e34fbac561cb0714d0f5779e1337150c673..95ebb70efc51227537de9ee744c0ff275249d8a8 100644 GIT binary patch delta 18 acmdn@nQ7l=CU*I54vz9G&Kudc?*sr$UI*R) delta 18 acmdn@nQ7l=CU*I54i2MCr;Y5}cLD%M^am{f diff --git a/data/cds/chlorodb/fasta/NC_010654.fst.gz b/data/cds/chlorodb/fasta/NC_010654.fst.gz index 5851ea856938f8356d49591d19d89849688e7d5c..a87ba749c1dea7c51a5edebc3585a40902ac646c 100644 GIT binary patch delta 18 acmaE~i0RQHCU*I54vz9G&KudICjtOQQwIP5 delta 18 ZcmaE~i0RQHCU*I54i2MCr;Y5<69GZ#22TJ0 diff --git a/data/cds/chlorodb/fasta/NC_010772.fst.gz b/data/cds/chlorodb/fasta/NC_010772.fst.gz index d18fb56f6f3651d8463ca930e6b8267b0c7fb92e..8f6da795aa8f1185dca539519b983e18adcc631e 100644 GIT binary patch delta 18 ZcmZo|U~X+-W|!~g;3&W1ypjFiegHSg2Gsxn delta 18 ZcmZo|U~X+-W|!~g;4sQ`+Q|NIKL9gd1|$Fg diff --git a/data/cds/chlorodb/fasta/NC_010776.fst.gz b/data/cds/chlorodb/fasta/NC_010776.fst.gz index a847f1b0c24a6af3d92edc43586ff5fc9c99ea9f..e8873b358e9d0787c93f239f2606d2843aceb6c4 100644 GIT binary patch delta 18 ZcmZ3{&b*?XnO(k{gQNV4^G5cChXFiq2G9Ti delta 18 ZcmZ3{&b*?XnO(k{gTpw}X(Ri>!vHu81|R?c diff --git a/data/cds/chlorodb/fasta/NC_011031.fst.gz b/data/cds/chlorodb/fasta/NC_011031.fst.gz index becd7edb308cff843f16abf6f4c777745dfc34a6..9f91a6b49bc0e919d8885693dc43a287b56d1917 100644 GIT binary patch delta 18 ZcmeCb#N2<0nO(k{gQNV4^G0@#mjFRO2EhOT delta 18 ZcmeCb#N2<0nO(k{gTpw}X(KzwO8`9F1`z-N diff --git a/data/cds/chlorodb/fasta/NC_011032.fst.gz b/data/cds/chlorodb/fasta/NC_011032.fst.gz index e558e7c9caac7de3359982e22b03619abd58998e..a88aa22e1683646e903df2926045805e493a16c6 100644 GIT binary patch delta 18 acmZ2@nrY!_CU*I54vvZ|&KuchEd>BWf(Il3 delta 18 acmZ2@nrY!_CU*I54i4i?r;Y5hmI44j7zT3y diff --git a/data/cds/chlorodb/fasta/NC_011152.fst.gz b/data/cds/chlorodb/fasta/NC_011152.fst.gz index 25c96326294d70dc3e50c97eefff7d475ac8a3ad..8bb995273c5f32fa593b3e7dd3df7daa2b2771c3 100644 GIT binary patch delta 18 acmex1lj++`CU*I54vvZ|&Kud^_W%G$`Uj=} delta 18 Zcmex1lj++`CU*I54i4i?r;Y6IdjLd`2K4{{ diff --git a/data/cds/chlorodb/fasta/NC_011153.fst.gz b/data/cds/chlorodb/fasta/NC_011153.fst.gz index 25d860aff5842f6217030c8f8b7ed0f7f840806d..0787f72c0f06d10c078c41ddc41ad0605babf40f 100644 GIT binary patch delta 18 Zcmew`kLklaCU*I54vvZ|&Kub?`vFJB2O$6e delta 18 Zcmew`kLklaCU*I54i4i?r;Y5H{QyH;25!o9WPOCU*I54vvZ|&Kucx_W}Sy9S08p delta 18 ZcmX>!o9WPOCU*I54i4i?r;Y5pdjUPO23`OF diff --git a/data/cds/chlorodb/fasta/NC_011156.fst.gz b/data/cds/chlorodb/fasta/NC_011156.fst.gz index f270fa960f2c496dd50ee8472a30f15c87acafcf..551db98f1a891132d4431743da10873281ba455d 100644 GIT binary patch delta 18 acmX>#m+918CU*I54vvZ|&Kube_W=MybO$T| delta 18 ZcmX>#m+918CU*I54i4i?r;Y4~`v5-*273Si diff --git a/data/cds/chlorodb/fasta/NC_011158.fst.gz b/data/cds/chlorodb/fasta/NC_011158.fst.gz index bfda1f5719efdfa6a9eea60f78a97bc7fc5cc534..d1024048017def0c03af847962c113ea72a4b513 100644 GIT binary patch delta 18 Zcmdloi)qU&CU*I54vvZ|&KucvdjUTb24esK delta 18 Zcmdloi)qU&CU*I54i4i?r;Y5oy#P9@1+oAD diff --git a/data/cds/chlorodb/fasta/NC_011159.fst.gz b/data/cds/chlorodb/fasta/NC_011159.fst.gz index 5f2b7ea03471bad7afbb01f088ef5840fc10576e..6bd8937f14f5dba52b45a3a6b200c520bfa1172a 100644 GIT binary patch delta 18 acmdlplWEUPCU*I54vvZ|&Kudc_5c7u3o! delta 18 ZcmZqcWoqkXVwdmc;4sc~+Q?qt1^_e01&06t diff --git a/data/cds/chlorodb/fasta/NC_012224.fst.gz b/data/cds/chlorodb/fasta/NC_012224.fst.gz index 253a5b391b2cbc8076a3ac5f242d38217c96d316..6b1792c0f1f0311db972327b15d9f030002bed33 100644 GIT binary patch delta 18 ZcmX@y!+f}hnO(k{gQMb#^G0@?V*o$J2Co1B delta 18 ZcmX@y!+f}hnO(k{gTpw}X(PMMF#tPT1^xg4 diff --git a/data/cds/chlorodb/fasta/NC_012568.fst.gz b/data/cds/chlorodb/fasta/NC_012568.fst.gz index f014f7179bd4766cb9d69ba9ab7a5bb7e6707523..9ec8d140f4f89983cad9ae07bb2b0b6c0b8f4ebc 100644 GIT binary patch delta 16 XcmcbUdMA}#zMF%i;)?S|_Nzt!I>!c* delta 16 XcmcbUdMA}#zMF%?IMZn(`&A<0iKnM2# diff --git a/data/cds/chlorodb/fasta/NC_012898.fst.gz b/data/cds/chlorodb/fasta/NC_012898.fst.gz index a23aa4c2d12645de7fb9963f6d556788331a8ca2..df67baacb1ba0eb14de9aef4e179eb040aaa8bb5 100644 GIT binary patch delta 18 ZcmdmahjHf}Mt1pb4vvZ|&Kuc{@&HGL2Gsxn delta 18 ZcmdmahjHf}Mt1pb4i4i?r;Y4Jc>qHj1|$Fg diff --git a/data/cds/chlorodb/fasta/NC_012903.fst.gz b/data/cds/chlorodb/fasta/NC_012903.fst.gz index bfc4b24e58b1b0babd0f70a836b9132ca7be83ff..fb1581234b8491ce941187cb78305c471c9a48bb 100644 GIT binary patch delta 18 ZcmeBq#@O?WkzKx diff --git a/data/cds/chlorodb/fasta/NC_012978.fst.gz b/data/cds/chlorodb/fasta/NC_012978.fst.gz index bde9aa6bf7ef098f52d0500e20b3fc25548a2884..85aef45db7314157e501bb32e99f7acfa2c4c90d 100644 GIT binary patch delta 18 acmdnJlxg=;CU*I54vvZ|&KudcOacHxV+Rue delta 18 acmdnJlxg=;CU*I54i4i?r;Y4eCIJ9F`37PD diff --git a/data/cds/chlorodb/fasta/NC_013086.fst.gz b/data/cds/chlorodb/fasta/NC_013086.fst.gz index 874ab3b86e63398049652203c624b716195e2d52..be644eb01245aabb5d971edac65d35997c65e871 100644 GIT binary patch delta 18 acmezPkm=(?CU*I54vvZ|&KucZZ2$mKCkRUb delta 18 acmezPkm=(?CU*I54i4i?r;Y5dHUI!jy$6~A diff --git a/data/cds/chlorodb/fasta/NC_013088.fst.gz b/data/cds/chlorodb/fasta/NC_013088.fst.gz index 7a810f29adeef9287db31094d1be5d284d66d7e9..12c957ea01db861e26212845dd194f6694953f7c 100644 GIT binary patch delta 18 acmbPnjcLX;CU*I54vvZ|&KubUR|5b-q6Vb^ delta 18 ZcmbPnjcLX;CU*I54i4i?r;Y4_s{uYZ1@r&_ diff --git a/data/cds/chlorodb/fasta/NC_013273.fst.gz b/data/cds/chlorodb/fasta/NC_013273.fst.gz index b46cc42d2bed9443d31554e523d7f710c1862833..bc08757a5275956196ef3027ce5588af2d5eb4a0 100644 GIT binary patch delta 18 ZcmeCW$<%d|iCw;%gQMb#^G5dOH2^{u2Lb>9 delta 18 ZcmeCW$<%d|iCw;%gTpw}X(M~{8UQ`422lV2 diff --git a/data/cds/chlorodb/fasta/NC_013359.fst.gz b/data/cds/chlorodb/fasta/NC_013359.fst.gz index d3bf37b1bd214e2ac383c7ea7b47a6b395664d64..413e37cc64d487465586ebce5943616d57d59470 100644 GIT binary patch delta 18 acmdn-glWeUCU*I54vvZ|&KubcHvs@hy9X!$ delta 18 Zcmdn-glWeUCU*I54i4i?r;Y4}n*c;n26q4e diff --git a/data/cds/chlorodb/fasta/NC_013498.fst.gz b/data/cds/chlorodb/fasta/NC_013498.fst.gz index ea72b6a2a6929602e93d34a123605bd0778b1295..450ebb271560a8c028e8a07a5c160db69fc55fd4 100644 GIT binary patch delta 18 acmZ2>iD}s-CU*I54vvZ|&Kud~R{{V;4hF>l delta 18 ZcmZ2>iD}s-CU*I54i4i?r;Y6LD*->G1{44Q diff --git a/data/cds/chlorodb/fasta/NC_013553.fst.gz b/data/cds/chlorodb/fasta/NC_013553.fst.gz index 5e2628d65218c803d94abd62cec20530b9279400..cb131e22f74cec9f66e524413c3b7f4afec5a294 100644 GIT binary patch delta 18 acmbRFg=yv&CU*I54vvZ|&Kuc-Mt1pb4vxwz&Kucp#RC9JatDO~ delta 18 ZcmaF3pYh>-Mt1pb4i4i?r;Y5l;sHhh2Gall diff --git a/data/cds/chlorodb/fasta/NC_013707.fst.gz b/data/cds/chlorodb/fasta/NC_013707.fst.gz index 88229f069ee81ae73b8f091eb9fe360056cbbcff..f207e8e5776ee10d1290580b62a3a8e0aaa3d1ce 100644 GIT binary patch delta 18 acmdn`muc%?CU*I54vxwz&Kud+?E?TzYzN)| delta 18 acmdn`muc%?CU*I54i4i?r;Y6E_5lD#`v)ul diff --git a/data/cds/chlorodb/fasta/NC_013823.fst.gz b/data/cds/chlorodb/fasta/NC_013823.fst.gz index 490710265d21fa4ceb86d7a725df8ce6abfd02e7..49c46a494369755d3a12a54c8512b675957d3ea3 100644 GIT binary patch delta 18 ZcmZ45$-K0anO(k{gQN0_^G5c0M*uui2F?Hg delta 18 ZcmZ45$-K0anO(k{gTpw}X(Ri*BLFwz1{?qY diff --git a/data/cds/chlorodb/fasta/NC_013843.fst.gz b/data/cds/chlorodb/fasta/NC_013843.fst.gz index 854ad658604f687b6596bcd41849ac7dbfb46c1b..a1cd691de1d3ceda367c5883bd558c3162bf8492 100644 GIT binary patch delta 18 ZcmeBt&(!&ziCw;%gQN0_^G5cj?Eplt2R8r! delta 18 ZcmeBt&(!&ziCw;%gTpw}X(M~nb^t&=2893s diff --git a/data/cds/chlorodb/fasta/NC_013991.fst.gz b/data/cds/chlorodb/fasta/NC_013991.fst.gz index 9e101c1bcdd1d5efa5de70120be1ea6a59088e12..33d29bd6f18ff1787505e56981def48029187af9 100644 GIT binary patch delta 18 ZcmbQz#5|>mnO(k{gQN0_^G0^wg8(=r1_}TG delta 18 ZcmbQz#5|>mnO(k{gTpw}X(K!DK>#ze1y}$8 diff --git a/data/cds/chlorodb/fasta/NC_014056.fst.gz b/data/cds/chlorodb/fasta/NC_014056.fst.gz index 77ab8c241163ad83d381409bf2b995ff79e22b91..dcdeedc421509ad8dcbbf2e948797a779f65b6b5 100644 GIT binary patch delta 18 acmdn+lxf3LCU*I54vxwz&KucRZUO*E$p@1F delta 18 acmdn+lxf3LCU*I54i4i?r;Y3@Hvs@dSO(z$ diff --git a/data/cds/chlorodb/fasta/NC_014057.fst.gz b/data/cds/chlorodb/fasta/NC_014057.fst.gz index be137eff6016cef4ec1469c2dd98a588fa70ed39..c864b60c3adcd76e5c54cf1d3920c57b7c646c61 100644 GIT binary patch delta 18 acmbQel4;|Es& delta 18 acmZ2|nQ8T9CU*I54i4i?r;Y4ORssM)at5UU diff --git a/data/cds/chlorodb/fasta/NC_014063.fst.gz b/data/cds/chlorodb/fasta/NC_014063.fst.gz index 25911e967648c6ed70456188c16874bf4cb1f525..0f0eeefb065229c3a029896248be2fcab00e5708 100644 GIT binary patch delta 18 acmaE{jOoQPCU*I54vxwz&KubiCj$USu?HRi delta 18 ZcmaE{jOoQPCU*I54i4i?r;Y51lL13O25bNT diff --git a/data/cds/chlorodb/fasta/NC_014267.fst.gz b/data/cds/chlorodb/fasta/NC_014267.fst.gz index 057d20b1d29278fdb88df5510a3a2eb6973dca1e..93b2426223cf90fa8d9cf988af02d8a12df6352e 100644 GIT binary patch delta 18 ZcmZp>!qj$!iCw;%gQN0_^G5dnD*-|C2WkKS delta 18 ZcmZp>!qj$!iCw;%gTpw}X(Rjpl>j}02DktK diff --git a/data/cds/chlorodb/fasta/NC_014287.fst.gz b/data/cds/chlorodb/fasta/NC_014287.fst.gz index 6756bef7be2c0f6e9569434eff89c6afdfa6633f..638d600c44eb4c0458e5b296e9e51e1756297ef3 100644 GIT binary patch delta 18 acmaDmlj-eDCU*I54vxwz&KudE^#A}z#s`c5 delta 18 ZcmaDmlj-eDCU*I54i1w{r;Y5-dH_RQ2HOAt diff --git a/data/cds/chlorodb/fasta/NC_014340.fst.gz b/data/cds/chlorodb/fasta/NC_014340.fst.gz index afc31991e68b9882e1087a11304b06b5fa8b1fb2..ff3feffb5c86f13e206e45251d44e9fad43f1552 100644 GIT binary patch delta 18 acmcb)oayFrCU*I54vxwz&Kub;O$Go)!v}K! delta 18 acmcb)oayFrCU*I54i1w{r;Y5FCIbLMSq8!Y diff --git a/data/cds/chlorodb/fasta/NC_014345.fst.gz b/data/cds/chlorodb/fasta/NC_014345.fst.gz index 92eacc6f23dea0615c12c23e505e68cb928092df..abbd8c74905c84c2eb0c19bb1889b61ab3e58b3d 100644 GIT binary patch delta 18 acmZ2+m2t&YMt1pb4vxwz&KubmW&r?2Tn7;V delta 18 ZcmZ2+m2t&YMt1pb4i1w{r;Y3jvj9Ny24DaH diff --git a/data/cds/chlorodb/fasta/NC_014346.fst.gz b/data/cds/chlorodb/fasta/NC_014346.fst.gz index 3decacf895da5927c57c41ea59b972fac940e191..b572e5865ddfd84adc8bd58451788a1713cd39d8 100644 GIT binary patch delta 24 gcmaERn&a(h4tDu&4vxwz&W-G??2KF4nVzWv0DFN5umAu6 delta 24 fcmaERn&a(h4tDu&4i1w{r$+WxcE+vjOwUvSa`6ZM diff --git a/data/cds/chlorodb/fasta/NC_014348.fst.gz b/data/cds/chlorodb/fasta/NC_014348.fst.gz index 24b57c609049440714b62beb5a9b954d8afe4a16..0cf5cd6efd5e0c40f0ececcdbc760333cbd698be 100644 GIT binary patch delta 18 acmX@`o$0`LCU*I54vxwz&Kucx?gju&FbD7e delta 18 acmX@`o$0`LCU*I54i1w{r;Y48cLM-O#s@zD diff --git a/data/cds/chlorodb/fasta/NC_014569.fst.gz b/data/cds/chlorodb/fasta/NC_014569.fst.gz index 6a24f3bfb2a3aef5b818447b2d1a691b4b765c58..f11e8243f59a2b83ea21cc6b55e34999cf8f50e0 100644 GIT binary patch delta 18 acmbPofN9DBCU*I54vxwz&Kucz7XSc1Xa-{d delta 18 ZcmbPofN9DBCU*I54i1w{r;Y5q3jjL)1+oAD diff --git a/data/cds/chlorodb/fasta/NC_014570.fst.gz b/data/cds/chlorodb/fasta/NC_014570.fst.gz index f9339e1a5f6f37b6227eb3c30ea25e57f88b1431..232e0ff7edda7f072c0cd63df47dcb352643510f 100644 GIT binary patch delta 18 Zcmdnn#=N(UnO(k{gQN0_^G0^F!vH=#29E#$ delta 18 Zcmdnn#=N(UnO(k{gTo}#X(PMYVE{SP1>OJv diff --git a/data/cds/chlorodb/fasta/NC_014573.fst.gz b/data/cds/chlorodb/fasta/NC_014573.fst.gz index c5ba218af6c21f2f288b8661aa294dcf192df953..d7152b469aecdd8c4bbb3a44dd63f54d90b9bd5c 100644 GIT binary patch delta 18 ZcmeDG#nk_ciCw;%gQN0_^G0@#y#Phr2IT+% delta 18 ZcmeDG#nk_ciCw;%gTo}#X(KzwUI0OI1~dQw diff --git a/data/cds/chlorodb/fasta/NC_014575.fst.gz b/data/cds/chlorodb/fasta/NC_014575.fst.gz index 00d98cd255aea442d64137ba993918e4892b9314..29d89cd47de52ada4960e5fffc91afca174ce421 100644 GIT binary patch delta 18 acmdnKglYQ{CU*I54vxwz&KubcCIJ9IzXpZ? delta 18 ZcmdnKglYQ{CU*I54i1w{r;Y3elK?zb1=Rom diff --git a/data/cds/chlorodb/fasta/NC_014582.fst.gz b/data/cds/chlorodb/fasta/NC_014582.fst.gz index 1555ee58f2c55f76316dc835bcaafd0a7a0dc808..bc29e6af807cc131059c53107a8e8f2c11e7a6f3 100644 GIT binary patch delta 18 acmbQfn`!!PCU*I54vxwz&Kub$%mn~IGX~!P delta 18 acmbQfn`!!PCU*I54i1w{r;Y3r<^lja$p$U} diff --git a/data/cds/chlorodb/fasta/NC_014589.fst.gz b/data/cds/chlorodb/fasta/NC_014589.fst.gz index e687cafcb964c3f1fee93e250b404875882df3f9..bad4103f0f72d2d017b3bc0d8720703397607e0a 100644 GIT binary patch delta 18 ZcmbQx&NQK&iCw;%gQN0_^G5d0W&k+Y21oz^ delta 18 ZcmbQx&NQK&iCw;%gTo}#X(M}QGXOMh1(yH- diff --git a/data/cds/chlorodb/fasta/NC_014592.fst.gz b/data/cds/chlorodb/fasta/NC_014592.fst.gz index ce3d5eeff8a7500502a46f8a17262936f1b635e4..39dca79f751de29430960ced680bde13015bd1c0 100644 GIT binary patch delta 18 acmaF)pXud)CU*I54vxwz&Kubu?FRr;#|VD_ delta 18 acmaF)pXud)CU*I54i1w{r;Y57_5%Pyk@3hxMt1pb4vxwz&KueHdH?`G(gwQ# delta 18 ZcmX>yk@3hxMt1pb4i1w{r;Y4;Jpept1_}TG diff --git a/data/cds/chlorodb/fasta/NC_015083.fst.gz b/data/cds/chlorodb/fasta/NC_015083.fst.gz index 6392c932282d10ee997006fd8e1f9caa9c1bcd03..c4b0ae728c1007f6a49332ef957018ac87e148f9 100644 GIT binary patch delta 18 Zcmex7kLmL~CU*I54vxwz&Kuct`T delta 18 ZcmaF$i|N%bCU*I54i1w{r;Y5%djU=32Soq? diff --git a/data/cds/chlorodb/fasta/NC_015204.fst.gz b/data/cds/chlorodb/fasta/NC_015204.fst.gz index 64842091818217a4614e465bcc4c444f1fd60b8c..08844fb6fb439e44e879554c9ebc57e0b4aefcbb 100644 GIT binary patch delta 18 ZcmeBaXYOfdW|!~g;HbRfypg^2FaS8I27Ukl delta 18 ZcmeBaXYOfdW|!~g;4sN_+Q{B|7yvXs1zk2TT9} delta 18 ZcmZqq%hd9hiCw;%gTo}#X(M~>J^(>a2ATi> diff --git a/data/cds/chlorodb/fasta/NC_015605.fst.gz b/data/cds/chlorodb/fasta/NC_015605.fst.gz index d2d24631d19093adcac290c34f45fef0307f522f..75d0f03721f94bb0b0ea667b415e3ca05b49d614 100644 GIT binary patch delta 18 ZcmaFg%ly8VnO(k{gQMz-^G5a;#{fq52e$wK delta 18 ZcmaFg%ly8VnO(k{gTo}#X(RiKV*o;h2L%8C diff --git a/data/cds/chlorodb/fasta/NC_015608.fst.gz b/data/cds/chlorodb/fasta/NC_015608.fst.gz index c71ea5dd57e0803bba10708e520f60d612b346ee..55db8b8d2ed080ad067a61406fa549991dcafc8d 100644 GIT binary patch delta 18 acmccem+8u1CU*I54vwlT&Kud!?gIc&un0T= delta 18 acmccem+8u1CU*I54i1w{r;Y4q_W=M*KL?5c diff --git a/data/cds/chlorodb/fasta/NC_015610.fst.gz b/data/cds/chlorodb/fasta/NC_015610.fst.gz index 042e4b44fb2b0b176baafdb6382898fa1e7baac4..a3fc93cd932d6e44e9cbc65c4feb590e8a5d06b6 100644 GIT binary patch delta 18 Zcmdnl$Go$TnO(k{gQMz-^G0@~;{ZOi2ABW< delta 18 Zcmdnl$Go$TnO(k{gTo}#X(PMQaR53)1?B(% diff --git a/data/cds/chlorodb/fasta/NC_015621.fst.gz b/data/cds/chlorodb/fasta/NC_015621.fst.gz index bd12cfe7e62871222dcc216240ca6562edcd0aba..ffc930932a3c145f1ebd0d7119412ab9697511b2 100644 GIT binary patch delta 18 acmX@{p6SGUCU*I54vwlT&KubeZU+EOQwQ|` delta 18 acmX@{p6SGUCU*I54i1w{r;Y3fw*vr3;s-+j diff --git a/data/cds/chlorodb/fasta/NC_015623.fst.gz b/data/cds/chlorodb/fasta/NC_015623.fst.gz index e60d3a14558a6161b4a8e240f98b69d1edbdf216..9e0d2b80d5e953294dc9bb0b09e027c9239dfdf7 100644 GIT binary patch delta 18 acmdn_mucr;CU*I54vwlT&Kub`?E?Tz{|D;; delta 18 acmdn_mucr;CU*I54i1w{r;Y5J_5lD$jt4ma diff --git a/data/cds/chlorodb/fasta/NC_015645.fst.gz b/data/cds/chlorodb/fasta/NC_015645.fst.gz index b7d8ba64248f35c27f71b86a2f6f9448db1a8870..b825810fae9c9ba8348a3f3e863ca4280b8789a2 100644 GIT binary patch delta 18 acmbQSj(Ns9W_I~*4vwlT&KubUuLA%+AqIs2 delta 18 ZcmbQSj(Ns9W_I~*4i1w{r;Y4_*8w@O1=9ck diff --git a/data/cds/chlorodb/fasta/NC_015803.fst.gz b/data/cds/chlorodb/fasta/NC_015803.fst.gz index 958329825f53251f252f01f02b5bacdef1d6af49..4d78922eb0059a1d8db82327f22baae782b9060a 100644 GIT binary patch delta 18 acmbPrjcL|3CU*I54vwlT&KucrW_I~*4vwlT&KudEp9KI&j0e{M delta 18 acmaDioB7>rW_I~*4i3{yr;Y5-&jJ8MA_pb_ diff --git a/data/cds/chlorodb/fasta/NC_015983.fst.gz b/data/cds/chlorodb/fasta/NC_015983.fst.gz index bbcaca17d31c4b6f973ef57ea3fba98f0becc141..31d19ba2b0bfbed76162d2234d4956ef1eaab935 100644 GIT binary patch delta 18 acmbRKmudQ6CU*I54vwlT&Kub$>;nKuSqFsx delta 18 acmbRKmudQ6CU*I54i3{yr;Y3r_5lDx?*`NW diff --git a/data/cds/chlorodb/fasta/NC_015990.fst.gz b/data/cds/chlorodb/fasta/NC_015990.fst.gz index 3abb0318ec2b414de6704baf17b86503d461ab7d..37839db5c82bb3ccb29dc2f7514e9be364dbe4d0 100644 GIT binary patch delta 18 acmcb6jp^<+CU*I54vwlT&KudoRs#S`9|v{- delta 18 Zcmcb6jp^<+CU*I54i3{yr;Y4ks{u!~2E_mX diff --git a/data/cds/chlorodb/fasta/NC_015996.fst.gz b/data/cds/chlorodb/fasta/NC_015996.fst.gz index a590465c80ad360fd2fe5fd0bafbbe2e6697824c..257bf52106c088975f06540c9d91e7eb851fdd0f 100644 GIT binary patch delta 18 ZcmZ3|#=NABnO(k{gQMz-^G0^r!vH$j21Nh> delta 18 ZcmZ3|#=NABnO(k{gTpk_X(PMrVE{I71(W~) diff --git a/data/cds/chlorodb/fasta/NC_016058.fst.gz b/data/cds/chlorodb/fasta/NC_016058.fst.gz index f473af77b15da18a5e2e184efee0f443f719b4ea..894164a40cbf9a22f6da3c3bc0120ef714d1bb2a 100644 GIT binary patch delta 18 ZcmeBO&D6V^iCw;%gQMz-^G5czsQ^6W2ATi> delta 18 ZcmeBO&D6V^iCw;%gTpk_X(M~vQ~)@71?d0) diff --git a/data/cds/chlorodb/fasta/NC_016063.fst.gz b/data/cds/chlorodb/fasta/NC_016063.fst.gz index 14cbc1d052459ce39c9786369bdaa30623165bb6..ec7c2fe91bb89107ae775286cde44fd0d4a1734a 100644 GIT binary patch delta 18 acmex)lIiD3CU*I54vwlT&Kuc3Edc;eSqLcr delta 18 acmex)lIiD3CU*I54i3{yr;Y5NmH+@s?+17Q diff --git a/data/cds/chlorodb/fasta/NC_016064.fst.gz b/data/cds/chlorodb/fasta/NC_016064.fst.gz index b4da2d106256e109f5fe1c231c90a7238ed1331a..57200ff5fa76cf6e1675e73d2a5054df3ed7b78d 100644 GIT binary patch delta 18 acmeycis{2DCU*I54vwlT&Kub?rvd;;P6t5% delta 18 Zcmeycis{2DCU*I54i3{yr;Y5HQvpQe29N*% diff --git a/data/cds/chlorodb/fasta/NC_016065.fst.gz b/data/cds/chlorodb/fasta/NC_016065.fst.gz index f40e3713358d29f8863521a19e7f6d95f6a798a0..920e16b03ac9083477b9c0b9ac12fbf08a1b99ba 100644 GIT binary patch delta 18 ZcmeA;$kcI=iCw;%gQMz-^G5c@1pq$k2EqUU delta 18 ZcmeA;$kcI=iCw;%gTpk_X(M~%0suOI1`z-N diff --git a/data/cds/chlorodb/fasta/NC_016068.fst.gz b/data/cds/chlorodb/fasta/NC_016068.fst.gz index 2588566bfd93e4a0ddd4ad3def90650d2424ae4f..e18a7175d1abaa7be8e1f56a511b53556b2da9e6 100644 GIT binary patch delta 18 acmaF-m+A3eCU*I54vwlT&Kue9>;nK&y$ERl delta 18 acmaF-m+A3eCU*I54i3{yr;Y4)_5lD+QwO*J diff --git a/data/cds/chlorodb/fasta/NC_016069.fst.gz b/data/cds/chlorodb/fasta/NC_016069.fst.gz index 5f1be6fe738deb2f8884ad8690c4e998f8f45cd4..81dd880d927e09dfe5a4a1f3d99e430b71e77411 100644 GIT binary patch delta 18 acmeymp6Tm)CU*I54vwlT&Kud^O$Pu=ng`qf delta 18 acmeymp6Tm)CU*I54i3{yr;Y6IrUL*+Fb69D diff --git a/data/cds/chlorodb/fasta/NC_016430.fst.gz b/data/cds/chlorodb/fasta/NC_016430.fst.gz index 57cb6824894bba8ca191b02e9efbe2677879d07f..ff82880c5107f92db321d8bdec263c62e780c74d 100644 GIT binary patch delta 18 acmezVpXvL5CU*I54vwlT&Kuc3><0iP6zn_ diff --git a/data/cds/chlorodb/fasta/NC_016433.fst.gz b/data/cds/chlorodb/fasta/NC_016433.fst.gz index 168a7aa7fc7edd9ec70fdfc183e391051507b52b..3990dafe9f61a84f83f8f4a0d94bc54b5f233ea4 100644 GIT binary patch delta 18 acmbRBooUv0CU*I54vwlT&Kub$?*;%!1qXis delta 18 acmbRBooUv0CU*I54i3{yr;Y5BcLM-Jn+DDR diff --git a/data/cds/chlorodb/fasta/NC_016468.fst.gz b/data/cds/chlorodb/fasta/NC_016468.fst.gz index e01c807d7c6f38ac255a70e3fed4120a04963f20..a600feacb6c8c8a5a2666b648d6a6f784813fc7d 100644 GIT binary patch delta 18 acmX@~o$1hbCU*I54vwlT&Kucx?*;%(eFygd delta 18 acmX@~o$1hbCU*I54i3{yr;Y5pcLM-P69+~B diff --git a/data/cds/chlorodb/fasta/NC_016471.fst.gz b/data/cds/chlorodb/fasta/NC_016471.fst.gz index 25d7498d5d1c7cdd6f1ab8065267dfba898be82b..14144583bc47828a1e6d4d5b696c3a7fdf345015 100644 GIT binary patch delta 18 acmZ4Xka5{VMt1pb4vwlT&Kue17XSc8mj@~U delta 18 ZcmZ4Xka5{VMt1pb4i3{yr;Y6M3jjhb26+Gg diff --git a/data/cds/chlorodb/fasta/NC_016668.fst.gz b/data/cds/chlorodb/fasta/NC_016668.fst.gz index 13490c0aca77d02c9d4a3b0ad7e67ea9da25ff43..9273a19874c143e37ff2111c47aa5b1451737fd5 100644 GIT binary patch delta 18 Zcmey?#{8{~nO(k{gQMz-^G5dk!vIDP2Ri@& delta 18 Zcmey?#{8{~nO(k{gTpk_X(N07VE{p;28sXx diff --git a/data/cds/chlorodb/fasta/NC_016670.fst.gz b/data/cds/chlorodb/fasta/NC_016670.fst.gz index dc551537abfa9a1fc5b2d983bd8e667573f1ae0c..6f8f8c345ed3e9065447a642b77698efe0a8245a 100644 GIT binary patch delta 18 ZcmX@w&V00;nO(k{gQMz-^G5c4hXFu)2Pyyn delta 18 ZcmX@w&V00;nO(k{gTpk_X(Ri-!vH)H26+Gg diff --git a/data/cds/chlorodb/fasta/NC_016677.fst.gz b/data/cds/chlorodb/fasta/NC_016677.fst.gz index 99ae2c31bec446ab03167c1513b30ebf3f417f67..1a260ee2f98744f9d14e7a6956e8e802d10cac04 100644 GIT binary patch delta 18 ZcmZoW&(wCFiCw;%gQMz-^G5diq diff --git a/data/cds/chlorodb/fasta/NC_016690.fst.gz b/data/cds/chlorodb/fasta/NC_016690.fst.gz index f9061bbd678bd637c686e0a4a7a79cabf66af2ef..cc441694110e1d5a2a4dcef40eb5c7d9dbf89972 100644 GIT binary patch delta 18 ZcmbQ%!91;lnO(k{gQMz-^G0_5BLF!r1|R?c delta 18 ZcmbQ%!91;lnO(k{gTpk_X(K!T5dbvA1#bWV diff --git a/data/cds/chlorodb/fasta/NC_016692.fst.gz b/data/cds/chlorodb/fasta/NC_016692.fst.gz index 6418a779878e0b5e1f3ff1b968a895a03260ac7e..5b486c90f2695f7cf533382675ef088e30b32c62 100644 GIT binary patch delta 18 ZcmeBgXYOxjW|!~g;HbLdypg@*FaS9j28aLv delta 18 ZcmeBgXYOxjW|!~g;4sZ}+Q{B<7yvY{1=j!o diff --git a/data/cds/chlorodb/fasta/NC_016699.fst.gz b/data/cds/chlorodb/fasta/NC_016699.fst.gz index daecf239e4c66e346edf7055054848f2c545cbe0..01f4255cdc1e7b7d6d729f8ab1516da5c0805857 100644 GIT binary patch delta 18 acmcb1jp^DoCU*I54vy+8&KueNR|5b`F$ZD* delta 18 Zcmcb1jp^DoCU*I54i3{yr;Y6Xs{uy92Cx7C diff --git a/data/cds/chlorodb/fasta/NC_016703.fst.gz b/data/cds/chlorodb/fasta/NC_016703.fst.gz index 883d75afe6d0c098b4d90cf2aa99d99b61c0a1d1..6175b55f830f9a3c9334832910022b3ddf5f9dc6 100644 GIT binary patch delta 18 Zcmey@#PqL;iCw;%gQNP2^G5daMgT@r2M7QF delta 18 Zcmey@#PqL;iCw;%gTpk_X(M}iBLG3-237z7 diff --git a/data/cds/chlorodb/fasta/NC_016708.fst.gz b/data/cds/chlorodb/fasta/NC_016708.fst.gz index a8739ada9ae79984c6653bf5c7f871014eab66b9..d000599c6a0fad89438b5ebc76d50e17e7de5b5d 100644 GIT binary patch delta 18 acmezOiRs@bCU*I54vy+8&KudwcLD%Z8wel( delta 18 ZcmezOiRs@bCU*I54i3{yr;Y68I{{Cs2W|iW diff --git a/data/cds/chlorodb/fasta/NC_016711.fst.gz b/data/cds/chlorodb/fasta/NC_016711.fst.gz index b01db8ef44fb9deff7b28d3e47df642b4d9ff0f9..2d5929b8df7220088792c2a5214c263d28c8aa6c 100644 GIT binary patch delta 18 Zcmdnq&b+;ynO(k{gQNP2^G5a!hXFpA2LS*8 delta 18 Zcmdnq&b+;ynO(k{gTpk_X(RiF!vH!b22TJ0 diff --git a/data/cds/chlorodb/fasta/NC_016712.fst.gz b/data/cds/chlorodb/fasta/NC_016712.fst.gz index 015548fc57db07e18e7b0cc9522f6b8d9a203751..b9b2f0ad59b827a372413907038cddf46384da53 100644 GIT binary patch delta 18 ZcmZo}XKrq1W|!~g;HbXhypg@;FaS4v24w&M delta 18 ZcmZo}XKrq1W|!~g;4sZ}+Q?pW7yvU11+xGE diff --git a/data/cds/chlorodb/fasta/NC_016718.fst.gz b/data/cds/chlorodb/fasta/NC_016718.fst.gz index d6cd0aa221016984e25eef5549a0cabb6c611eb3..38ccc1300e57611d9cc14df27daba342919f8f22 100644 GIT binary patch delta 18 acmdmcj%n{XCU*I54vy+8&KudymIDAr$_E1g delta 18 Zcmdmcj%n{XCU*I54i3{yr;Y4p%K<`J22lV2 diff --git a/data/cds/chlorodb/fasta/NC_016727.fst.gz b/data/cds/chlorodb/fasta/NC_016727.fst.gz index 5e4bee50bcec728e59022ea28e331aff42b86e65..c2bd97720b7bf24e8d8c7ded6ff49efd339ba46d 100644 GIT binary patch delta 18 acmaF*k?HA2CU*I54vy+8&Kue9?EnB#kO)!$ delta 18 acmaF*k?HA2CU*I54i3{yr;Y6Qb^riP9|xcS diff --git a/data/cds/chlorodb/fasta/NC_016728.fst.gz b/data/cds/chlorodb/fasta/NC_016728.fst.gz index 91a8e25bbb3160d668381cbcca4b96cc602cfe50..b52dbd08dd09e8a3f1187431baae79ea97fa9a2e 100644 GIT binary patch delta 18 acmdn^k!j;cCU*I54vy+8&KucR?EnBubO*Ko delta 18 acmdn^k!j;cCU*I54i3{yr;Y5Zb^riI0|x{E diff --git a/data/cds/chlorodb/fasta/NC_016729.fst.gz b/data/cds/chlorodb/fasta/NC_016729.fst.gz index 9eecb634c87492cfa1d7720bf00d767811abdfd7..4de853d257119c06d0d2f0d26263635f9d649a5e 100644 GIT binary patch delta 18 acmbRCoN3x~CU*I54vy+8&KueLHv<4ghzCpn delta 18 ZcmbRCoN3x~CU*I54i3{yr;Y6Wn*l)=2ATi> diff --git a/data/cds/chlorodb/fasta/NC_016730.fst.gz b/data/cds/chlorodb/fasta/NC_016730.fst.gz index fae19b52f5b5fe9c930aa06fc1ccfc0e103cd8a3..0e8135b0596972df6d6c92750b43445901b674ac 100644 GIT binary patch delta 18 acmZ4YiD}&@CU*I54vy+8&Kud)cLD%OD+e$D delta 18 ZcmZ4YiD}&@CU*I54i3{yr;Y6DI{`$x27Ukl diff --git a/data/cds/chlorodb/fasta/NC_016731.fst.gz b/data/cds/chlorodb/fasta/NC_016731.fst.gz index e76c8546129083d685bf728d1855ad546de3efbc..32d17e5750a1c66baa397ef2ecafeb76bfb4bada 100644 GIT binary patch delta 18 ZcmX>-gX#1PCU*I54vy+8&KucXdH_NX2BrW2 delta 18 ZcmX>-gX#1PCU*I54i3{yr;Y3`JpetP1@r&_ diff --git a/data/cds/chlorodb/fasta/NC_016732.fst.gz b/data/cds/chlorodb/fasta/NC_016732.fst.gz index a63c06d88af09d4bfa0effa28e186115c55f6cfd..477ca94f7db1ec421b0a539ce15583c6c2dbdfdc 100644 GIT binary patch delta 21 ccmX@{gXP2z7Iyh=4vy+8&W-F_*%=*e0AoZ4o&W#< delta 21 ccmX@{gXP2z7Iyh=4i3{yr$+Xz?2L{!09?HW>;M1& diff --git a/data/cds/chlorodb/fasta/NC_016733.fst.gz b/data/cds/chlorodb/fasta/NC_016733.fst.gz index e248521e55aa40e383cf5aef0f7d684ad5f25f45..aac6f099acfa4fdfd401f895e2fcb39d827126ac 100644 GIT binary patch delta 18 Zcmccdj`7AjMt1pb4vy+8&KubS%K=Uf2VwvK delta 18 Zcmccdj`7AjMt1pb4i3{yr;Y4^Y2Cx7C diff --git a/data/cds/chlorodb/fasta/NC_016734.fst.gz b/data/cds/chlorodb/fasta/NC_016734.fst.gz index 12301fc8d7a2178f29a47d75834c5bd903c04747..c15a5673ed22981e2074dab2a1f791a7f8a4bb83 100644 GIT binary patch delta 18 acmbRIm1*)QmiCw;%gQNP2^G0^IX#hM61|9$a delta 18 ZcmeBO!_>QmiCw;%gTpk_X(Kz^Gypf61#AES diff --git a/data/cds/chlorodb/fasta/NC_016736.fst.gz b/data/cds/chlorodb/fasta/NC_016736.fst.gz index 41868b0c7f13b9ba271e7bf764226ec6fe0b1f4a..6680f0f85478c52434c122e5783fa35df08b56b7 100644 GIT binary patch delta 18 ZcmZqcVQ%YTW|!~g;HbXhypjF?Q2;rD2KoR1 delta 18 ZcmZqcVQ%YTW|!~g;4sZ}+Q|O@C;&AP21oz^ diff --git a/data/cds/chlorodb/fasta/NC_016753.fst.gz b/data/cds/chlorodb/fasta/NC_016753.fst.gz index cb760fb93d6e6e9d3fee4d5a751175cba93fee14..ae79f9f71dfe2d6b138b4cee60eee3a4843055fb 100644 GIT binary patch delta 18 Zcmey@&HS&MnO(k{gQNP2^G5dXM*&F72jBnz delta 18 Zcmey@&HS&MnO(k{gTpk_X(RjhqX0x&2QB~r diff --git a/data/cds/chlorodb/fasta/NC_016921.fst.gz b/data/cds/chlorodb/fasta/NC_016921.fst.gz index f211f2ab488ab2726b4cc2b6171d9d4dd7f4dc57..020a0568c0d8a8350f04bc000fde3dd1fe112a41 100644 GIT binary patch delta 18 acmccikLlV!CU*I54vy+8&KueN_X7Y>9S6n$ delta 18 ZcmccikLlV!CU*I54i3{yr;Y6X`vFU=2NVDR diff --git a/data/cds/chlorodb/fasta/NC_016927.fst.gz b/data/cds/chlorodb/fasta/NC_016927.fst.gz index 8d4097273eeb2addbda913b04a22eecb70ff4e7d..10edb8aad98f76ee762d801dd56a39e5167cfb3c 100644 GIT binary patch delta 18 acmZ2$R622TJ0 diff --git a/data/cds/chlorodb/fasta/NC_017835.fst.gz b/data/cds/chlorodb/fasta/NC_017835.fst.gz index 76c018c36bbace8487197deea89c328309451f8b..e7de7830ce4e3966db0265dfc16399205be97cd4 100644 GIT binary patch delta 18 acmaELlIhh+CU*I54vy+8&KubuF985eQwRM3 delta 18 acmaELlIhh+CU*I54i2+Sr;Y57mjD1r=?6>z diff --git a/data/cds/chlorodb/fasta/NC_017894.fst.gz b/data/cds/chlorodb/fasta/NC_017894.fst.gz index 1e279da08858931d5cca9aa2a55a5a232b479047..3621d4f85b62bcfec6ef465ee64ad314a19c489f 100644 GIT binary patch delta 18 ZcmeBbWA18WW|!~g;HbXhypf&xFaS4F1^55} delta 18 ZcmeBbWA18WW|!~g;4sT{+Q`m)7yvTp1xEk? diff --git a/data/cds/chlorodb/fasta/NC_018051.fst.gz b/data/cds/chlorodb/fasta/NC_018051.fst.gz index 8df7f0dd552887fbda3926b74d30881aa8fc84e5..b234edc4ab1849e4ee7493ded402002da75005bd 100644 GIT binary patch delta 18 acmZ4Zk!j&aCU*I54vy+8&Kuch?EnBsLFDu diff --git a/data/cds/chlorodb/fasta/NC_018114.fst.gz b/data/cds/chlorodb/fasta/NC_018114.fst.gz index 082cf519db72daf16780f955e1ce95644d06c2dc..52b5165a4c67d58d9fc1fd85a5b51b09b04061a4 100644 GIT binary patch delta 18 acmaEThw1elCU*I54vy+8&KucN)&T%c%?Gdm delta 18 ZcmaEThw1elCU*I54i2+Sr;Y3>>i|k)2LAv6 diff --git a/data/cds/chlorodb/fasta/NC_018117.fst.gz b/data/cds/chlorodb/fasta/NC_018117.fst.gz index 4f7e40a0b165ed08dfc46e0d2dd2643d47444c54..594833a046c7968e4b6eaeb55f371a5fd828df63 100644 GIT binary patch delta 18 acmbRIk7@EhCU*I54vy+8&Kucz_5%P$^alL^ delta 18 ZcmbRIk7@EhCU*I54i2+Sr;Y49`vF3V2220| diff --git a/data/cds/chlorodb/fasta/NC_018357.fst.gz b/data/cds/chlorodb/fasta/NC_018357.fst.gz index 244459a74961c9ebba25931594f2bfdd9996ecab..5999931acff4a2da0c52fb7639de9dc3c0a41500 100644 GIT binary patch delta 18 ZcmaFT&itgEnO(k{gQNP2^G5c&hXF*t2Z#Uw delta 18 ZcmaFT&itgEnO(k{gTpM-X(RjH!vH{42G;-p diff --git a/data/cds/chlorodb/fasta/NC_018523.fst.gz b/data/cds/chlorodb/fasta/NC_018523.fst.gz index 408a708d488835063de56d9b94991234c6ca7bf2..6f27dd34488b8dbc40d40f9daa9e6b8c2ede80ef 100644 GIT binary patch delta 18 acmbQahiT>>CU*I54vy+8&Kuc<<^cddrv_>O delta 18 ZcmbQahiT>>CU*I54i2+Sr;Y4F^8h<0i&7YG9Y delta 18 acmdo0pK1SpCU*I54i2+Sr;Y48_5%P(tp`#7 diff --git a/data/cds/chlorodb/fasta/NC_018552.fst.gz b/data/cds/chlorodb/fasta/NC_018552.fst.gz index fdd40e140efd37b55536d542e862697059b91975..81a645301f2d2803e572f65e5f42bad764ce6898 100644 GIT binary patch delta 18 acmdn;pJ~f~CU*I54vy+8&Kud+?gs!&mIvYh delta 18 acmdn;pJ~f~CU*I54i2+Sr;Y4u_X7Y(EC(?F diff --git a/data/cds/chlorodb/fasta/NC_018565.fst.gz b/data/cds/chlorodb/fasta/NC_018565.fst.gz index 28cec75159f112a2d642ddb4f7d2828afbc7e59b..3931b82f85f92575a408c6545cfe5b1fb1fee9ab 100644 GIT binary patch delta 18 acmdn-i)qI%CU*I54vy+8&Kubc_W}S*g$H5) delta 18 Zcmdn-i)qI%CU*I54i2+Sr;Y4}djUrq2C)DD diff --git a/data/cds/chlorodb/fasta/NC_018569.fst.gz b/data/cds/chlorodb/fasta/NC_018569.fst.gz index f05100f970ac41c04bf3e151252396f3dabf692e..e95629fe5e47593c41df90c6dc3dfc2f31f4ba63 100644 GIT binary patch delta 18 acmccdj_JlbCU*I54vy+8&KubSw*vr9YX_tN delta 18 Zcmccdj_JlbCU*I54i2+Sr;Y4^+W|@e2J-*_ diff --git a/data/cds/chlorodb/fasta/NC_018766.fst.gz b/data/cds/chlorodb/fasta/NC_018766.fst.gz index 9f254e6ca2d549a4bd3e71e14d5feca4c1c802dd..eb49801f354d25efcc03e9c3c9c3d554aea83329 100644 GIT binary patch delta 18 acmX@Gm+8P>CU*I54vv~D&Kucx&I15OA_rms delta 18 acmX@Gm+8P>CU*I54i2+Sr;Y48=K%mgu?DaJ diff --git a/data/cds/chlorodb/fasta/NC_018767.fst.gz b/data/cds/chlorodb/fasta/NC_018767.fst.gz index 04d279bed9b756ffbbf2bf425c4a5e0e7907217a..fbb3083003ca423989eb7e87698c06308cfc99d3 100644 GIT binary patch delta 18 acmeylm+9wTCU*I54vv~D&Kuc3%>w{U?FbD3 delta 18 acmeylm+9wTCU*I54i2+Sr;Y5N<^cdnd=LiG< delta 18 ZcmaF!hw059CU*I54i2+Sr;Y5X`v6XM2T}k4 diff --git a/data/cds/chlorodb/fasta/NC_019616.fst.gz b/data/cds/chlorodb/fasta/NC_019616.fst.gz index 7402933ad51b6addab2ee3ead6896a62b47e36e0..3509363cbe33ae0fd48ce5f3c7b3b2673719a404 100644 GIT binary patch delta 18 ZcmZo!%-ph=nO(k{gQMn(^G5dCivT+q2Co1B delta 18 ZcmZo!%-ph=nO(k{gTpM-X(M~>MF2LZ1^oa3 diff --git a/data/cds/chlorodb/fasta/NC_019628.fst.gz b/data/cds/chlorodb/fasta/NC_019628.fst.gz index 443eae5d18070714ad07cc9087f8857db23080b4..b2f7e95db78573ececb9b8a3779d0a51e144076f 100644 GIT binary patch delta 18 acmaE{oax1KCU*I54vv~D&KubuP6hx-BaatC|> delta 18 acmdmcnrZK8CU*I54i2+Sr;Y5}mI44n0S3wd diff --git a/data/cds/chlorodb/fasta/NC_019651.fst.gz b/data/cds/chlorodb/fasta/NC_019651.fst.gz index c270958ab04ea5c72243b2f38e6ae1698667d8be..1a565091716f2f260236a5790f1e33f703373ddb 100644 GIT binary patch delta 18 acmdmXnrYiq1}Xpm diff --git a/data/cds/chlorodb/fasta/NC_020018.fst.gz b/data/cds/chlorodb/fasta/NC_020018.fst.gz index f41028146d3ac98bee0f712906154b0c6e79cce0..7acb44f9e1badda8d7f69703c62570f277c111ad 100644 GIT binary patch delta 18 acmbQYnQ`7`Mt1pb4vv~D&KudMM*;vpBLO>e1@8a= diff --git a/data/cds/chlorodb/fasta/NC_020019.fst.gz b/data/cds/chlorodb/fasta/NC_020019.fst.gz index c915f8c9d9af848757eebd5b63d89defba9d889e..ace246543604e2ecff5de4532b15a924cf1a7783 100644 GIT binary patch delta 18 acmaFzpXteeCU*I54vv~D&Kue9?gs!HK delta 18 acmdn+k!iz6CU*I54i2+Sr;Y3@cK`rI=LZ4+ diff --git a/data/cds/chlorodb/fasta/NC_020098.fst.gz b/data/cds/chlorodb/fasta/NC_020098.fst.gz index 30d16771112d22a3a7eb2f6d3e02913f78433f3d..13430049ab3868a8f70abb0803d7ca9eb2a76830 100644 GIT binary patch delta 18 acmcchgXz`}CU*I54vv~D&Kuc-_W%G-^9RHL delta 18 ZcmcchgXz`}CU*I54i2+Sr;Y5vdjLy<2ND1P diff --git a/data/cds/chlorodb/fasta/NC_020146.fst.gz b/data/cds/chlorodb/fasta/NC_020146.fst.gz index 7ab271a06a4210c8464ffc18757ae262eddff0db..a7e366ef15e801b27322bc9d39a028fc4d0d22cc 100644 GIT binary patch delta 18 acmdnFk7?&VCU*I54vv~D&Kuc{<^upkO$N{a delta 18 ZcmdnFk7?&VCU*I54i2+Sr;Y4J^8r8H1|9$a diff --git a/data/cds/chlorodb/fasta/NC_020147.fst.gz b/data/cds/chlorodb/fasta/NC_020147.fst.gz index 672b27972189ca8b1d7a520d2f60a1d70c791da0..d44e929caa1714299cd58c44dd84ee1a88f46ab7 100644 GIT binary patch delta 18 ZcmZp=!qjwyiCw;%gQMn(^G5dHD*-`#2VnpJ delta 18 ZcmZp=!qjwyiCw;%gTpM-X(RjZl>j{p2Co1B diff --git a/data/cds/chlorodb/fasta/NC_020152.fst.gz b/data/cds/chlorodb/fasta/NC_020152.fst.gz index 9a0c67b1eb98c626a71317322e114fcab3d1df96..1416c9a7edb99597fc6867e44d5b96d19a701b87 100644 GIT binary patch delta 18 ZcmZ44#k{hMnO(k{gQMn(^G0^1qX0Y<24DaH delta 18 ZcmZ44#k{hMnO(k{gTpM-X(PMRQ2;li1+D-9 diff --git a/data/cds/chlorodb/fasta/NC_020316.fst.gz b/data/cds/chlorodb/fasta/NC_020316.fst.gz index 29b780495a983bfb3258aafe58ebe5dc4336e343..4ecf9fe6708bd4ff7a7d47fe4016fef546241493 100644 GIT binary patch delta 18 Zcmey~&iuWdnO(k{gQMn(^G5a$hXF@l2f_dV delta 18 Zcmey~&iuWdnO(k{gTpM-X(RiG!vI3=2M_=N diff --git a/data/cds/chlorodb/fasta/NC_020317.fst.gz b/data/cds/chlorodb/fasta/NC_020317.fst.gz index d671c27791c0666c78075c69e1b04ee529616664..fa9d9930ad2d00bad3013c422f81a7f1be72e259 100644 GIT binary patch delta 18 ZcmaFe&iuNanO(k{gQMn(^G5b3hXF;q2c7@` delta 18 ZcmaFe&iuNanO(k{gTp-2X(RiS!vH~12JHX< diff --git a/data/cds/chlorodb/fasta/NC_020318.fst.gz b/data/cds/chlorodb/fasta/NC_020318.fst.gz index aeddde616df9ef2ee82cac4fa7a4a85be6819b58..472f556a471e531fc4eb1b0928226aabbc9fcebc 100644 GIT binary patch delta 18 ZcmccG#(cGnnO(k{gQMn(^G0^R!vH~=2HF4s delta 18 ZcmccG#(cGnnO(k{gTp-2X(PMeVE{ca1}Ojl diff --git a/data/cds/chlorodb/fasta/NC_020319.fst.gz b/data/cds/chlorodb/fasta/NC_020319.fst.gz index a48165569a9c49c67f18fa27633dd2ed6ccb493d..55c075aa2d5eda99012fe2bec1354bcbfd2ea35d 100644 GIT binary patch delta 18 ZcmZ3{%eV*ohi1~UKv diff --git a/data/cds/chlorodb/fasta/NC_020320.fst.gz b/data/cds/chlorodb/fasta/NC_020320.fst.gz index 434ec0b7008673d2aa5e951a8c159583e27d09fa..c807002634b59cb04c5872da48da130e3cf7f923 100644 GIT binary patch delta 18 acmbRDk!jvXCU*I54vv~D&KudM?*ITt;s<^J delta 18 acmbRDk!jvXCU*I54i587r;Y5>cK`rGcm~Y? diff --git a/data/cds/chlorodb/fasta/NC_020321.fst.gz b/data/cds/chlorodb/fasta/NC_020321.fst.gz index 63a2ab47de1d27e60c8bbc0b492b75baa841c20c..9bb3d80cfb59a178382eac5548b820be035c3112 100644 GIT binary patch delta 18 acmcb;jp_C_CU*I54vv~D&Kuc7W&;36_Xi>X delta 18 Zcmcb;jp_C_CU*I54i587r;Y3(vjIbm25|rY diff --git a/data/cds/chlorodb/fasta/NC_020341.fst.gz b/data/cds/chlorodb/fasta/NC_020341.fst.gz index b8a22913fcdce7b6a547307c89079a79dccd5ae3..612e4592a025d4fb3ba64992bcfdae5382f50b32 100644 GIT binary patch delta 18 acmca|h3U!_CU*I54vv~D&Kuc%R{;P@vj$181`PlJ diff --git a/data/cds/chlorodb/fasta/NC_020367.fst.gz b/data/cds/chlorodb/fasta/NC_020367.fst.gz index 762d388f4b60279cc091129995eb2ab358cd7b3c..c4a95a75631e947c08005360798eaf034b935c17 100644 GIT binary patch delta 18 Zcmdnp$h^CenO(k{gQMn(^G5b92LL{92LAv6 delta 18 Zcmdnp$h^CenO(k{gTp-2X(RiV0{}V%22KC~ diff --git a/data/cds/chlorodb/fasta/NC_020371.fst.gz b/data/cds/chlorodb/fasta/NC_020371.fst.gz index 7afc86daea02677031999ce7e625e64f4fdeaed5..bab2dfa71a5e74d6974085d3abcaee7ad7876e61 100644 GIT binary patch delta 18 ZcmeBp#n|zRkzKxk!jaQCU*I54vv~D&Kub`?*ITxwg=Jx delta 18 acmdn>k!jaQCU*I54i587r;Y5JcK`rKOa~zV diff --git a/data/cds/chlorodb/fasta/NC_020795.fst.gz b/data/cds/chlorodb/fasta/NC_020795.fst.gz index badcd7383d525fb2fa373c4c75f27a9c99674811..b40753e170d46154bf7af10fc85cc2ad86ce9be6 100644 GIT binary patch delta 18 acmZ3yo_X^t# diff --git a/data/cds/chlorodb/fasta/NC_021102.fst.gz b/data/cds/chlorodb/fasta/NC_021102.fst.gz index c3c43076c157eacd75fe94dd6f3c424d2c80321a..1fc949dae0522762ce5f237a21cc154b9cc5d803 100644 GIT binary patch delta 18 acmezSgX!-NCU*I54vyL@&Kudw_5c7>!w4<_ delta 18 ZcmezSgX!-NCU*I54i587r;Y4odjL>U2Ydhk diff --git a/data/cds/chlorodb/fasta/NC_021109.fst.gz b/data/cds/chlorodb/fasta/NC_021109.fst.gz index 484a54b4d16791d50c692c6ef2d0f5f7ca959454..af6c7f7e66579f5bc91d4b019e9ee67b3a7ccbf9 100644 GIT binary patch delta 21 ccmX@n%X*@hm0iA@gQNC}b0hm!cE*El096hLRsaA1 delta 21 ccmX@n%X*@hm0iA@gTp-2sgZpvJL5q&08WPnqyPW_ diff --git a/data/cds/chlorodb/fasta/NC_021110.fst.gz b/data/cds/chlorodb/fasta/NC_021110.fst.gz index b7816b700d8e49d05a790d96d8487f3249866a7d..2a517def689d775c406b2a9c08d46c90cc92eaaa 100644 GIT binary patch delta 18 acmZ2+oN2{zCU*I54vyL@&KubmE(QQZ90xQ2 delta 18 acmZ2+oN2{zCU*I54i587r;Y3j7Xtu4s|JDq diff --git a/data/cds/chlorodb/fasta/NC_021111.fst.gz b/data/cds/chlorodb/fasta/NC_021111.fst.gz index 843593a67c0f3285a464e5e1f21d5ec7177a9627..993992060fc8240c99699caeb1591c114186f1a3 100644 GIT binary patch delta 18 acmX@~oAJ{Ri3r delta 18 ZcmccfkLk`oCU*I54i587r;Y5P`vFXh2Pgml diff --git a/data/cds/chlorodb/fasta/NC_021189.fst.gz b/data/cds/chlorodb/fasta/NC_021189.fst.gz index 04ed1e19c05b76c19cb5b36e15e9dcb00c84faf2..dcf2ce06b959e5c0fc1526dfbf13be670ecd83d9 100644 GIT binary patch delta 18 acmdmen|b$bW_I~*4vyL@&KudcyafPBhzH>S delta 18 acmdmen|b$bW_I~*4i587r;Y4e-U0wc7Y8o@ diff --git a/data/cds/chlorodb/fasta/NC_021372.fst.gz b/data/cds/chlorodb/fasta/NC_021372.fst.gz index 26b541779acabe13741be5daad03d8d5520b3e80..056f394e16ea31b61b61de91f51fe8d438fb29c9 100644 GIT binary patch delta 18 acmX?ko9X0jCU*I54vyL@&Kubetpxx}6$i-x delta 18 acmX?ko9X0jCU*I54i587r;Y4~)&c-Vqz4xO diff --git a/data/cds/chlorodb/fasta/NC_021423.fst.gz b/data/cds/chlorodb/fasta/NC_021423.fst.gz index 09fb051d1567f7cc0397f42d3491a706fc9d0269..3c3e3250b68c27f4904048d47bd981882919cbd7 100644 GIT binary patch delta 18 acmbRKn`!!QCU*I54vyL@&Kub$>;(WwF9(AF delta 18 acmbRKn`!!QCU*I54i587r;Y3r_5uJyz6Q|% diff --git a/data/cds/chlorodb/fasta/NC_021425.fst.gz b/data/cds/chlorodb/fasta/NC_021425.fst.gz index 061be635f8551142149412637636d84e060c3dd8..30ac4f46ae2dea6f7f5420d5ea76da5bc5287302 100644 GIT binary patch delta 18 acmZ2AiFwr|W_I~*4vyL@&Kud4PXYivItF+E delta 18 ZcmZ2AiFwr|W_I~*4i587r;Y5&CjmIg1;zjX diff --git a/data/cds/chlorodb/fasta/NC_021426.fst.gz b/data/cds/chlorodb/fasta/NC_021426.fst.gz index b1301826ca44975413c4d25bdb2c78e7141875aa..dd71e265d0efdee575b69c5502f06d2b813dc308 100644 GIT binary patch delta 18 acmaDeh55}CW_I~*4vyL@&KucNPXPc%e+NSV delta 18 ZcmaDeh55}CW_I~*4i587r;Y5XrvO3@29W>& diff --git a/data/cds/chlorodb/fasta/NC_021429.fst.gz b/data/cds/chlorodb/fasta/NC_021429.fst.gz index c2e1f68a721e446fcd70efca7091c7ec9f97ffa1..3fedc550aaa95270df9c117c8aab99ed7e0e98e3 100644 GIT binary patch delta 18 acmccckLkicCU*I54vyL@&Kuc1_X7Y=SqHWN delta 18 ZcmccckLkicCU*I54i587r;Y5M`vFSm2Lu2B diff --git a/data/cds/chlorodb/fasta/NC_021430.fst.gz b/data/cds/chlorodb/fasta/NC_021430.fst.gz index 7ee6176d67cf209082fcd0d519a1b7b3c2f06108..52ca2f554273360204f7e8a97ef1ed793e362113 100644 GIT binary patch delta 18 acmdn`n`!HBCU*I54vyL@&Kud+?F9f#NeA5k delta 18 acmdn`n`!HBCU*I54i587r;Y6E_5uJ$*as^B diff --git a/data/cds/chlorodb/fasta/NC_021431.fst.gz b/data/cds/chlorodb/fasta/NC_021431.fst.gz index 6ac58fda46ddb37166cc86e9e6927ad9d3f94bef..3a188e2fdf61a3202d5c9c677ecc451061d80167 100644 GIT binary patch delta 18 acmezTo9Xj!CU*I54vyL@&Kud^>;(W+!w8oE delta 18 acmezTo9Xj!CU*I54i1Y&b diff --git a/data/cds/chlorodb/fasta/NC_021449.fst.gz b/data/cds/chlorodb/fasta/NC_021449.fst.gz index e3797633311d06b0aecb6998dcb7c2e7fc37b814..f95a709e86514e8434b19926b85fd465554ad080 100644 GIT binary patch delta 18 acmbRBg=y9oCU*I54vyL@&Kuc;wQuGY4+~ delta 18 acmbRKnQ8iGCU*I54i1Y8CU*I54vyL@&Kuc1cLD%S-v^ig delta 18 ZcmccciRr>8CU*I54i1Y;wQ)I|z3G delta 18 acmaF=nd$v!CU*I54i1Y1{?qY diff --git a/data/cds/chlorodb/fasta/NC_021762.fst.gz b/data/cds/chlorodb/fasta/NC_021762.fst.gz index 7bb99d3a171b1c6ae970a877a2ed3e7c52876ca3..d9fd3c7c425a4f365d0e8d622a3af86a70b2a990 100644 GIT binary patch delta 18 acmew{o9V}FCU*I54vyL@&Kuc3_5uJ&q6fAB delta 18 Zcmew{o9V}FCU*I54i1Y#+j1)Kl? diff --git a/data/cds/chlorodb/fasta/NC_022137.fst.gz b/data/cds/chlorodb/fasta/NC_022137.fst.gz index 2c7e267c2c7869e505c3edb6305ea8899c0cdba8..d15aa1b0676ca9f36a05436695bb5c27dfa9f67b 100644 GIT binary patch delta 18 ZcmZqq#?wFj2MhoJ diff --git a/data/cds/chlorodb/fasta/NC_022259.fst.gz b/data/cds/chlorodb/fasta/NC_022259.fst.gz index b9580606162f0e0fa7957fa9eb26a18ee0a33b9d..d6536b586ee14e142b1da4433a679fc9d624f182 100644 GIT binary patch delta 18 ZcmeC3&(u4giCw;%gQM<>^G5czegHd$27mwn delta 18 ZcmeC3&(u4giCw;%gTo@zX(M}EKL9rs1^G5c^G5cBLjXhH2MquK delta 18 ZcmaFf!u-62nO(k{gTo@zX(M~WApk#a23r6C diff --git a/data/cds/chlorodb/fasta/NC_022380.fst.gz b/data/cds/chlorodb/fasta/NC_022380.fst.gz index 3b2301f5d25cdeb1e34d6c68692d8165ed2c1b31..b654599f3ad7db37c377aad352c94d725579ac0b 100644 GIT binary patch delta 18 ZcmaFb%KWsInO(k{gQM<>^G5c2hX6#l2Z;ax delta 18 ZcmaFb%KWsInO(k{gTo@zX(Ri+LjXWW2G;-p diff --git a/data/cds/chlorodb/fasta/NC_022381.fst.gz b/data/cds/chlorodb/fasta/NC_022381.fst.gz index f64ead7e32d1ba15f8dd0481492c3935fead64fe..02b528b8dd6e8bbb3399d62e33f2d8020a7a605d 100644 GIT binary patch delta 18 ZcmX@x#(cJonO(k{gQM<>^G0^J!vH{#2E+gW delta 18 ZcmX@x#(cJonO(k{gTo@zX(PMaVE{ZI1`+@O diff --git a/data/cds/chlorodb/fasta/NC_022382.fst.gz b/data/cds/chlorodb/fasta/NC_022382.fst.gz index 9f825aaf5c99d33d8ee41fc0de162782b171ca57..590262773d668becbbe50b76677ef2b910dfa373 100644 GIT binary patch delta 18 ZcmccE#(c4jnO(k{gQM<>^G0^B!vH}X2G9Ti delta 18 ZcmccE#(c4jnO(k{gTo@zX(PMWVE{a<1|9$a diff --git a/data/cds/chlorodb/fasta/NC_022383.fst.gz b/data/cds/chlorodb/fasta/NC_022383.fst.gz index 51ec8f8864690f599e441cba7e57e8c4fb0796a9..63b66e4097218edab3cbbc42e209f6e10dfeac72 100644 GIT binary patch delta 18 ZcmccF%6zkxnO(k{gQM<>^G5bdhX6wq2W0>N delta 18 ZcmccF%6zkxnO(k{gTo@zX(RikLjXRb2D1PF diff --git a/data/cds/chlorodb/fasta/NC_022384.fst.gz b/data/cds/chlorodb/fasta/NC_022384.fst.gz index 1a78b59f39a4c98aad3563ddb51fc62fdef36a2b..0d19974c7d91749f443efa44ca673f9920534731 100644 GIT binary patch delta 18 ZcmaFT%KW62nO(k{gQM<>^G5c&hX6#C2ZjIu delta 18 ZcmaFT%KW62nO(k{gTpe@X(RjHLjXW42Gsxn diff --git a/data/cds/chlorodb/fasta/NC_022385.fst.gz b/data/cds/chlorodb/fasta/NC_022385.fst.gz index 80a575c6761db07a8ae4e108f0fa2d8c8dacc478..ed12fbf68dbce75a4d9411b2545c1f7537b5543f 100644 GIT binary patch delta 18 ZcmeBZWA12UW|!~g;HbOeypf&pFaS3p1@!;` delta 18 ZcmeBZWA12UW|!~g;IPbe+Q`m$7yvT21w;S< diff --git a/data/cds/chlorodb/fasta/NC_022386.fst.gz b/data/cds/chlorodb/fasta/NC_022386.fst.gz index 985a727919de7032a79dfb36eb1f863fed6fe4fb..f09f24559e0734804a257deb97bef57fa6d2f216 100644 GIT binary patch delta 18 ZcmZ48#=N?XnO(k{gQM<>^G0@+!vH(#23`OF delta 18 ZcmZ48#=N?XnO(k{gTpe@X(PMJVE{LP1+4%8 diff --git a/data/cds/chlorodb/fasta/NC_022387.fst.gz b/data/cds/chlorodb/fasta/NC_022387.fst.gz index 5b5db0289479910afdf472c849252e4999865549..9f060c2296c779ec329b31f98e28b27107d49f6d 100644 GIT binary patch delta 18 ZcmaFa!u+y@nO(k{gQM<>^G5chLjXi22NM7Q delta 18 ZcmaFa!u+y@nO(k{gTpe@X(M~mApk$S24VmJ diff --git a/data/cds/chlorodb/fasta/NC_022388.fst.gz b/data/cds/chlorodb/fasta/NC_022388.fst.gz index 655d129a09ab675e499513b30af195b8ef080017..b1949dc08ca100f0d65cfaf3fadb1b2cbc39f68e 100644 GIT binary patch delta 18 ZcmbQ*#yqu+nO(k{gQM<>^G0^Q!vHww1{?qY delta 18 ZcmbQ*#yqu+nO(k{gTpe@X(Kz|VE{CK1#18R diff --git a/data/cds/chlorodb/fasta/NC_022389.fst.gz b/data/cds/chlorodb/fasta/NC_022389.fst.gz index 4067297ebf75f998d93edad263e77d03736cd397..d0c503382923f6328063809297fe0a66d899f99a 100644 GIT binary patch delta 18 ZcmZ48#=N?XnO(k{gQM<>^G0@+!vH(#23`OF delta 18 ZcmZ48#=N?XnO(k{gTpe@X(PMJVE{LP1+4%8 diff --git a/data/cds/chlorodb/fasta/NC_022390.fst.gz b/data/cds/chlorodb/fasta/NC_022390.fst.gz index 6d4c8215fbf898a639fe214ffb268a43e9e515e3..909daee8c90e401acfaae0a884201f30db9b8c4b 100644 GIT binary patch delta 18 ZcmZ40#=NSHnO(k{gQM<>^G0^%!vH(S23r6C delta 18 ZcmZ40#=NSHnO(k{gTpe@X(PMxVE{K>1*!l5 diff --git a/data/cds/chlorodb/fasta/NC_022391.fst.gz b/data/cds/chlorodb/fasta/NC_022391.fst.gz index 7a8195b213e28a0cd0d4197e06c265f3cbfbad01..7b1e3937f1cbbdc1c2e0c5c34e758b598c2c3dc0 100644 GIT binary patch delta 18 Zcmey_#{9F5nO(k{gQM<>^G5cf!vIE<2S@+_ delta 18 Zcmey_#{9F5nO(k{gTpe@X(M~lVE{rZ2A2Q; diff --git a/data/cds/chlorodb/fasta/NC_022392.fst.gz b/data/cds/chlorodb/fasta/NC_022392.fst.gz index 44c0f5260c7d824b707c824d2555583764d1d184..794bbe0e4ec96c2ac8df4a558ab40e863d9ad9de 100644 GIT binary patch delta 18 ZcmaFR#{8g-nO(k{gQM<>^G5c_!vI4m2K@j4 delta 18 ZcmaFR#{8g-nO(k{gTpe@X(M~&VE{hA2220| diff --git a/data/cds/chlorodb/fasta/NC_022393.fst.gz b/data/cds/chlorodb/fasta/NC_022393.fst.gz index 4910a558792a2345c88631c7f3fa2bf0d963307c..99e6500729689ac0ec23af12971e50899516f6f2 100644 GIT binary patch delta 18 ZcmaFd#{9UAnO(k{gQM<>^G5cV!vI5)2L=ED delta 18 ZcmaFd#{9UAnO(k{gTpe@X(M~gVE{iU22}t6 diff --git a/data/cds/chlorodb/fasta/NC_022394.fst.gz b/data/cds/chlorodb/fasta/NC_022394.fst.gz index 185aaa2b9a6acade89929980dd305785bdc385fb..a91c425d5611e312cd64d61c8f3b26ce5cdab88c 100644 GIT binary patch delta 18 ZcmaFR#{8g-nO(k{gQM<>^G5c_!vI4m2K@j4 delta 18 ZcmaFR#{8g-nO(k{gTpe@X(M~&VE{hA2220| diff --git a/data/cds/chlorodb/fasta/NC_022395.fst.gz b/data/cds/chlorodb/fasta/NC_022395.fst.gz index 2c01f189115aff8adea15c261276599d0774640f..19311796c0346e51b2e2e800737366b990abd2da 100644 GIT binary patch delta 18 ZcmaFa#{9C4nO(k{gQM<>^G5ch!vI8N2N(bV delta 18 ZcmaFa#{9C4nO(k{gTpe@X(M~mVE{k+24?^O diff --git a/data/cds/chlorodb/fasta/NC_022396.fst.gz b/data/cds/chlorodb/fasta/NC_022396.fst.gz index b81bbefc7bdac638badbf775757da4ed35ff86ae..e2a71fe5afb9c38b4c89d9efa7139e505f55b33d 100644 GIT binary patch delta 18 ZcmeBeXYOrhW|!~g;HbOeypg@_FaS9328I9t delta 18 ZcmeBeXYOrhW|!~g;IPbe+Q{B^7yvYd1=Rom diff --git a/data/cds/chlorodb/fasta/NC_022397.fst.gz b/data/cds/chlorodb/fasta/NC_022397.fst.gz index 41ae84b2e80fba855ebb31894235b73293302cf4..30e9d7a5b0b477d1cc9f626bb36caf0bd9e9e6cf 100644 GIT binary patch delta 18 ZcmX@#%6z_+nO(k{gQM<>^G5a)hX6sg2S)$^ delta 18 ZcmX@#%6z_+nO(k{gTpe@X(RiILjXNY29^K- diff --git a/data/cds/chlorodb/fasta/NC_022398.fst.gz b/data/cds/chlorodb/fasta/NC_022398.fst.gz index 01c449a907283060eefcd5dbab2fe3f81c51ceb3..c63c321a3b879cefe75f360ef29f1a2091743f96 100644 GIT binary patch delta 18 ZcmaFg#{9mGnO(k{gQM<>^G5cJ!vIA#2Pyyn delta 18 ZcmaFg#{9mGnO(k{gTpe@X(M~aVE{nP26+Gg diff --git a/data/cds/chlorodb/fasta/NC_022399.fst.gz b/data/cds/chlorodb/fasta/NC_022399.fst.gz index f0e1c2d350387e8138c70bbfd3ab321fa9c1c440..dd94d6ccf97251516461ddbf67caa84c3f343c64 100644 GIT binary patch delta 18 Zcmey{#{9R9nO(k{gQM<>^G5cv!vIGh2UGw6 delta 18 Zcmey{#{9R9nO(k{gTpe@X(M~tVE{t52BQD~ diff --git a/data/cds/chlorodb/fasta/NC_022400.fst.gz b/data/cds/chlorodb/fasta/NC_022400.fst.gz index d62c740654e522464a85c744b9d8a9a6d2a04a4f..9e4fa1826458fe5167f9f67fc68939f8bee70dce 100644 GIT binary patch delta 18 ZcmaFg!Ti31nO(k{gQM<>^G5cJBLGEp2QL5s delta 18 ZcmaFg!Ti31nO(k{gTpe@X(M~a5dc9827Ukl diff --git a/data/cds/chlorodb/fasta/NC_022401.fst.gz b/data/cds/chlorodb/fasta/NC_022401.fst.gz index 5140ee927dab28dda0c09c066c102ffe4e453e50..98d036588165cc660644e53d83f8618ec06e8053 100644 GIT binary patch delta 18 ZcmeBbXYOieW|!~g;HbOeypg^6FaS7)27Lek delta 18 ZcmeBbXYOieW|!~g;IPbe+Q{B~7yvXJ1^G0^Z!vH_w2DJbH delta 18 ZcmX@n#(biUnO(k{gTpe@X(PMiVE{XK1_S^A diff --git a/data/cds/chlorodb/fasta/NC_022403.fst.gz b/data/cds/chlorodb/fasta/NC_022403.fst.gz index 6d05ebfdffa7a85e3a8db656afc59802cc68196e..45f267db14ae8ac941be6851940be8ceceded64f 100644 GIT binary patch delta 18 ZcmbQ;&OE!FnO(k{gQM<>^G5b5hXFd-2Cx7C delta 18 ZcmbQ;&OE!FnO(k{gTpe@X(RiT!vHpK1^)m5 diff --git a/data/cds/chlorodb/fasta/NC_022404.fst.gz b/data/cds/chlorodb/fasta/NC_022404.fst.gz index 9b291b00d6a8924586e36a6448f95dcafed23ec9..83541ad475b91390720acaac7a387736639dcbdc 100644 GIT binary patch delta 18 ZcmeBaWA15VW|!~g;HbOeypf&tFaS5L1_1y7 delta 18 ZcmeBaWA15VW|!~g;IPbe+Q`m&7yvUv1yBG0 diff --git a/data/cds/chlorodb/fasta/NC_022405.fst.gz b/data/cds/chlorodb/fasta/NC_022405.fst.gz index 78503b1a46c402427ae0437d03c937577521246a..37ce68c9a72621124cae0eb7968c0d72e240cc08 100644 GIT binary patch delta 18 ZcmeBcXYOlfW|!~g;HbOeypg^AFaS9c28jRw delta 18 ZcmeBcXYOlfW|!~g;IPVc+Q{C17yvY{1=#=q diff --git a/data/cds/chlorodb/fasta/NC_022406.fst.gz b/data/cds/chlorodb/fasta/NC_022406.fst.gz index f641bf82cfa84d0d10cca17b6ea49aef574bbedc..0afd032ab200a7d1dc4a551c6c93638b05827cfd 100644 GIT binary patch delta 18 Zcmdnf%DktQnO(k{gQM<>^G5cqhX6kv2Mz!L delta 18 Zcmdnf%DktQnO(k{gTpG*X(RjALjXFu23`OF diff --git a/data/cds/chlorodb/fasta/NC_022407.fst.gz b/data/cds/chlorodb/fasta/NC_022407.fst.gz index 051db74f38b7532a50b0622f5ae911b7ab8ec2a9..0672aad5b99ae05a8d50043562a62fa5467db4c7 100644 GIT binary patch delta 18 Zcmey<&itpHnO(k{gQM<>^G5cshXF_&2h#um delta 18 Zcmey<&itpHnO(k{gTpG*X(RjB!vI6M2O|Ig diff --git a/data/cds/chlorodb/fasta/NC_022408.fst.gz b/data/cds/chlorodb/fasta/NC_022408.fst.gz index 687c59fbd71ef506910074050eab9579161ebbf5..a91c20b755455b7624ea7cf317e93c6d7a721513 100644 GIT binary patch delta 18 Zcmcc8#(brXnO(k{gQM<>^G0^x!vH~r2H5}r delta 18 Zcmcc8#(brXnO(k{gTpG*X(PMuVE{cM1}Ojl diff --git a/data/cds/chlorodb/fasta/NC_022409.fst.gz b/data/cds/chlorodb/fasta/NC_022409.fst.gz index 9ffbb2a9a0ec374fa4894b8aa8c5de51a21dfa23..2aa312a514feee577d1a135e02197cdb6423153e 100644 GIT binary patch delta 18 ZcmbQ=#yr1`nO(k{gQM<>^G0@w!vH!)208!$ delta 18 ZcmbQ=#yr1`nO(k{gTpG*X(PMDVE{Gb1&ROw diff --git a/data/cds/chlorodb/fasta/NC_022410.fst.gz b/data/cds/chlorodb/fasta/NC_022410.fst.gz index 86c58fec3dce34cae4ddc98905e0a462d3213171..515f18040c9f9a315cc80fcdb3a8f236e41d6ecd 100644 GIT binary patch delta 18 ZcmX@p#(buYnO(k{gQM<>^G0^p!vH{S2EhOT delta 18 ZcmX@p#(buYnO(k{gTpG*X(PMqVE{Y|1`z-N diff --git a/data/cds/chlorodb/fasta/NC_022411.fst.gz b/data/cds/chlorodb/fasta/NC_022411.fst.gz index 2ab37a34cd51e157497c4a100f9f08edc93a0965..3cfaf3e331c62b0adc543c93dbd2da2acbbf2ac4 100644 GIT binary patch delta 18 ZcmZ3~#=NMFnO(k{gQNb6^G0^*!vH$A21Eb= delta 18 ZcmZ3~#=NMFnO(k{gTpG*X(PMzVE{Hv1(N^( diff --git a/data/cds/chlorodb/fasta/NC_022412.fst.gz b/data/cds/chlorodb/fasta/NC_022412.fst.gz index 5b9a175694e608566b00d7c447b067d59c412551..0d2470b1bfad93d36bf9901836683bf9a8499ab8 100644 GIT binary patch delta 18 ZcmeBfXYOuiW|!~g;Hbaiypg@-FaS8P27v$o delta 18 ZcmeBfXYOuiW|!~g;IPVc+Q{B=7yvXz1<(Kh diff --git a/data/cds/chlorodb/fasta/NC_022413.fst.gz b/data/cds/chlorodb/fasta/NC_022413.fst.gz index f62b8a7d9267636d9f3923564a399b1b9394d2b2..b6cfb221b4c6df78b77cc525e6230f7cff7013f1 100644 GIT binary patch delta 18 ZcmZ49%DlXlnO(k{gQNb6^G5ashX6c92G9Ti delta 18 ZcmZ49%DlXlnO(k{gTpG*X(RiBLjX711|I+b diff --git a/data/cds/chlorodb/fasta/NC_022414.fst.gz b/data/cds/chlorodb/fasta/NC_022414.fst.gz index 6f3574d91776ea436b561db22e2137d342584794..2d9068b5ab245d11d4606af9783a303687740af0 100644 GIT binary patch delta 18 ZcmZ41%Dk+VnO(k{gQNb6^G5dhhX6bx2F(Bf delta 18 ZcmZ41%Dk+VnO(k{gTpG*X(RjmLjX6p1{?qY diff --git a/data/cds/chlorodb/fasta/NC_022417.fst.gz b/data/cds/chlorodb/fasta/NC_022417.fst.gz index 8099d2e73b8a70c8f39473bcaa10d8260e4a8d91..e8c3b4f6266f6f4dc0a026b6d9fc458d288dbd03 100644 GIT binary patch delta 18 acmX^5lj-PBCU*I54vzXO&KueH?EwHzNC*l5 delta 18 acmX^5lj-PBCU*I54i2kKr;Y6U_5c7$-UnF# diff --git a/data/cds/chlorodb/fasta/NC_022431.fst.gz b/data/cds/chlorodb/fasta/NC_022431.fst.gz index 1e6afa8978cf617d7680a3fc6490f8e1e9e317ab..6c243570aaed8aa472950aeed4f0c7c022d1d096 100644 GIT binary patch delta 18 ZcmZ45$-K0anO(k{gQNb6^G5c0M*uv12Gjrm delta 18 ZcmZ45$-K0anO(k{gTpG*X(Ri*BLFxP1|t9f diff --git a/data/cds/chlorodb/fasta/NC_022432.fst.gz b/data/cds/chlorodb/fasta/NC_022432.fst.gz index fb75bf7a49c5c4dd5b1480775e01ed1aefac7f05..eea5a6ac9e22bab4765d439a5dbffa7128515b4b 100644 GIT binary patch delta 18 Zcmey{$o#jFnO(k{gQNb6^G5b>2LMNj2gm>b delta 18 Zcmey{$o#jFnO(k{gTpG*X(Ri$0{}xG2NwVU diff --git a/data/cds/chlorodb/fasta/NC_022451.fst.gz b/data/cds/chlorodb/fasta/NC_022451.fst.gz index 69fbac34056fe7c6a04eeb7be11425b2d38295f9..8737b76ff7c501dbd8b8ae877dd912246d966c8f 100644 GIT binary patch delta 18 acmdn`fobapCU*I54vzXO&KueFb^riL{Rcz< delta 18 Zcmdn`fobapCU*I54i2kKr;Y4-I{-zK29p2) diff --git a/data/cds/chlorodb/fasta/NC_022457.fst.gz b/data/cds/chlorodb/fasta/NC_022457.fst.gz index 0b410f8cfd08484f839e7f4c1ff11427e86991a1..bb4055098e03ce3e6f241b672e70223e4d0ba716 100644 GIT binary patch delta 18 acmbO|nR)hPW_I~*4vzXO&KudMoCE+oS_aPm delta 18 acmbO|nR)hPW_I~*4i2kKr;Y4WP67Zo@CF_L diff --git a/data/cds/chlorodb/fasta/NC_022459.fst.gz b/data/cds/chlorodb/fasta/NC_022459.fst.gz index 431553ebf48f66086434d4308595866c03b2c6e1..7601113d42f9317a9bca989ea0f70434fdd992ea 100644 GIT binary patch delta 18 acmdn+k7>g{CU*I54vzXO&Kub^_X7Y+2M1UH delta 18 Zcmdn+k7>g{CU*I54i2kKr;Y5I`vFFs2B!c3 diff --git a/data/cds/chlorodb/fasta/NC_022460.fst.gz b/data/cds/chlorodb/fasta/NC_022460.fst.gz index 86e681604d0efaddd123b37be2eff1d11a16efdc..2bbd1d39ec94e2e512538c45ef8b6e001a05cf8a 100644 GIT binary patch delta 18 acmccokLmJ1CU*I54vzXO&Kuc%_5%P<& delta 18 ZcmeDE$JG0eiCw;%gTpG*X(Kz^egHw#20j1) diff --git a/data/cds/chlorodb/fasta/NC_022811.fst.gz b/data/cds/chlorodb/fasta/NC_022811.fst.gz index de3b2020863814c7b0722181956c9801e14a2946..afcb33ec9ddfb14cf07b50b3ba61e86e8f9d72ea 100644 GIT binary patch delta 18 acmX^9pXvC2CU*I54vzXO&Kube><0i(O9&qT delta 18 acmX^9pXvC2CU*I54i2kKr;Y3f_5%P);RkL2 diff --git a/data/cds/chlorodb/fasta/NC_022812.fst.gz b/data/cds/chlorodb/fasta/NC_022812.fst.gz index 2f56d44c5b013d736f4a06cf52d7e8e075bd069e..5de6edd3d345e1a7156af335d429611245d8cf70 100644 GIT binary patch delta 18 ZcmZqs&(!vxiCw;%gQNb6^G5di{QyR22V4LE delta 18 ZcmZqs&(!vxiCw;%gTpG*X(N06egHxK2CD!7 diff --git a/data/cds/chlorodb/fasta/NC_022813.fst.gz b/data/cds/chlorodb/fasta/NC_022813.fst.gz index 8630fb96e255896b4a5648f57af08fccb3b3f829..5e0caeab10fe005de466ea37656f39170794ba97 100644 GIT binary patch delta 18 acmezQm+9wUCU*I54vzXO&Kuc3?E?T+;s~$+ delta 18 acmezQm+9wUCU*I54i2kKr;Y5N_5lDmjM7j9|m>+ diff --git a/data/cds/chlorodb/fasta/NC_022859.fst.gz b/data/cds/chlorodb/fasta/NC_022859.fst.gz index 25dbf639e74bc4581e41a2ca2e5d027adb78f43e..ed0469e2dae24c85c076d4db557f664de64ba64a 100644 GIT binary patch delta 18 ZcmZqr&D8XpiCw;%gQNb6^G5dSy#PgC2Sxw@ delta 18 ZcmZqr&D8XpiCw;%gTpG*X(M~}UI0M!29*E+ diff --git a/data/cds/chlorodb/fasta/NC_022868.fst.gz b/data/cds/chlorodb/fasta/NC_022868.fst.gz index ce1f67047efde1de8e3b4ed4330d33c977a0e808..bd06f3746354e8f0929a4f2964d4567dc9aab293 100644 GIT binary patch delta 18 acmbRFiD~91CU*I54vzXO&Kuchj diff --git a/data/cds/chlorodb/fasta/NC_023085.fst.gz b/data/cds/chlorodb/fasta/NC_023085.fst.gz index 28f13ab4e0cde671c39b604106787312dda73770..cd31af6f34a10cd0eef41e56aa15bb2e9e02bf96 100644 GIT binary patch delta 18 acmdn<0i$0|(at delta 18 acmZ4gpK1MnCU*I54i2kKr;Y3@_5%P%nFl5S diff --git a/data/cds/chlorodb/fasta/NC_023090.fst.gz b/data/cds/chlorodb/fasta/NC_023090.fst.gz index fe225c16dc197da86b440f2236babfac3a927a90..b7de5ef769954c5777d3427c54e6a1af173749b6 100644 GIT binary patch delta 18 acmbREiD}{|CU*I54vzXO&Kudeb^-uJPzK!q delta 18 ZcmbREiD}{|CU*I54i2kKr;Y4fI{`rE1}p#o diff --git a/data/cds/chlorodb/fasta/NC_023092.fst.gz b/data/cds/chlorodb/fasta/NC_023092.fst.gz index 58da494b293e6c40df8ffa82b6351a157bea21e8..b65077e62636093be6c069d346542f2504e6d19a 100644 GIT binary patch delta 18 ZcmbQ)!925rnO(k{gQNb6^G0@|BLF$N1}*>q delta 18 ZcmbQ)!925rnO(k{gTpG*X(PMP5dbw%1$_Vj diff --git a/data/cds/chlorodb/fasta/NC_023096.fst.gz b/data/cds/chlorodb/fasta/NC_023096.fst.gz index 26c1d021bce64307ccad255a3a212e653d87c643..f7d4474288aa9a1dffeba57cb97928fd6417bb01 100644 GIT binary patch delta 18 ZcmdlmjcLO)CU*I54vzXO&Kub^y8%8s22=n5 delta 18 ZcmdlmjcLO)CU*I54i2kKr;Y5I-2ge!1)~4} diff --git a/data/cds/chlorodb/fasta/NC_023097.fst.gz b/data/cds/chlorodb/fasta/NC_023097.fst.gz index ff23caf55dae44948f0e4292d044d1863c1261ad..68d9dfb170b15944fad25be5cc1f9862525946ae 100644 GIT binary patch delta 18 acmZ2IooV%SCU*I54vzXO&Kud6bOQiBs|Lpa delta 18 ZcmZ2IooV%SCU*I54i4)~r;Y4Ox&b;!1{VMT diff --git a/data/cds/chlorodb/fasta/NC_023102.fst.gz b/data/cds/chlorodb/fasta/NC_023102.fst.gz index ec4ae59bb8e2585aa7cc17fef7a6ee2a1fd9bc95..cb0e4af0d86219e6ed69d6db00d23856ad195b6c 100644 GIT binary patch delta 18 acmbRAo@vs1CU*I54vzXO&Kudgw*vr16bD!U delta 18 ZcmbRAo@vs1CU*I54i4)~r;Y60+W|qb2B-i4 diff --git a/data/cds/chlorodb/fasta/NC_023107.fst.gz b/data/cds/chlorodb/fasta/NC_023107.fst.gz index d441ae52a64d7289ad5fd2e4219a171a64c18c84..9016bec3a61980d2dda6562c57786f1ed5f92176 100644 GIT binary patch delta 18 acmZ4Vk!jIKCU*I54vzXO&Kuch?*ITug9nWO delta 18 acmZ4Vk!jIKCU*I54i4)~r;Y5hcK`rHAO_t4 diff --git a/data/cds/chlorodb/fasta/NC_023108.fst.gz b/data/cds/chlorodb/fasta/NC_023108.fst.gz index 87cb10fc1893cd6a6fdeddba9cb9d05195f63799..afdaa24e80f26691a1cf72be665b98260c905ef8 100644 GIT binary patch delta 18 acmezMf$7%=CU*I54vzXO&Kuc_cK`rWYzPwo delta 18 ZcmezMf$7%=CU*I54i4)~r;Y5zI{;4!2V(#L diff --git a/data/cds/chlorodb/fasta/NC_023109.fst.gz b/data/cds/chlorodb/fasta/NC_023109.fst.gz index 73f714a163b0c5201e73377bd464b89b4f70100c..abc16100c9068ef27bbb6a99505ee843d07fc806 100644 GIT binary patch delta 18 acmZ4dk!kTqCU*I54vzXO&Kue1>;M2rrU#G! delta 18 acmZ4dk!kTqCU*I54i4)~r;Y4$b^riGLk8dg diff --git a/data/cds/chlorodb/fasta/NC_023110.fst.gz b/data/cds/chlorodb/fasta/NC_023110.fst.gz index a0765814197c8d2b24d629fbb5bd724572757e5e..4e525776bfe31188134911be8d511a7e56250071 100644 GIT binary patch delta 18 acmX^9k?HtHCU*I54vzXO&Kube>;M2wk_Y?% delta 18 acmX^9k?HtHCU*I54i4)~r;Y3fb^riLF9%Ej diff --git a/data/cds/chlorodb/fasta/NC_023111.fst.gz b/data/cds/chlorodb/fasta/NC_023111.fst.gz index 63fa2960e8abaa5291a83f9db91c99c81ce75292..55caa6b8f976c48c8595dc70e4238f634a556c28 100644 GIT binary patch delta 18 ZcmeDA$kg+ZiCw;%gQNb6^G5d89RNjv2TK3| delta 18 ZcmeDA$kg+ZiCw;%gTp%0X(M~<4gf(O2Aco? diff --git a/data/cds/chlorodb/fasta/NC_023112.fst.gz b/data/cds/chlorodb/fasta/NC_023112.fst.gz index 81635946adb0b7b1b07f18fa43645395fe9cb98a..12c0e719cd5bdfa2e035a4065d65d74c5c6aa389 100644 GIT binary patch delta 18 acmdn@k!jyYCU*I54vvN^&Kudc?*ITyUI*d; delta 18 acmdn@k!jyYCU*I54i4)~r;Y5}cK`rK^an8j diff --git a/data/cds/chlorodb/fasta/NC_023113.fst.gz b/data/cds/chlorodb/fasta/NC_023113.fst.gz index d55e548e45b74b4984829ddd1598b879094b3ab9..c9bdfcb03668316ca7b55e2efe17da9fb1339919 100644 GIT binary patch delta 18 acmbRJk!kivCU*I54vvN^&KudM>;M2ql?QnM delta 18 acmbRJk!kivCU*I54i4)~r;Y4Wb^riFD+b5_ diff --git a/data/cds/chlorodb/fasta/NC_023114.fst.gz b/data/cds/chlorodb/fasta/NC_023114.fst.gz index 893c60eb2dbe0858d4face19acde66ccae41532b..2f94183ae797db3955341db7213224a726b136f9 100644 GIT binary patch delta 18 acmZ4Tk!i_CCU*I54vvN^&Kue1?f?Kt&?q diff --git a/data/cds/chlorodb/fasta/NC_023119.fst.gz b/data/cds/chlorodb/fasta/NC_023119.fst.gz index 578e3eb2ef92c4040d76ad95f55a9f1239643eb1..019d35709526a8d317232440f5fa56086d892ff1 100644 GIT binary patch delta 18 ZcmZpE#MJzViCw;%gQMY!^G5bR8vsLe2a5mz delta 18 ZcmZpE#MJzViCw;%gTp%0X(Rie4FEq12HF4s diff --git a/data/cds/chlorodb/fasta/NC_023120.fst.gz b/data/cds/chlorodb/fasta/NC_023120.fst.gz index 91a522e4da77268b65a9e3e89d55ea36cc3dfdbf..0d36ba228cc73b7dc3bd9516270b595c46c52d38 100644 GIT binary patch delta 18 ZcmZoY&eVFGiCw;%gQMY!^G5c%#Q;BO2F?Hg delta 18 ZcmZoY&eVFGiCw;%gTp%0X(M~xVgNe+1|0wZ diff --git a/data/cds/chlorodb/fasta/NC_023121.fst.gz b/data/cds/chlorodb/fasta/NC_023121.fst.gz index 9d991d1144e3d9e125045c5fe405089eb3b25c03..e14a6ee53aa4b851db74745034602cbb5ddfa4e4 100644 GIT binary patch delta 18 acmcbw; delta 18 ZcmaDmlkx3LMt1pb4i4)~r;Y5-d;mi*2A}`{ diff --git a/data/cds/chlorodb/fasta/NC_023133.fst.gz b/data/cds/chlorodb/fasta/NC_023133.fst.gz index e8913660a81574bd7e46cac65de2353a8823c075..737b2cf862f4ab6aa5a87fea711f002bb1a84a30 100644 GIT binary patch delta 21 ccmey>%krz2g%krz2g<0i;J_w8e delta 18 acmaF;pXv2~CU*I54i1}4r;Y4S_5%P<+XvhL diff --git a/data/cds/chlorodb/fasta/NC_023260.fst.gz b/data/cds/chlorodb/fasta/NC_023260.fst.gz index e21ff76eb8347aa11e95c683cb0193fd926c6f90..9a1046a5f6cc0bf4b538483b21ba0a10486217b8 100644 GIT binary patch delta 18 ZcmeC2#N0WFnO(k{gQMY!^G0^2lK?o(1{eSU delta 18 ZcmeC2#N0WFnO(k{gTp4%X(Kz+NdPoy1!w>O diff --git a/data/cds/chlorodb/fasta/NC_023261.fst.gz b/data/cds/chlorodb/fasta/NC_023261.fst.gz index 3da52d94feb22859012f1331903db39325c2a18e..a8aae66db34d879f6a6f2b265930139b442e2945 100644 GIT binary patch delta 18 acmeypi23&-W_I~*4vvN^&KucFE&>2bS_hT@ delta 18 Zcmeypi23&-W_I~*4i1}4r;Y3-7Xd~02Ic?& diff --git a/data/cds/chlorodb/fasta/NC_023356.fst.gz b/data/cds/chlorodb/fasta/NC_023356.fst.gz index e7e6ca5eec92d19f9ed60e61b74488dbd9924e41..ab0563eb8dde2adfb56a70a258a776eda73127e0 100644 GIT binary patch delta 18 ZcmccnkMZt5Mt1pb4vvN^&Kudo>H$#L2c7@` delta 18 ZcmccnkMZt5Mt1pb4i1}4r;Y4k^#DwD2JQd= diff --git a/data/cds/chlorodb/fasta/NC_023357.fst.gz b/data/cds/chlorodb/fasta/NC_023357.fst.gz index 945eb1201a5b8c778c969e73a9b11bab0beb044c..297fc4df294745d3694f4e3291ee56133813f502 100644 GIT binary patch delta 18 acmdn-nQ6yoCU*I54vvN^&Kub`?gRi!%Lml} delta 18 acmdn-nQ6yoCU*I54i1}4r;Y3zcLD%MXa^+# diff --git a/data/cds/chlorodb/fasta/NC_023358.fst.gz b/data/cds/chlorodb/fasta/NC_023358.fst.gz index 4952521818c2ed98e64e121f7268e4510644af51..a6a026c5084035bcdeea073603a152d36a4f3fcb 100644 GIT binary patch delta 18 acmbRAf@#tVCU*I54vvN^&Kudew*UY{KL*GE delta 18 ZcmbRAf@#tVCU*I54i1}4r;Y5~TL3@Y1{eSU diff --git a/data/cds/chlorodb/fasta/NC_023359.fst.gz b/data/cds/chlorodb/fasta/NC_023359.fst.gz index 0b5340c203a338f509121a51c39b64c6f499cba5..7082e25543302336aaa42808ad26b0d6ea6c042e 100644 GIT binary patch delta 18 ZcmeBu!PNVLiCw;%gQMY!^G0^IEdWE12DtzL delta 18 ZcmeBu!PNVLiCw;%gTp4%X(Kz^763mj1_=NF diff --git a/data/cds/chlorodb/fasta/NC_023360.fst.gz b/data/cds/chlorodb/fasta/NC_023360.fst.gz index cd23b216cc01f3e28715ad1a74059c8935c8dd22..4131bae3818d14e267ad14aabb89bba60d2c7d0a 100644 GIT binary patch delta 18 ZcmZqv$khCiiCw;%gQMY!^G5cX9RNg42QdHu delta 18 ZcmZqv$khCiiCw;%gTp4%X(M~h4gf#u27v$o diff --git a/data/cds/chlorodb/fasta/NC_023367.fst.gz b/data/cds/chlorodb/fasta/NC_023367.fst.gz index db8bdba31d4c5302add9273b67339aee1da089d1..d9d7f246c1ff58b8cdb38398e13453bd869f510b 100644 GIT binary patch delta 18 acmaF=mFfLgCU*I54vvN^&KucZ>;eE&j|hJN delta 18 acmaF=mFfLgCU*I54i1}4r;Y3{b^!oSEC=CU*I54vvN^&KudktOfv4f(Tdu delta 18 acmex;o$2>=CU*I54i1}4r;Y4iRs#S{9|x!a diff --git a/data/cds/chlorodb/fasta/NC_023463.fst.gz b/data/cds/chlorodb/fasta/NC_023463.fst.gz index a42e58d04d3ae4cfbef7540d294a1954d21ffeab..194372f2de1a5a9d05b401fa3f0ef9c509a6f371 100644 GIT binary patch delta 18 acmX^9g6a4RCU*I54vvN^&Kubswg3Q2eg|g& delta 18 ZcmX^9g6a4RCU*I54i1}4r;Y3mTL4EJ2DbnJ diff --git a/data/cds/chlorodb/fasta/NC_023464.fst.gz b/data/cds/chlorodb/fasta/NC_023464.fst.gz index 3012d9cb7a455f8efd802f7f43ec71b87fde6944..aa6a5308cd56de5089a882e675bab5422577ee5b 100644 GIT binary patch delta 18 ZcmZo!$k?)wkzKx& delta 18 ZcmcaLjq%nrMt1pb4i1}4r;Y5v-T*&91>pby diff --git a/data/cds/chlorodb/fasta/NC_023533.fst.gz b/data/cds/chlorodb/fasta/NC_023533.fst.gz index 2993d815bbb4308804e3677ba75bfd52ec84f8cd..b23be5d90b8cfcc09ed8a50da2712c0f6d1d783d 100644 GIT binary patch delta 18 acmaEUn(6szCU*I54vvN^&KubuECm2fOb7k| delta 18 acmaEUn(6szCU*I54i1}4r;Y3nmI44s=?6{# diff --git a/data/cds/chlorodb/fasta/NC_023544.fst.gz b/data/cds/chlorodb/fasta/NC_023544.fst.gz index e8a821f86125df39677baac88ce8343dd06580ca..d726e0fcd2ec7cb3d3496a4e7ca9eb458652522a 100644 GIT binary patch delta 18 acmezLi|NxZCU*I54vvN^&KudY_W}S@mIxI9 delta 18 ZcmezLi|NxZCU*I54i1}4r;Y5{djU@~2W0>N diff --git a/data/cds/chlorodb/fasta/NC_023775.fst.gz b/data/cds/chlorodb/fasta/NC_023775.fst.gz index 387974e46f41e6898dc55ae4d12f03329ca3d61f..5874dc759b2358617773c9223db482ff61f57ba0 100644 GIT binary patch delta 18 Zcmcb4hVkYZMt1pb4vvN^&Kuc-(f~>&2NeJS delta 18 Zcmcb4hVkYZMt1pb4i1}4r;Y4EX#hpS24w&M diff --git a/data/cds/chlorodb/fasta/NC_023785.fst.gz b/data/cds/chlorodb/fasta/NC_023785.fst.gz index e06219b78759aa96b7dd19dd1f672ceb047c0377..659c89497920b7cd15f85b6ca3d7537edc0a44a8 100644 GIT binary patch delta 18 acmdn8j(N*EW_I~*4vvN^&KucvuLA%=9|qq5 delta 18 Zcmdn8j(N*EW_I~*4i1}4r;Y5o*8x4e1}^{r diff --git a/data/cds/chlorodb/fasta/NC_023790.fst.gz b/data/cds/chlorodb/fasta/NC_023790.fst.gz index d272ebf2e24c5bc43b2fdf1f031b2f6da11b2e44..788a9365c87c0e0d39d6bc402ca62f22ecd1080c 100644 GIT binary patch delta 18 ZcmccG!F;uYnO(k{gQMY!^G0^RBLG452IBw# delta 18 ZcmccG!F;uYnO(k{gTp4%X(PMe5db}s1~UKv diff --git a/data/cds/chlorodb/fasta/NC_023792.fst.gz b/data/cds/chlorodb/fasta/NC_023792.fst.gz index 021b8079fff8702e26c305050dab8cba23ebdf36..422d175bd791648aa1a8fbcd8915e16321079771 100644 GIT binary patch delta 18 Zcmcc7!F;2GnO(k{gQMY!^G5c-BLG5P2J8R; delta 18 Zcmcc7!F;2GnO(k{gTp4%X(M~!5db~=20Q=& diff --git a/data/cds/chlorodb/fasta/NC_023798.fst.gz b/data/cds/chlorodb/fasta/NC_023798.fst.gz index ecc98fa8b8215d5686f3c595b4e057ab163d930d..1914d907771319a2c389404f8b64b1d03a01e902 100644 GIT binary patch delta 18 ZcmX@n$b6!anO(k{gQMY!^G5cA2LM1(2Pyyn delta 18 ZcmX@n$b6!anO(k{gTp4%X(Ri=0{}bj26_Mh diff --git a/data/cds/chlorodb/fasta/NC_023800.fst.gz b/data/cds/chlorodb/fasta/NC_023800.fst.gz index fd4c0e52893b776fe6a160072c1ddb7ae9da986f..1cf62bbbb1c8425c5f5e6eee81a6468708630854 100644 GIT binary patch delta 18 acmex&gX!N5CU*I54vxkv&Kudw*8l)f5(nh~ delta 18 Zcmex&gX!N5CU*I54i1}4r;Y68YXD5B2Q&Zx diff --git a/data/cds/chlorodb/fasta/NC_023801.fst.gz b/data/cds/chlorodb/fasta/NC_023801.fst.gz index 0bdf9fd117710c2d664c55601ef67ed1a9e08751..260fc2ef4a2018f4508268b91fb2b01b2f50bf7a 100644 GIT binary patch delta 18 Zcmey}&iuQbnO(k{gQM|^^G5bBhXF_q2h#um delta 18 Zcmey}&iuQbnO(k{gTp4%X(RiW!vI612OFDu diff --git a/data/cds/chlorodb/fasta/NC_023935.fst.gz b/data/cds/chlorodb/fasta/NC_023935.fst.gz index f4c887d5110977d56844bc1b6312360d0c9f99c6..6547c1d6d8baa5c2024b37a24dcd5d1b22609e65 100644 GIT binary patch delta 18 ZcmeCU#?*0*iCw;%gQM|^^G0^Y)c`=T27Ukl delta 18 ZcmeCU#?*0*iCw;%gTpq{X(K!1Y5+V=1uE delta 18 ZcmX@Jjp@ubCU*I54i4K)r;Y5cvjIV>21)<` diff --git a/data/cds/chlorodb/fasta/NC_024022.fst.gz b/data/cds/chlorodb/fasta/NC_024022.fst.gz index 2b0d96c68062ef51feef4e17b788c00460ff6bec..a99b2a5b7eb9c8b55978e82d6669e523cda0ba4d 100644 GIT binary patch delta 18 acmZ3qjcL&~CU*I54vxkv&KudKX9EC0PX>Gd delta 18 ZcmZ3qjcL&~CU*I54i4K)r;Y5=vjIEo13jjnQ27Ukl diff --git a/data/cds/chlorodb/fasta/NC_024038.fst.gz b/data/cds/chlorodb/fasta/NC_024038.fst.gz index a9ae660f2211479f5749f2c161cefc84652d2fb5..4862bd4c81c8e0f14a037c3b5d4234c8a16a543b 100644 GIT binary patch delta 18 acmZ3ujcMUFCU*I54vxkv&KudKW&;2~ECzW1 delta 18 ZcmZ3ujcMUFCU*I54i4K)r;Y4VvjIEF1<3#a diff --git a/data/cds/chlorodb/fasta/NC_024050.fst.gz b/data/cds/chlorodb/fasta/NC_024050.fst.gz index f817b27ac18ca97bb805cf48f3dc711610937c9f..ec11c385fb6c85fc28a488c5dab8bae165f8712c 100644 GIT binary patch delta 18 acmex+hWYOqW_I~*4vxkv&Kudwo&f+)(g+3s delta 18 Zcmex+hWYOqW_I~*4i4K)r;Y4o&j3qr2UY+8 diff --git a/data/cds/chlorodb/fasta/NC_024060.fst.gz b/data/cds/chlorodb/fasta/NC_024060.fst.gz index 13f644099a7f9e8c7e36937156f6bb2fc34e0254..064f3caba7c7e6cb1cf2ea2b96c867b6caa068d8 100644 GIT binary patch delta 18 ZcmccA&3vhwnO(k{gQM|^^G5d5M*%|d2VwvK delta 18 ZcmccA&3vhwnO(k{gTpq{X(RjTqX0gR2C@JE diff --git a/data/cds/chlorodb/fasta/NC_024061.fst.gz b/data/cds/chlorodb/fasta/NC_024061.fst.gz index e15d15f3ebfc03a672dd44506fc0728ebc346dd2..b7ecf3c896381cff6ce6344ffe836a8ba2e23788 100644 GIT binary patch delta 18 Zcmdnl!@RSHnO(k{gQM|^^G0@~V*oy;2ATi> delta 18 Zcmdnl!@RSHnO(k{gTpq{X(PMQF#tM41?m6* diff --git a/data/cds/chlorodb/fasta/NC_024062.fst.gz b/data/cds/chlorodb/fasta/NC_024062.fst.gz index 56dffffacdd49281aac3d9149e323c0a779c6ad7..412e1e496b718a65234665dcc60d1a4addfd3e65 100644 GIT binary patch delta 18 ZcmZ41!@R7AnO(k{gQM|^^G0_0V*or224MgI delta 18 ZcmZ41!@R7AnO(k{gTpq{X(PM*F#tEJ1+f4C diff --git a/data/cds/chlorodb/fasta/NC_024064.fst.gz b/data/cds/chlorodb/fasta/NC_024064.fst.gz index 2560ae11cd8245bcc97eb4738f2e86a1bd6c8f90..3a483f2ca1f34a8f0474fabdc133b9c3cb35de8e 100644 GIT binary patch delta 18 ZcmX@q&3vevnO(k{gQM|^^G5dFM*%>=2QmNv delta 18 ZcmX@q&3vevnO(k{gTpq{X(RjYqX0Z!27&+p diff --git a/data/cds/chlorodb/fasta/NC_024065.fst.gz b/data/cds/chlorodb/fasta/NC_024065.fst.gz index a8bb2f697410cf41d9b68ac20e6ffb3255756527..1cc6dba7fc64759fe260b25ad04f7de8cd5efeaa 100644 GIT binary patch delta 18 ZcmX@y#eBGnnO(k{gQMw+^G0@?qX0k52DAVG delta 18 ZcmX@y#eBGnnO(k{gTpq{X(PMMQ2;w)1_J;9 diff --git a/data/cds/chlorodb/models/blosum62.mat b/data/cds/chlorodb/models/blosum62.mat new file mode 100644 index 0000000..37f3f29 --- /dev/null +++ b/data/cds/chlorodb/models/blosum62.mat @@ -0,0 +1,29 @@ +# +# blosum62 substitution matrix +# with larger penalty for stops +# + A R N D C Q E G H I L K M F P S T W Y V B Z X * +A 4 -1 -2 -2 0 -1 -1 0 -2 -1 -1 -1 -1 -2 -1 1 0 -3 -2 0 -2 -1 0 -50 +R -1 5 0 -2 -3 1 0 -2 0 -3 -2 2 -1 -3 -2 -1 -1 -3 -2 -3 -1 0 -1 -50 +N -2 0 6 1 -3 0 0 0 1 -3 -3 0 -2 -3 -2 1 0 -4 -2 -3 3 0 -1 -50 +D -2 -2 1 6 -3 0 2 -1 -1 -3 -4 -1 -3 -3 -1 0 -1 -4 -3 -3 4 1 -1 -50 +C 0 -3 -3 -3 9 -3 -4 -3 -3 -1 -1 -3 -1 -2 -3 -1 -1 -2 -2 -1 -3 -3 -2 -50 +Q -1 1 0 0 -3 5 2 -2 0 -3 -2 1 0 -3 -1 0 -1 -2 -1 -2 0 3 -1 -50 +E -1 0 0 2 -4 2 5 -2 0 -3 -3 1 -2 -3 -1 0 -1 -3 -2 -2 1 4 -1 -50 +G 0 -2 0 -1 -3 -2 -2 6 -2 -4 -4 -2 -3 -3 -2 0 -2 -2 -3 -3 -1 -2 -1 -50 +H -2 0 1 -1 -3 0 0 -2 8 -3 -3 -1 -2 -1 -2 -1 -2 -2 2 -3 0 0 -1 -50 +I -1 -3 -3 -3 -1 -3 -3 -4 -3 4 2 -3 1 0 -3 -2 -1 -3 -1 3 -3 -3 -1 -50 +L -1 -2 -3 -4 -1 -2 -3 -4 -3 2 4 -2 2 0 -3 -2 -1 -2 -1 1 -4 -3 -1 -50 +K -1 2 0 -1 -3 1 1 -2 -1 -3 -2 5 -1 -3 -1 0 -1 -3 -2 -2 0 1 -1 -50 +M -1 -1 -2 -3 -1 0 -2 -3 -2 1 2 -1 5 0 -2 -1 -1 -1 -1 1 -3 -1 -1 -50 +F -2 -3 -3 -3 -2 -3 -3 -3 -1 0 0 -3 0 6 -4 -2 -2 1 3 -1 -3 -3 -1 -50 +P -1 -2 -2 -1 -3 -1 -1 -2 -2 -3 -3 -1 -2 -4 7 -1 -1 -4 -3 -2 -2 -1 -2 -50 +S 1 -1 1 0 -1 0 0 0 -1 -2 -2 0 -1 -2 -1 4 1 -3 -2 -2 0 0 0 -50 +T 0 -1 0 -1 -1 -1 -1 -2 -2 -1 -1 -1 -1 -2 -1 1 5 -2 -2 0 -1 -1 0 -50 +W -3 -3 -4 -4 -2 -2 -3 -2 -2 -3 -2 -3 -1 1 -4 -3 -2 11 2 -3 -4 -3 -2 -50 +Y -2 -2 -2 -3 -2 -1 -2 -3 2 -1 -1 -2 -1 3 -3 -2 -2 2 7 -1 -3 -2 -1 -50 +V 0 -3 -3 -3 -1 -2 -2 -3 -3 3 1 -2 1 -1 -2 -2 0 -3 -1 4 -3 -2 -1 -50 +B -2 -1 3 4 -3 0 1 -1 0 -3 -4 0 -3 -3 -2 0 -1 -4 -3 -3 4 1 -1 -50 +Z -1 0 0 1 -3 3 4 -2 0 -3 -3 1 -1 -3 -1 0 -1 -3 -2 -2 1 4 -1 -50 +X 0 -1 -1 -1 -2 -1 -1 -1 -1 -1 -1 -1 -1 -1 -2 0 0 -2 -1 -1 -1 -1 -1 -50 +* -50 -50 -50 -50 -50 -50 -50 -50 -50 -50 -50 -50 -50 -50 -50 -50 -50 -50 -50 -50 -50 -50 -50 1 diff --git a/data/cds/chlorodb/models/splice.none.frq b/data/cds/chlorodb/models/splice.none.frq new file mode 100644 index 0000000..3a1626c --- /dev/null +++ b/data/cds/chlorodb/models/splice.none.frq @@ -0,0 +1,6 @@ +# 3'/5' splice null model +# A C G T +25 25 25 25 +splice +25 25 25 25 +# end of 3'/5' splice null model diff --git a/data/cds/chlorodb/models/splice3.default.frq b/data/cds/chlorodb/models/splice3.default.frq new file mode 100644 index 0000000..4ba2d4c --- /dev/null +++ b/data/cds/chlorodb/models/splice3.default.frq @@ -0,0 +1,13 @@ +# 3' splice model : default +# A C G T +19 18 27 36 +36 5 34 25 +20 7 51 23 +29 13 14 44 +splice +5 2 78 15 +3 7 15 75 +4 1 83 12 +5 51 13 31 +5 7 79 9 +53 10 27 11 diff --git a/data/cds/chlorodb/models/splice3.ndha.frq b/data/cds/chlorodb/models/splice3.ndha.frq new file mode 100644 index 0000000..3584fe3 --- /dev/null +++ b/data/cds/chlorodb/models/splice3.ndha.frq @@ -0,0 +1,13 @@ +# 3' splice model : ndha +# A C G T +1 43 1 56 +0 57 0 42 +41 1 2 56 +57 42 0 1 +splice +1 55 42 2 +0 1 57 42 +1 1 43 56 +2 11 56 31 +1 29 42 28 +41 1 57 1 diff --git a/data/cds/chlorodb/models/splice3.psba.frq b/data/cds/chlorodb/models/splice3.psba.frq new file mode 100644 index 0000000..21a6d8a --- /dev/null +++ b/data/cds/chlorodb/models/splice3.psba.frq @@ -0,0 +1,13 @@ +# 3' splice model : psba +# A C G T +26 14 40 21 +13 44 35 9 +41 3 33 23 +1 13 5 81 +splice +37 5 27 31 +62 5 9 24 +56 13 23 8 +32 28 6 33 +35 21 17 28 +53 12 10 26 diff --git a/data/cds/chlorodb/models/splice5.default.frq b/data/cds/chlorodb/models/splice5.default.frq new file mode 100644 index 0000000..b5cb067 --- /dev/null +++ b/data/cds/chlorodb/models/splice5.default.frq @@ -0,0 +1,13 @@ +# 5' splice model : default +# A C G T +15 42 3 40 +15 46 6 33 +13 32 2 53 +45 17 21 16 +70 13 6 11 +21 39 8 32 +splice +37 27 9 26 +31 35 17 17 +29 23 26 22 +30 25 28 17 diff --git a/data/cds/chlorodb/models/splice5.ndha.frq b/data/cds/chlorodb/models/splice5.ndha.frq new file mode 100644 index 0000000..fdad60d --- /dev/null +++ b/data/cds/chlorodb/models/splice5.ndha.frq @@ -0,0 +1,13 @@ +# 5' splice model : ndha +# A C G T +0 54 2 44 +43 1 1 56 +57 1 7 35 +8 1 39 52 +56 2 40 2 +55 1 0 44 +splice +1 0 2 97 +40 1 1 58 +55 0 1 44 +1 41 1 58 diff --git a/data/cds/chlorodb/models/splice5.psba.frq b/data/cds/chlorodb/models/splice5.psba.frq new file mode 100644 index 0000000..7785836 --- /dev/null +++ b/data/cds/chlorodb/models/splice5.psba.frq @@ -0,0 +1,13 @@ +# 5' splice model : psba +# A C G T +38 15 9 37 +40 5 13 42 +41 15 6 37 +32 9 15 44 +22 8 10 60 +0 9 83 8 +splice +33 15 27 24 +31 6 26 37 +17 28 6 49 +13 15 23 49 diff --git a/data/cds/chlorodb/models/start.default.frq b/data/cds/chlorodb/models/start.default.frq new file mode 100644 index 0000000..aa16582 --- /dev/null +++ b/data/cds/chlorodb/models/start.default.frq @@ -0,0 +1,8 @@ +# start model : default +atg 0.9692592 36165 +acg 0.01173885 438 +gtg 0.007504288 280 +ata 0.003886149 145 +atc 0.00337693 126 +att 0.002840909 106 +ttg 0.001393654 52 diff --git a/data/cds/chlorodb/models/start.ndhd.frq b/data/cds/chlorodb/models/start.ndhd.frq new file mode 100644 index 0000000..893232b --- /dev/null +++ b/data/cds/chlorodb/models/start.ndhd.frq @@ -0,0 +1,7 @@ +# start model : ndhd +acg 0.5066667 190 +atg 0.3493333 131 +atc 0.05066667 19 +ata 0.03466667 13 +acc 0.02933333 11 +gtg 0.02933333 11 diff --git a/data/cds/chlorodb/models/start.rps19.frq b/data/cds/chlorodb/models/start.rps19.frq new file mode 100644 index 0000000..59a3169 --- /dev/null +++ b/data/cds/chlorodb/models/start.rps19.frq @@ -0,0 +1,3 @@ +# start model : rps19 +gtg 0.6261023 355 +atg 0.3738977 212 diff --git a/data/cds/chlorodb/models/stop.default.frq b/data/cds/chlorodb/models/stop.default.frq new file mode 100644 index 0000000..f5f76e5 --- /dev/null +++ b/data/cds/chlorodb/models/stop.default.frq @@ -0,0 +1,4 @@ +# stop model : default (freq. ignored) +taa 0.5742367 21968 +tag 0.2351265 8995 +tga 0.1906368 7293 diff --git a/data/cds/chlorodb/parameters.sh b/data/cds/chlorodb/parameters.sh new file mode 100644 index 0000000..75749a3 --- /dev/null +++ b/data/cds/chlorodb/parameters.sh @@ -0,0 +1,28 @@ +# sourced file + +set CORE_NCDS_CUTOFF = 200 +set CORE_START_ATG_CUTOFF = 50 +set CORE_START_DFT_CUTOFF = 50 +set CORE_START_OTH_CUTOFF = 10 +set CORE_STOP_CUTOFF = 200 +set CORE_SPLICE_CUTOFF = 50 + +set SHEL_NCDS_CUTOFF = 10 + +set CORE_DELTA = Inf +set CORE_COVMIN = 30 +set CORE_PMAX = 1e-6 +set CORE_IDMIN = 30 +set CORE_SIZMIN = 50 + +set SHEL_DELTA = 0.5 +set SHEL_COVMIN = 30 +set SHEL_PMAX = 1e-6 +set SHEL_IDMIN = 30 +set SHEL_SIZMIN = 10 + +set DUST_DELTA = 0.5 +set DUST_COVMIN = 30 +set DUST_PMAX = 1e-6 +set DUST_IDMIN = 30 +set DUST_SIZMIN = 10 diff --git a/detectors/cds/bin/go_pass1.sh b/detectors/cds/bin/do_exonerate.sh similarity index 85% rename from detectors/cds/bin/go_pass1.sh rename to detectors/cds/bin/do_exonerate.sh index 4f911a5..5fbe664 100755 --- a/detectors/cds/bin/go_pass1.sh +++ b/detectors/cds/bin/do_exonerate.sh @@ -1,21 +1,21 @@ #!/bin/csh -f # -# Annotate CDS - Pass1 +# Annotate CDS - Exonerate # #======================================================================================== # -# Annotate CDS of chlorodb/core proteins using exonerate +# Annotate CDS using exonerate # -# pass1.sh [] +# do_exonerate.sh [] # -# - : The fasta file containing the genome to annotate -# - : Name of the protein family (defined in chlorodb/core) +# - : The fasta file containing the genome to annotate +# - : The fasta file containing the protein family # -# Results are in file : `basename :r`..res +# Results are in file : `basename :r`.`basename :r`.res # #======================================================================================== # -# usage: go_pass1.sh fasta family [outdir] +# usage: do_exonerate.sh dna.fasta prot.fasta [outdir] # unsetenv ORG_SOURCED @@ -31,12 +31,14 @@ NeedArg 2 set GenoFile = $Argv[1] set GenoName = `basename $GenoFile:r` -set ProtName = $Argv[2] -set ProtDir = $CDS_DATA_DIR/chlorodb/core -set ProtFile = $ProtDir/$ProtName.fst + +set ProtFile = $Argv[2] +set ProtDir = `dirname $ProtFile` +set ProtName = `basename $ProtFile:r` NeedFile $GenoFile NeedFile $ProtFile +NeedFile $ProtDir/Annot.lst set OutDir = . if ($#Argv >= 3) set OutDir = $3 @@ -101,7 +103,7 @@ endif if ($PASS1_SPEEDUP != 0) then - $PROG_DIR/go_filterbx.sh $GenoFile $ProtFile \ + $PROG_DIR/do_filterbx.sh $GenoFile $ProtFile \ $PASS1_BLASTX_FILTER_IDMIN \ $PASS1_BLASTX_FILTER_NBMIN \ $PASS1_BLASTX_FILTER_NBMAX > D_$$ @@ -159,8 +161,7 @@ $AwkCmd -v MAX_SPAN=$PASS1_MAX_SPAN \ # get annotations # -egrep "^$ProtName " $CDS_DATA_DIR/chlorodb/core/Annot.lst |\ - awk '{print "c annot", $0}' > T_$$ +egrep "^$ProtName " $ProtDir/Annot.lst | awk '{print "c annot", $0}' > T_$$ # # extend start/stop diff --git a/detectors/cds/bin/go_filterbx.sh b/detectors/cds/bin/do_filterbx.sh similarity index 94% rename from detectors/cds/bin/go_filterbx.sh rename to detectors/cds/bin/do_filterbx.sh index 7213fa3..ea51b63 100755 --- a/detectors/cds/bin/go_filterbx.sh +++ b/detectors/cds/bin/do_filterbx.sh @@ -5,7 +5,7 @@ # # output on stdout # -# usage: go_filterbx.sh dna_fasta prot_fasta [idmin nbmin nbmax] +# usage: do_filterbx.sh dna.fasta prot.fasta [idmin nbmin nbmax] # unsetenv ORG_SOURCED diff --git a/detectors/cds/bin/go_cds.sh b/detectors/cds/bin/go_cds.sh index 2dae666..f38e053 100755 --- a/detectors/cds/bin/go_cds.sh +++ b/detectors/cds/bin/go_cds.sh @@ -13,7 +13,7 @@ # Results are printed to the standard output # #======================================================================================== -# usage: go_cds.sh fasta +# usage: go_cds.sh fasta [db_core] # unsetenv ORG_SOURCED @@ -22,13 +22,19 @@ source $ORG_HOME/scripts/csh_init.sh NeedArg 1 -set Fasta = $Argv[1] +set Fasta = $Argv[1]; Shift NeedFile $Fasta set Genome = `basename $Fasta:r` -NeedFile $CDS_DATA_DIR/chlorodb/core +set DbCore = $CDS_DATA_DIR/chlorodb/core + +if ($#Argv > 0) then + set DbCore = $Argv[1]; Shift +endif + +NeedFile $DbCore/Annot.lst # # run everything into temporary place @@ -44,15 +50,15 @@ endif # pass1: run exonerate # -set fams = `ls $CDS_DATA_DIR/chlorodb/core/*.fst` +set fams = `ls $DbCore/*.fst` -Notify "running pass1: exonerate of $Genome" +Notify "running pass1: exonerate of $Genome on $DbCore" foreach f ($fams) - set prot = `basename $f:r` - $PROG_DIR/go_pass1.sh $Fasta $prot $temp + $PROG_DIR/do_exonerate.sh $Fasta $f $temp end + # # pass2: transsplicing # diff --git a/detectors/cds/test/go_test.sh b/detectors/cds/test/go_test.sh index f778c9f..9e62ae4 100755 --- a/detectors/cds/test/go_test.sh +++ b/detectors/cds/test/go_test.sh @@ -1,5 +1,7 @@ #!/bin/csh -f +setenv Verbose 1 + setenv ORG_HOME `dirname $0`/../../.. source $ORG_HOME/scripts/csh_init.sh @@ -8,9 +10,9 @@ echo "+ testing CDS" setenv TMP_CLEANUP 0 setenv PASS1_SPEEDUP 1 setenv PASS1_SLOWDOWN 0 -setenv PASS1_BLASTX_FILTER_NBMAX 10 +setenv PASS1_BLASTX_FILTER_NBMAX 5 -`dirname $0`/../bin/go_cds.sh test.fst > test.bak +`dirname $0`/../bin/go_cds.sh test.fst test.db > test.bak diff -q test.bak test.ref >& /dev/null @@ -18,7 +20,7 @@ set stat = $status if ($stat == 0) then echo "+ $VTC[3]CDS test Ok$VTC[1]" - \rm -r test.bak test.tmp + \rm -r test.bak test.tmp test.db/*.fst.p?? else echo "* $VTC[2]CDS test Failure$VTC[1]" endif diff --git a/detectors/cds/test/test.db/Annot.lst b/detectors/cds/test/test.db/Annot.lst new file mode 100644 index 0000000..b1d9e74 --- /dev/null +++ b/detectors/cds/test/test.db/Annot.lst @@ -0,0 +1,18 @@ +atpf atpF 483 1:80_2:401_3:1_4:1 POLYEX ATP_synthase_CF0_B_subunit +ccsa ccsA 477 1:476_2:1 POLYEX cytochrome_c_biogenesis_protein +ndha ndhA 384 1:9_2:375 POLYEX NADH_dehydrogenase_subunit_1 +ndhb ndhB 699 1:5_2:693_3:1 POLYEX NADH_dehydrogenase_subunit_2 +ndhd ndhD 383 1:383 MONEX NADH_dehydrogenase_subunit_4 +ndhe ndhE 395 1:395 MONEX NADH_dehydrogenase_subunit_4L +ndhf ndhF 384 1:384 MONEX NADH_dehydrogenase_subunit_5 +ndhg ndhG 386 1:386 MONEX NADH_dehydrogenase_subunit_6 +ndhh ndhH 406 1:400_2:6 POLYEX NADH_dehydrogenase_subunit_7 +ndhi ndhI 386 1:386 MONEX NADH_dehydrogenase_subunit_I +psac psaC 498 1:491_2:4_3:3 POLYEX photosystem_I_subunit_VII +rpl2 rpl2 800 1:101_2:698_5:1 POLYEX ribosomal_protein_L2 +rpl23 rpl23 787 1:782_2:2_3:1_4:2 POLYEX ribosomal_protein_L23 +rpl32 rpl32 474 1:474 MONEX ribosomal_protein_L32 +rps15 rps15 480 1:479_2:1 POLYEX ribosomal_protein_S15 +rps7 rps7 853 1:853 MONEX ribosomal_protein_S7 +ycf1 ycf1 408 1:406_2:2 POLYEX hypothetical_chloroplast_RF1 +ycf2 ycf2 654 1:649_2:5 POLYEX Ycf2 diff --git a/detectors/cds/test/test.db/atpf.fst b/detectors/cds/test/test.db/atpf.fst new file mode 100644 index 0000000..350bddd --- /dev/null +++ b/detectors/cds/test/test.db/atpf.fst @@ -0,0 +1,50 @@ +>AC_000188@LyesCp071@atpf@11803@13043@R@2@185 ATP_synthase_CF0_B_chain +MKNVTDSFVSLGHWPSAGSFGFNTDILATNPINLSVVLGVLIFFGKGVLS +DLLDNRKQRILNTIRNSEELRGGAIEQLEKARSRLRKVETEAEQFRVNGY +SEIEREKLNLINSTYKTLEQLENYKNETIQFEQQRAINQVRQRVFQQALR +GALGTLNSCLNNELHLRTISANIGMLGTMKEITD +>NC_000925@PopuCp059@atpf@45392@45943@R@1@184 ATP_synthase_CF0_B_subunit +MNSIVNITPIIIILSEHSSEHTFGFNSDIFEANVINILLLLFGLIYVLKQ +SLGSTLNERQLKVLAAIQESEERLEQASSRLSESEKQLAQTQIIINQIKK +EAQLTAEKVRSSILAQGQIDIERLAITGKSNIETAEKQIRRQIQQQIAFL +ALKKVTLQLENQMSSDIQLRIIDNNIAKLGDQL +>NC_000926@GuthCp075@atpf@65505@66053@R@1@183 ATP_synthase_CF0_B_subunit +MDIISGFYNTINLAELSNAKTFGFNPNILEANVLNIAILLSGVIYLGRNF +LTSALESRQQKVTEAIQEAEERLQQANVKLLDAEKQLTQAQTVIEQIKKE +AEKTARTVKETILAQGKLDIERLTNNGKSSIEKAELQIKKQIQQHITDLA +IKKVSAQMETFMTDNLQVKVIDTNIASLGGKI +>NC_000927@NeolCp025@atpf@19121@19651@R@1@177 ATP_synthase_CF0_B_chain +MFHFLALTPLAHSEGFGLNTNILETNILNLAAVFALLAYVGTDFVSSLLK +TRKESILKSLRDADERYQDAVNQLKQALQELETARTNAAEIRRQSEINAE +AIRQRLELLTQEEMARLEEAKETIIKLEEEKAVAEVCTKVISMALVRAEK +KIISSMDEAMHRRVMDMYLNLLREVY +>NC_000932@ArthCp008@atpf@11529@12798@R@2@185 ATP_synthase_CF0_B_subunit +MKNLTDSFVYLGHWPSAGSFGFNTDILATNPINLSVVFGVLIFFGKGVLN +DLLDNRKQRILNTIRNSEELREGAIQQLENARARLRNVETEADKFRVNGY +SEIEREKLNLINSTYKTLKQLENYKNETILFEQQRTINQVRERVFQQALQ +GAIGTLNSCLSNELHLRTINANIGMFGTMKEITD +>NC_001319@MapoCp012@atpf@18468@19609@D@2@185 ATP_synthase_CF0_B_subunit +MENGTYFIISSNFWTIAGSFGLNTNLLETNLINLGVVLGLLVYFGKGVLS +NLLNNRKLTILNTIQDAEERYKEATDKLNQARTRLQQAKQKADDIRINGL +SQMEKEKQDLINAADEDSKRLEDSKNATIRFEKQRAIEQVRQQVSRLALE +RALETLKSRLNSELHLRMIDYHIGLLRAMESTIE +>NC_001320@OrsajCp021@atpf@32741@34111@D@2@181 ATP_synthase_CF0_B_subunit +MKNVTHSFVFLAHWPSAGSFGLNTDILATNLINLTVVVGVLIYFGKGVLK +DLLDNRKQRILSTIRNSEELRRGTIEQLEKARIRLQKVELEADEYRMNGY +SEIEREKANLINATSISLEQLEKSKNETLYFEKQRAMNQVRQRVFQQAVQ +GALGTLNSCLNTELHFRTIRANISILGAME +>NC_001603@EugrCp038@atpf@64813@66970@D@4@184 ATP_synthase_CF0_B_chain +MVIDNFNIFTIISNAKTFGINTNVFETNIINLAIVVGTLFYYGKLTLSDL +LKTRKKTIIKNILDIDEKIRSSQSSLYLAELEFENAAKKASLIRSNGTTF +CLKSFDIIRSSVNEDIKRLKQSKRLILRTEDKKSVREIFKNLYSQACQKA +KATIIKRLNSKIHKKIILKKMEKMSLKKLKPKY +>NC_001631@PithCp015@atpf@11663@12972@R@2@185 ATP_synthase_CF0_B_subunit +MKNVIDPFISLSYWPSAGGFGSNTNILETNIINSSVVLSVLIYFGKGVLS +NLLDNRKQKILETIRNSEELCKGAIDQLEKARACLRNVEMIADEIQVNGN +SQIEREKEDLLNTASDNLEQLEDPKNETIYSEQQRAFDQIRQQVSRQALR +RAIGTLNSRLNTELHLRTIDHNIGLLRTMMNTND +>NC_001666@ZemaCp019@atpf@35097@36479@D@2@184 ATP_synthase_CF0_B_subunit +MKNVTHSFVFLAHWPFAGSFGLNTDILATNLINLTVVVGVLIFFGKGVLK +DLLDNRKQRILSTIRNSEELRKGTLEQLEKARIRLQKVELEADEYRMNGY +SEIEREKENLINATSISLEQLEKSKNETLYFEKQRAMNQVRQQGFQQAVQ +GALGTLNSCLNTELHFRTIRANIGILGAIEWKR diff --git a/detectors/cds/test/test.db/ccsa.fst b/detectors/cds/test/test.db/ccsa.fst new file mode 100644 index 0000000..3a3b5f2 --- /dev/null +++ b/detectors/cds/test/test.db/ccsa.fst @@ -0,0 +1,78 @@ +>AC_000188@LyesCp084@ccsa@115765@116706@D@1@314 cytochrome_c_biogenesis_protein +MIFSTLEHILTHISFSIVSIVITIHLITFLVDEIVKLYDSSEKGIIVTFF +CITGLLVTRWVSSGHFPLSDLYESLIFLSWSFSLIHIIPYFKKNVLILSK +ITGPSAILTQGFATSGILTEIHQSGILVPALQSEWLIMHVSMMILGYAAL +LCGSLLSVALLVITFRKNRKLFSKSNVFLNESFFLGENVVENTSFFCTKN +YYRSQLIQQLDYWSYRVISLGFTFLTIGILSGAVWANEAWGSYWNWDPKE +TWAFITWIVFAIYLHTRTNRNLRGPNSAIVASIGFLIIWICYFGVNLLGI +GLHSYGSFPSTFN +>NC_000925@PopuCp184@ccsa@160407@161366@D@1@320 cytochrome_c_biogenesis_protein +MNLEMMQNSCVNFAFGGLLTAMLVYWSSLAFPRISGLNKLAALITLLVNI +ALALTLSSRWFANGYFPLSNLYESLLFLAWGLTFVHLFIESKTKSRLIGA +VSIPVAMFVTAFASLALPIEMQKASPLVPALKSNWLMMHVSIMMISYSIL +ILGSLLSILFLIITRGQDINLKGSSVGTGSYTVKSLDSNPSFAFSNPSGI +VQEQSNMLINSTRMNLLESIDNLSYRIIGLGFPLLTIGIVAGAVWANEAW +GSYWSWDPKETWALITWLIFAAYLHCRITKSWQGKRPAILASVGFLVVWI +CYLGVNFLGKGLHSYGWLA +>NC_000926@GuthCp037@ccsa@33657@34562@R@1@302 cytochrome_c_biogenesis_protein +MFNVQFDIFNFSNNITFLTLLISLISYWLGLIFKKIKNVFYIGYGSTILA +CITITIILGTRWIESGYFPLSNLYESLMFLTWGLLFSAIYLEYKTNLYLI +GAIVSPISLFIVSFSTLSLPQDMQKAAPLVPALKSNWLMMHVSVMMLSYS +TLIIGSLLAILYLVLIKAQQKKHSLKDFAFANLEFTFPKSTNSTNFNLLE +TLDNLSYRTIGFGFPLLTIGIIAGAVWANEAWGTYWSWDPKETWALITWL +VFAAYLHARITKSWTGERPAYLAALGFVVVWICYLGVNFLGKGLHSYGWL +N +>NC_000927@NeolCp108@ccsa@128438@129259@D@1@274 cytochrome_c_biogenesis_protein +MSTFSILSLVAFATLFVTMLLYFFQRQPLARQSMWIAHTSLAGLLLLRWV +QSGHFPLSNLYESCLFLSWAVTLGHFVVEKDASRAGFLDLGIFTAPMAFF +VYAFATFSLPPTMQEAGPLVPALRSHWLMMHVTLMILSYAALLFGSVLSL +AFLVITTGPRKNSEKLQSLASTFDTLSYRTLGIGFPLLTVGILSGAVWAN +EAWGSYWSWDPKETWALITWLIFAIYLHSRLTYGWNGQKAALIASVGFFL +IWICYLGVNLLGKGLHSYGWLTS +>NC_000927@NeolCp129@ccsa@163667@164488@R@1@274 cytochrome_c_biogenesis_protein +MSTFSILSLVAFATLFVTMLLYFFQRQPLARQSMWIAHTSLAGLLLLRWV +QSGHFPLSNLYESCLFLSWAVTLGHFVVEKDASRAGFLDLGIFTAPMAFF +VYAFATFSLPPTMQEAGPLVPALRSHWLMMHVTLMILSYAALLFGSVLSL +AFLVITTGPRKNSEKLQSLASTFDTLSYRTLGIGFPLLTVGILSGAVWAN +EAWGSYWSWDPKETWALITWLIFAIYLHSRLTYGWNGQKAALIASVGFFL +IWICYLGVNLLGKGLHSYGWLTS +>NC_000932@ArthCp073@ccsa@114461@115447@D@1@329 cytochrome_c_biogenesis_protein +MIFSILEHILTHISFSVVSIVLTIYFLTLLVNLDEIIGFFDSSDKGIIIT +FFGITGLLLTRWIYSGHFPLSNLYESLIFLSWAFSIIHMVSYFNKKQQNK +LNTITAPSVIFIQGFATSGLLNKMPQSAILVPALQSQWLMMHVSMMILGY +GALLCGSLLSIALLVITFRKVGPTFWKKNIKKNFLLNELFSFDVLYYINE +RNSILLQQNINFSFSRNYYRYQLIQQLDFWSFRIISLGFIFLTVGILSGA +VWANETWGSYWNWDPKETWAFITWTIFAIYLHIKTNRNVRGINSAIVALI +GFILIWICYFGVNLLGIGLHSYGSFTSN +>NC_001319@MapoCp078@ccsa@95482@96444@D@1@321 cytochrome_c_biogenesis_protein +MPFITLERILAHTSFFLLFFVTFIYWGKFLYINIKPITILGEISMKIACF +FITTFLLIRWSSSGHFPLSNLYESSMFLSWSFTLIHLILENKSKNTWLGI +ITAPSAMLTHGFATLSLPKEMQESVFLVPALQSHWLMMHVTMMMLSYSTL +LCGSLLAITILIITLTKQKNLPILTSYFNFPFNSFIFKNLLQPMENEILS +YKTQKVFSFINFRKWQLIKELDNWSYRVISLGFPLLTIGILSGAVWANEA +WGSYWNWDPKETWALITWLIFAIYLHTRMIKGWQGKKPAIIASLGFFIVW +ICYLGVNLLGKGLHSYGWLI +>NC_001320@OrsajCp087@ccsa@105236@106201@D@1@322 cytochrome_c_biogenesis_protein +MLFATLEHILTHISFSTISIVITIHLITLLVRELGGLRDSSEKGMIATFF +CITGFLVSRWASSGHFPLSNLYESLIFLSWALYILHMIPKIQNSKNDLST +ITTPSTILTQGFATSGLLTEMHQSTILVPALQSQWLMMHVSMMLLSYATL +LCGSLLSAALLMIRFRKNLDFFSKKKKNVLSKTFFFNEIEYFYAKRSALK +STFFPLFPNYYKYQLIERLDSWSYRVISLGFTLLTIGILCGAVWANEAWG +SYWNWDPKETWAFITWTIFAIYLHSRTNPNWKGTKSAFVASIGFLIIWIC +YFGINLLGIGLHSYGSFTLPI +>NC_001631@PithCp147@ccsa@104925@105887@R@1@321 cytochrome_c_biogenesis_protein +MIFITLEHILAHISFSLILVVTLIYWGTLVYRIEGLSSSGGKGMIVTFLC +TTGLLINRWLYSGHLPLSNLYESFMFLSWSSSVFHILLEVRSRDDRWLGA +ITAPSAMLTHGFATLGLPEEMQRSGMLVPALQSHWSMMHVSMILFSYATL +LCGSLASIALLVIMSGVNRQVIFGAMDNLFSRAILPNENFYSHEKQKSDL +QYTVYFSSTNYRKCQLIKQLDHWSYRAIGLGFSLSTIGTLSGAIWANEAW +GSYWSWDPKETWALITWTIFAIYLHTRMNKGWQGEEPAIVASLGFFIVWI +RYLGVNLLGIGLHSYGWLEP +>NC_001666@ZemaCp085@ccsa@108995@109960@D@1@322 cytochrome_c_biogenesis_protein +MLFATLEHILTHISFSTISIVITIHLITLLVRELRGLRDSSEKGMIATFF +SITGFLVSRWVSSGHFPLSNLYESLIFLSWTLYILHTIPKIQNSKNDLST +ITTPSTILTQGFATSGLLTEMHQSTILVPALQSQWLMMHVSMMLLSYATL +LCGSLLSAALLIIRFRKNFDFFSLKKNVFLKTFFFSEIEYLYAKRSALKN +TSFPVFPNYYKYQLTERLDSWSYRVISLGFTLLTVGILCGAVWANEAWGS +YWNWDPKETWAFITWTIFAIYLHSRKNPNWKGTNSALVASIGFLIIWICY +FGINLLGIGLHSYGSFTLPSK diff --git a/detectors/cds/test/test.db/ndha.fst b/detectors/cds/test/test.db/ndha.fst new file mode 100644 index 0000000..16cef4f --- /dev/null +++ b/detectors/cds/test/test.db/ndha.fst @@ -0,0 +1,90 @@ +>AC_000188@LyesCp085@ndha@121113@123337@R@2@364 NADH_dehydrogenase_subunit_1 +MIIDTTEIETINSFSKLESLKEVYGIIWMLVPIVTLVLGITIGVLVIVWL +EREISAGIQQRIGPEYAGPLGILQALADGTKLLLKENLIPSTGDTRLFSI +GPSIAVISIFLSYSVIPFGDHLVLADLSIGVFFWIAISSIAPVGLLMSGY +GSNNKYSFLGGLRAAAQSISYEIPLALCVLSISLLSNSLSTVDIVEAQSK +YGFWGWNLWRQPIGFIVFLISSLAECERLPFDLPEAEEELVAGYQTEYSG +IKFGLFYIASYLNLLVSSLFVTVLYLGGWNLSIPYIFVPDIFGINKGGKV +FGTLIGIFITLAKTYLFLFIPIATRWTLPRLRMDQLLNLGWKFLLPISLG +NLLLTTSSQLLSL +>NC_000927@NeolCp116@ndha@144380@145468@D@1@363 NADH_dehydrogenase_subunit_1 +MTYVLDLKRSFLDACTWLIGDNFRDLGSVLWVPLPILSLVIVATLGVLVI +VWLERKISAGVQQRVGPEYGGALGLLQPLADGLKLVFKEDVVPAKSDTWL +FTLGPAVVVIPIFLAYLVVPFGQQLIIADLRIGIFFWIAISSIAPIGLLM +SGYGSNNKYSFLGGLRAAAQSISYELPLAICVLSVCLLADSLSTVDIVES +QSSWGILTWNIWRQPIGFVAFLIAALAECERLPFDLPEAEEELVAGYQTE +YTGMKFGLFYVGSYVNLLVSGCFVTVLYLGGWHGPFAIDGILPDSPPFQV +LDAFLGITWTLLKTFLFLFAAILTRWTLPRVRIDQLLDLGWKFLLPVSLG +NLLLTASLKLLF +>NC_000932@ArthCp079@ndha@119847@122009@R@2@361 NADH_dehydrogenase_subunit_1 +MIIYATAVQTINSFVKLESLKEVYGLIWIFVPIFSLVLGIITGVLVIVWL +EREISAGIQQRIGPEYAGPLGILQALADGTKLLFKENLRPSRGNTPLFSI +GPSIAVISILLSYSVIPFSNHLVLADLNIGIFLWIAISSIAPIGLLMSGY +GSNNKYSFLGGLRAAAQSISYEIPLTLCVLSISLLSNSLSTVDIVEAQSK +YGFWGWNLWRQPIGFIIFLISSLAECERLPFDLPEAEEELIAGYQTEYSG +IKFGLFYVASYLNLLISSLFVTVLYLGGWNISIPYISILELFQRDQIFGT +TIGIFITLAKTYLFLFVSIATRWTLPRLRMDQLLNLGWKFLLPISLGNLL +LTTSFQLFSL +>NC_001319@MapoCp084@ndha@100382@102200@R@2@369 NADH_dehydrogenase_subunit_1 +MISNINLEDKFFSFFFTLGFSKEFFNFLWIIFSILILMLGVTIGVLVLVW +LERKISAAIQQRIGPEYAGPLGIIQALADGIKLFLKEDIVPAQGDVWLFN +IGPILVLIPVFLSYLVIPFEYNVILANFSIGVFFWIAVSSVVPLGLLMAG +YGSNNKYSFLGGLRAAAQSISYEIPLALSVLSIALLSNSLSTVDIVEAQS +KYGFLSWNLWRQPIGFIVFFIASLAECERLPFDLPEAEEELVAGYQTEYS +GMKFAFFYLASYLNLLVSSLFVTILYLGGWHFSIPFFSLFKNFEWNLMSN +GISEVISIIIGIVITLVKSYLFLFISIMTRWTLPRIRIDQLLNLGWKFLL +PIALGNLLLTTSFQLFLL +>NC_001320@OrsajCp093@ndha@110631@112706@R@2@363 NADH_dehydrogenase_subunit_1 +MIIDRVQVEAINSFSNLELLKEVYGLIWILPILTLLLGITIEVLVIVWLE +REISASIQQRIGPEYAGPLGLLQAIADGTKLLFKEDILPSRGDIPLFSIG +PSIAVISILLSFLVIPLGYRFVLADLSIGVFLWIAISSIAPIGLLMAGYS +SNNKYSFSGGLRAAAQSISYEIPLTFCVLAISLLSNSSSTVDIVEAQSKY +GFFGWNLWRQPIGFLVFLISSLAECERLPFDLPEAEEELVAGYQTEYSGI +KYGLFYLVSYLNLLVSSLFVTVLYLGGWNLSIPYISFFGFFQMNKMVGIL +EMTMSIFITLTKAYLFLFISITIRWTLPRMRMDQLLNLGWKFLLPISLGN +LLLTTSSQLVSL +>NC_001666@ZemaCp091@ndha@114343@116454@R@2@363 NADH_dehydrogenase_subunit_1 +MIIDRVEVETINSFSKSELFKEIYGLIWILPIFALLLGITIEVLVIVWLE +REISASIQQRIGPEYAGPLGLLQAIADGTKLLLKEDILPSRGDIPLFSIG +PSIAVISILLSFLVIPLGYRFVLADLSIGVFLWIAISSIAPIGLLMAGYS +SNNKYSFSGGLRAAAQSISYEIPLTFCVLAISLLSNSSSTVDIVEAQSKY +GFFGWNLWRQPIGFLVFLISSLAECERLPFDLPEAEEELVAGYQTEYSGI +KYGLFYLVSYLNLLVSSLFVTVLYLGGWNFSIPYISFFGFFQMNKIIGIL +EMVIGIFITLTKAYLFLFISITIRWTLPRMRMDQLLNLGWKFLLPISLGN +LLLTTSSQLVSL +>NC_001879@NitaCp088@ndha@121696@123935@R@2@364 NADH_dehydrogenase_subunit_1 +MIIDTTEIETINSFSKLESLKEVYGIIWMLFPILTLVLGITIGVLVIVWL +EREISAGIQQRIGPEYAGPLGILQALADGTKLLLKENLIPSTGDTRLFSI +GPSIAVISIFLSYSVIPFGDHLVLADLSIGVFFWIAISSIAPVGLLMSGY +GSNNKYSFLGGLRAAAQSISYEIPLALCVLSISLLSNSLSTVDIVEAQSK +YGFWGWNLWRQPIGFIVFLISSLAECERLPFDLPEAEEELVAGYQTEYSG +IKFGLFYIASYLNLLVSSLFVTVLYLGGWNLSIPYIFVPELFGINKRGKV +FGTLIGIFITLAKTYLFLFIPIATRWTLPRLRMDQLLNLGWKFLLPISLG +NLLLTTSSQLLSL +>NC_002186@MeviCp102@ndha@106489@107592@R@1@368 NADH_dehydrogenase_subunit_1 +MLLTINLKDSFLTFFSNLGFSNEFSKALWIPLPILLLIILAVVGVLVVVW +LERKISAAVQQRIGPEYAGPLGVLQPLADGLKLAFKEDIIPSKGDVLLFT +LGPAIVVIPIFLSYLIVPFGENLIVSNINLGIFFWITVSSVAPLGLLMSG +YGSNNKYSFLGGLRATAQSLSYEIPLALCVLSICLLSDSLSTIDIVQKQS +TYGILGWNIWRQPIGFIAFIIAALAECERLPFDLPEAEEELVAGYQTEYT +GMKFGLFYIGSYVNLLVSALFASVLYLGGWSLPIPIEFLLNKMSLNASDS +EVQVISAFLGIGMTLLKTYLFLFLSILTRWTMPRVRIDQLLDLGWKFLLP +ISLGNLLLTASLKIALL +>NC_002202@SpolCp090@ndha@117598@119774@R@2@366 NADH_dehydrogenase_subunit_1 +MIIDTTTTKVQAINSFSRLEFLKEVYETIWMLFPILILVLGITIGVLVIV +WLEREISASIQQRIGPEYAGPLGILQALADGTKLLFKENLLPSRGDTYLF +SIGPSIAVISILLGYLIIPFGSRLVLADLSIGVFLWIAVSSIAPIGLLMS +GYGSNNKYSFLGGLRAAAQSISYEIPLTLCVLSISLLSNSSSTVDIVEAQ +SKYGFWGWNLWRQPIGFIVFIISSLAECERLPFDLPEAEEELVAGYQTEY +SGIKFGLFYVASYLNLLISSLFVTVLYLGGWNLSIPYIFISEFFEINKID +GVFGTTIGIFITLAKTFLFLFIPITTRWTLPRLRMDQLLNLGWKFLLPIS +LGNLLLTTSSQLFSL +>NC_002693@OeelhCp102@ndha@125123@127258@R@2@364 NADH_dehydrogenase_subunit_1 +MIIDTTAVQDMNSFSRLQSLKEVSGIIWMLVPILSLVLGITLGVLVIVWL +EREISAGIQQRIGPEYAGPMGILQALADGIKLIFKENLLPSRGDTRLFSI +GPSIAVISILLSYSVIPFSSHLVLSDLNIGVFLWIAVSSIAPIGLLMSGY +GSNNKYSFLGGLRAAAQSISYEIPLTLCLLSISLLSNSSSTVDIVEAQSK +YGLWGWNLWRQPIGFLVFLISSLAECERLPFDLPEAEEELVAGYQTEYSG +IKFGLFYVASYLNLLVSSLFVTVLYLGGWNISISYIFVPGLFEITKVGRV +FGTTIGIFTTLAKTYLFLFISITTRWTLPRLRMDQLLNLGWKFLLPISLG +NLLLTTSSQLLSL diff --git a/detectors/cds/test/test.db/ndhb.fst b/detectors/cds/test/test.db/ndhb.fst new file mode 100644 index 0000000..a674c53 --- /dev/null +++ b/detectors/cds/test/test.db/ndhb.fst @@ -0,0 +1,120 @@ +>AC_000188@LyesCp066@ndhb@96224@98435@R@2@511 NADH_dehydrogenase_subunit_2 +MIWHVQNENFILDSTRIFMKAFHLLLFDGSLIFPECILIFGLILLLMIDS +TSDQKDIPWLYFISSTSLVMSITALLFRWREEPMISFSGNFQTNNFNEIF +QFLILLCSTLCIPLSVEYIECTEMAITEFLLFVLTATLGGMFLCGANDLI +TIFVAPECFSLCSYLLSGYTKKDVRSNEATMKYLLMGGASSSILVHGFSW +LYGSSGGEIELQEIVNGLINTQMYNSPGISIALIFITVGIGFKLSPAPSH +QWTPDVYEGSPTPVVAFLSVTSKVAASASATRIFNIPFYFSSNEWHLLLE +ILAILSMILGNLIAITQTSMKRMLAYSSIGQIGYVIIGIIVGDSNDGYAS +MITYMLFYISMNLGTFACIVLFGLRTGTDNIRDYAGLYTKDPFLALSLAL +CLLSLGGLPPLAGFFGKLYLFWCGWQAGLYFLVLIGLLTSVVSIYYYLKI +IKLLMTGRNQEITPHVRNYRRSPLRSNNSIELSMIVCVIASTIPGISMNP +IIAIAQDSLF +>AC_000188@LyesCp086@ndhb@142909@145120@D@2@511 NADH_dehydrogenase_subunit_2 +MIWHVQNENFILDSTRIFMKAFHLLLFDGSLIFPECILIFGLILLLMIDS +TSDQKDIPWLYFISSTSLVMSITALLFRWREEPMISFSGNFQTNNFNEIF +QFLILLCSTLCIPLSVEYIECTEMAITEFLLFVLTATLGGMFLCGANDLI +TIFVAPECFSLCSYLLSGYTKKDVRSNEATMKYLLMGGASSSILVHGFSW +LYGSSGGEIELQEIVNGLINTQMYNSPGISIALIFITVGIGFKLSPAPSH +QWTPDVYEGSPTPVVAFLSVTSKVAASASATRIFNIPFYFSSNEWHLLLE +ILAILSMILGNLIAITQTSMKRMLAYSSIGQIGYVIIGIIVGDSNDGYAS +MITYMLFYISMNLGTFACIVLFGLRTGTDNIRDYAGLYTKDPFLALSLAL +CLLSLGGLPPLAGFFGKLYLFWCGWQAGLYFLVLIGLLTSVVSIYYYLKI +IKLLMTGRNQEITPHVRNYRRSPLRSNNSIELSMIVCVIASTIPGISMNP +IIAIAQDSLF +>NC_000927@NeolCp033@ndhb@28430@29950@D@1@507 NADH_dehydrogenase_subunit_2 +MELSDILASFHASNLIPEGIVACTILLVLLLDLVYSRTCHAWLAWVAMAG +LSLASVLLGQQWYQLMNLPTATMTFGGSFQADSLSLVFRAIIAMSCVLCI +LLSIDYVESTGTAPSEFLVLIATASLGGMLVAGSNDLLMMFVSLETLGLA +SYLLTGYMKRDVRSNEASLKYLLVGAASSGLFLYGISWMYGISGGHMELN +SIAHAIVSLDETKTTTCALALVLMTVGVGFKVAAAPFHQWTPDVYQGSPT +PVVAFLSVGSKAAGFILAVRMCTTLFPSFNTEWHLIFTILSILSMIVGNF +IAVTQTSLKRMLGYSSVGQAGVMMIGMLTDSPDGYASLIVYLLIYLFMNL +GAFACVILFGLRTGTDQIQDYSGLLARDPFLALCLSLCLLSLGGIPPLAG +FFGKMYLFLAAWDAGQYSLVWVGLITSVVSIYYYLSVVKIMLVPATQEMS +LAVREYPRRAWSLEPIQPLEVGIFVCVLGSILVGVAGNSMVNLMTITMSQ +APSLGV +>NC_000932@ArthCp068@ndhb@94941@97164@R@2@513 NADH_dehydrogenase_subunit_2 +MIWHVQNENFILDSTRIFMKAFHLLLFDGSFIFPECILIFGLILLLMIDS +TSDQKDIPWLYFISSTSFVMSITALLFRWREEPMISFSGNFQTNNFNEIF +QFLILLCSTLCIPLSVEYIECTEMAITEFLLFILTATLGGMFLCGANDLI +TIFVAPECFSLCSYLLSGYTKKDIRSNEATMKYLLMGGASSSILVHGFSW +LYGSSGGEIELQEIVNGLINTQMYNSPGISIALIFITVGIGFKLSLAPSH +QWTPDVYEGSPTPVVAFLSVTSKVAASASATRIFDIPFYFSSNEWHLLLE +ILAILSMIFGNLIAITQTSMKRMLAYSSIGQIGYVIIGIIVGDSNGGYAS +MITYMLFYIAMNLGTFACIILFGLRTGTDNIRDYAGLYTKDPFLALSLAL +CLLSLGGLPPLAGFFGKLHLFWCGWQAGLYFLVSIGLLTSVLSIYYYLKI +IKLLMTGRNQEITPHMRNYRISPLRSNNSIELSMIVCVIASTIPGISMNP +IIAIAQDTLFSF +>NC_000932@ArthCp086@ndhb@141485@143708@D@2@513 NADH_dehydrogenase_subunit_2 +MIWHVQNENFILDSTRIFMKAFHLLLFDGSFIFPECILIFGLILLLMIDS +TSDQKDIPWLYFISSTSFVMSITALLFRWREEPMISFSGNFQTNNFNEIF +QFLILLCSTLCIPLSVEYIECTEMAITEFLLFILTATLGGMFLCGANDLI +TIFVAPECFSLCSYLLSGYTKKDIRSNEATMKYLLMGGASSSILVHGFSW +LYGSSGGEIELQEIVNGLINTQMYNSPGISIALIFITVGIGFKLSLAPSH +QWTPDVYEGSPTPVVAFLSVTSKVAASASATRIFDIPFYFSSNEWHLLLE +ILAILSMIFGNLIAITQTSMKRMLAYSSIGQIGYVIIGIIVGDSNGGYAS +MITYMLFYIAMNLGTFACIILFGLRTGTDNIRDYAGLYTKDPFLALSLAL +CLLSLGGLPPLAGFFGKLHLFWCGWQAGLYFLVSIGLLTSVLSIYYYLKI +IKLLMTGRNQEITPHMRNYRISPLRSNNSIELSMIVCVIASTIPGISMNP +IIAIAQDTLFSF +>NC_001319@MapoCp003@ndhb@1514@3555@D@2@502 NADH_dehydrogenase_subunit_2 +MKLELDMFFLYGSTILPECILIFSLLIILIIDLTFPKKDTIWLYFISLTS +LLISIIILLFQYKTDPIISFLGSFQTDSFNRIFQSFIVFCSILCIPLSIE +YIKCAKMAIPEFLIFILTATVGGMFLCGANDLVTIFVSLECLSLCSYLLC +GYTKRDIRSNEAAIKYLLIGGTSSSILAYGFSWLYGLSGGETNIQKITNG +LLNAETYNSSGTFIAFICILVGLAFKLSLVPFHQWTPDIYEGSPTPVVAF +LSVTSKIAGLALATRILNILFSFSPNEWKIFLEILAILSMILGNLVAITQ +TSMKRMLAYSSISQIGYILIGLITGDLKGYTSMTIYVFFYIFMNLGTFAC +IILYSLRTGTDNIRDYAGLYIKDPLLSFSLTLCLLSLGGLPPLTGFFGKL +YLFWCGWQSGFYLLVFIALITSVISLYYYLKIIKLILTKKNNEINPYIQA +YIITSPTFFSKNPIEFVMIFCVLGSTFLGIIINPIFSFFQDSLSLSVFFI +K +>NC_001320@OrsajCp075@ndhb@85395@87639@R@2@511 NADH_dehydrogenase_subunit_2 +MIWHVQNENFILDSTRIFMKAFHLLLFQGSFIFPECILIFGLILLLMIDL +TSDQKDRPWFYFISSTSLVISITALLFRWREEPIISFSGNFQTNNFNEIF +QFLILLCSTLCIPLSVEYIECTEMAITEFLLFVLTATLGGMFLCGANDLI +TIFVAPECFSLCSYLLSGYTKRDLRSNEATMKYLLMGGASSSILVHGFSW +LYGSSGGEIELQEIVNGLINTQMYNSPGISIALISITVGLGFKLSPAPFH +QWTPDVYEGSPTPVVAFLSVTSKVAASASATRILDIPFYFSSNEWHLLLE +ILAILSMILGNLLAITQTSMKRMLAYSSIGQIGYVIIGIIVGDSNDGYAS +MITYMLFYISMNLGTFACIVLFGLRTGTDNIRDYAGLYTKDPFLALSLAL +CLLSLGGLPPLAGFFGKLYLFWCGWQAGLYFLVSIGLLTSVLSIYYYLKI +VKLLMTGRNQEITPYVRNYRRSPLRSNNSIELSMTVCVIASTIPGISMNP +ILAIAQDTLF +>NC_001320@OrsajCp104@ndhb@127479@129723@D@2@511 NADH_dehydrogenase_subunit_2 +MIWHVQNENFILDSTRIFMKAFHLLLFQGSFIFPECILIFGLILLLMIDL +TSDQKDRPWFYFISSTSLVISITALLFRWREEPIISFSGNFQTNNFNEIF +QFLILLCSTLCIPLSVEYIECTEMAITEFLLFVLTATLGGMFLCGANDLI +TIFVAPECFSLCSYLLSGYTKRDLRSNEATMKYLLMGGASSSILVHGFSW +LYGSSGGEIELQEIVNGLINTQMYNSPGISIALISITVGLGFKLSPAPFH +QWTPDVYEGSPTPVVAFLSVTSKVAASASATRILDIPFYFSSNEWHLLLE +ILAILSMILGNLLAITQTSMKRMLAYSSIGQIGYVIIGIIVGDSNDGYAS +MITYMLFYISMNLGTFACIVLFGLRTGTDNIRDYAGLYTKDPFLALSLAL +CLLSLGGLPPLAGFFGKLYLFWCGWQAGLYFLVSIGLLTSVLSIYYYLKI +VKLLMTGRNQEITPYVRNYRRSPLRSNNSIELSMTVCVIASTIPGISMNP +ILAIAQDTLF +>NC_001666@ZemaCp075@ndhb@89236@91472@R@2@511 NADH_dehydrogenase_subunit_2 +MIWHVQNENFILDSTRIFMKAFHLLLFHGSFIFPECILIFGLILLLMIDL +TSDQKDRPWFYFISSTSLVISITALLFRWREEPIISFSGNFQTNNFNEIF +QFLILLCSTLCIPLSVEYIECTEMAITEFLLFVLTATLGGMFLCGANDLI +TIFVAPECFSLCSYLLSGYTKRDLRSNEATMKYLLMGGASSSILVHGFSW +LYGSSGGEIELQEIVNGLINTQMYNSPGISIALIFITVGLGFKLSPAPFH +QWTPDVYEGSPTPVVAFLSVTSKVAASALATRILDIPFYFSSNEWHLLLE +ILAILSMILGNLLAITQTSMKRMLAYSSIGQIGYVIIGIIVGDSNDGYAS +MITYMLFYISMNLGTFACIVLFGLRTGTDNIRDYAGLYTKDPFLALSLAL +CLLSLGGLPPLAGFFGKLYLFWCGWQAGLYFLVSIGLLTSVLSIYYYLKI +IKLLMTGRNQEITPYVRNYRRSPLRSNNSIELSMTVCVIASTIPGISMNP +ILAIAQDTLF +>NC_001666@ZemaCp101@ndhb@131265@133501@D@2@511 NADH_dehydrogenase_subunit_2 +MIWHVQNENFILDSTRIFMKAFHLLLFHGSFIFPECILIFGLILLLMIDL +TSDQKDRPWFYFISSTSLVISITALLFRWREEPIISFSGNFQTNNFNEIF +QFLILLCSTLCIPLSVEYIECTEMAITEFLLFVLTATLGGMFLCGANDLI +TIFVAPECFSLCSYLLSGYTKRDLRSNEATMKYLLMGGASSSILVHGFSW +LYGSSGGEIELQEIVNGLINTQMYNSPGISIALIFITVGLGFKLSPAPFH +QWTPDVYEGSPTPVVAFLSVTSKVAASALATRILDIPFYFSSNEWHLLLE +ILAILSMILGNLLAITQTSMKRMLAYSSIGQIGYVIIGIIVGDSNDGYAS +MITYMLFYISMNLGTFACIVLFGLRTGTDNIRDYAGLYTKDPFLALSLAL +CLLSLGGLPPLAGFFGKLYLFWCGWQAGLYFLVSIGLLTSVLSIYYYLKI +IKLLMTGRNQEITPYVRNYRRSPLRSNNSIELSMTVCVIASTIPGISMNP +ILAIAQDTLF diff --git a/detectors/cds/test/test.db/ndhd.fst b/detectors/cds/test/test.db/ndhd.fst new file mode 100644 index 0000000..e4b1b3d --- /dev/null +++ b/detectors/cds/test/test.db/ndhd.fst @@ -0,0 +1,113 @@ +>AC_000188@LyesCp081@ndhd@116944@118446@R@1@501 NADH_dehydrogenase_subunit_4 +MNYFPWLTIIVVFPIFAGSLIFFLPHKGNRVIRWYTICICILELLLTTYA +FCYHFQSDDPLIQLVEDYKWIDFFDFHWRLGIDGLSIGPILLTGFITTLA +TLAAWPVTRDSRLFHFLMLAMYSGQIGLFSSRDLLLFFIMWELELIPVYL +LLAMWGGKKRLYSATKFILYTAGGSVFLLMGVLGVALYGSNEPTLNFETS +VNQSYPVVLEIIFYIGFFIAFAVKSPIIPLHTWLPDTHGEAHYSTCMLLA +GILLKMGAYGLIRINMELLPHAHSIFSPWLMIIGTIQIIYAASTSLGQRN +LKKRIAYSSVSHMGFIIIGISSLTDTGLNGALLQIISHGFIGAALFFLAG +TTYDRIRLVYLDEMGGIAIPMPKMFTMFSSFSMASLALPGMSGFVAELIV +FFGIITGQKYLLMPKLLITFVMAIGIILTPIYSLSMPRQMFYGYKLFNAP +KDSFFDSGPRELFLSISIFLPVIGIGIYPDFVLSLAVDKVEVILSNFFYR +>NC_000927@NeolCp113@ndhd@139299@140801@D@1@501 NADH_dehydrogenase_subunit_4 +MTHFPWLSTIVLFPLLASLAIPWLPDRKGTTVRWYALGVGLIDFSLIAYM +FGRYYDFEQTSLQFVEDITWIDRLHLHWSLGVDGLSMPLVLLTGFITTLA +TLAAWPVTKNPRLFYFLMLAMYTGQLGVFVVQDLLLFFLMWELELIPVYL +LVSCWGGKKRLYAATKFILYTALGSIFILLGALTMPFMGIQGVTFDMSTL +AYREYSLPVEILLYTGFLIAYGVKLPAIPVHTWLPDTHGEAHYSTCMLLA +GILLKMGGYALIRINMNMLPHAHALFSPWLIGVGVVNIIYAALTSFAQRN +LKRKIAYSSVSHMGFVLIGIGSLSEAGLNGAMLQMISHGLIGASLFFLAG +TTYDRTRTLVLEEMGGLATFMPKTFALFTACSLASLALPGMSGFFAELLV +FLGLVTSEAYSPTFRAIMTVFEAIGILLTPIYLLSMLRQLFYGRSIGRPK +ALIDAGPREVFVVSCLLVPILGIGIYPKLATAIYVNTTDHVVQHVLSALR +>NC_000932@ArthCp074@ndhd@115665@117167@R@1@501 NADH_dehydrogenase_subunit_4 +MNDFPWLTIIVVFPISAGSLMLFLPHRGNKVNKWYTICICILELLLTTYA +FCYNFKMDDPLIQLSEDYKWIDFFDFYWRMGIDGLSIGTILLTGFITTLA +TLAAFPVTRDSRFFHFLMLAMYSGQIGSFSSRDLLLFFIMWELELIPVYL +LLSMWGGKKRLYSATKFILYTAGSSIFLLIGVLGISLYGSNEPTLNLELL +ANKSYPVTLEILFYIGFLIAFAVKSPIIPLHTWLPDTHGEAHYSTCMLLA +GILLKMGAYGLVRINMELLPHAHSMFSPWLLVVGTIQIIYAASTSPGQRN +LKKRIAYSSVSHMGFIIIGISSITDPGLNGAILQIISHGFIGAALFFLAG +TSYDRIRLVYLDEMGGMAISIPKIFTMFTILSMASLALPGMSGFIAEFIV +FFGIITSQKYFLISKIFIIFVMAIGMILTPIYLLSMLRQMFYGYKLINIK +NFSFFDSGPRELFLSISILLPIIGIGIYPDFVLSLASDKVESILSNYFYG +>NC_001319@MapoCp079@ndhd@96665@98164@R@1@500 NADH_dehydrogenase_subunit_4 +MNHFPWLTIIVLFPISAGLVIPFLPSTGNKIIRWYTLGVCLLEFLLITYI +FCYHYQFNDHLIQLKEDYNWISFINFHWRLGIDGFSIGLILLTGFITTLA +TLAAWPVTRNPRLFYFLMLAMYSGQIGLFASQDILLFFFMWELELLPVYL +LLAMWGGKRRLYAATKFILYTAAGSLFILIGGLIMAFYNSNEFTFDFQFL +INKKYPLELEIIIYLSFLIAYAVKLPIIPFHTWLPDTHGEAHYSTCMLLA +GILLKMGAYGLIRINMELLPHAHSFFAPWLVIVGAIQIVYAALTSLSQRN +LKRRIAYSSVSHMGFVLIGIGSITNLGLNGAILQMISHGLIGASLFFLAG +ISYDRTRTLVLDQMGGIGNSMPKIFTLFTSCSMASLALPGMSGFIAELMI +FLGVIDNPNYSSLFKIIIIIIQGIGIILTPIYLLSMLRQMFYGYKFSNTL +EPYFMDAGPREIFILICLFFPIISIGIYPNFVLSIWNSKVNFLLSNNFF +>NC_001320@OrsajCp088@ndhd@106398@107900@R@1@501 NADH_dehydrogenase_subunit_4 +MSSFPWLTILVVLPIFAGSLIFFLPHRGNKIVRWYTMSICLLEFLLMTYA +FCYHFQLEDPLIQLKEDSKWIDVFNFHWRLGIDGLSLGSILLTGFMTTLA +TLAAWPVTRNSRLFYFLMLAMYSGQIGLFSSRDLLLFFIMWELELIPVYL +LLSMWGGKRRLYSATKFILYTAGGSIFFLIGVLGMGLYGSNEPRLDLERL +INQSYPATLEILFYFGFLIAYAVKLPIIPLHTWLPDTHGEAHYSTCMLLA +GILLKMGAYGLIRINMELLPHAHYLFSPWLVIIGAMQIIYAASTSLGQRN +FKKRIAYSSVSHMGFIIIGIGSITNIGLNGAILQILSHGFIGATLFFLAG +TACDRMRLVYLEELGGASIPMPKIFTMFSSFSMASLALPGMSGFVAELVV +FFGLITSPKFLLMPKMLITFVMAIGMILTPIYLLSMLRQMFYGYKLFHVP +NENFEDSGPRELFLLICIFLPVIGIGIYPDFVLSLSVDRVEALLSNYYPK +>NC_001666@ZemaCp086@ndhd@110138@111640@R@1@501 NADH_dehydrogenase_subunit_4 +MSYFPWLTILVVLPIFAGSLIFFLPHKGNKIVRWYTIAICLLEFLLMTYA +FCYHFQLEDPLIQLKEDSKWIDVFDFHWRLGIDPLSLGSILLTGFITTLA +TLAAWPVTRNSQLFYFLMLAMYSGQIGLFSSRDLLLFFIMWELELIPVYL +LLSMWGGKRRLYSATKFILYTAGGSIFFLIGVLGMGLYGSNEPGLDLERL +INQSYPTTWEILLYFGFLIAYAVKLPIIPLHTWLPYTHGEAHYSTCMLLA +GILLKMGAYGLIRVNMELLPHAHYLFSPWLVIIGAVQIIYAASTSLGQRN +FKKRIAYSSVSHMGFIIIGIGSITNIGLNGAILQILSHGFIGATLFFLAG +TACDRMRLVYLEELGGISIPMPKIFTMFSSFSMASLALPGMSGFVAELVV +FFGLITSPKFMLMPKMLITFVMAIGMILTPIYLLSMLRQMFYGYKLFHVP +NKNFVDSGPRELFLLICIFLPVIGIGIYPDLVLSLSVDRVEVLLSNYYTK +>NC_001879@NitaCp083@ndhd@117525@119027@R@1@501 NADH_dehydrogenase_subunit_4 +MNYFPWLTIIVVFPIFAGSLIFFLPHKGNRVIRWYTICICILELLLTTYA +FCYHFQSDDPLIQLVEDYKWINFFDFHWRLGIDGLSIGPILLTGFITTLA +TLAAWPVTRDSRLFHFLMLAMYSGQIGSFSSRDLLLFFIMWELELIPVYL +LLCMWGGKKRLYSATKFILYTAGGSVFLLMGVLGLALYGSNEPTLNFETS +VNQSYPVVLEIIFYIGFFIAFAVKSPIIPLHTWLPDTHGEAHYSTCMLLA +GILLKMGAYGLIRINMELLPHAHSIFSPWLMIIGTIQIIYAALTSLGQRN +LKKRIAYSSVSHMGFIIIGISSLTDTGLNGALLQIISHGFIGAALFFLAG +TTYDRIRLVYLDEMGGIAIPMPKMFTMFSSFSMASLALPGMSGFVAELIV +FFGIITGQKYLLIPKILITFVMAIGMILTPIYSLSMSRQMFYGYKLFNAP +KDSFFDSGPRELFLSISIFLPVIGIGIYPDFVLSLAVDKVEVILSNFFYR +>NC_002186@MeviCp085@ndhd@90277@91800@D@1@508 NADH_dehydrogenase_subunit_4 +MNNFPWITSIVMLPILAGLLIPFIPDENGKNVRWYALGIGLLDFLLISYI +FGYKYNIQDTSLQLIDDYEWISSINFHWRLGIDGLSIPLILLTGFITTLA +MLGAWPIQKNAKLFYFLMLAMYSGQLGVFASQDLLLFFLMWELELIPIYI +LLIIWGGKKRLYAATKFILYTALGSIFILIAAFGMAFYGENMSFDMQILG +EKEYPINLEILFYICFLIAYAVKLPAFPVHTWLPDTHGEAHYSTCMLLAG +ILLKMGGYALIRINMNMLPNAHIYFAPYLAIIGVINIIYAALTSFAQRNI +KRKIAYSSISHMGFVLIGISSFTDIGLSGAMLQMVSHGLIGASLFFLAGT +TYDRTRTLILEDMGGIAKYMPKIFAMFTTCSLASLALPGMSGFVAELMVF +LGFANSNAYSIEFRGIITFLEAIGIIVTPIYLLSMLRQVFYGSENLKLLK +VNNLIDASAREIFIISCLLVPVIGIGIYPRILTQIYDLKTNAIIEHLEII +RSNSQIM +>NC_002202@SpolCp085@ndhd@113491@114996@R@1@502 NADH_dehydrogenase_subunit_4 +MTNSFPWLTTIVVLPIFAGSLIFLFPHRGNKVIRWYTICISMIELLLMTY +VFFYHFQPDDPLIQLVEDYKWINFFDFHWRLGIDGLSIGPILLTGFITTL +ATLAAWPVTRNSQLFHFLMLAMYSAQIGLFSSRDLLLFFIMWELELIPVY +LLLSMWGGKKRLYSATKFILYTAGGSIFLLMGVLGVGLYGSNEPTLNLET +LVNQSYPVALEIIFYIGFFIAFAVKLPIIPLHTWLPDTHGEAHYSTCMLL +AGILLKMGAYGLVRINMELLPHAHSIFSPWLMIIGTMQIIYAASTSPGQR +NLKKRIAYSSVSHMGFIIIGISSITDTGLNGAILQIISHGFIGAALFFLA +GTSYDRIRLVYLDEMGGIAIPMPKIFTLFSSFSMASLALPGMSGFIAELI +VFFGLITSQKYLLIPKLLITFGMAIGMILTPIYLLSMSRQMFYGYKLFNI +SNSSFFDSGPRELFVSTSIFLPVIGIGVYPDLVLSLSVEKVEAILSNYFY +R +>NC_002693@OeelhCp097@ndhd@121124@122647@R@1@508 NADH_dehydrogenase_subunit_4 +MNSFPWLTIIVVFPILTGSLIFLLPHRGNKVMKWYTLCICILELLLTTYT +FCYHFQLDDPLTQLTENYKWIHFFDFYWRLGIDGLSIGPILLTGFITTLA +TLAAWPVTRDAQLFHFLMLAMYSGQIGSFSSRDLLLFFLMWEFELIPVYL +LLSMWGGKKRLYSATKFILYTAGGSIFLLIGVLGIGLYGSNEPTLNFETL +ANQSYPVALEVIFYVGFLIAFAVKLPIIPFHTWLPDTHGEAHYSTCMLLA +GILLKMGAYGLVRINMELLPHAHCLFSPGLIIVGAIQIIYAASTSPGQLN +LKKRIAYSSISHMGFIIIGIGSLSDTGLNGAILQIISHGFIGAALFFLAG +TSYDRIRLLYLDEMGGMAIPLPKLFTMLSILSMASLALPGLSGFVAELLV +FFGIITSQKYLLMPKILIAFLMAIGMILTPIYSLSMLRQMFYGYKLFNVP +NYYFFDSGPRELFVSISLLLPIIGIGIYPDFVLSLSVEKVEAIISHFFFS +IVFKKKE diff --git a/detectors/cds/test/test.db/ndhe.fst b/detectors/cds/test/test.db/ndhe.fst new file mode 100644 index 0000000..4c87a47 --- /dev/null +++ b/detectors/cds/test/test.db/ndhe.fst @@ -0,0 +1,39 @@ +>AC_000188@LyesCp080@ndhe@119061@119366@R@1@102 NADH_dehydrogenase_subunit_4 +MILEHVLVLSAYLFSIGIYGLITSRNMVRALMCLELILNAVNINFVTFSD +FFDNRQLKGDIFSIFVIAIAAAEAAIGLAIVSSIYRNRKSTRINQSNLLN +N +>NC_000927@NeolCp119@ndhe@147326@147631@D@1@102 NADH_dehydrogenase_subunit_4L +MIFQSYLLIAASMFCIGLYGLLTSRNVVRVLMSLELLLNAVNLNLLTFSN +FVDSHEMKGQVLALFVIALAAAEAAIGLAIILSIYRNQRTVDPEQFNLLK +W +>NC_000932@ArthCp076@ndhe@117804@118109@R@1@102 NADH_dehydrogenase_subunit_4L +MILEHVLVLSAYLFLIGLYGLITSRNMVRALMCLELILNAVNMNFVTFSD +FFDNSQLKGEIFCIFVIAIAAAEAAIGLAIVSSIYRNRKSIRINQSTLLN +K +>NC_001319@MapoCp081@ndhe@98757@99059@R@1@101 NADH_dehydrogenase_subunit_4L +MLEHILTLSAFLFCIGVFGLITSRNMVRALMCLELIFNAVNINLVAFSNF +LDSSQIKGEIFSIFIIAIAAAEATIGLAIVLAIYRNRKSTRIDQFNLLKW +>NC_001320@OrsajCp090@ndhe@108712@109017@R@1@102 NADH_dehydrogenase_subunit_4L +MMFEHVLFLSVYLFSIGIYGLITSRNMVRALICLELILNSINLNLVTFSD +LFDSRQLKGDIFAIFVIALAAAEAAIGLSILSSIHRNRKSTRINQSNFLN +N +>NC_001666@ZemaCp088@ndhe@112473@112778@R@1@102 NADH_dehydrogenase_subunit_4L +MMFERVLFLSVYLFSIGIYGLITSRNMVRALICLELILNSINLNLVTFSD +LFDSRQLKGDIFAIFVIALAAAEAAIGLSILSSIHRNRKSTRINQSNFLN +N +>NC_001879@NitaCp085@ndhe@119652@119957@R@1@102 NADH_dehydrogenase_subunit_4L +MILEHVLVLSAYLFSIGIYGLITSRNMVRALMCLELILNAVNINFVTFSD +FFDNRQLKGDIFSIFVIAIAAAEAAIGLAIVSSIYRNRKSTRINQSNLLN +N +>NC_002186@MeviCp099@ndhe@104916@105221@R@1@102 NADH_dehydrogenase_subunit_4L +MYIENFLLLASALFCIGIYGLLTSRNIVRVLMCLELCLNAININFIAFSN +FIDYEKINGQVIAIFIMTIAAAEAAIGLALVLTIYRNRETVDIENFDLLK +G +>NC_002202@SpolCp087@ndhe@115663@115968@R@1@102 NADH_dehydrogenase_subunit_4L +MILEHVLVLSAFLFSIGIYGLVTSRNLVRALMCLELILNAVNLNFVTFSD +FFDSRQLKGNIFSIFVIAIAAAEAAIGPAIVSSIYRNRKSIRINQSNLLN +K +>NC_002693@OeelhCp099@ndhe@123298@123603@R@1@102 NADH_dehydrogenase_subunit_4L +MILEHVLVLSAYLFSIGIYGLITSRNMVRALMCLELILNSVNLNFVTFSD +FFDSRQLKGDIFSIFIIAIAAAEAAIGLAIVSSIYRNRKSIRINQSNLLN +K diff --git a/detectors/cds/test/test.db/ndhf.fst b/detectors/cds/test/test.db/ndhf.fst new file mode 100644 index 0000000..9c5b2df --- /dev/null +++ b/detectors/cds/test/test.db/ndhf.fst @@ -0,0 +1,157 @@ +>AC_000188@LyesCp073@ndhf@111508@113721@R@1@738 NADH_dehydrogenase_subunit_5 +MEQTYEYAWIIPFIPLPVPMLIGAGLILFPTATKRFRRMWAFQSVLLLSI +VMIFSIYLSIQQINSSSVYQYVWSWIINNDFSLDFGYLIDPLTSIMSILI +TTVGIMVLIYSDNYMAHDQGYLRFFAYMSFFSTSMLGLVTSSNLIQIYIF +WELVGLCSYLLIGFWFTRPVAANACQKAFVTNRVGDFGLLLGILGFYWIT +GSFEFRDLFEIFNNLIYNNELNFLFVTLCAVLLFAGAVAKSAQFPLHVWL +PDAMEGPTPISALIHAATMVAAGIFLVARLLPLFRVIPYIMYLISVIGII +TVLLGATLALAQKDIKRGLAYSTMSQLGYMMLALGMGSYRSALFHLITHA +YSKALLFLGSGSIIHSMETIVGYSPAKSQNMGLMGGLRKHVPITKITFLL +GTLSLCGIPPLACFWSKDEILNDSWLYSPIFAIIAWATAGLTAFYMFRIY +LLTFEGHLNAHFQNYGGKQKIPFYSISLWGKNGVKKNSCLLTMNNNESTY +FLSKTKYPIAKNGRKMTRPFMTIAHFKHKAVSSYPYESDNTMLFPIFVLG +LFTLFVGAIGIPFNQEGVNLDILSKWLAPSINLLHPKSNNSLDWNEFLKD +AVVSVSIAYFGIFIASFLYKPIYSSLKNLEFINSFVKKGPKRILWDKILN +GIYDWSYNRAYIDAFYTRFFVGGIRGLAEFTHFVDRRVIDGMTNGVGVIS +FIVGEGIKYIGGGRISSYLFLYLAYVSVFLLVYYLLF +>NC_000927@NeolCp114@ndhf@140837@142783@R@1@649 NADH_dehydrogenase_subunit_5 +MEIFHQAIWLIPVLPLSASMLSGIGLLTFRETTSDLRRLHGALAIGAMAL +SFVVSLGVLWNQLHGIAPVRWIIEWMLTDTFRLEIGYWVDPLTSTMLVVV +TSVALLVMIYSDEYMHVDEGYVRFFVYLSIFTTSMLGLVLSPNLVQVYGF +WELVGMCSYLLVGFWFTRPTAAEASQKAFITNRVGDFGLLLGILALYWMT +GSFEFASIADRLGDLLIAIPSLRTIACIACILVFMGPIAKSAQFPLHVWL +PDAMEGPTPISALIHAATMVAAGVFLVARMFPVFDQLPLVMELIAWTGTL +TAFLGATMALTQSDIKKGLAYSTMSQLGYMIMALGTGAYSEALFHLTTHA +YSKALLFLAAGSVIHGMEPVVGFSPMQNQNMHRMGGLRKYMPLTAMTFLL +GTCSICGIPPLACFWSKDAILAEVFATHPTCWLIAWLTAGMTGFYMFRIY +FLTFEGSFRSDLGRAKPKESHLGMVAPLIILAIPTVAIGSLGTPFAPVWE +TFVHAPGQLSSLDEEFDLAEFLEMAGSSVGIGLLGISLSSLMYRNYAIDA +TRISEYFSPLNRLFASKWYIDDLYAQVIVQGTRTIAQTLLIFDQRIIDGA +VNLTAFGTLSAADTLKYWENGRVQFYILSIIFGVLFGSWLLTTHLSSL +>NC_000932@ArthCp071@ndhf@110398@112638@R@1@747 NADH_dehydrogenase_subunit_5 +MEHTYQYSWIIPFIPLPVPILLGVGLLLFPTATKNLRRMWTFLSIFLLSI +VMIFSIYLSIQQIFLSCIHQNVWSWTINNEFSFEFGYFIDPLTSIMSILI +TTVGILVLIYSDNYMSHDQGYLRFFAYMGFFNTSMLGLVTSSNLIQVYFF +WELVGMCSYLLIGFWFTRPIAANACQKAFVTNRVGDFGLLLGILGLYWIT +GSFEFQDLFEIFNNLILNNRVNLLFLTLCAFLLFVGPIAKSAQFPLHVWL +PDAMEGPTPISALIHAATMVAAGIFLVARLLPLFIVIPSIMYIISLIGII +TVLLGATLALAQKDIKRGLAYSTMSQLGYMMLALGMGSYRSALFHLITHA +YSKALLFLGSGSIIHSMEAIVGYSPDKSQNMILMGGLTKHVPITKTAFLI +GTLSLCGIPPLACFWSKDEILNDSLLFSPIFAIIACSTAGLTAFYMFRIY +LLTFEGHLNTYFLNYSGKKSGSFYSLSLWGKEEEKKLNKNFGLVPLLTMN +NTKRASFFCNKTYKISNNVRNQIFITVENFGLNTRTFYYPHESDNTILFP +MLILVLFTLFIGAIGIPFNQEGIDFDILSKFFTPSINLLHKNSQNFVDWY +EFLRNATFSVSIAFFGIFIAYCLYKPFYSSLLNLTLLNSFQKWNSKRIHW +EKLINFVYNWSYNRGYIDSFFKTSLIESIRRLAKQTTFFDKRIIDGITNG +VGITSFFVGEVTKYIGGSRISSYLFLYLSYVLIFLMILFFFYFEKF +>NC_001319@MapoCp074@ndhf@91101@93179@R@1@693 NADH_dehydrogenase_subunit_5 +MELIFQNVWFVPLFPFLASILLGIGLFFFPNSIKKFRRLSSFISIMFLNI +AMLLSFHFFWQQITGSPIHRYLWSWVLYKNFVLEIGYLLDPLTSIMLVLV +TTVAVMVMIYSDSYMFYDEGYIKFFCYLSLFTASMLGLVLSPNLIQVYIF +WELVGMCSYLLIGFWFTRPSAANACQKAFVTNRIGDFGLLLGILGFYWIT +GSFDFQQLSKRFFELLSYNQINLVFATLCALFLFLGPVAKSAQFPLHIWL +PDAMEGPTPISALIHAATMVAAGIFLVARMFPLFQMLPFVMSIISWTGAI +TALLGATIALAQKDLKKGLAYSTMSQLGYMMLALGIGSYKAGLFHLITHA +YSKALLFLGSGSVIHSMEPIVGYHPNKSQNMIFMGGLRQYMPITAITFLF +GTLSLCGIPPFACFWSKDEILVNSWLHFPILGSIAFFTAGLTAFYMFRIY +FLTFEGDFRGHFFDDVKKLSSISIWGSLEFNKEQFKLDKKSTLYPKEANN +IMLFPLIILTIPTVFIGFIGILFDENKMNVDSLSYWLTLSINSFNYSNSE +KFLEFLFNAIPSVSIAFFGILIAFYLYGPNFSFLKKEKKKLQLKSEIDIV +LKSFSNFIYNWSYYRAYIDGFYSSFFIKGLRFLIKIVSFIDRWIIDGIIN +GIGIFSFFGGESLKYIEGGRISSYLFFIIFCMFLFFLYSYII +>NC_001320@OrsajCp085@ndhf@101433@103637@R@1@735 NADH_dehydrogenase_subunit_5 +MEHTYQYAWVIPLLPLPVIMSMGFGLFLVPTATKNLRRIWAFPSVLLLSI +AMVFSVHLSIQQINGSSIYQYLWSWTVNNDFSLEFGYLIDPLTSIMLILI +TTVGILVLIYSDDYMSHDEGYLRFFVYISFFNTSMLGLVTSSNLIQIYFF +WELVGMCSYLLIGFWFTRPIAASACQKAFVTNRVGDFGLLLGILGFFWIT +GSLEFRDLFKIANNWIPNNEINSLLTILCAFLLFLGAVAKSAQFPLHVWL +PDAMEGPTPISALIHATTMVAAGIFLIARLLPLFISLPLIMSFISLIGTL +TLFLGATLALAQRDIKRSLAYSTMSQLGYMMLALGIGSYQAALFHLITHA +YSKALLFLGSGSVIHSMEPLVGYSPDKSQNMVLMGGLRKYIPITRTCFLW +GTLSLCGIPPLACFWSKDEILSNSWLYSPFFGIIASFTAGLTAFYMFRIY +LLTFDGYLRVHFQNYSSTKEDSLYSISLWGKRISKGVNRDFVLSTAKSGV +SFFSQNLSKIHVNTGNRIGSFSTSLGTKNTFVYPHEPGNTMLFPLLILLL +CTLFIGSIGIHFDNEIGELTILSKWLTPSINFFQESSNSSINSYEFITNA +ISSVSLAIFGLFIGIYVLWICLLFFSEFDLINSFVKGGPKKYFFHQLKKK +IYSWSYNRGYIDIFYTRTFTLGIRGLTELTQFFDKGVIDGITNGVGLASF +CIGEEIKYVGGGRISSYLFFFLCYVSVFLFFFLS +>NC_001666@ZemaCp083@ndhf@105072@107288@R@1@739 NADH_dehydrogenase_subunit_5 +MEHTYQYAWVIPLLPLPVIMSMGFGLFLIPTATKNLRRIWAFPSILLLSI +AMVFSLHLSIQQINGSSIYQYLWSWTINNDFSLEFGYLVDPLTSIMLILI +TTVGILVLIYSDDYMSHDEGYLRFFVYISFFNTSMLGLVTSSNLIQIYFF +WELVGMCSYLLIGFWFTRPIAASACQKAFVTNRVGDFGLLLGILGFFWIT +GSLEFRDLFKIANNWIPNNGINSLLTTLCAFLLFLGAVAKSAQFPLHVWL +PDAMEGPTPISALIHAATMVAAGIFLLARLLPLFISLPWIMSFISLIGTI +TLFLGATLALAQRDIKRSLAYSTMSQLGYMMLALGIGSYQAALFHLITHA +YSKALLFLGSGSVIHSMEPLVGYSPDKSQNMVLMGGLRKYVPITRTTFLC +GTLSLCGIPPLACFWSKDEILSNSWLYSPFFGIIASFTAGLTAFYMFRIY +LLTFDGYLRVHFQNYSSTKEGSLYSISLWGKSISKGVNRDFVLSTMKSGV +SFFSQNIPKIPANTRNKIGSFSTPFGAKNTFVYPHETGNTMLFPLLILLL +FTLFIGSIGIHFDNGVKDNRILELTILSKWLTPSINLFQENSNSSINSYE +FLTNAISSVSLAIFGLFIAYIFYGSAYSFFQNLNFQNSLVKKNPKKSFLD +EVKKKIYSWSYNRGYIDFFYTRVFILGIRKLAELTHFFDKGVIDGITNGV +GLAGFCIGEEIKYVGGGRISSYLFFFLCYVSLFLFFIP +>NC_001879@NitaCp080@ndhf@112072@114294@R@1@741 NADH_dehydrogenase_subunit_5 +MEQTYEYAWIIPFIPLPVPMLIGAGLFLFPTATKSFRRMWAFQSVLLLSI +VMVFSIYLSIQQINSSSFYQYVWSWIINNDFSLDFGYLIDPLTSIMSILI +TTVGIMVLIYSDNYMAHDQGYLRFFAYMSFFSTSMLGLVTSSNLIQIYIF +WELVGLCSYLLIGFWFTRPVAANACQKAFVTNRVGDFGLLLGILGFYWIT +GSFEFRDLFEIFNNLIYNNEVDFLFVTLCAVLLFAGAVAKSAQFPLHVWL +PDAMEGPTPISALIHAATMVAAGIFLVARLLPLFRVIPYIMYLISVIGII +TVLLGATLALAQKDIKRGLAYSTMSQLGYMMLALGMGSYRSALFHLITHA +YSKALLFLGSGSIIHSMETIVGYSPAKSQNMGLMGGLRKHVPISKITFLL +GTLSLCGIPPLACFWSKDEILNDSWLYSPIFAIIAWATAGLTAFYMFRIY +LLTFEGHLNAHFPNYGGKQKTPFYSISLWGKNGVKKNSCLLTMNNNESTY +FFAKTKYPIDKNGRKMTRPFMTIAHFEHKAVYSYPYESDNTMLFPIFVLG +LFTLFVGSIGIPFNQEGGNLDILSKWLAPSINLLHQKSNNSMDWNEFLKD +AVLSVSIAYFGIFIASFLYKPIYSSLKNFELINSFVKKGPKRILWDKIIN +GIYDWSYNRAYIDAFYTRFLVGGIRGLAEFTHFFDRRVIDGMTNGVGVIS +FIVGEGIKYIGGGRISSYLFLYLAYVSIFLLVYYLLFSTL +>NC_002186@MeviCp105@ndhf@109803@111761@D@1@653 NADH_dehydrogenase_subunit_5 +MESISQYAWLIPIFPLAGSLLIGIGLISFRRATNILRWRYSFLIIALLGI +SLILSCLILFSQINATPSYQWIFQWIVTNNFLLEIGYFVDPLTAVMLVIV +TTVAILVLIYTDGYMSYDEGYVRFFAYLSLFTTSMLGLVLSPNLLQIYVF +WELVGMCSYLLIGFWFTRPAAADACQKAFVTNRVGDFGLLLGILGFYWMT +GSFEFDVISMKLLQLAEYDNFNTQLAIFFGFLIFLGPVAKSAQFPLHVWL +PDAMEGPTPISALIHAATMVAAGVFLVARMFPIFSQFPFLMDLIAWTGAI +TAIIGATIAVTQVDLKKGLAYSTMSQLGYMIMAMGMGSYTASLFHLMTHA +YSKALLFLSAGSTIHGMEPIVGFNPAKNQNMSLMGGIRKYMPITGNAFLI +GTLSLCGIPPLACFWSKDAILSNAFVHSPLLWFIGWSTAGLTSFYMFRMY +FLVFEGEFRGNSVNQEKIRSNKLPKESNTKMTLPLIILTLFSITIGWIGT +PFNNQFMFLIHTINQEIEPFDINEFLFIAGSSVGIALLGCYTAYLIYIKD +KNTDKFANLLQPFYQLSFNKWYIDDIYEYIFVKGNRQLAQQTLLFDKKII +DGFVNLTGLITLVSSESLRSIENGKIQSYILMIIFTLLTILGISQTYYSL +IL +>NC_002202@SpolCp080@ndhf@107770@109998@R@1@743 NADH_dehydrogenase_subunit_5 +MEHIYQYAWIIPFLPLPVPLLIGAGLLFFPTATKNLRRIWAFSSISLLSI +VMIFSMKLAIQQINSNSIYQYLWSWTINNDFSLEFGYLMDPLTSIMSMLI +TTVAILVLIYSDNYMSHDQGYLRFFAYMSFFNTSMLGLVTSSNLIQIYIF +WELVGMCSYLLIGFWFTRPIAANACQKAFVTNRVGDFGLLLGILGLYWIT +GSFEFRDLFEIFNNLIKNNEVNSLFCILCAFLLFAGAVAKSAQFPLHVWL +PDAMEGPTPISALIHAATMVAAGIFLVARLLPLFVVIPYIMYVISFIGII +TVLLGATLALAQKDIKRSLAYYTMSQLGYMMLALGMGSYRTALFHLITHA +YSKALLFLASGSLIHSMGTIVGYSPDKSQNMVLMGGLTKHVPITKTSFLI +GTLSLCGIPPLACFWSKDEILNDSWVYSPIFAIIAYFTAGLTAFYMFRIY +LLTFEGHLNFFCKNYSGKKSSSFYSISLWGKKELKTINQKISLLNLLTMN +NKERASFFSKKPYEINVKLTKLLRSFITITYFENKNISLYPYESDNTMLF +PLIILIMFTLFVGFIGIPFNQEGMDLDILTKWLTPSINLLHSNSENFVDW +YEFVINAIFSISIAFFGIFIAFFFYKPIYSSLKNFDLINSFDKRGQKRIL +GDNIITIIYNWSANRGYIDAFYSTFLIKGIRSLSELVSFFDRRIIDGIPN +GFGVTSFFVGEGIKYVGGGRISSYLFWYLLYVSIFLFIFTFT +>NC_002693@OeelhCp094@ndhf@115809@118142@R@1@778 NADH_dehydrogenase_subunit_5 +MEYTYQYSWIIPFIPLPVPILIGMGLLLFPTATKNHRRVWSFPSILLLSM +VMLLSVYLSIQQINRSFIYQYVWSWTINNDFSLEFGHLIDPLASIMLILI +TTVGILVLFYSDNYMSHDQGYLRFFAYLSFFNTSMLGLVTSSNLIQIYIF +WELVGMCSYLLIGFWFTRPIAATACQKAFVTNRVGDFGLLLGILGLYWIT +GSFEFRDLFEIVNNLIDNNNQVHFLFVTLCSFLLFAGAVAKSAQFPLHVW +LPDAMEGPTPISALIHAATMVAAGIFLVARLLPLFVITPYIMNLISLIGI +ITVLLGATLALAQKDIKRSLAYSTMSQLGYMMLALGMGSYRAALFHLITH +AYSKALLFLGSGSIIHSMESIVGYSPDKSQNMVLMGGLKKHVPITKTAFL +VGTLSLCGIPPLACFWSKDEILNDSWLYSPIFAIIACSTAGFTAFYMFRV +YLLTFDGHLNVHFQNYSGQKSSSVYSISLWGKQVPKRIQNPFCLLNLLTM +NNNESTSFFWNNKCKLDGNVKKRIRPFITVTHFPNRKTFSYPHESDNTML +FSLFVLVLFTLFVAAIGIPFNQEGSDCDILSKLLNPSINLLHQNSNNFTD +WYEFVTNASFSVSIALLGIFIATFLYKPIYSSLQNFNLLNSFYKRSANRV +MWDKIQNWIYDWSYNRGYIDSFYTISLTGGIRGLAELSHFFDRRVIDGIL +NGFGLTSFFLGESLKYFGGGRISSYLLLYSIFIFIFLLMDSFFTNLPFFV +LCQFLDSSFSMSISGFLLYENFLYENF diff --git a/detectors/cds/test/test.db/ndhg.fst b/detectors/cds/test/test.db/ndhg.fst new file mode 100644 index 0000000..40dc735 --- /dev/null +++ b/detectors/cds/test/test.db/ndhg.fst @@ -0,0 +1,50 @@ +>AC_000188@LyesCp077@ndhg@119590@120120@R@1@177 NADH_degydrogenase_subunit_6 +MDLSEPIHDFLLVFLGSGLILGGLGVVLLPNPIYSAFSLGLVLVCTSLFY +ILSNAYFVAAAQLLIYVGAINVLIIFAVMFMNGSEYYKDFHLWTVGDGIT +SMVCISLFISLITTISDTSWYGIIWTTRSNQIIEQDFLSNSQQIGIHLST +DFFLPFELISIILLVALIGAIAVARQ +>NC_000927@NeolCp118@ndhg@146302@146811@D@1@170 NADH_dehydrogenase_subunit_6 +MEIVQNFSSAALTTGILLGCLGVIFLPSIVYAAFLLGAVFFCLAGIYVLL +HADFVAAAQVLVYVGAINVLILFAIMLVNPQDAPPRALDSPPLIPGIACI +GLLGVLVQMISTTSWLTPPWTPEPNSLPVLGGHLFSDCLLAFEVMSLVLL +VALVGAIVLARREPVERSS +>NC_000932@ArthCp077@ndhg@118377@118907@R@1@177 NADH_dehydrogenase_subunit_6 +MDLPGPIHDFLLVFLGSGLLVGGLGVVLLPNPIFSAFSLGFVLVCISLLY +ILSNSHFVAAAQLLIYVGAINVLIIFAVMFMNDSEYSTDFNLWTIGNGIT +SLVCTTILFLLMSTILDTSWYGVIWTTKLNQILEQDLISNSQQIGIHLST +DFFLPFELISIILLVALIGAISVARQ +>NC_001319@MapoCp082@ndhg@99113@99688@R@1@192 NADH_dehydrogenase_subunit_6 +MKLPESFYETIFLFLESGLILGSLGVILLTNIVYSALFLGFVFVCISLLY +LLLNADFVAAAQILIYVGAVNVLIIFAVMLINKKQYSNFFVYWTIGDGIT +LTLCTSIFLLLNNFISNTSWSKIFLMTKPNLVVKDIILINTVRHIGSELL +TEFLLPFELMSIILLVALIGAITLARREKKIELEKNDFFNF +>NC_001320@OrsajCp091@ndhg@109227@109757@R@1@177 NADH_dehydrogenase_subunit_6 +MDLPGPIHEILVLFGGFVLLLGGLGVVLLTNPTFSAFSLGLVLVCISLFY +ILLNSYFVAVAQLLIYVGAINVLIIFAVMFVNGSEWSKDKNFWTIGDGFT +SLVCITIPFSLMTTIPDTSWYGILWTTRSNQIVEQGLINNVQQIGIHLAT +DFYLPFELISIILLVSLIGAITMARQ +>NC_001666@ZemaCp089@ndhg@112993@113523@R@1@177 NADH_dehydrogenase_subunit_6 +MDLPGPIHEILVLFGGFGLLLGGLGVVLLTNPIYSAFSLGLVLVCISLFY +FLLNSYFVAVAQLLIYVGAINVLIIFAVMFVNGSEWSKDKNYWTIGDGFT +LLLCITIPFSLMTTIPDTSWYGILWTTRSNQIVEQGLINNVQQIGIHLAT +DFYLPFELISLILLVSLIGAITMARQ +>NC_001879@NitaCp086@ndhg@120181@120711@R@1@177 NADH_dehydrogenase_subunit_6 +MDLSEPIHDFLLVFLGSGLILGGLGVVLLPNPIYSAFSLGLVLVCTSLFY +ILSNSYFVAAAQLLIYVGAINVLIIFAVMFMNGSEYYKDFHLWTVGDGIT +SMVCISLFISLITTISDTSWYGIIWTTRSNQIIEQDFISNSQQIGIHLST +DFFLPFELISIILLVALIGAIAVARQ +>NC_002186@MeviCp100@ndhg@105252@105821@R@1@190 NADH_dehydrogenase_subunit_6 +MSFSEQIQNLSLLLLEIGTIIGALGVVLLPNILYSGFLLGGVLICIAGIY +LLLNAEFIAAAQVLIYVGAINVIILFAIMLVNKIENLNPSNNQMMRNGLS +SFICFSFFILLSNMIFDTQWIDTVGVSTKYSISIIGNHIFSDFLLPFEIV +SVLLLVTLVGAVFIARKEDASEIEISKISFLNLPDPSKK +>NC_002202@SpolCp088@ndhg@116164@116694@R@1@177 NADH_dehydrogenase_subunit_6 +MDLPGPIHDFLLVFLGSGLILGALGVVLFTNPIFSAFSLGLVLVCISLFY +ILANSHFVASAQLLIYVGAINVLIIFSVMFMSGPEYDKKFQLWTVGDGVT +SLVCISLFVSLISTILNTSWYGIIWTTKSNQILEQDLINASQQIGIHLST +DFFLPFELISIILLVSLIGAIAVARQ +>NC_002693@OeelhCp100@ndhg@123796@124326@R@1@177 NADH_dehydrogenase_subunit_6 +MDLPGPIHDFLLVFLGSGLIVGGLGVVLLTNPIFSAFSLGLVLVCISLFF +SLSNSYFVAAAQLLIYVGAINVLILFAVMFMNGSEYSKDLTLWTVGDGIT +SLVCTSIFISLITTILDTSWYGIIWTTKSNQIIEQDLIGNSQQIGIHLST +DFFLPFELISIILLVSLIGAIAVARQ diff --git a/detectors/cds/test/test.db/ndhh.fst b/detectors/cds/test/test.db/ndhh.fst new file mode 100644 index 0000000..c195a4a --- /dev/null +++ b/detectors/cds/test/test.db/ndhh.fst @@ -0,0 +1,90 @@ +>AC_000188@LyesCp078@ndhh@123339@124520@R@1@394 NADH_dehydrogenase_subunit_7 +MTAPTTRKDLMIVNMGPQHPSMHGVLRLIVTLDGEDVVDCEPILGYLHRG +MEKIAENRTIIQYLPYVTRWDYLATMFTEAITINGPEQLGNIQVPKRASY +IRVIMLELSRIASHLLWLGPFMADIGAQTPFFYIFRERELIYDLFEAATG +MRMMHNYFRIGGVAADLPYGWIDKCLDFCDYFLTGVAEYQKLITRNPIFL +ERVEGVGIIGRDEALNWGLSGPMLRASGIEWDLRKVDHYESYDEFDWQVQ +WQREGDSLARYLVRIGEMTESIKIIQQALEGIPGGPYENLEMRRFDRLKD +PEWNDFEYRFISKKPSPTFELSKQELYVRVEAPKGELGIFLIGDQSVFPW +RWKIRPPGFINLQILPQLVKRMKLADIMTILGSIDIIMGEVDR +>NC_000927@NeolCp115@ndhh@143205@144380@D@1@392 NADH_dehydrogenase_subunit_7 +MIEAKTDPMIVSMGPHHPSMHGVLRLIVTLDGENVLDCEPVVGYLHRGME +KIAENRTIVQYLPYVTRWDYLATMFTEAITVNAPERLANIEVPRRASYLR +VIMLELSRIASHLLWLGPFMADLGAQTPFFYILREREMIYDLFEAATGMR +MMHNYFRVGGVAADVPYGWIDKCLDFCEYFLPKVDEYEALITRNPIFLKR +VKGVGTISPQQAINWGLSGPMLRASGVSWDLRKVDRYECYEDFHWSVESE +ETGDCLARYLVRIREMRTSTKIVQQALKSIPGGPTENLEARQLSQGRTSP +WNEFDYQFLGKKASPTFKMPRQEHYVRVEAPKGELGVFLIGDDHVFPWRW +KIRPPGFINVQILPNLVQGMKLADIMTILGSIDIIMGEVDR +>NC_000932@ArthCp080@ndhh@122011@123192@R@1@394 NADH_dehydrogenase_subunit_7 +MKRPVTGKDLMIVNMGPHHPSMHGVLRLIVTLDGEDVVDCEPILGYLHRG +MEKIAENRAIIQYLPYVTRWDYLATMFTEAITVNGPEQLGNIQVPKRASY +IRVIMLELSRIASHLLWLGPFMADIGAQTPFFYIFREREFVYDLFEAATG +MRMMHNFFRIGGIAADLPYGWIDKCLDFCDYFLTEVVEYQKLITRNPIFL +ERVEGVGIIGGEEAINWGLSGPMLRASGIPWDLRKIDRYESYDEFEWEIQ +WQKQGDSLARYLVRLSEMTESIKIIQQALEGLPGGPYENLESRGFDRKRN +PEWNDFEYRFISKKPSPTFELSKQELYVRVEAPKGELGIFLIGDQSGFPW +RWKIRPPGFINLQILPELVKRMKLADIMTILGSIDIIMGEVDR +>NC_001319@MapoCp085@ndhh@102202@103380@R@1@393 NADH_dehydrogenase_subunit_7 +MMILTKNKPMIVSMGPHHPSMHGVLRLIVTLDGEDVLDCEPVLGYLHRGM +EKIAENRTIVQYLPYVTRWDYLATMFTEAITVNAPEKLTNIQVPKRASYI +RIIMLELSRIASHLLWLGPFMADIGAQTPFFYIFREREMIYDLFESATGM +RMMHNYFRIGGVAVDLPYGWIDKCLDFCDYFLPKINEYERLITNNPIFLK +RVEGIGTVTREEAINWGLSGPMLRASGVQWDLRKVDHYECYDELDWKIQW +QKEGDSLARYLVRIGEMKESVKIIQQALKAIPGGPFENLEARRLNQGKNS +EWNLFEYQFISKKPSPTFKLPKQEHYVRVEAPKGELGIFLIGDDSVFPWR +LKIRSPGFINLQILPQLVKGMKLADIMTILGSIDIIMGEVDR +>NC_001320@OrsajCp094@ndhh@112708@113889@R@1@394 NADH_dehydrogenase_subunit_7 +MSLPLTRKDLMIVNMGPQHPSMHGVLRLIVTLDGEDVIDCEPILGYLHRG +MEKIAENRTIIQYLPYVTRWDYLATMFTEAITVNAPEFLENIQIPQRASY +IRVIMLELSRIASHLLWLGPFMADLGAQTPFFYIFRERELIYDLFEAATG +MRMMHNYFRIGGVAADLPYGWIDKCLDFCDYFLRGVIEYQQLITQNPIFL +ERVEGVGFISGEEAVNWGLSGPMLRASGIQWDLRKVDLYESYNQFDWKVQ +WQKEGDSLARYLVRIGEMRESIKIIQQAVEKIPGGPYENLEVRRFKKAKN +SEWNDFEYRFLGKKPSPNFELSKQELYARVEAPKGELGIYLVGDDSLFPW +RWKIRPPGFINLQILPQLVKKMKLADIMTILGSIDIIMGEVDR +>NC_001666@ZemaCp092@ndhh@116456@117637@R@1@394 NADH_dehydrogenase_subunit_7 +MSLSLKRKDLMIVNMGPQHPSMHGVLRLIVTLDGEDVIDCEPILGYLHRG +MEKIAENRSIIQYLPYVTRWDYLATMFTEAITVNAPEFLENIQIPKRASY +IRVIMLELSRIASHLLWLGPFMADLGAQTPFFYIFRERELIYDLFEAVTG +MRMMHNYFRIGGVAADLPYGWMDKCLDFCDYFLQGVVEYQELITQNPIFL +ERVEGVGFISGEEAVNWGLSGPMLRASGIQWDLRKIDPYESYNQFDWKVQ +WQKEGDSLARYLVRVGEMRESIKIIQQAVEKIPGGPYENLEARRFKKAKN +PEWNDFEYRFLGKKPSPNFELSKQELYVRVEAPKGELGIYLVGDDSLFPW +RWKIRPPGFINLQILPQLVKKMKLADIMTILGSIDIIMGEVDR +>NC_001879@NitaCp089@ndhh@123937@125118@R@1@394 NADH_dehydrogenase_subunit_7 +MTAPTTRKDLMIVNMGPQHPSMHGVLRLIVTLDGEDVVDCEPILGYLHRG +MEKIAENRTIIQYLPYVTRWDYLATMFTEAITINGPEQLGNIQVPKRASY +IRVIMLELSRIASHLLWLGPFMADIGAQTPFFYIFRERELIYDLFEAATG +MRMMHNYFRIGGVAADLPYGWIDKCLDFCDYFLTGVAEYQKLITRNPIFL +ERVEGVGIIGGDEALNWGLSGPMLRASGIEWDLRKVDHYESYDEFDWQVQ +WQREGDSLARYLVRIGEMTESIKIIQQALEGIPGGPYENLEIRRFDRLKD +PEWNDFEYRFISKKPSPTFELSKQELYVRVEAPKGELGIFLIGDQSVFPW +RWKIRPPGFINLQILPQLVKRMKLADIMTILGSIDIIMGEVDR +>NC_002186@MeviCp103@ndhh@107611@108792@R@1@394 NADH_dehydrogenase_subunit_7 +MTMLQTKTDPMVISMGPHHPSMHGVLRLIVTLDGENVIDCEPVLGYLHRA +MEKIAENRTIVQYLPYVTRWDYLATMFTEAITVNAPEKLANIEVPKRASY +IRVIMLELSRIASHLLWLGPFMADIGAQTPFFYILREREMIYDLFEAATG +MRMMHNYFRIGGVASDLPYGWVDKCLDFSDYFLPKVDEYERLITNNPIFL +KRVRDVGFISREEAINWGLSGPMLRASGVQWDLRKVDNYECYGELDWNVQ +WQSDGDCLARYLVRLGEMRESTKIIQQALKAIPGGPYENLEARRLSKGRK +SEWNNFEYQFVGKKPSPTFKIPKQEHYVRVEAPKGELGVFLMGDDNVFPW +RWKIRSPGFINVQILPELVRGMKLADIMTILGSIDIIMGEVDR +>NC_002202@SpolCp091@ndhh@119776@120957@R@1@394 NADH_dehydrogenase_subunit_7 +MAVPTTRKDLMIVNMGPHHPSMHGVLRLIVTLDGEDVIDCEPIVGYLHRG +MEKIAENRTIIQYLPYVTRWDYLATMFTEAITVNGPEQLGNIQVPKRASY +IRVIMLELSRIASHLLWLGPFMADIGAQTPFFYILRERELIYDLFEAATG +MRMMHNYFRIGGVAADLPYGWIDKCLDFCDYFLIGLTEYQKLITRNPIFL +ERVENVGIIGGEEAINWGLSGPMLRASGIQWDLRKVDHYECYDEFDWEVQ +WQKEGDSLARYLIRIGEMAESVKIIQQALEGIPGGPYENLEIRRFNRIKY +PEWNDFEYRFISKKPSPAFELSKQELYVRVEAPKGELGIFLIGDQSVFPW +RWKIRPPGFINLQILPQLVKKMKLADIMTILGSIDIIMGEVDR +>NC_002693@OeelhCp103@ndhh@127260@128441@R@1@394 NADH_dehydrogenase_subunit_7 +MNVTTTRKDLMIVNMGPHHPSMHGVLRLILTLDGEDVIDCEPILGYLHRG +MEKIAENRTVIQYLPYVTRWDYLATMFTEAITINGPEQLGNIQVPKRASY +IRIIMLELSRIASHLLWLGPFMADIGAQTPFFYIFRERELVYDLFEAATG +MRMMHNYFRIGGVAADLPYGWIDKCLDFCDYFLTAVSEYQKLITRNPIFL +ERVEGVGIIGGEEAINWGLSGPMLRASGIEWDLRKVDRYECYGELDWEIR +WQKEGDSLARYLVRMSEMTESIKIIQQALEGIPGGPYENLEIRCFDREKD +PEWDGFEYRFISKKPSPTFELPKQELYVRVEAPKGELGIFLIGDQSGFPW +RWKIRPPGFINLQILPQLVKRMKLADIMTILGSIDIIMGEVDR diff --git a/detectors/cds/test/test.db/ndhi.fst b/detectors/cds/test/test.db/ndhi.fst new file mode 100644 index 0000000..a2a13ce --- /dev/null +++ b/detectors/cds/test/test.db/ndhi.fst @@ -0,0 +1,50 @@ +>AC_000188@LyesCp076@ndhi@120525@121028@R@1@168 NADH_dehydrogenase_subunit_I +MLPMITEFINYGQQTIRAARYIGQGFMITLSHANRLPVTIQYPYEKLITS +ERFRGRIHFEFDKCIACEVCVRVCPIDLPVVDWKLETDIRKKRLLNYSID +FGICIFCGNCVEYCPTNCLSMTEEYELSTYDRHELNYNQIALGRLPMSVI +DDYTIRTISNLPQINNE +>NC_000927@NeolCp117@ndhi@145747@146268@D@1@174 NADH_dehydrogenase_subunit_I +MFDFLTSLQTYRQEAAQAAQYIGQGFGVTFDHMSRRPITIHYPYEKLIPS +ERFRGRIHFEFDKCIACEVCVRVCPINLPVVDWDYQKSVKKKQLRSYSID +FGVCIFCGNCVEYCPTNCLSMTEEYELSVYDRHELNFDHVALGRVPTSVV +QDTLVTPVLGLGYLPKGELSSLP +>NC_000932@ArthCp078@ndhi@119244@119762@R@1@173 NADH_dehydrogenase_subunit_I +MLPMITGFMNYGQQTLRAARYIGQGFMITLSHTNRLPVTIQYPYEKLITS +ERFRGRIHFEFDKCIACEVCVRVCPIDLPVVDWKLETNIRKKRLLNYSID +FGICIFCGNCVEYCPTNCLSMTEEYEFSTYDRHELNYNQIALGRLPMSVI +DDYTIRTIWNSPQTKNGVNPLI +>NC_001319@MapoCp083@ndhi@99779@100330@R@1@184 NADH_dehydrogenase_subunit_I +MFSIINGLKNYNQQAIQAARYIGQGFLVTLDHMNRLPTTIQYPYEKLIPS +ERFRGRIHFEFDKCIACEVCVRVCPINLPVVDWELKKTIKKKQLKNYSID +FGVCIFCGNCVEYCPTNCLSMTEEYELSTYNRHELNYDQIALGRLPISII +EDSTIENIFNLTSLPKGKIEGHIYSRNITNIVN +>NC_001320@OrsajCp092@ndhi@110000@110536@R@1@179 NADH_dehydrogenase_subunit_I +MFPMVTGFMGQQTIRAARYIGQSFIITLSHTNRLPITIHYPYEKSITSER +FRGRIHFEFDKCIACEVCVRVCPIDLPLVDWRFEKDIKRKQLLNYSIDFG +VCIFCGNCVEYCPTNCLSMTEEYELSTYDRHELNYNQIALSRLPISIMGD +YTIQTIRNSTQSKIDEEKSWNSRTITDY +>NC_001666@ZemaCp090@ndhi@113707@114249@R@1@181 NADH_dehydrogenase_subunit_I +MFPMLTGFISYGQQTIRAARYIGQSFIITLSHTNRLPITIHYPYEKSITS +ERFRGRIHFEFDKCIACEVCVRVCPIDLPLVDWRFEKDIKRKQLLNYSID +FGVCIFCGNCVEYCPTNCLSMTEEYELSTYDRHELNYNQIALSRLPISIM +GDYTIQTIRNSPQSKIDEEKSWNSRTITDY +>NC_001879@NitaCp087@ndhi@121108@121611@R@1@168 NADH_dehydrogenase_subunit_I +MLPMITEFINYGQQTIRAARYIGQGFMITLSHANRLPVTIQYPYEKLITS +ERFRGRIHFEFDKCIACEVCVRVCPIDLPVVDWKLETDIRKKRLLNYSID +FGICIFCGNCVEYCPTNCLSMTEEYELSTYDRHELNYNQIALGRLPMSVI +DDYTIRTISNLPQIKNE +>NC_002186@MeviCp101@ndhi@105946@106476@R@1@177 NADH_dehydrogenase_subunit_I +MFNFIDNVQTYSKEALQAAKYIGQGFMVTFDHMNRRAITIQYPYEKLIPS +ERFRGRIHFEFDKCIACEVCVRVCPINLPVVNWEFQKEKKKKQLQTYSID +FGVCIFCGNCVEYCPTNCLSMTEEYELSVYDRHELNYDNFALGRLPTMVN +NDSMVKGIKGLGYLPKGIIEGHIDNQ +>NC_002202@SpolCp089@ndhi@116981@117493@R@1@171 NADH_dehydrogenase_subunit_I +MFPMVTGFINYGQQTIRAARYIGQSFMITLSHANRLPVTIQYPYEKLITS +ERFRGRIHFEFDKCIACEVCVRACPIDLPVVDWKLETDIRKKRLLNYSID +FGICIFCGNCVEYCPTNCLSMTEEYELSTYDRHELNYNQIALGRLPISIT +DDYTIRTILNSPQTKEKACD +>NC_002693@OeelhCp101@ndhi@124541@125038@R@1@166 NADH_dehydrogenase_subunit_I +MFPMVTGFMNYGQQTVRAARYIGQGFMITLSHANRLPVTIQYPYEKLITS +ERFRGRIHFEFDKCIACEVCVRVCPIDLPVVDWKLETGVRKKRLLNYSID +FGVCIFCGNCVEYCPTNCLSMTEEYELSTYDRHELNYNQIALGRLPMSVI +DDYTIRTILNSAQIK diff --git a/detectors/cds/test/test.db/psac.fst b/detectors/cds/test/test.db/psac.fst new file mode 100644 index 0000000..bde2496 --- /dev/null +++ b/detectors/cds/test/test.db/psac.fst @@ -0,0 +1,30 @@ +>AC_000188@LyesCp065@psac@118564@118809@R@1@82 photosystem_I_subunit_VII +MSHSVKIYDTCIGCTQCVRACPTDVLEMIPWDGCKAKQIASAPRTEDCVG +CKRCESACPTDFLSVRVYLWHETTRSMGLAY +>NC_000925@PopuCp189@psac@164452@164697@R@1@82 photosystem_I_subunit_VII +MAHSVKVYDTCIGCTQCVRACPCDVLEMVPWDGCKAKQIASAPRTEDCIG +CKRCETACPTDFLSVRVYLGAETTRSMGLAY +>NC_000926@GuthCp035@psac@33008@33253@D@1@82 photosystem_I_subunit_VII +MSHSVKVYDTCIGCTQCVRACPCDVLEMVAWDGCKAGQIASAPRTEDCIG +CKRCETACPTDFLSVRVYLGGETTRSMGLAY +>NC_000927@NeolCp112@psac@138977@139222@D@1@82 photosystem_I_subunit_VII +MSHSVKIYDTCIGCTQCVRACPTDVLEMVPWGGCKAAQIASAPRTEDCVG +CKRCESACPTDFLSVRVYLGAETTRSMGLAY +>NC_000932@ArthCp075@psac@117318@117563@R@1@82 photosystem_I_subunit_VII +MSHSVKIYDTCIGCTQCVRACPTDVLEMIPWDGCKAKQIASAPRTEDCVG +CKRCESACPTDFLSVRVYLWHETTRSMGLAY +>NC_001319@MapoCp080@psac@98289@98534@R@1@82 photosystem_I_subunit_VII +MAHAVKIYDTCIGCTQCVRACPTDVLEMIPWDGCKANQIASAPRTEDCVG +CKRCESRCPTDFLSVRVYLGNETTRSMGLSY +>NC_001320@OrsajCp089@psac@108020@108265@R@1@82 photosystem_I_subunit_VII +MSHSVKIYDTCIGCTQCVRACPTDVLEMIPWDGCKAKQIASAPRTEDCVG +CKRCESACPTDFLSVRVYLGPETTRSMALSY +>NC_001603@EugrCp046@psac@74937@75893@R@3@82 photosystem_I_subunit_VII +MSHSVKIYNTCIGCTQCVRACPTDVLEMVPWDGCKAGQIASSPRTEDCVG +CKRCESACPTDFLSVRVYLGSETSRSMGLAY +>NC_001631@PithCp145@psac@103521@103766@D@1@82 photosystem_I_subunit_VII +MAHSVKIYDTCIGCTQCVRACPTDVLEMIPWEGCKAKQIASAPRTEDCAG +CKRCESACPTDFLSVRVYLWHETTRSMGLAY +>NC_001666@ZemaCp087@psac@111760@112005@R@1@82 photosystem_I_subunit_VII +MSHSVKIYDTCIGCTHCVRACPTDVLEMIPWDGCKAKQIASAPRTEDCVG +CKRCESACPTDFLSVRVYLGPETTRSMALSY diff --git a/detectors/cds/test/test.db/rpl2.fst b/detectors/cds/test/test.db/rpl2.fst new file mode 100644 index 0000000..f4ac988 --- /dev/null +++ b/detectors/cds/test/test.db/rpl2.fst @@ -0,0 +1,70 @@ +>AC_000188@LyesCp030@rpl2@86038@87528@R@2@275 ribosomal_protein_L2 +MAIHLYKTSTPSTRNGTVDSQVKSNPRNNLIYGQRRCGKGRNARGIITAR +HRGGGHKRLYRKIDFRRNEKDIYGRIVTIEYDPNRNAYICLIHYGDGEKR +YILHPRGAIIGDTIVSGTEVPIKMGNALPLTDMPLGTAIHNIEITLGKGG +QLARAAGAVAKLIAKEGKSATLKLPSGEVRLISKNCSATVGQVGNVGVNQ +KSLGRAGSKRWLGKRPVVRGVVMNPVDHPHGGGEGRAPIGRKKPTTPWGY +PALGRRSRKRNKYSDNLILRRRSK +>AC_000188@LyesCp087@rpl2@153816@155306@D@2@275 ribosomal_protein_L2 +MAIHLYKTSTPSTRNGTVDSQVKSNPRNNLIYGQRRCGKGRNARGIITAR +HRGGGHKRLYRKIDFRRNEKDIYGRIVTIEYDPNRNAYICLIHYGDGEKR +YILHPRGAIIGDTIVSGTEVPIKMGNALPLTDMPLGTAIHNIEITLGKGG +QLARAAGAVAKLIAKEGKSATLKLPSGEVRLISKNCSATVGQVGNVGVNQ +KSLGRAGSKRWLGKRPVVRGVVMNPVDHPHGGGEGRAPIGRKKPTTPWGY +PALGRRSRKRNKYSDNLILRRRSK +>NC_000925@PopuCp126@rpl2@103379@104263@R@1@295 ribosomal_protein_L2 +MAIRLYRAYTPGTRNRTVSTFSEITTDKPEKSLINKHHFCKGRNNRGVIT +CRHKGGGHKQRYRLIDFKRNRHNIIAKVASIEYDPNRNARIALLHYLDGE +KRYILHPRSLSVGAIVVSGPMAPIEVGNALPLSTIPLGTAVHNIELRPYC +GGQIVRSAGTYAQIVAKEGNFVTVKLPSSEVRMIRKECYATIGQVGNIDA +SNITLGKAGRSRWLGKRPTVRGVVMNPVDHPHGGGGEGKSPIGRSRPVTP +WGKPALGVKTRNPNKYSNPYVLLVVNKVYLTYNLILKYNVEINT +>NC_000926@GuthCp113@rpl2@100540@101367@D@1@276 ribosomal_protein_L2 +MGIRIYKSYTPGTRNRSSSDFVEITKSKPEKSLLRKKLSCAGRNNRGLIT +VRHKGGGHKQRYRLVDFKRNKLDIPAIVASVEYDPNRNARIALLHYQDGE +KRYILHPKKLAVGDKIYSGINVPIEIGNAMPLYNVPLGTAVHNVELIPGR +GGQIVRSAGTSAQVVAKDGQVVTIKMPSNEVRMIYKNCYATIGEVGNADI +KNIRLGKAGRKRWLGIRPSVRGVVMNPCDHPHGGGEGRSPIGRAKPVTPW +GKPALGVKTRRQNKYSDFCIIRSRN +>NC_000927@NeolCp022@rpl2@15904@16731@R@1@276 ribosomal_protein_L2 +MGIRFYRAHTPGTRNRSVSDFHEITTSTPTKSLTHANHRARGRNHSGSIT +TRWRGGGHKRLYRQIDFRRDKVGVLARVATVEYDPNRSARIALLHYQDGS +KRYILHPQGLAIGAEVMSSPEAPISIGNALPLVNMPLGTEVHNIELRPYN +GGQLVRAAGAVAQLVAKEGGFGTLRMPSGEVRLVAKDCWATVGQVGHVES +INLTLGKAGRSRWLDRRPRVRGSVMNACDHPHGGGEGRCPIGHPGPLTPW +GKPALGQRTRARKKYSDALLVRRRK +>NC_000932@ArthCp064@rpl2@84337@85843@R@2@275 ribosomal_protein_L2 +MAIHLYKTSTPSTRNGAVDSQVKSNPRNNLICGQHHCGKGRNARGIITAR +HRGGGHKRLYRKIDFRRNAKDIYGRIVTIEYDPNRNAYICLIHYGDGEKR +YILHPRGAIIGDTIVSGTEVPIKMGNALPLTDMPLGTAIHNIEITLGRGG +QLARAAGAVAKLIAKEGKSATLKLPSGEVRLISKNCSATVGQVGNVGVNQ +KSLGRAGSKCWLGKRPVVRGVVMNPVDHPHGGGEGRAPIGRKKPVTPWGY +PALGRRTRKRKKYSETLILRRRSK +>NC_000932@ArthCp085@rpl2@152806@154312@D@2@275 ribosomal_protein_L2 +MAIHLYKTSTPSTRNGAVDSQVKSNPRNNLICGQHHCGKGRNARGIITAR +HRGGGHKRLYRKIDFRRNAKDIYGRIVTIEYDPNRNAYICLIHYGDGEKR +YILHPRGAIIGDTIVSGTEVPIKMGNALPLTDMPLGTAIHNIEITLGRGG +QLARAAGAVAKLIAKEGKSATLKLPSGEVRLISKNCSATVGQVGNVGVNQ +KSLGRAGSKCWLGKRPVVRGVVMNPVDHPHGGGEGRAPIGRKKPVTPWGY +PALGRRTRKRKKYSETLILRRRSK +>NC_001319@MapoCp072@rpl2@79137@80514@R@2@278 ribosomal_protein_L2 +MAIRLYRAYTPGTRNRSVPKFDEIVKCQPQKKLTYNKHIKKGRNNRGIIT +SQHRGGGHKRLYRKIDFQRNKKYITGKIKTIEYDPNRNTYICLINYEDGE +KRYILYPRGIKLDDTIISSEEAPILIGNTLPLTNMPLGTAIHNIEITPGK +GGQLVRAAGTVAKIIAKEGQLVTLRLPSGEIRLISQKCLATIGQIGNVDV +NNLRIGKAGSKRWLGKRPKVRGVVMNPIDHPHGGGEGRAPIGRKKPLTPW +GHPALGKRSRKNNKYSDTLILRRRKNS +>NC_001320@OrsajCp069@rpl2@81180@82664@R@2@274 ribosomal_protein_L2 +MAKHLYKTPIPSTRKGTIDRQVKSNPRNNLIHGRHRCGKGRNSRGIITAR +HRGGGHKRLYRKIDFRRNQKDISGRIVTIEYDPNRNAYICLIHYGDGEKG +YILHPRGAIIGDTIVSGTKVPISMGNALPLTDMPLGTAIHNIEITRGRGG +QLARAAGAVAKLIAKEGKSATLRLPSGEVRLVSQNCLATVGQVGNVGVNQ +KSLGRAGSKCWLGKRPVVRGVVMNPVDHPHGGGEGKAPIGRKKPTTPWGY +PALGRRTRKRKKYSDSFILRRRK +>NC_001320@OrsajCp109@rpl2@132454@133938@D@2@274 ribosomal_protein_L2 +MAKHLYKTPIPSTRKGTIDRQVKSNPRNNLIHGRHRCGKGRNSRGIITAR +HRGGGHKRLYRKIDFRRNQKDISGRIVTIEYDPNRNAYICLIHYGDGEKG +YILHPRGAIIGDTIVSGTKVPISMGNALPLTDMPLGTAIHNIEITRGRGG +QLARAAGAVAKLIAKEGKSATLRLPSGEVRLVSQNCLATVGQVGNVGVNQ +KSLGRAGSKCWLGKRPVVRGVVMNPVDHPHGGGEGKAPIGRKKPTTPWGY +PALGRRTRKRKKYSDSFILRRRK diff --git a/detectors/cds/test/test.db/rpl23.fst b/detectors/cds/test/test.db/rpl23.fst new file mode 100644 index 0000000..7a6ef00 --- /dev/null +++ b/detectors/cds/test/test.db/rpl23.fst @@ -0,0 +1,30 @@ +>AC_000188@LyesCp026@rpl23@87547@87828@R@1@94 ribosomal_protein_L23 +MDGIKYAVFTDKSIRLLGKNQYTSNVESGSTRTEIKHWVELFFGVKVIAM +NSHRLPGKSRRMGPIMGHTMHYRRMIITLQPGYSIPPLRKKRT +>AC_000188@LyesCp083@rpl23@153516@153797@D@1@94 ribosomal_protein_L23 +MDGIKYAVFTDKSIRLLGKNQYTSNVESGSTRTEIKHWVELFFGVKVIAM +NSHRLPGKSRRMGPIMGHTMHYRRMIITLQPGYSIPPLRKKRT +>NC_000925@PopuCp127@rpl23@104311@104613@R@1@101 ribosomal_protein_L23 +MDSIDSRDLLDLVKYPIITDKTTKLLEENQYCFAVDPNATKINIKAAIQY +IFNVQVTGVNTCHPPKKKRSIGRFIGKRPHYKKAIITLASKDSINLFPET +>NC_000926@GuthCp112@rpl23@100237@100524@D@1@96 ribosomal_protein_L23 +MHALIDLVKYPLITDKATRLLELNQYTFLTSRVATKTDIKNAIEFLFNVK +VISINTCLLPLKRKRLGKFVGSKPRYKKAVVTLEKNNTINLFSEN +>NC_000927@NeolCp023@rpl23@16871@17149@R@1@93 ribosomal_protein_L23 +MIIDLVKRPVITEKATRILEKNQYTFDVELSLTKPKIKALIEKAFKVEVV +SVNTHRPPRRKRRLGTTQGYLPRYKRAIITLKRGFMIPLTPF +>NC_000932@ArthCp065@rpl23@85862@86143@R@1@94 ribosomal_protein_L23 +MDGIKYAVFTDKSIRLLGKNQYTFNVESGSTRTEIKHWVELFFGVKVIAM +NSHRLPGKVKRMGPILGHTMHYRRMIITLQPGYSIPPLRKKRT +>NC_000932@ArthCp084@rpl23@152506@152787@D@1@94 ribosomal_protein_L23 +MDGIKYAVFTDKSIRLLGKNQYTFNVESGSTRTEIKHWVELFFGVKVIAM +NSHRLPGKVKRMGPILGHTMHYRRMIITLQPGYSIPPLRKKRT +>NC_001319@MapoCp073@rpl23@80550@80825@R@1@92 ribosomal_protein_L23 +MNQVKYPVLTEKTIRLLEKNQYSFDVNIDSNKTQIKKWIELFFNVKVISV +NSHRLPKKKKKIGTTTGYTVRYKRMIIKLQSGYSIPLFSNK +>NC_001320@OrsajCp071@rpl23@82683@82964@R@1@94 ribosomal_protein_L23 +MDGIKYAVFTEKSLRLLGKNQYTFNVESGFTKTEIKHWVELFFGVKVVAV +NSHRLPGKGRRMGPILGHTMHYRRMIITLQPGYSIPLLDREKN +>NC_001320@OrsajCp108@rpl23@132154@132435@D@1@94 ribosomal_protein_L23 +MDGIKYAVFTEKSLRLLGKNQYTFNVESGFTKTEIKHWVELFFGVKVVAV +NSHRLPGKGRRMGPILGHTMHYRRMIITLQPGYSIPLLDREKN diff --git a/detectors/cds/test/test.db/rpl32.fst b/detectors/cds/test/test.db/rpl32.fst new file mode 100644 index 0000000..7cf400e --- /dev/null +++ b/detectors/cds/test/test.db/rpl32.fst @@ -0,0 +1,30 @@ +>AC_000188@LyesCp036@rpl32@114504@114671@D@1@56 ribosomal_protein_L32 +MAVPKKRTSTSKKRIRKNIWKRKGYWVALKAFSLAKSLSTGNSKSFFVRQ +TKINK +>NC_000925@PopuCp022@rpl32@16239@16418@D@1@60 ribosomal_protein_L32 +MAVPKKRTSKAKKNARKANWKNQAKTEAQKALSLAKSVLTGKSNGFVYNT +LEVADAIVE +>NC_000926@GuthCp026@rpl32@24770@24931@D@1@54 ribosomal_protein_L32 +MAVPKKRTSRSKTNSRFANWLNKSNLQAQRAISKAKSITNKKNTVNDETI +ETE +>NC_000927@NeolCp122@rpl32@149220@149447@D@1@76 ribosomal_protein_L32 +MAVPKKRKSKSRANSQNHVWKREIVKQARRAVSLAKALLGGNTNFLLVSP +GPTTPIKPNPKKQTGRRPRSQRRRT +>NC_000932@ArthCp072@rpl32@113449@113607@D@1@53 ribosomal_protein_L32 +MAVPKKRTSISKKRIRKKIWKRKGYWTSLKAFSLGKSLSTGNSKSFFVQQ +NK +>NC_001319@MapoCp076@rpl32@93886@94095@D@1@70 ribosomal_protein_L32 +MAVPKKRTSKSKTRIRKAIWKNKANKSALRAFSLAKSILTNRSKSFYYTI +NDKLLNSSKSISTSKLDES +>NC_001320@OrsajCp086@rpl32@104352@104543@D@1@64 ribosomal_protein_L32 +MAVPKKRTSMSKKRIRKNLWKKKTYFSIVQSYSLAKSRSFSGVSEHPKPK +GFSRQQTNNRVLG +>NC_001603@EugrCp047@rpl32@75928@76092@R@1@55 ribosomal_protein_L32 +MAVPKKKMSKSRRNSRKSNWKKKVLKKVLFALSLGKSFEANTNVNFSFGD +KLPQ +>NC_001631@PithCp150@rpl32@107399@107611@R@1@71 ribosomal_protein_L32 +MAVPKKRTSRSKKKIRKNVRKGKAYRAAIKAFSLAKSISTGHSKSFYCIV +NDDSSGSSESKLTAIDLDDP +>NC_001666@ZemaCp084@rpl32@108127@108306@D@1@60 ribosomal_protein_L32 +MAVPKKRTSMSKKRIRKNLWKKKTYFSIVQSYSLAKSRSFSRGNEHPKPK +GFSGQQANK diff --git a/detectors/cds/test/test.db/rps15.fst b/detectors/cds/test/test.db/rps15.fst new file mode 100644 index 0000000..cd3fe81 --- /dev/null +++ b/detectors/cds/test/test.db/rps15.fst @@ -0,0 +1,30 @@ +>AC_000188@LyesCp029@rps15@124632@124895@R@1@88 ribosomal_protein_S15 +MVKNSVISVISQEEKKGSVEFQVFNFTNKIRRLTSHLELHKKDYLSQRGL +KKILGKRQRLLAYLAKKNRVRYKELINRLDIRETKTR +>NC_000932@ArthCp081@rps15@123296@123562@R@1@89 ribosomal_protein_S15 +MIKNIVISFEEQKEESRGSVEFQVFSFTNKIRRLTSHLELHRKDYLSQRG +LRKILGKRQRLLAYLSKKNRVRYKELINQLNIRELKTR +>NC_001319@MapoCp086@rps15@103433@103699@R@1@89 ribosomal_protein_S15 +MSKNLFMDLSSISEKEKGSVEFQIFRLTNRVVKLTYHFKKHGKDYSSQRG +LWKILGKRKRLLAYLFKTNFVSYENLIIQLGIRGLKKN +>NC_001320@OrsajCp083@rps15@100818@101090@D@1@91 ribosomal_protein_S15 +MKKKGGRKIFGFMVKEEKEENWGSVEFQVFSFTNKIRRLASHLELHKKDF +SSERGLRRLLGKRQRLLAYLAKKNRVRYKKLISQLDIRER +>NC_001320@OrsajCp095@rps15@114028@114300@R@1@91 ribosomal_protein_S15 +MKKKGGRKIFGFMVKEEKEENWGSVEFQVFSFTNKIRRLASHLELHKKDF +SSERGLRRLLGKRQRLLAYLAKKNRVRYKKLISQLDIRER +>NC_001631@PithCp139@rps15@101136@101402@D@1@89 ribosomal_protein_S15 +MINNLSISSSLIPDKQRGSVESQVFYLTNRVLRLTQHLQLHGRDYSSQRG +LWKILSKRKQLLVYLSKRDKLRYDDLIGQLGIRGLKTR +>NC_001666@ZemaCp082@rps15@104729@104965@D@1@79 ribosomal_protein_S15 +MVKEEKQENRGSVEFQVFSFTNKIRRLASHLELHKKDFSSERGLRRLLGK +RQRLLAYLAKKNRVRYKKLISQLDIREK +>NC_001666@ZemaCp093@rps15@117772@118008@R@1@79 ribosomal_protein_S15 +MVKEEKQENRGSVEFQVFSFTNKIRRLASHLELHKKDFSSERGLRRLLGK +RQRLLAYLAKKNRVRYKKLISQLDIREK +>NC_001879@NitaCp090@rps15@125230@125493@R@1@88 ribosomal_protein_S15 +MVKNSVISVISQEEKRGSVEFQVFNFTNKIRRLTSHLELHKKDYLSQRGL +KKILGKRQRLLAYLSKKNRVRYKELINQLDIRETKTR +>NC_002186@MeviCp104@rps15@109145@109417@R@1@91 ribosomal_protein_S15 +MLKKKIIKTHANHTNDTGSTQVQVSLLSSRVAQLTKHLNNHKNDYSSQRG +LKKLLGQRKRLLKYLFVKDPLGYNNLIIQLGIRPGKSLVN diff --git a/detectors/cds/test/test.db/rps7.fst b/detectors/cds/test/test.db/rps7.fst new file mode 100644 index 0000000..0f9187e --- /dev/null +++ b/detectors/cds/test/test.db/rps7.fst @@ -0,0 +1,50 @@ +>AC_000188@LyesCp008@rps7@98721@99188@R@1@156 ribosomal_protein_S7 +MSRRGTAEKKTAKSDPIYRNRLVNMLVNRILKHGKKSLAYQIIYRAVKKI +QQKTETNPLSVLRQAIRGVTPDITVKARRVGGSTHQVPIEIGSTQGKALA +IRWLLAASRKRPGRNMAFKLSSELVDAAKGSGDAIRKKEETHRMAEANRA +FAHFR +>AC_000188@LyesCp022@rps7@142156@142623@D@1@156 ribosomal_protein_S7 +MSRRGTAEKKTAKSDPIYRNRLVNMLVNRILKHGKKSLAYQIIYRAVKKI +QQKTETNPLSVLRQAIRGVTPDITVKARRVGGSTHQVPIEIGSTQGKALA +IRWLLAASRKRPGRNMAFKLSSELVDAAKGSGDAIRKKEETHRMAEANRA +FAHFR +>NC_000925@PopuCp103@rps7@92209@92679@R@1@157 ribosomal_protein_S7 +MSRRNTAKKRFASPDPLYKSRLVSMLTVRILKSGKKTLAQRIIYQALDIV +KERTETDPLNVLEKAIRNITPLVEVKARRVGGSTYQVPIEVRAYRGTNLA +LRWITRFSRERSGKSMSMKLANEIMDAANETGNSIRKREETHRMAEANKA +FAHYRY +>NC_000926@GuthCp136@rps7@111745@112215@D@1@157 ribosomal_protein_S7 +MSRRSTTKKKLALPDPIYNSRLVNMLTVRILKEGKKHLAQRIIYNAFDII +KQRTGEDAILVFESAIKKVTPLVEVKARRIGGSTYQVPMEVRAFRGTNLA +LRWITKYARERAGKSMSMKLANEIMDAANETGSSIRKREEIHRMAEANKA +FAHYRF +>NC_000927@NeolCp044@rps7@48318@48788@D@1@157 ribosomal_protein_S7 +MSRRNTAVKRSISSDPVYNSQLIHMMISHILKEGKKALAYRLMYDAMKRI +EKTTQQDPILVVERAVRNATPTIEVKARRMGGSIYQVPLEVKPERGTALA +LRWILLAARNRTGRDMVAKLSNELMDASNRIGNAVRKRDEMHRMAEANKA +FAHIRV +>NC_000932@ArthCp069@rps7@97478@97945@R@1@156 ribosomal_protein_S7 +MSRRGTAEEKTAKSDPIYRNRLVNMLVNRILKHGKKSLAYQIIYRALKKI +QQKTETNPLSVLRQAIRGVTPDIAVKARRVGGSTHQVPIEIGSTQGKALA +IRWLLGASRKRPGRNMAFKLSSELVDAAKGSGDAIRKKEETHRMAEANRA +FAHFR +>NC_000932@ArthCp088@rps7@140704@141171@D@1@156 ribosomal_protein_S7 +MSRRGTAEEKTAKSDPIYRNRLVNMLVNRILKHGKKSLAYQIIYRALKKI +QQKTETNPLSVLRQAIRGVTPDIAVKARRVGGSTHQVPIEIGSTQGKALA +IRWLLGASRKRPGRNMAFKLSSELVDAAKGSGDAIRKKEETHRMAEANRA +FAHFR +>NC_001319@MapoCp002@rps7@892@1359@D@1@156 ribosomal_protein_S7 +MSRKSIAEKQVAKPDPIYRNRLVNMLVNRILKNGKKSLAYRILYKAMKNI +KQKTKKNPLFVLRQAVRKVTPNVTVKARRIDGSTYQVPLEIKSTQGKALA +IRWLLGASRKRSGQNMAFKLSYELIDAARDNGIAIRKKEETHKMAEANRA +FAHFR +>NC_001320@OrsajCp076@rps7@87944@88414@R@1@157 ribosomal_protein_S7 +MSRRGTAEKRTAKSDPIFRNRLVNMVVNRIMKDGKKSLAYQILYRAVKKI +QQKTETNPLLVLRQAIRRVTPNIGVKTRRNKKGSTRKVPIEIGSKQGRAL +AIRWLLEASQKRPGRNMAFKLSSELVDAAKGGGGAIRKKEATHRMAEANR +ALAHFR +>NC_001320@OrsajCp103@rps7@126704@127174@D@1@157 ribosomal_protein_S7 +MSRRGTAEKRTAKSDPIFRNRLVNMVVNRIMKDGKKSLAYQILYRAVKKI +QQKTETNPLLVLRQAIRRVTPNIGVKTRRNKKGSTRKVPIEIGSKQGRAL +AIRWLLEASQKRPGRNMAFKLSSELVDAAKGGGGAIRKKEATHRMAEANR +ALAHFR diff --git a/detectors/cds/test/test.db/ycf1.fst b/detectors/cds/test/test.db/ycf1.fst new file mode 100644 index 0000000..cb7986a --- /dev/null +++ b/detectors/cds/test/test.db/ycf1.fst @@ -0,0 +1,353 @@ +>AC_000188@LyesCp019@ycf1@125297@130972@R@1@1892 ycf1_protein +MIFQSFLLGNLVSLCMKIINSVVVVGLYYGFLTTFSIGPSYLFLLRALVM +EEGTEKKVSATTGFITGQLMMFISIYYAPLHLALGRPHTITVLALPYLLF +HFFWNNHKHFFDYGSTTRNSMRNLSIQCVFLNNLIFQLFNHFILPSSMLA +RLVNIYLFRCNNKILFVTSGFVGWLIGHILFMKWLGLVLVWIRQNHSIRS +NKYIRSNKYLVLELRNSMARIFSILLFITCVYYLGRIPSPILTKKLKEAS +KTEERVESEEERDVEIETASEMKGTKQEQEGSTEEDPYPSPSLFSEEGWD +PDKIDETEEIRVNGKDKIKDKFHSHLTETGYNNINTSNSPIYDYQDSYLN +NNNTGNLENCKLQLLDKKNENQEQDLFWFQKPLVSLLFDYNRWNRPFRYI +KNNRFEQAVRTEMSQYFFDTCKSDGKQKISFTYPPSLSTFWKMIKRKIPL +LSLQKTLPNELDTQWVSTNKEKSNNLNKEFLNRLEILDKESLSLDILETR +TRFCNDDTKKEYVPKMYDPLLNGLYRGTIKKGVSSSIINNTLLENWEKRV +RLNRIHTIFLPNIDYQEFEQKAYTIDKKPLSTEIDEFLTLINELGNEAKS +SLNLKGLSLFSDQEQRRANSEKRTKFVKFVFNALDPNETKSGKKSIGIKE +ISKKVPRWSHKLITELDQQMGEFKDRASMDHQLRSRKAKRVVIFTDNKAT +KDAEEEVALISYSQQSDFRRGIITGSMRAQRRKTFISKLFQANVHSPLFV +DRITPLRLFSFDISELIKPILKNWTDKEGEFKILESREEQTKREEKKEKD +KKEDNKRKEQARIAIEEAWDTIPLAQIIRGYMLITQSILRKYILLPALII +AKNIGRMLFLQLPEWSEDLQEWNREMQIKCTYNGVQLSETEFPKNWLRDG +IQIKILFPFCLKPWHISKLYPSRRELMKKQKQKDDFCFLTVWGMEAELPF +GSPRKRPSFFEPIFKELEKKIGKFKKKYFLTLKILKGKTKLFRKVSKETT +KLFIKSIGFLKKIKKELSKVNLIVLFRFKEISESNETKKEKDYLISNQII +NESFRQIESGNWPNSSLIETKMKDLTNRTSTIKNKIERITKEKKKVTPEI +DINPNKTNNIKKFESPKKIFQILKSRNTRVIWKFHYFLKLFIQRLYINLF +LSIINIPRITTQLFLKSTNKLIEKFISNNEINQEKINNKKKIHFMFISTI +KKSLYNISKKNSHILCDLSYLSQAYVFYKLSQTQVINFSKFRSVLQYNTT +SCFLKTKIKDYFKTLGIFHSELKHKKLQSYRINQWKNWLRWHYQYDLSQI +RWSRLMPKKWRTRVNQSCMAQNKNRNLNKWNSYEKDQLLHYKKENDSELY +SLSNEKDNFKKCYGYGLLAYKSINYENKSDSFFSRLPFEVQVKKNLEISY +NSNTSKHNFVDMPGNLHINNYLRKGNILDRERNLDRKYFDWKIIHFSLRQ +KGDIEAWVKIDTNSNPNTKIGINNYQIIDKIEKKGVFYLTTHQNPEKTQK +NSKKFFFDWMGMNEKIFNRPILNLEFWFFPEFVLLYNVYKIKPWIIPSKF +LLFNLNTNKNVSQNKNQNFFLPSNKKIKIKNRSQEAKEPPSQRERGSDIE +NKGNLSPVFSKHQTDLEKDYVESDTKKGKNKKQYKSNTEAELDLFLKRYL +LFQLRWNGALNQRMFENIKVYCLLLRLINPTKITISSIQRREMSLDIMLI +QANLPLTDLMKKGVLIIEPIRLSVKDNGQFIMYQTIGISLIHKSKHQTNQ +RYREQRYVDKKNFDEFILQPQTQRINTEKTHFGLLVPENILWSRRRRELR +IRSFFNSWNWNVVDRNSVFCNETNVKNWSQFLGERKPLYKDKNELIKFKF +FFWPNYRLEDLACMNRYWFDTNNGSRFSILRIHMYPRLKIN +>NC_000932@ArthCp070@ycf1@109405@110436@D@1@344 hypothetical_protein +MMVFQSFILGNLVSLCMKIINSVVVVGLYYGFLTTFSIGPSYLFLLRARV +MDEGEEGTEKKVSATTGFIAGQLMMFISIYYAPLHLALGRPHTITVLALP +YLLFHFFWNNHKHFFDYGSTTRNEMRNLRIQCVFLNNLIFQLFNHFILPS +SMLARLVNIYMFRCNNKMLFVTSSFVGWLIGHILFMKWVGLVLVWIQQNN +SIRSNVVIRSNKYKFLVSELRNSMARIFSILLFITCVYYLGRIPSPIFTK +KLKGTSETGGTKQDQEVSTEEAPFPSLFSEEGEDLDKIDEMEEIRVNGKD +KINKDDEFHVRTYYNYKTVSENLYGNKENSNLEFFKIKKKEDH +>NC_000932@Arthcp087@ycf1@123884@129244@R@1@1787 Ycf1 +MMVFQSFILGNLVSLCMKIINSVVVVGLYYGFLTTFSIGPSYLFLLRARV +MDEGEEGTEKKVSATTGFIAGQLMMFISIYYAPLHLALGRPHTITVLALP +YLLFHFFWNNHKHFFDYGSTTRNEMRNLRIQCVFLNNLIFQLFNHFILPS +SMLARLVNIYMFRCNNKMLFVTSSFVGWLIGHILFMKWVGLVLVWIQQNN +SIRSNVVIRSNKYKFLVSELRNSMARIFSILLFITCVYYLGRIPSPIFTK +KLKGTSETGGTKQDQEVSTEEAPFPSLFSEEGEDLDKIDEMEEIRVNGKD +KINKDDEFHVRTYYNYKTVSENLYGNKENSNLEFFKIKKKEDHFLWFEKP +FVTLVFDYKRWNRPNRYIKNDKIENIVRNEMSQYFFYTCQSDGKERISFT +YPPNLSTFFEMIQKRIPSFTKEKKTFDQVSTYWSLIHEEKRENLKKEFLN +RIEALDKEWSVENILEKTTRFCYNEAKKEYLPKIYDPFLHGISRGRIKKL +PPFQIITETYRKNNLGGSWINKIHGLLLKINYKKFEQTIEKFNRKSLSIE +KKLSFFSEPQQEEKINSEEEIKTFKFLFDIVRTDSNDQTLIKNFMDFPEI +NKKVPRWSYKLISELEELEGENEENVPMEPGIRSRKAKRVVVFTDKEPHG +EIYTNLKDNQNSDQNDEMALIRYSQQSDFRREIIKGSMRSQRRKTVIWEF +FQAKVHSPLFFDRIDKLFFFSFDIWGLKKKIIKNFIWKKKIDKKEEEQSK +REETRRIEIAETWDSFLFAQIIRGSLLVTQSILRKYIILPLLIIIKNSVR +MLLFQFPEWSQDLKDWKREMHVKCTYNGVQLSETEFPRNWLTDGIQIKIL +FPFYLKPWHKSKFQASQKARLKKTKDKGEKNDFCFLTVWGMETELPFGSA +QRKPSFFEPISKELKKRIKKLKKKSFVVLKIFKERAPIFLKVAKETKNWI +LKNFIFIKGISKRNLIPLFGPREIYELNEPKKDSIISNQMIHELSVQNKS +LEWTNSSLSEKKIKNLIDRKKTIRNQIEEISKEKQNLTNSCTKLRYDSKI +IESSKKIWQTFKRKNTRLIRKSIFFFKFCIEQMSIAIFLGIINIPRITTQ +LFFESTKKILDKYIYKNEENGEKKKNTLYFISTIKNLISNKKKMSYDLCS +LSQAYVFYKLSQIKVSNFCKLKAVLEYNICITSFFVKNKIKVFFQEHGIF +HYELKNKTFLNSEVNQWKNWLRSQYQYNLPQISWARLVTQNWKNKINKDS +LVLNPSLTKEDSYEKKKFDNYKKQKFFEADSLLNPKHNVKKDSIYNLFCY +KSIHSTEKNFDMSIGIALDNCLVSSFLEKYNIRGMGEIRHRKYLDWRILN +FWFTKKVTIEPWVDTKSKKKYINTKVQNYQKIDKITQTDLANKKRNFFDW +MGMNEEILNQRITNFEFFFFPEFFLFSSTYKMKPWVIPIKLLLLNFNENI +NVNKKIIRKKKGFIPSNEKESLRFYNLNKEEKESAGQVELESDKETKRNP +EAARLNQEKNIEENFAESTIKKRKNKKQYKSNTEAELDLFLTRYSRFQLR +WNCFFNQKILNNVKVYCLLVRLNNPNEIAVSSIERGEMSLDILMIEKNFT +FAKLMKKGILIIEPVRLSVQNDGQLIIYRTIGISLVHKNKHKISKRYKKK +SYINKKFFEKSITKYQNKTVNKKKNNYDFFVPEKILSPKRRREFRILICF +NLKKKNARDTNSRFDKNIQNLTTVLHKKKDLDLDKDKNNLINLKSFLWPN +FKLEDLACMNRYWFNTTNGNHFSMIRIRMYTRFPIP +>NC_001879@NitaCp151@ycf1@125891@131599@R@1@1903 Ycf1 +MMIFQSFLLGNLVSLCMKIINSVVVVGLYYGFLTTFSIGPSYLFLLRALV +MEEGTEKKVSATTGFITGQLMMFISIYYAPLHLALGRPHTITVLALPYLL +FHFFWNNHKHFFDYGSTTRNSMRNLSIQCVFLNNLIFQLFNHFILPSSML +ARLVNIYLFRCNSKILFVTSGFVGWLIGHILFMKWLGLVLVWIRQNHSIR +SNKYIRSNKYLVLELRNSMARIFSILLFITCVYYLGRIPSPILTKKLKEA +SKTEERVESEEERDVEIETASEMKGTKQEQEGSTEEDPYPSPSLFSEERW +DPDKIDETEEIRVNGKDKIKDKFHSHLTETGYNNINTSNSPIYDYEDSYL +NNNNTGNTEIFKLQLLDKKNENKDLFWFQQPLVSLLFDYNRWNRPFRYIK +NNRFEQAIRTEMSQYFFNTCKSDGKQRISFTYPPSLSTFWKMIKRRIPLL +SLQKTLPNELDNQWISTNKEKSNNLNKEFLNRLEVLDKESFSLDILETRT +RLCNDDTKKEYVPKMYDPLLNGPYRGTIKKKFSPSIINNTSLENLKERVR +INRIHTIFLPNTDYQELEQKVDTVAKKPLSTEIDEFLTLINEFGNEPKSS +LNLKDLSLFSDQEQGRVNSEKRTKFVKFVFNAIAPNGTTSEKKSIGIKEI +SKKIPRWSHKLITELEQQSGDYQEGVPLDHQIRSRKAKRVVIFTANNQNN +DPDTKDTDTADQDQTKEVALIRYSQQPDFRRGIIKGSMRAQRRKTVIWKL +FQANVHSPLFLDRITPPFLFSFDISGLIKPIFRNWSGKEGEFKILESREE +QTKREEKKEKDKKGENKRKEKARIEIAEAWDTIPFAQIIRGYMLITQSIL +RKYIVLPSLIIAKNLGRMLVLQLPEWSEDLQEWNREMHIKCTYNGVQLSE +TEFPKNWLKDGIQIKILFPFCLKPWHISKLYSSRGELMKKKKQKDDFCFL +TVWGMEAELPFGSPRKRPSFFEPIFKELEKKIGKFKKKYFITLKVFKGKI +KLFRRISKETKKWLIKSSLFIKKMKKELSKVNPIVLFRLKEIDESNETKK +EKDSLMSNQIINESFSQIESGNWPNSSLIESKMKDLTDRTSTIKNQIERI +TKEKKKVTPEIDISPNKTNNIKKFESPKKIFQILKRRNTRLIWKFHYFLK +LFIQRLYIDLFLSIINIPRINTQLFLESTNKLIDKYISNNEINQEKINNQ +KKIHFISTIKKSLYNISKKNSHIFFDLSYLSQAYVFYKLSQPQVINLSKL +RSVLQYNRTSFFLKTKIKDYFRTLGIFHSELKHKKLQSYRINQWKNWLRR +HYQYDLSQIRWSRLMPQKWRNRVNQGCMAQNRNLNKWNSYEKDQLIHYKK +ENDSELYSLANQKDNFQKCYRYDLLAYKSINYEKKNDSFISRLPFQVNKN +LEISSNSNTSKHNLFDMLGNLHINNYLRKGNILYIERNLDRKYFDWKIIH +FSLRQKEDIEAWVKIDTNSNPNTKIGINNYQIIDKIDKKGFFYLTIHQNP +ENNQKNSKKAFFDWMGMNEKILNRPILNLEFWFFPEFVPLYNVYKIKPWI +IPSKLLLLNLNTNENVSQNKNINKNQKQNFFLRSNKKIKNRIQEAKEPAS +QGEKERGSDIENKGNLGPVLSKHQNALKKDYAESDTKKGKKKKQYKSNTE +AELDLFLKRYLLFQLRWNDALNQRMIENIKVYCLLLRLINPSKIAISSIQ +RREMSLDIMLIQKNLTLTELMKKGILIIEPIRLSVKNNGQFIMYQTIGIS +LVHKSKHQTNQRYPEQRYVDKKNFDEFILQPQTQRINTDKNHFDLLVPEN +ILWSRRRRELRIRSLFNSLNWNGIDRNSVFCNENNVKNWSQFLDERKPLY +KEKNELIKLKFFLWPNYRLEDLACMNRYWFDTNNGSRFSILRIHMYPQLK +IN +>NC_002202@SpolCp093@ycf1@121596@127097@R@1@1834 ycf1_protein +MIFQSFLLGNLVSLCMKIINSVVVVGLYYGFLTTFSIGPSYLFLLRAQVM +EEGEEGTEKKVSGTTGFIMGQLMMFISIYYTPLHLALGRPHTITVLALPY +LLFHFFWNNHKHFFDYGSTSRNSMRNLSIQCVFLNNLIFQLFNYFILPSS +MLARLVNIYMFRCNNKMLFVTSSFVGWLIGHILFMKWVGLVLVWIQQNNS +IRSNKYLVSELRNSMARIFSILFFITCVYYLGRMPSPIFTNKLKQMLETN +EIEEETNLEIEKTSETKETKQEEEGFTEEDPSPSLFSEEKEDPDKIDETE +KIRVNGKDKTKDEFHLKEACYKNSPTSYSGNQDISKLEILKKEKKILFWF +QKPLIFLLFDYKRWNRPMRYIKNNRFENAVRNEMSQYFFYTCQNDGKQRI +SFTYPPSLSIFWEMIQRKISLATTEKFLYDDELYNYWIYTNEQKKNSLSN +EFANRITVLDKGLFYIDVLDKKTRLCKSKNEYLQKDHDPLLNGSYRGIIK +KTLLPFINNDETTVKKLIDEIFINKIHSVLGNCNNYQEFEYKKDPFKKNP +ISSKIRHFVTLMSQFDGESTFNQKGISLLSEHKQICSEDPEIFFKFLVDT +IIADSFTQTIPKESIGIKEISKKVPHWSYQLIDESEQEEMENEKQVSWPH +QIRSRSGKEVVFFTDKQENTDNPTPNTADISEQADEVVLTRYPQESDFRR +DIIKGSMRSQRRKIVIWELFQANIHSPLFLDRTNKSSFFSITFSRLIKRI +FKNYMGKNPELDISNYKEEELKKKEKAKEHKKDKEKKQEQIRLDIAETWD +TIPGAQIIRSLILLTQSILRKYILLPLLITGKNIGRILLFQLPEWSDDFK +EWTSEMHIKCTYNGVQLSEKEFPKNWLTDGMQIKILSPFCLKPWHKSMIR +PYHQDKKKKEQNQIDAFCFLTVVGLETDIPFGPPRKRPSFFQPIFKQLDK +KIEKLIKGNFQVRKRLKEKILFFLKLQNETNNWIIEIFPFFKKIIRKMST +VNTIGVFGLKEASSEIKSEKDSRIKNHMIHESSVQIRFLNQTNSSVTEKK +MKDLANRTRIIKNKIEKISNDKLKMSPKKTRYGTKNLGQILKRRNARLIR +NSNYILKFFRERIYGDIFLYIINIPKINTQLFLESTKNGIDKSIYNNESI +TKTNKNRIQFISTINKKFLPFLSTSKNNSKIISDFSFLSQAYVFYKLSQA +KILNLYKLRLVLQYRGISLFLKNEIKDFFGTQGITNSELKTKKLPNSGMN +QWKNWLKLKNNYQYNLSQLKWSRLVPQKWRNRVTEHCEVENTNLYQNEEL +INSKKHLLLLPDQKYNFQKNYRYDVLSYKFFNYKNKNDSYRYSYGLPFQV +NKNQEFSYTYNYNINNNKFIDMWWNIPISNFSYLEKTKIMDIDKNIDRKY +LDFKILDFSLRNKIDIEDWIDISTSINENTKTEPRNYQIVEKINKKSLVY +STIYQEIKQSDQKNKLFDWMGMNEKILSRPISNLEFWFFSEFFSFYNAYK +MKPWVIPINLLFSNSNVSEKFSKNKSINRKKKTNPFIPSNEKKSFELENR +NQDEKELVSKEDLGSYVQENYEKDIEEDYISFIDIKKPIKQKQPKSVIEA +EFDLFLKRYLLFQLKWADSLNEKLMDNIQVYCLVLRLINPIEILISSIER +KELSMDIMLDRKDFNCPNWKQKRVLIIEPIRLSIRGDGQFLLYQTIGISL +VHKSKHQNNQKRYSENVDKKFLGERNKNNFDLLAPENLLSPRRRRELRIL +LCLNSRNNNGVNTNPMENRVKNCNQFFDEKKDLDRDKNTLRNLKFFLWPN +YRLEDLACMNRFWFDTNNGSRFSILRIHMYPQF +>NC_002693@OeelhCp105@ycf1@129224@136615@R@1@2464 Ycf1 +MVNLVYVCMKINNSVVMVGLYYGFISAFSIGSSYLFLLRPRFLNDDPDAI +EKKASETAGFFTGQLLIFISILYGPLHLALGRPHTILLLLAPYFFFHYLF +SNSGQWPSQRFAFPLLTKSMRNRRFQLVFLNNLLFQLFSLSLLGRPMLTR +LSYIYIFRCNNKMLFVLSSFVGWLIGHILVLKWAGLVFVWLLQVIRSKTM +KYITCNVLIPATKYIIEKWRNSFVAGLIREILAMKQVESALVRIKNSKLL +DDARWWIRGSSLISGLKINIRFYARLILRGFENVYVGAKFRQDMEHLFSI +ILFAIFLLYLDQTPLLYADPADKKLQLQRKLSNETQAARAEKKLEERLTK +KFEAQRRAQRAAQRQALQEFKQGVVESYLAKQVAKDANQIQAQKDEKQIQ +AEQKARRIRAEQVVQYTFWLIEAQRREMEIEAARAMQEAYKGMLAAQEGY +VEEGVQEKQEGFPEELISPSPIFHSEEREENPKLLILKEKISILKKKISI +LKKKISILKEKNDLFSFEIPIITSLFDPQKPLRPLRYIKTCAGVEKAVKN +EMSQYFFYACRSDGKQRICFTYPPSLATFWEMIQRKMASRFPRIYAKAKW +RALRWSAPGSYRQWISRNKKKKNSLSTEFQNRIKTLDKKKSLLNVLARRK +RSSLLNVLARRKRSSLQNVLETRKRLCNYKTNKTKKEYLPEKEYLPEIAD +PFLTGALRGKSDPEVDDGGRKTSDLIKVVFLKNNITMATLRNKNDDDLRE +QKNAIALLSRMKNPVNKLHLLFVNERDYPFVKTLVNRINGPAVPKKKKKI +SKSKQKNVKSKQKNVKSKQKNVKSKQKNVKSKQNEIKRKVNEIKRKVNEI +KRKQNESYPRGVKFGATPKTEINPHGIRFDAATIEKYSFATGYSYSPPSF +DDILFHAFVTEPQRNKKAVIELEEEINKKVPRWSYQLIDELEQLEGAEGE +TQFSDHEIRILPFKRVAVFTEKDSKKRKPLIDEQGNFVRHRKTYAIRFLG +HMSDFRRGLIKGSARQDRRKAYVCRTTQVNARSPLFALGPRTFLDGLVNL +AVQVKFFYETRIKGEKIVDDDDDNEKDEFKVMIPDTKSIVAETREMLKQA +GAEDGQSYEDVEDDIRIENVTEMWENIDYGQVIRTFILLLHIFLRKKVVF +PAFIIGKNIARMLLLQATEWKIDFARLKRERYAICTYNGMKVSEKIAFDQ +FPPDWADDGIQILVTNPFYLKPWYRSKTRSIQKDPKKEKDPKKEKGPKKE +PWYRFKTRFIQKDPKKEKGPKKEKGPKKEPWYRRFFFQKDPKKEKGPKKG +KAQFEGDRGVRFLTSFGILTDRPFGDLITPDWGVFFNPIRNELKKKIRQF +EKKHSIILSKRFRNVLKKTKKWFIKSFLFLKRARLKRHPIELSGGRETPE +FTRSQKDIDNLKNEQDFRMSRNPRISESLLQGPVRALKDDSLPEEKVADP +EKEPSDLDNELRAVWDEIDKVTKERKKIVFTPKPDSPDKLVQAKKNILKK +LERIKSRRHKFYFLRIRKSYYVLLFFIKRISRNIKRIYLNPLERAISIRK +IHPQRFFEFSKKMIEKSIGIGKTETNKETVYKTKKKKKKKNPFISIFKES +LYDKDIRISENDIKLGDTWNGYKYKRKKATDTSDLASMSQAYVFYKLYQT +QQTQLIHLDKLRYVLQYDGTSRFLKKELKDYFEAQELFHSKLKHKNSLNS +GKNQWKNWLKAQHQYSVSPIIWNSLSPQKWRTKVNQERMDENTDLNKRYS +NEKRKQFFEANSLDDEENVVETYLGQRAGDIKNSIKSYSYDLFSYQSINS +EDKYVCINNKQKNSYNYNRRKVNLVDSPEGIALSNQFLVQNDLLDLYTFP +DRKYVPWRLFPGSLIGGNDKDKDRFVKMWTATNSGNAVKYWTAANGNTSI +KPGVFWTFQNSQRTKKQNPLFDWRGMNTELPNRCISDLKGWFFFSELLKL +DLRYQVKPWILSKNLLFENLIFENQEENPNLIQNPIEDGRKNVIQNENEN +DPIEDGRQNVIQNENENAIQNLIDFFLEKKNSPKDTNQELHAQAKARIWD +ALVASLKQKREQKERKNKRIAQLIEKKKQKEIEKQKRKIEKQKRKKEKIE +NAKKKIENEKKKIETEEEKIEKEKRKKERKKEKLKKKVAKNIEKLKNKVA +KNVAKNIEKLKKQRAKNIARMEEEDKKARKKRKRKVQVQENKIPYTAFGS +DKWQRPIAEYPKSGDIRNFQVILPEDDDEDDEEDRLDELKLNAYELSRIQ +KITDEKRMKRNLLSSIKRERLKMEFSTRNNSLATIMLTHGIFSIEPLRIS +RQNQDASFLIYQLIKISLVEQLDPYDHNDSFELTEKYRARRNFFMPKTNA +ETMHKSDSDLFVPETILSTKRRRELRILISFYSRRGKRKNRIYKNPVFWK +YVKNCGEVVDNSEKKKKKLIKSFLWPNYRLEDLACMNRYWFNAQNGSRFS +MLRIRMYPRLKIR +>NC_002694@LocoCp080@ycf1@120497@125878@R@1@1794 hypothetical_protein +MIFQSFILDNLVSLCLKIINSVIVVGLYYGFMTTFSTGPSYLFLLRAHVM +EEGTEKKISATTGFITGQLVMFISIYYAPLHIALDRPHTITVITLPYLLL +YFLGNNQKNFLNYVYKNQNSIRHFSIQRIFFQNLFFQLLNPFFLPSSILM +RLANIYIFQSNNKVLFLTSSFVGWLIGHVFFMKWIGLMLVWIQEKNNSIK +STVAIRSNKGVLAKFRKSMFQIFLIFFFITCLYYLGRIPPIYFFTPKMSE +IKERGEIEKREGEIDIEINSQRAGSKQEQKITAEEKLSPYLFSKKNNNLD +KIKEENDIFGFQKPLVTILFDYNRWNRPLRYIKNDRFENVVRNEISQFFF +FTCQSDGKERISFTYPPNLSTFQKMMEMKISLFTRDIISYEELSNSWRST +NEEKKKKLTNEFLNRVEVLDKESLPVDIFENRIRLCNDEKKQKYLTKEYD +PFLNGPCRGQIQKWFSPPIQKETYKKNSLFINKIHGILFSNTNNYPKFEQ +KKNIFDRKSLLTDINFFFNLITKFSRKSVSSLNFEGLYLFPKDNKGKMSS +KKKKFLFDTIRPDLNDNKIVNLQKCIGINEIVKKLPRWSYNLIDELEQLE +GKKKVEYHQIRSRKAKRVVLLTKNSQNDDNYDETTDTDNTEKKKELALIR +YSQQPDFRRDIIKGSIRAQRRKTVTCKLFQRSVDSPLFLEKMEKTSFFCF +DILDSSKIFFMFKNWIRKKKELKNSDYTDEKAKESQKKEEEKIKKNEKEE +KRRIEIGEAWDSIIFAQVIRGCLLITQSILRKYILLPSLIITKNIVRILL +FQFPEWSEDFRDWQREMYIKCTYNGVQLSETEFPKKWLTDGIQIKILFPF +RLKPWHRSKLRFTEKKKDPLKNKKVKKKNFCFLTIFGMEVELPFSGYPRN +RFSFFDPILKELKKKMKKLKNNFFLILKIVNERTKNFITTLKETSKRIIQ +SILKKVLFLNKKIKKLYNYLFLFRFKKIDELNQNKKNFPITKNNPIIYES +TILIQAINKTNCSLTEKKIKAINAKTKKIIKKIERMTKENKGGFLISEIN +SNSKKTSSNTKGLELEKKILQILQRRNVQLTHKLYSFFKFLLNFMKKVYT +DIFLCIVSVPRINVQFFLESTKKIINQSIYNKKTNEEIIDKTNQSIIHFI +SIINKSSNTKNTNSAANSYEVSALSQAYVFFKISQIQVLNVYKYKFKYVF +DYDGRSFFIKDEIKDYFFGIQGIIHSKLRHKNSPVSLKNQWTNWLKVHYQ +YDLSQNRWSRLVQKNLKNRINKHRLDQNKDLTKCDSYKKTQLIVSKNKKQ +QVDFLVNLLIQKKIKKQSRYDLLLYKFINYAEKKELSIYGYRSPFQANKK +RAISYDYNTQKKEFFDRMDDISIKNYIAEDAIRYIEQNRDRKYFDWVVMD +VKIQNNSISNLQFSFFFKFLRFYDAYRNKPWIIPIKFLFLHFSVNQNFNK +IKNIIEKKRRIDIFKPWKKKKILEVELETPNRAKKEYTSRVDLNKPSLSN +QEKDIEEDYGESDSKKGGKDKNKKKYKNKIEAEVNLLLRKYLNFHLNWKG +SLNKRVINNVKVYCLLIRLKNIKQIAISSIQRGELSLDIMMIQNEKDSTL +TGFRKKKEFIEKGIFIIEPVRLSRKNNEQFFMYETARLLLIHKSKRQINQ +RNPEKSDLDKQIFYKNIPPKRDQRITQNKEKKHYALVVIENILSARRRRE +LRILICFNPRSINSMPRKTIFDNENKINNCCQVFAKNKDLDKEKKILMNL +KLILWPNYRLEDLACINRYWFDTYNGSRFSIVRIHMYPRLKMR +>NC_003119@MetrCp012@ycf1@13390@18672@R@1@1761 hypothetical_chloroplast_RF1 +MIYQLFILDRLVGLWLKILNSAIVMGLYYGFLTTFSIGPSYLFLIRARVM +DKGTETEIAATTGFITGQLMMFISIYYAPLHLALIRPHTITVLTLPYLFF +NFVYKNNKHYYSADSHFYLDLDYGYKNPNSIRKFRIYKVFFNNLFFQLSN +PLLFPSSILLRLMNIYLFRSNNKLLFLTSSFLGWLIGHIFLMKCIGLILL +VWSKQKNSIKSKLTMRFDKYILLQLRNYVGQIFVVFSFVIVVHYLGRTPV +PYLYTYTDEILEYDEKQKDEINGETEIDVEIDSEQEQNGSIEDEEDILSY +LFPKKDKTLENIEQDNNLLALEKPLVTTLFDYRKWNRPLRYIKNDHFERV +VRDENSQFFFHICQSDGKERISFTYPPDLSSFLKIMEKKMDLFTKDKISY +NDNELSNYWSSNNKEKRKKLSNEFFKRAKVLDKKYKKYKKFIPVDVFENR +IRLSNDKRKIKYLTKIYDPFLNGPFRGQSFSPSIQNETYTTNSILINKIH +GLLLINSNYPEFDNSNYPEFDNSNYPEFEQKIDQFDRKFLLTEIGFFFNL +ISQFSEKSVSSFNFDGLYLFPEHEQVKIYSEEKKRKKKFLFEAIRTDQNN +QTIFNRKKCTGINEISKQVPRWSYELIDELEQMTERLTKEFQIRSAKAER +MVIFNGNTDSLTLNIGPRNDNDAIPEVDLNHEFFLVNFLREPDFDRDIIK +GSMRPLRRKIATTKLSQGNAQPHSPIFLEMIDPLYFIFGDLFDDLSQIFK +EMFRKPGTDNSEFVEFQERLEHKYEEDAKDDAEIRRLKIEEDWESILYGL +IIRSFVLLIQSFFRKYILLPSLIITKNIIRILLFQNPEWSEDFRDWSREV +HIKCTYQGIPVSDKELPKNWFDEGIQIRILNPFVLKAWHKSKVQSTEKKK +KKRSTEKKYTENKNFWFLTGYGTLVESYLDEGFPRDPLSIFGPVLKTIRK +QLKKDLKKHFFLVLKFLNERKKWFPTMLKKIENWNIKRILKSILFRFKII +DELSESKKTSTISKNNSKIEVIEVIEESPVKMESINWTNSSFTEKRIKDL +NVKTKTIIKQIETMTEEKKEGILTSEINLNSNKTTYDAKRLELQKNNLQI +LQRRFVRLIRKSYSFFKIFIEGVYIDILLCISSIARIHRQRFLDFLESTD +KILNVKKPIYDKKKKMEEMEERFENLSVSRLISILEKSENITNMNSQNSW +DVSSLSSLSQEYVFYKLSQIQFSNGSKFKIRSILESPGRSFFLKNEIKDY +FFRMQGTYNSKLRHKKRSDSLMNPWTNWFKVLYQYDLPEKRWSRLVSQNW +RNRINEHRVAQNKDLVEYDSYEKNQLIWKELILSKKQEQEGDLLKIEIKN +KIKKQYRYDLFSYQYLNFANKKKSSIYGYRSPNKNQAISYNYNISIQNYL +EEYDILDMEKNLEKNLDRKYFNWMGMNVKRKKTSRPKDKFLIPGFWFFSK +LSKLYCAYKMNPWILPIKFFVLQLDNLELTTEEYVNTVDEDLKSVSYYYK +GSDSKYRTDLKGERDFLLSKYLGFYLHCDSSDEEIGMDNTNLFCLLLRMK +KFNKIVIMSIKKLELDIEMLVDSRTKDFCYTECRDTEDLKERLIFFIEPI +RLPRKKHEQSLLYQTIRLPLIHKSKTRKSWSWKKKKSRVDQKITENKDKN +LYDLFVPENLLSTRRRRELRILTCFNPRNRNTVHRKTINDNENQIKNVSQ +VLTKNKDLDSETKKLMNFKLFLWPNYRLEDLACINRYWFNTHNGSHFSIL +RIHMYPRLKD +>NC_003386@PsnuCp088@ycf1@112439@117550@R@1@1704 hypothetical_protein +MIGRLYMKKLKNLFLFLSSLCPVFPWISQISLVMPFGLYYGFLTALPIGP +SQILSIRTFFLEGNRSGIICILGSMMGQFVILLSIYCSPLYVMLVKPHLM +TLLVIPYMFYYWYRTKNPSRYYILHPIKSLTHAHTRNLLLDSFIFQLLNP +ILLPNPVLTRLLNLFLFRYSSNVFFLTSSLLGWLCGHILFINSIKLLLFR +IEHDSPIIYILMKRSISRTFSILISITFFLYLGRSPVPLITKKFADEITL +SDQKIKENLWEESLWLYRPWPTSFFDQYRWNRPIRYIPNSKSSHNGFVKK +QVSKFFYDECITDGKNAISFASQPSLSIFKKQLMNYLHNSDISISTKDSY +KGWIETKREKRDALNNEFKDRIQFVYNSSTIEEAMENKTGFSHDRNHFLV +KVNDPFLSGSSRIRIPNKKYSSSLLKLHDSKDQTMKISKKTKRKHTRNKM +RNWIFNKHKKWQHNKFPLPWEPIPTKAEKVFWRILNESENPIILEMLTTL +NSIKEKNYQFRITWEHIFQLPRIEKAIFLFRSKQEIEDSIFRYPSHLSLK +NLTLFNIFTRSKNIFYSAKIAVSPILQIEEMQKELPRYNSRLRSDRIDAV +NVDVDIRQRKIKNLGPRKGKLEDKEKEKEKAAQTQTEVKKEREKEKEERV +IKRFQNQSDFRRKLVKGSIRARRRKTGIWRLYQSGTHSPFFLRMKEIPIS +FQSSINALRLNKMKDERAILGIGKELRPFNLYKKRSKADRLTIAARFDFP +IAHAGRGVLLIIQSNIRKYVILPILIICKNIGRIMLFQSPEWKEDWAEWN +QEIHIKCTYDGIEVSHRHLPAHWFKEGLQIKILYPFHLKPWHIHRTNNIN +DLRNEAQIQKEISDFGKQRKLSFSYLTIWGYQTSSVFGSMKKRPSFWRPI +ANALKKKLQRNLFSKLTWISHFFYEIILLSRTFIISKKPNNIPEMSIQSN +ELRYDVSDYELIQKYPNSNEKNDYVVMNEISIESNNRNGKEISHESQDQY +KDNFNNIRSFNDIETLLTDISGTSVEESYRDRIETYLRLNKKNHRYAINI +RLIWNKQLVQTQQEFSRFRRIIMQFMHKGYRLAKRFLTKFYREIFRRFTF +SIQLSIQLVLRLTKNITKLSEKNKVYQNLNLLKKNEQNLKIDSSRNKPVL +SQAYVFQKLWHARTRTKIDVHYLVQSLEREIVNSIENNELKASKLKDLKW +NEHNYLNDHIKDLLEIQGLLKETQTFTEKNWKEWLHCFTRYQISSKIEYG +IVPQKWKNEVKKRWKSNTNKLDKNKEYKTLEKENKYSLYETNNMLKQRIN +NRNNYCEFYNLLYSFIDSTKASNIIKLPIQQKGKEDPIQYINDINKIHEN +IHLNSKKKYKRPQFQSISTEKGDIDSNLMLWLLPNLLDTKPESVTNSLDS +YSFEMYLSQNEDKDSLKKEIRFNAKKLNLDTKEPTSDAMKPTSDTKELIS +DTNEPTSDIKSDDQSENQNKPLKEKSIRERKHHRPIPQVKWKSKSVEKKM +QRINNLTSFLSVIEDRKNMENYIISFCMKMGIDIDLLNSFFTNTEDELSI +QLLDDSAHRLPRLLNDQTLVRKMVSILLNFEKQFEEGITSKISSQSISSI +YRTEKKYSVNSYNLEDIMLSRRYRELRILNSLILEKQYVNFDHWIDKSEK +YPFLNLPSQVQIIKRFLWPTYRLEDLACMNRFWFNTNNGSRFAMLKLRMY +CPD +>NC_004115@ChglCp095@ycf1@114383@118735@R@1@1451 hypothetical_chloroplast_RF1 +MITTYSTFLFNFLSQFQYLVNIPEPLILFGLYYGFLTTLPISFSHIVVIR +NRLIEGKTSSVMAFCGLITGQLCMIGTIYYTPLYKLFIKPHLILLLSIIY +SFFYWQRLRNNQNYDDLREAQSLINVRNFFSFFDSFVFQILNPILLPTPI +FFRLNNVFLFRYSNNLNFFLSFFIGSLIGNFLFFNALNWIRYRFEQDSNV +IYPVLKLLINKSIIPIVFCICLIPIAKYSHIPFCTMKQKEGQSSYSFDKN +WPNIIFDSNQPHRPIRIFSETKTDDNLNINDNLSKKQTSQFFFKECISDG +NVRISYTYPSTLANFQTDLSSSFQDFSLSEQSFDNLYSNWKLEKLSRKDN +LNNLLLTKIKLLNNKKEWFYKHFQNKFGTFIKDDNNYNKFVKKSNDVRLK +QSSKIQIKKSKLLTSDIRDISTTQSGFYDLKKNKLKSFISQKFKMNSNNS +TLPVWNHLNKQLLQNELKRIKKQLQDKTKNIKENDFNNLKLLKSNIETID +NTINDIHHNKIKQITSVDLIKIFATNNKTLLLETLAFNKKITQKDNFNFN +KLFQHKNKKFTTNSGNENTYLNLNDIFKNIKRLPKWRTFSKHVVYDEVSD +IRRRAIKSNSKLKIANKDSDIIIFEYKKSLNFRARLPKGSLRARRKNKFT +WKLFHNNLNSPFFIRSKQLLNKTDIPFLKYNENYLNFFKNFISPDKNINY +LNNDISEMRRQELLFKWDKTNVHILRSMVLVGQAFFRKYIKLPIFIFFKN +LSRQLLYQPSEWTKDWSNWMNEWYIFCYYDGTELAKDQWPEMWLQRGIQI +KLINPFYIKPWYIQKSFIKNKQNKKTRTSYLTVFGSQQELPFGKKIRMPS +FWKPVRREVSKSIKLKLYFPFLTLQKNTIILFEKVFNKKRINEDNKTIEK +SILNKKNEQLILKKDEVIPNNKSIAGKLSKLDFHNQNITKTSIKNATKQI +LIKNEYNSLLKENKNLFTKNKIVFLKIKNILNKLNLKLIKVKINFTYKIK +TVLKIISRNLLKFYSIIQFQLENLGRNNSNDLSYKNQLSYQKDFPNFNNF +CLNQANIIQNLCKNNILKHKKLNQNFQINSKNLNQTNIIDVNPENIKAQD +FKNLLENIYTFTPTINLWDKLSTNNWKISVQNNWKQKSYNNYDLTKKALV +SKNLNFISYFYQNNLINNLNKKIKHTKIFNLSKNYLSLNNLNQNQIKNFD +FQNSLNNNITYKKNIKNFTIRQNVPSQLRRWDWKNNKIKKFVNRLLQKNT +ILLKEEVFNLIPFFDRFTIQNPMIRNWSHPISSILDDEIFTYELLDTFLQ +INKNIDFLHTKQIEDNLSSNSNQAIASLPLSSTTAENFLYYLTTVEDLIS +IEDKKELKILNSLNFNKSTPNYIKTNVVEKSLNENLSKNLQSILSKETLD +SINNTQILKKFLWASYRCEDLACMNRFWFSTNNGSRFGTLRLRLYPNLKN diff --git a/detectors/cds/test/test.db/ycf2.fst b/detectors/cds/test/test.db/ycf2.fst new file mode 100644 index 0000000..729ecc3 --- /dev/null +++ b/detectors/cds/test/test.db/ycf2.fst @@ -0,0 +1,466 @@ +>AC_000188@LyesCp004@ycf2@88196@95032@D@1@2279 Ycf2_protein +MRGHQFKSWIFELREILREIKNSHHFLDSWTQFNSVGSFIHIFFHQERFL +KLFDPRIWSILLSRNSQGSPSNRYFTIKGVILFVVAVLIYRINNRNMVER +KNLYLIGLLPIPMNSIGPRNDTLEESVGSSNINRLIVSLLYLPKGKKISE +SCFLNPKESTWVLPITKKCSMPESNWGSRWWRNWIGKKRDSSCKISNETV +AGIEILFKEKDLKYLEFLFVYYMDDPIRKDHDWELFDRLSLRKSRNRINL +NSGPLFEILVKHWISYLMSAFREKIPIEVEGFFKQQGAGSTIQSNDIEHV +SHLFSRNKWAISLQNCAQFHMWQFRQDLFVSWGKNPPESDFLRNVSRENW +IWLDNVWLVNKDRFFSKVQNVSSNIQYDSTRSSFVQVTDSSQLKGSSDQS +RDHLDSISNEDSEYHTLINQREIQQRKERSILWDPSFLQTERKEIESGRF +PKCLSGYSSMSRLFTEREKQMINHLFPEEIEEFLGNPTRSVRSFFSDRWS +ELHLGSNPTERSTRDQKLLKKQQDLSFVPSRRSEKKEMVNIFKIITYLQN +TVSIHPISSDPGCDMVPKDEPDMDSSNKISFLNKNPFFDLFHLFHDRNRG +GYTLHYDFASEERFQEMADLFTLSITEPDLVYHKGFAFSIDSCGLDQKQF +LNEARDESKKKSLLVLPPIFYEENESFSRRIRKKWVRISCGNDLEDPKPK +IVVFASNNIMEAVTQYRLIRNLIQIQYSTYGYIRNVLNRFFLMNRSDRNF +EYGIQRDQIGKDTLNHRTIMKYTINQYLSNLKKSQKKWFEPLILISRTER +SMNRDPDAYRYKWSNGSKSFQEHLEQSVSKQKSRFQVVFDRLRINQYSID +WSEVIDKKDLSKSLRFFLSKSLLFLSKLLLFLSNSLPFFCVSFGNIPIHR +SEIYIYEELKGPNDQLCNQLLESIGLQIVHLKKLKPFLLDDHDTSQKSKF +LINGGTISPFLFNKIPKWMIDSFHTRNNRRKSFDNPDSYFSMIFHDQDNW +LNPVKPFHRSSLISSFYKANRLRFLNNPHHFCFYWNTRFPFSVEKARINN +SDFTYGQFLNILFIRNKIFSLCVGKKKHAFWGRDTISPIESQVSNIFIPN +DFPQSGDETYNLYKSFHFPSRSDPFVRRAIYSIADISGTPLTEGQIVNFE +RTYCQPLSDMNLSDSEGKNLHQYLNFNSNMGLIHTPCSEKDLSSEKRKKW +SLCLKKCVEKGQTYRTFQRDSAFSTLSKWNLFQTYMPWFLTSTGYKYLNL +IFLDTFSDLLPILSSSQKFVSIFPDIMHGSGISWRILQKKLCLPQWNLIS +EISSKCLHNLLLSEEMIHRNNESPLISTHLRSPNAREFLYSILFLLLVAG +YLVRTHLLFVSRASSELQTEFERVKSLMTPSSMIELRKLLDRYPTSEPNS +FWLKNLFLVALEQLGDSLEEIRGSASGGNMLGPAYGVKSIRSKKKDWNIN +LIEIIDLIPNPINRITFSRNTRHLSHTSKEIYSLIRKRKNVNGDWIDEKI +ESWVANSDSIDDEEREFLVQFSTLTTENRIDQILLSLTHSDHLSKNDSGY +QMIEQPGAIYLRYLVDIHKKHLMNYEFNPSCLAERRIFLAHYQTITYSQT +SCGENSFHFPSHGKPFSLRLALSPSRGILVIGSIGTGRSYLVKYLATNSY +VPFITVFLNKFLDNKSKGFLLDEIDIDDSDDIDDSDNLDASDDIDRDLDT +ELELLTRMNGLTVDMMPEIDRFYITLQFELAKAMSPCIIWIPNIHDLDVN +ESNDLSLGLLVNHLSRDCERCSTRNILVIASTHIPQKVDPALIAPNKLNT +CIKIRRLLIPQQRKHFFTLSYTRGFHLEKKMFHTNGFGSITMGSNARDLV +ALTNEVLSISITQKKSIIDTNTIRSALHRQTWDLRSQVRSVQDHGILFYQ +IGRAVAQNVLLSNCPIDPISIYMKKKSCNEGDSYLYKWYFELGTSMKRLT +ILLYLLSCSAGSVAQDLWSLSVPDEKNGITSYGLVENDSDLVHGLLEVEG +ALVGSSRTEKDCSQFDNDRVTLLLRPEPRNPLDMMQKGSWSILDQRFLYE +KYESEFEEGEGEGALDPQEDLFNHIVWAPRIWRPWGFLFDCIERPNELGF +PYWSRSFRGKRIIYDEEDELQENDSGFLQSGTMQYQTRDRSQGLFRISQF +IWDPADPLFFLFKDQPPGSVFSHRELFADEEMSKGLLTSQTDPPTSLYKR +WFIKNTQEKHFELLINRQRWLRTNSSLSNGSFRSNTLSESYQYLSNLFLS +NGTLLDQMPKTLLRKRWLFPDEMKIGFM +>AC_000188@LyesCp055@ycf2@146312@153148@R@1@2279 Ycf2_protein +MRGHQFKSWIFELREILREIKNSHHFLDSWTQFNSVGSFIHIFFHQERFL +KLFDPRIWSILLSRNSQGSPSNRYFTIKGVILFVVAVLIYRINNRNMVER +KNLYLIGLLPIPMNSIGPRNDTLEESVGSSNINRLIVSLLYLPKGKKISE +SCFLNPKESTWVLPITKKCSMPESNWGSRWWRNWIGKKRDSSCKISNETV +AGIEILFKEKDLKYLEFLFVYYMDDPIRKDHDWELFDRLSLRKSRNRINL +NSGPLFEILVKHWISYLMSAFREKIPIEVEGFFKQQGAGSTIQSNDIEHV +SHLFSRNKWAISLQNCAQFHMWQFRQDLFVSWGKNPPESDFLRNVSRENW +IWLDNVWLVNKDRFFSKVQNVSSNIQYDSTRSSFVQVTDSSQLKGSSDQS +RDHLDSISNEDSEYHTLINQREIQQRKERSILWDPSFLQTERKEIESGRF +PKCLSGYSSMSRLFTEREKQMINHLFPEEIEEFLGNPTRSVRSFFSDRWS +ELHLGSNPTERSTRDQKLLKKQQDLSFVPSRRSEKKEMVNIFKIITYLQN +TVSIHPISSDPGCDMVPKDEPDMDSSNKISFLNKNPFFDLFHLFHDRNRG +GYTLHYDFASEERFQEMADLFTLSITEPDLVYHKGFAFSIDSCGLDQKQF +LNEARDESKKKSLLVLPPIFYEENESFSRRIRKKWVRISCGNDLEDPKPK +IVVFASNNIMEAVTQYRLIRNLIQIQYSTYGYIRNVLNRFFLMNRSDRNF +EYGIQRDQIGKDTLNHRTIMKYTINQYLSNLKKSQKKWFEPLILISRTER +SMNRDPDAYRYKWSNGSKSFQEHLEQSVSKQKSRFQVVFDRLRINQYSID +WSEVIDKKDLSKSLRFFLSKSLLFLSKLLLFLSNSLPFFCVSFGNIPIHR +SEIYIYEELKGPNDQLCNQLLESIGLQIVHLKKLKPFLLDDHDTSQKSKF +LINGGTISPFLFNKIPKWMIDSFHTRNNRRKSFDNPDSYFSMIFHDQDNW +LNPVKPFHRSSLISSFYKANRLRFLNNPHHFCFYWNTRFPFSVEKARINN +SDFTYGQFLNILFIRNKIFSLCVGKKKHAFWGRDTISPIESQVSNIFIPN +DFPQSGDETYNLYKSFHFPSRSDPFVRRAIYSIADISGTPLTEGQIVNFE +RTYCQPLSDMNLSDSEGKNLHQYLNFNSNMGLIHTPCSEKDLSSEKRKKW +SLCLKKCVEKGQTYRTFQRDSAFSTLSKWNLFQTYMPWFLTSTGYKYLNL +IFLDTFSDLLPILSSSQKFVSIFPDIMHGSGISWRILQKKLCLPQWNLIS +EISSKCLHNLLLSEEMIHRNNESPLISTHLRSPNAREFLYSILFLLLVAG +YLVRTHLLFVSRASSELQTEFERVKSLMTPSSMIELRKLLDRYPTSEPNS +FWLKNLFLVALEQLGDSLEEIRGSASGGNMLGPAYGVKSIRSKKKDWNIN +LIEIIDLIPNPINRITFSRNTRHLSHTSKEIYSLIRKRKNVNGDWIDEKI +ESWVANSDSIDDEEREFLVQFSTLTTENRIDQILLSLTHSDHLSKNDSGY +QMIEQPGAIYLRYLVDIHKKHLMNYEFNPSCLAERRIFLAHYQTITYSQT +SCGENSFHFPSHGKPFSLRLALSPSRGILVIGSIGTGRSYLVKYLATNSY +VPFITVFLNKFLDNKSKGFLLDEIDIDDSDDIDDSDNLDASDDIDRDLDT +ELELLTRMNGLTVDMMPEIDRFYITLQFELAKAMSPCIIWIPNIHDLDVN +ESNDLSLGLLVNHLSRDCERCSTRNILVIASTHIPQKVDPALIAPNKLNT +CIKIRRLLIPQQRKHFFTLSYTRGFHLEKKMFHTNGFGSITMGSNARDLV +ALTNEVLSISITQKKSIIDTNTIRSALHRQTWDLRSQVRSVQDHGILFYQ +IGRAVAQNVLLSNCPIDPISIYMKKKSCNEGDSYLYKWYFELGTSMKRLT +ILLYLLSCSAGSVAQDLWSLSVPDEKNGITSYGLVENDSDLVHGLLEVEG +ALVGSSRTEKDCSQFDNDRVTLLLRPEPRNPLDMMQKGSWSILDQRFLYE +KYESEFEEGEGEGALDPQEDLFNHIVWAPRIWRPWGFLFDCIERPNELGF +PYWSRSFRGKRIIYDEEDELQENDSGFLQSGTMQYQTRDRSQGLFRISQF +IWDPADPLFFLFKDQPPGSVFSHRELFADEEMSKGLLTSQTDPPTSLYKR +WFIKNTQEKHFELLINRQRWLRTNSSLSNGSFRSNTLSESYQYLSNLFLS +NGTLLDQMPKTLLRKRWLFPDEMKIGFM +>NC_000932@ArthCp066@ycf2@86474@93358@D@1@2295 Ycf2 +MKGHQFKSWIFELREIVREIKNAHYFLDSWTQFNSVGSFIHIFFHQERFR +KLLDPRIFSILLLRNSQGSTSNRYFTIKGVVLFVVAALLYRINNRNMVES +KNLYLKGLLPIPMNSIGPRNDTSEESFGSCNINRLIVSLLYLTKGKKISE +SCFRDPKESTWVLPITQKCIMPESNWSSRWWRNWIGKKRGFCCKISNETV +AGIDISFKEKDIKYLEFLFVYYMDDPIRKGHDWELFDRLSPSKRRNIINL +NSGQLFEILVKDWICYLMFAFREKIPIEVEGFCKQQGAGSTIQSNDIEHV +SHLFSRNKWAISLQNCAQFHMWQFHQDLFVSWGKNPHESDFFRKISRENW +IWLDNVWLVNKDRFFSKVRNVSSNIQYDSTRSSFVQVTDSSQLNGSSDQF +IDPFDSISNEDSEYHYHTLINQREIQQLKERSILLDPSFIQTEGREIESD +RFPKYLSGYSSMPRLFTEREKRMNNHLLPEESEEFLGNPTRAIRSFFSDR +WSELHLGSNPTERSTRDQKLLKKEQDVSFVPSRRSENKEIVNIFKIITYL +QNTVSIHPISSDLGCDMVPKDELDMDSSNKISFLNKNPFFDLFHLFHERK +RGGYTLRHESEERFQEMADLFTLSITEPDLVYHKGFAFSIDSYGLDQRQF +LKEVFNFRDESKKKSLLVLPPIFYEENESFYRRLRKIWVRISCGNYLEDQ +KRVVFASNNIMEAVNQYRLIRNMIQIQFQYSPYGYIRNVLNRFFLMKRPD +RNFEYGIQRDLIGNDTLNHRTIMKDTINQHLSNLKKSQKKWFDPLIFLSQ +TERSINRDPNAYRYKWSNGSKNFQEHLEHFVSERKSRFQVVFDQLCINQY +SIDWSEVIDKKDLSKSLRFFLSKLLRFFLSKLLLFLSKLLLFLSNSLPFF +FVSFENIPIHRSEIHIYELKGPNDQLCNQLLESIGLQIVHLKKLKPFLLD +DHNTSQKSKFLINGGTISPFLFNKIPKWMIDSFHTRKNRRKSFDNTDSAY +FSIVSHDQDNWLNPVKPFQRSSLISSFSKANRLRFLNNPHHFCFYCNKRF +PFYVEKARLNNSDFTFTYGQFLTILFIHNKTFSSCGGKKKHAFLERDTIS +PSSIESQVSNIFISNDFPQSGDERYNLYKSFHFPIRSDPLVRRAIYSIAD +ISGTPLIEGQRVNFERTYCQTLSDMNLSDSEEKSLHQYLNFNSNMGLIHT +PCSEKYLQRKKRSLCLKKCVDKGQMDRTFQRDSAFSTLSKWNLFQTYMPW +FFTSTGYKYLNLIFLDTFSDLLRILSSSQKFVSIFHDIMHGLDISWRILQ +KKLCLPQRNLISEISSKSLHNLLLSEEMIHRNNESSLISTHLRSPNVREV +LYSILFLLLVAGYIVRTHLLFVSRAYSELQTEFEKIKSLMIPSYMIELRK +LLDRYPTSELNSFWLKNLFLVALEQLGDCLEEIRGSGGNMLWGGDPAYGV +KSIRSKKKDLKINFIDIIDLISIIPNPINRITFSRNTRHLSHTSKEIYSL +IRKRKNVSGDWIDDKIESWVANSDSIDDKEREFLVQFSTLRAEKRIDQIL +LSLTHSDHLSKNDSGYQMIEQPGTIYLRYLVDIHKKYLMNYEFNTSCLAE +RRIFLAHYQTITYSQTSCGANSFHFPSHGKPFSLRLALSPSRSILVIGSI +GTGRSYLVKYLATNSYVPFITVFLNKFLDNKPKGFFIDDIDIDDSDDIDA +SNDIDRELDTELELLTMMNALTMDMMLEIDRFYITLQFELAKAMSPCIIW +IPNIHDLDVNESSYLALGLLVNSLSRDCERCSTRNILVIASTHIPQKVDP +ALIAPNKLNTCIKIRRLLIPQQRKHFFTLSYTRGFHLEKKMFHTNGFESI +TMGSSARDLVALTNEALSISITQKKSIIDTNTIRSALHRQTWDLRSQVRS +VQDHGILFYQIGRAVAQNVLISNCPIDPISIYMKKKSCNEGDSYLYKWYF +ELGTSMKKFTILLYLLSCSAGSVAQDLWSLPVPDEKNRITSYGFVENDSD +LVHGLLEVQGALVGSSRTEKDCSQFDNDRVTLLFRSEPRDPLYMMQDGSC +SIVDQRFLYEKYESEFEEGEGEGVLDPQQIEEDLFNHIVWAPRIWRPRGF +LFDCIERPNELGFPYSAGSFRGKRIIYDEKYELQENDSEFLQSGTMQYQR +RDRSSKEQGFFRISQFIWDPADPLFFLFKDQPFVSVFSHREFFADEEMSK +GLLTSQTDPPTSIYKRWFIKNTQEKHFELLIQRQRWLRTNSSLSNGFFRS +NTRSESYQYLSNLFISNGTLLDRMTKTLLKKRWLFSDEMKIGFM +>NC_000932@ArthCp083@ycf2@145291@152175@R@1@2295 Ycf2 +MKGHQFKSWIFELREIVREIKNAHYFLDSWTQFNSVGSFIHIFFHQERFR +KLLDPRIFSILLLRNSQGSTSNRYFTIKGVVLFVVAALLYRINNRNMVES +KNLYLKGLLPIPMNSIGPRNDTSEESFGSCNINRLIVSLLYLTKGKKISE +SCFRDPKESTWVLPITQKCIMPESNWSSRWWRNWIGKKRGFCCKISNETV +AGIDISFKEKDIKYLEFLFVYYMDDPIRKGHDWELFDRLSPSKRRNIINL +NSGQLFEILVKDWICYLMFAFREKIPIEVEGFCKQQGAGSTIQSNDIEHV +SHLFSRNKWAISLQNCAQFHMWQFHQDLFVSWGKNPHESDFFRKISRENW +IWLDNVWLVNKDRFFSKVRNVSSNIQYDSTRSSFVQVTDSSQLNGSSDQF +IDPFDSISNEDSEYHYHTLINQREIQQLKERSILLDPSFIQTEGREIESD +RFPKYLSGYSSMPRLFTEREKRMNNHLLPEESEEFLGNPTRAIRSFFSDR +WSELHLGSNPTERSTRDQKLLKKEQDVSFVPSRRSENKEIVNIFKIITYL +QNTVSIHPISSDLGCDMVPKDELDMDSSNKISFLNKNPFFDLFHLFHERK +RGGYTLRHESEERFQEMADLFTLSITEPDLVYHKGFAFSIDSYGLDQRQF +LKEVFNFRDESKKKSLLVLPPIFYEENESFYRRLRKIWVRISCGNYLEDQ +KRVVFASNNIMEAVNQYRLIRNMIQIQFQYSPYGYIRNVLNRFFLMKRPD +RNFEYGIQRDLIGNDTLNHRTIMKDTINQHLSNLKKSQKKWFDPLIFLSQ +TERSINRDPNAYRYKWSNGSKNFQEHLEHFVSERKSRFQVVFDQLCINQY +SIDWSEVIDKKDLSKSLRFFLSKLLRFFLSKLLLFLSKLLLFLSNSLPFF +FVSFENIPIHRSEIHIYELKGPNDQLCNQLLESIGLQIVHLKKLKPFLLD +DHNTSQKSKFLINGGTISPFLFNKIPKWMIDSFHTRKNRRKSFDNTDSAY +FSIVSHDQDNWLNPVKPFQRSSLISSFSKANRLRFLNNPHHFCFYCNKRF +PFYVEKARLNNSDFTFTYGQFLTILFIHNKTFSSCGGKKKHAFLERDTIS +PSSIESQVSNIFISNDFPQSGDERYNLYKSFHFPIRSDPLVRRAIYSIAD +ISGTPLIEGQRVNFERTYCQTLSDMNLSDSEEKSLHQYLNFNSNMGLIHT +PCSEKYLQRKKRSLCLKKCVDKGQMDRTFQRDSAFSTLSKWNLFQTYMPW +FFTSTGYKYLNLIFLDTFSDLLRILSSSQKFVSIFHDIMHGLDISWRILQ +KKLCLPQRNLISEISSKSLHNLLLSEEMIHRNNESSLISTHLRSPNVREV +LYSILFLLLVAGYIVRTHLLFVSRAYSELQTEFEKIKSLMIPSYMIELRK +LLDRYPTSELNSFWLKNLFLVALEQLGDCLEEIRGSGGNMLWGGDPAYGV +KSIRSKKKDLKINFIDIIDLISIIPNPINRITFSRNTRHLSHTSKEIYSL +IRKRKNVSGDWIDDKIESWVANSDSIDDKEREFLVQFSTLRAEKRIDQIL +LSLTHSDHLSKNDSGYQMIEQPGTIYLRYLVDIHKKYLMNYEFNTSCLAE +RRIFLAHYQTITYSQTSCGANSFHFPSHGKPFSLRLALSPSRSILVIGSI +GTGRSYLVKYLATNSYVPFITVFLNKFLDNKPKGFFIDDIDIDDSDDIDA +SNDIDRELDTELELLTMMNALTMDMMLEIDRFYITLQFELAKAMSPCIIW +IPNIHDLDVNESSYLALGLLVNSLSRDCERCSTRNILVIASTHIPQKVDP +ALIAPNKLNTCIKIRRLLIPQQRKHFFTLSYTRGFHLEKKMFHTNGFESI +TMGSSARDLVALTNEALSISITQKKSIIDTNTIRSALHRQTWDLRSQVRS +VQDHGILFYQIGRAVAQNVLISNCPIDPISIYMKKKSCNEGDSYLYKWYF +ELGTSMKKFTILLYLLSCSAGSVAQDLWSLPVPDEKNRITSYGFVENDSD +LVHGLLEVQGALVGSSRTEKDCSQFDNDRVTLLFRSEPRDPLYMMQDGSC +SIVDQRFLYEKYESEFEEGEGEGVLDPQQIEEDLFNHIVWAPRIWRPRGF +LFDCIERPNELGFPYSAGSFRGKRIIYDEKYELQENDSEFLQSGTMQYQR +RDRSSKEQGFFRISQFIWDPADPLFFLFKDQPFVSVFSHREFFADEEMSK +GLLTSQTDPPTSIYKRWFIKNTQEKHFELLIQRQRWLRTNSSLSNGFFRS +NTRSESYQYLSNLFISNGTLLDRMTKTLLKKRWLFSDEMKIGFM +>NC_001568@EpviCp27@ycf2@22045@28695@D@1@2217 Ycf2 +MKEHPFPYKSWILELREIKNSHYFLDSWTKFNSVGSYINIFSHQERFIKL +FDPRILSILLSRNSQGSTSNRYFTIKGVILFVVAVLIYRINNRNMVEIKN +IYWRGLLPIPMNSIGPRNDTLEELVGSYNINRFIVSLLYLTKGKNISESF +FLNLKESTLVLPITKKCSMPESNWGSRWWRNWTGKNRDYSCKISNETVAG +IEILFKEKDKKYLEFIFFYYMDDPIRKDRDWELFDRLSPSKRLNKINFYS +GPLFEILVKRRIYYLMSAFREKIPIEVVKGFFKQQKVGSTIQSNDIEHVS +HFFSRNKRAISLKNSAQFNMWQFRQDLLVSWGENPHESDFLRNVSRANWI +WLNNVWLVNKYRFCRKVRNVSSNIKYKYDSTRSRSSFVQVTDSSQLKGSY +YKSSGHFYSVISNEDSEYHTLINQREIKPLKSIFFDPSFLQTEATEIESD +QLQKRPSGYSSTLFTEHEKQMINHMLPEEIEEFIGNPTRLVHSFLSDRWS +ELHLGSNPTERSTRDHKLLKKQQDLSFVPSRRSENKELVNILKIITYLKN +TVSIHPISSDPGCDGVLKDEPDMDSSNKISVFNKNTFIYLFHLFHDWNRV +GYTLNLHHDFELEERFQEKADLFTLSITEPDLVYHKGFSFSIYMDQKQKM +VVFASNNIMEAVNQSRFIRNMIKIQYSTYGYIRNVLHRFFLMNRSDHNLE +YEIKRDQIGKDTLNHRTIIKYMINQHLSNFKKSQNKWFNPILFFSRTERS +VNRNPDAYRYKRSNGSNNFLEHLEHFVSEQKSHFKFKIVFDLIRFNQYSI +DWSAFIDTKDLSKPLRFFLSKLLFFLSNSLPFFCVSFGNIPIHRSEIYIY +ELKDPNDQLCNQFLEPIDLKIVHLKKRKPFLLGYHGTSRKLKLLITGGRP +FLFNKIPRCMIDSFHTINNRSKSFDNTDSYLSMIFHNKDNWLNLVKPFHR +SSLISYFYKANRLQFLNNPHNFCFYCNTRLPFYVEKAHIHNYYFTYGQFL +NILFIRNKIFSLCVDKKKHAFWGGRDTISPIESQVSKIFIPKNFPQSGDE +TYNLSQPFHFPSRYDPFVRLIANIYGTPLTEGQIVNLGRTYCQPLSDMNL +SDSEGKNFHQYLNFNSNMGLIHTPCSDKYLPSEKRKKRSLCINKYKCVEK +GQMYRTFQRKVAFSTLSKWNLFQTYMPWFLTSAGYKYINLIFLDTFSELL +SILSSSKKFVSIFNNIMHGSGISWRIINKKRCLPQWNLISEISSKCLHNL +LLSEETIRQNNESPLISTHLRSPNVREFLYSILFLLLVVGYLVRTHLLFV +SRASSELQTEFKRVKSLMIPSSMIELRKLLNRYPTPASNSFWLKNLFIVA +MEQLVYSLEEIRASGGNLLGPAYGVKSICSKNKYFNINLIDLIPNPINRI +IFSRNMRHLSHTSKEIYSLIRKRKNVNGDWIDDIIESWVANSDSIDDEER +EFLVQFSALTTEKRIYQILLSLTHSDHLSKNDSGYKMIEQPGAIYLRYLV +DIHKKYLLNYECNTSCLVERRVFLAHSQTITYSQTSRGTNTLHFPSQGKP +FSISLALSPSKGILVIGSIGTGRSFLVKYLATNSYVPFITVFLNKFLDNK +PKGFLVDDNDDNDSSDDIYASDDINSDLDTELELITMMNALTMDMMLELD +RFFTTLQLELAKAMSPWIIWIPNIHDLDVNESNYLSFGLLVNHLSERCST +NNIIVIASTHIPKKVDPALLAPNKLNTCIKIRRLLIPQQRKHFCTLSYTR +GFHLENKIFHTNGFGSITMGSSARDLVALTNEALSISITQNKSILDTNTI +RSALHRQTWDLRSGVRSFQDNGILSYQIGRAITQNVLLSNCPIDPISIYM +KKKSCTCNGGDYYFYKWYFGLGTSMKKLTILLYLLSCSAGSVAQDLWSLP +GPAEKNGITSYGLVENDSDLVRGLLEVEGALVGSSRTEKDCSPFDNDRVI +FTLILRPEPGNPLDIIKKGSCSIFDHRFIYEKYESEFEEGYGEGALDPQQ +IEEDLFNHIVWAPRIWRPWGFIFYCIERPNELGFPYWSRSFRGKRIVYDK +DEEGELQENDSELLKSGTVQYQTRDRSSKEQGLLKINQFIWDPADPLFFL +LKDQPPGSVFSHRRFFADEEMSKGLLTSQKDPPTSIYKRWFIKNTQEQHF +ELLINRQRWLRTKSSLSKSNGSFRSNTLFESYQYLSTLFLSNGTLFDKMT +KTLLIKRWLFPDEMQM +>NC_001568@EpviCp32@ycf2@61133@67783@R@1@2217 Ycf2 +MKEHPFPYKSWILELREIKNSHYFLDSWTKFNSVGSYINIFSHQERFIKL +FDPRILSILLSRNSQGSTSNRYFTIKGVILFVVAVLIYRINNRNMVEIKN +IYWRGLLPIPMNSIGPRNDTLEELVGSYNINRFIVSLLYLTKGKNISESF +FLNLKESTLVLPITKKCSMPESNWGSRWWRNWTGKNRDYSCKISNETVAG +IEILFKEKDKKYLEFIFFYYMDDPIRKDRDWELFDRLSPSKRLNKINFYS +GPLFEILVKRRIYYLMSAFREKIPIEVVKGFFKQQKVGSTIQSNDIEHVS +HFFSRNKRAISLKNSAQFNMWQFRQDLLVSWGENPHESDFLRNVSRANWI +WLNNVWLVNKYRFCRKVRNVSSNIKYKYDSTRSRSSFVQVTDSSQLKGSY +YKSSGHFYSVISNEDSEYHTLINQREIKPLKSIFFDPSFLQTEATEIESD +QLQKRPSGYSSTLFTEHEKQMINHMLPEEIEEFIGNPTRLVHSFLSDRWS +ELHLGSNPTERSTRDHKLLKKQQDLSFVPSRRSENKELVNILKIITYLKN +TVSIHPISSDPGCDGVLKDEPDMDSSNKISVFNKNTFIYLFHLFHDWNRV +GYTLNLHHDFELEERFQEKADLFTLSITEPDLVYHKGFSFSIYMDQKQKM +VVFASNNIMEAVNQSRFIRNMIKIQYSTYGYIRNVLHRFFLMNRSDHNLE +YEIKRDQIGKDTLNHRTIIKYMINQHLSNFKKSQNKWFNPILFFSRTERS +VNRNPDAYRYKRSNGSNNFLEHLEHFVSEQKSHFKFKIVFDLIRFNQYSI +DWSAFIDTKDLSKPLRFFLSKLLFFLSNSLPFFCVSFGNIPIHRSEIYIY +ELKDPNDQLCNQFLEPIDLKIVHLKKRKPFLLGYHGTSRKLKLLITGGRP +FLFNKIPRCMIDSFHTINNRSKSFDNTDSYLSMIFHNKDNWLNLVKPFHR +SSLISYFYKANRLQFLNNPHNFCFYCNTRLPFYVEKAHIHNYYFTYGQFL +NILFIRNKIFSLCVDKKKHAFWGGRDTISPIESQVSKIFIPKNFPQSGDE +TYNLSQPFHFPSRYDPFVRLIANIYGTPLTEGQIVNLGRTYCQPLSDMNL +SDSEGKNFHQYLNFNSNMGLIHTPCSDKYLPSEKRKKRSLCINKYKCVEK +GQMYRTFQRKVAFSTLSKWNLFQTYMPWFLTSAGYKYINLIFLDTFSELL +SILSSSKKFVSIFNNIMHGSGISWRIINKKRCLPQWNLISEISSKCLHNL +LLSEETIRQNNESPLISTHLRSPNVREFLYSILFLLLVVGYLVRTHLLFV +SRASSELQTEFKRVKSLMIPSSMIELRKLLNRYPTPASNSFWLKNLFIVA +MEQLVYSLEEIRASGGNLLGPAYGVKSICSKNKYFNINLIDLIPNPINRI +IFSRNMRHLSHTSKEIYSLIRKRKNVNGDWIDDIIESWVANSDSIDDEER +EFLVQFSALTTEKRIYQILLSLTHSDHLSKNDSGYKMIEQPGAIYLRYLV +DIHKKYLLNYECNTSCLVERRVFLAHSQTITYSQTSRGTNTLHFPSQGKP +FSISLALSPSKGILVIGSIGTGRSFLVKYLATNSYVPFITVFLNKFLDNK +PKGFLVDDNDDNDSSDDIYASDDINSDLDTELELITMMNALTMDMMLELD +RFFTTLQLELAKAMSPWIIWIPNIHDLDVNESNYLSFGLLVNHLSERCST +NNIIVIASTHIPKKVDPALLAPNKLNTCIKIRRLLIPQQRKHFCTLSYTR +GFHLENKIFHTNGFGSITMGSSARDLVALTNEALSISITQNKSILDTNTI +RSALHRQTWDLRSGVRSFQDNGILSYQIGRAITQNVLLSNCPIDPISIYM +KKKSCTCNGGDYYFYKWYFGLGTSMKKLTILLYLLSCSAGSVAQDLWSLP +GPAEKNGITSYGLVENDSDLVRGLLEVEGALVGSSRTEKDCSPFDNDRVI +FTLILRPEPGNPLDIIKKGSCSIFDHRFIYEKYESEFEEGYGEGALDPQQ +IEEDLFNHIVWAPRIWRPWGFIFYCIERPNELGFPYWSRSFRGKRIVYDK +DEEGELQENDSELLKSGTVQYQTRDRSSKEQGLLKINQFIWDPADPLFFL +LKDQPPGSVFSHRRFFADEEMSKGLLTSQKDPPTSIYKRWFIKNTQEQHF +ELLINRQRWLRTKSSLSKSNGSFRSNTLFESYQYLSTLFLSNGTLFDKMT +KTLLIKRWLFPDEMQM +>NC_001879@NitaCp068@ycf2@88885@95727@D@1@2281 Ycf2 +MRGHQFKSWIFELREILREIKNSHHFLDSWTQFNSAGSFIHIFFHQERFL +KLFDPRIWSILLSRNSQGSTSNRYFTIKGVILFVVAVLIYRINNRNMVER +KNLYLIGLLPIPMNSIGPRNDTLEESVGSSNINRLIVSLLYLPKGKKISE +SCFLNPKESTWVLPITKKCSMPESNWGSRWWRNWIGKKRDSSCKISNETV +AGIEILFKEKDLKYLEFLFVYYMDDPIRKDHDWELFDRLSLRKSRNRINL +NSGPLFEILVKHWISYLMSAFREKIPIEVEGFFKQQGAGSTIQSNDIEHV +SHLFSRNKWAISLQNCAQFHMWQFRQDLFVSWGKNPPESDFLRNVSRENW +IWLDNVWLVNKDRFFSKVQNVSSNIQYDSTRSSFVQVTDSSQLKGSSDQS +RDHLDSISNEDSEYHTLINQREIQQRKERSILWDPSFLQTERKEIESGRF +PKCLSGYSSMSRLFTEREKQMINHLFPEEIEEFLGNPTRSVRSFFSDRWS +ELHLGSNPTERSTRDQKLLKKQQDLSFVPSKRSENKEMVNIFKIITYLQN +TVSIHPISSDPGCDMVPKDEPDMDSSNKISFLNKNPFFDLFHLFHDRNRG +GYTLHYDFESEERFQEMADLFTLSITEPDLVYHKGFAFSIDSCGLDQKQF +LNEARDESKKKSLLVLPPIFYEENESFSRRIRKKWVRISCGNDLEDPKPK +IVVFASNNIMEAVTQYRLIRNLIQIQYSTYGYIRNVLNRFFLMNRSDRNF +EYGIQRDQIGKDTLNHRTIMKYTINQYLSNLKKSQKKWFEPLILISRTER +SMNRDPDAYRYKWSNGSKNFQEHLEQSVSEQKSRFQVVFDRLRINQYSID +WSEVIDKKDLSKPLRFFLSKSLLFLSKLLFFLSNSLPFFCVSFGNIPIHR +SEIYIYELKGPNDQLCNQLLESIGLQIVHLKKWKPFLLDDHDTSQKSKFL +INGGTISPFLFNKIPKWMIDSFHTRNNRRKSFDNPDSYFSMIFHDQDNWL +NPVKPFHRSSLISSFYKANRLRFLNNPHHFCFYWNTRFPFSVEKARINNS +DFTYGQFLNILFIRNKIFSLCVGKKKHAFWGRDTISPIESQVSNIFIPND +FPQSGDETYNLYKSFHFPSRSDPFVRRAIYSIADISGTPLTEGQIVNFER +TYCQPLSDMNLSDSEGKNLHQYLNFNSNMGLIHTPCSEKDLSSEKRKKRS +LCLKKCVEKGQMYRTFQRDSAFSTLSKWNLFQTYMPWFLTSTGYKYLNLI +FLDTFSDLLPILSSSQKFVPIFHDIMHGSGISWRILQKKLCLPQWNLISE +ISSKCLHNLLLSEEMIHRNNESPLISTHLRSPNAREFLYSILFLLLVAGY +LVRTHLLFVSRASSELQTEFEKVKSLMIPSSMIELRKLLDRYPTSEPNSF +WLKNLFLVALEQLGDSLEEIRGSASGGNMLGPAYGVKSIRSKKKDWNINL +IEIIDLIPNPINRITFSRNTRHLSHTSKEIYSLIRKRKNVNGDWIDDKIE +SWVANSDSIDDEEREFLVQFSTLTTENRIDQILLSLTHSDRLSKNDSGYQ +MIEQPGAIYLRYLVDIHKKHLMNYEFNPSCLAERRIFLAHYQTITYSQTS +CGENSFHFPSHGKPFSLRLALSPSRGILVIGSIGTGRSYLVKYLATNSYV +PFITVFLNKFLDNKPKGFLLDEIDIDDSDDIDDSDNLDASDDIDRDLDTE +LKLLTRMNGLTMDMMPEIDRFYITLQFELAKAMSPCIIWIPNIHDLDVNE +SNDLALGLLVNHLSRDCERCSTRNILVIASTHIPQKVDPALIAPNKLNTC +IKIRRLLLPQQRKHFFTLSYTRGFHLEKKMFHTNGFGSITMGSNARDLVA +LTNEVLSISITQKKSIIDTNTIRSALHRQTWDLRSQVRSVQDHGILFYQI +GRAVAQNVLLSNCPIDPISIYMKKKSCNEGDSYLYKWYFELGTSMKRLTI +LLYLLSCSAGSVAQDLWSLSGPDEKNGITSYGLVENDSDLVHGLLEVEGA +LVGSSRTEKDCSQFDNDRVTLLLRPEPRNPLDMMQNGSCSILDQRFLYEK +YESEFEEGEGEGALDPQEDLFNHIVWAPRIWRPWGFLFDCIERPNELGFP +YWSRSFRGKRIIYDEEDELQENDSEFLQSGTMQYQTRDRSSKEQGLFRIS +QFIWDPADPLFFLFKDQPPGSVFSHRELFADEEMSKGLLTSQTDPPTSIY +KRWFIKNTQEKHFELLINRQRWLRTNSSLSNGSFRSNTLSESYQYLSNLF +LSNGTLLDQMTKTLLRKRWLFPDEMKIGFM +>NC_001879@NitaCp102@ycf2@146903@153745@R@1@2281 Ycf2 +MRGHQFKSWIFELREILREIKNSHHFLDSWTQFNSAGSFIHIFFHQERFL +KLFDPRIWSILLSRNSQGSTSNRYFTIKGVILFVVAVLIYRINNRNMVER +KNLYLIGLLPIPMNSIGPRNDTLEESVGSSNINRLIVSLLYLPKGKKISE +SCFLNPKESTWVLPITKKCSMPESNWGSRWWRNWIGKKRDSSCKISNETV +AGIEILFKEKDLKYLEFLFVYYMDDPIRKDHDWELFDRLSLRKSRNRINL +NSGPLFEILVKHWISYLMSAFREKIPIEVEGFFKQQGAGSTIQSNDIEHV +SHLFSRNKWAISLQNCAQFHMWQFRQDLFVSWGKNPPESDFLRNVSRENW +IWLDNVWLVNKDRFFSKVQNVSSNIQYDSTRSSFVQVTDSSQLKGSSDQS +RDHLDSISNEDSEYHTLINQREIQQRKERSILWDPSFLQTERKEIESGRF +PKCLSGYSSMSRLFTEREKQMINHLFPEEIEEFLGNPTRSVRSFFSDRWS +ELHLGSNPTERSTRDQKLLKKQQDLSFVPSKRSENKEMVNIFKIITYLQN +TVSIHPISSDPGCDMVPKDEPDMDSSNKISFLNKNPFFDLFHLFHDRNRG +GYTLHYDFESEERFQEMADLFTLSITEPDLVYHKGFAFSIDSCGLDQKQF +LNEARDESKKKSLLVLPPIFYEENESFSRRIRKKWVRISCGNDLEDPKPK +IVVFASNNIMEAVTQYRLIRNLIQIQYSTYGYIRNVLNRFFLMNRSDRNF +EYGIQRDQIGKDTLNHRTIMKYTINQYLSNLKKSQKKWFEPLILISRTER +SMNRDPDAYRYKWSNGSKNFQEHLEQSVSEQKSRFQVVFDRLRINQYSID +WSEVIDKKDLSKPLRFFLSKSLLFLSKLLFFLSNSLPFFCVSFGNIPIHR +SEIYIYELKGPNDQLCNQLLESIGLQIVHLKKWKPFLLDDHDTSQKSKFL +INGGTISPFLFNKIPKWMIDSFHTRNNRRKSFDNPDSYFSMIFHDQDNWL +NPVKPFHRSSLISSFYKANRLRFLNNPHHFCFYWNTRFPFSVEKARINNS +DFTYGQFLNILFIRNKIFSLCVGKKKHAFWGRDTISPIESQVSNIFIPND +FPQSGDETYNLYKSFHFPSRSDPFVRRAIYSIADISGTPLTEGQIVNFER +TYCQPLSDMNLSDSEGKNLHQYLNFNSNMGLIHTPCSEKDLSSEKRKKRS +LCLKKCVEKGQMYRTFQRDSAFSTLSKWNLFQTYMPWFLTSTGYKYLNLI +FLDTFSDLLPILSSSQKFVPIFHDIMHGSGISWRILQKKLCLPQWNLISE +ISSKCLHNLLLSEEMIHRNNESPLISTHLRSPNAREFLYSILFLLLVAGY +LVRTHLLFVSRASSELQTEFEKVKSLMIPSSMIELRKLLDRYPTSEPNSF +WLKNLFLVALEQLGDSLEEIRGSASGGNMLGPAYGVKSIRSKKKDWNINL +IEIIDLIPNPINRITFSRNTRHLSHTSKEIYSLIRKRKNVNGDWIDDKIE +SWVANSDSIDDEEREFLVQFSTLTTENRIDQILLSLTHSDRLSKNDSGYQ +MIEQPGAIYLRYLVDIHKKHLMNYEFNPSCLAERRIFLAHYQTITYSQTS +CGENSFHFPSHGKPFSLRLALSPSRGILVIGSIGTGRSYLVKYLATNSYV +PFITVFLNKFLDNKPKGFLLDEIDIDDSDDIDDSDNLDASDDIDRDLDTE +LKLLTRMNGLTMDMMPEIDRFYITLQFELAKAMSPCIIWIPNIHDLDVNE +SNDLALGLLVNHLSRDCERCSTRNILVIASTHIPQKVDPALIAPNKLNTC +IKIRRLLLPQQRKHFFTLSYTRGFHLEKKMFHTNGFGSITMGSNARDLVA +LTNEVLSISITQKKSIIDTNTIRSALHRQTWDLRSQVRSVQDHGILFYQI +GRAVAQNVLLSNCPIDPISIYMKKKSCNEGDSYLYKWYFELGTSMKRLTI +LLYLLSCSAGSVAQDLWSLSGPDEKNGITSYGLVENDSDLVHGLLEVEGA +LVGSSRTEKDCSQFDNDRVTLLLRPEPRNPLDMMQNGSCSILDQRFLYEK +YESEFEEGEGEGALDPQEDLFNHIVWAPRIWRPWGFLFDCIERPNELGFP +YWSRSFRGKRIIYDEEDELQENDSEFLQSGTMQYQTRDRSSKEQGLFRIS +QFIWDPADPLFFLFKDQPPGSVFSHRELFADEEMSKGLLTSQTDPPTSIY +KRWFIKNTQEKHFELLINRQRWLRTNSSLSNGSFRSNTLSESYQYLSNLF +LSNGTLLDQMTKTLLRKRWLFPDEMKIGFM +>NC_002202@SpolCp103@ycf2@142690@149085@R@1@2132 Ycf2 +MKGHQFKSWIFELREILREIKNSHYFLDSWTQFNSVGSFIHIFFYQERFL +KLFDPRIWSILLSPNSQGSTSNRYFTIKGVVLFVVVVLIYRITNRNMVER +KNLYLIGLFPIPMNSIGPRNDTLEKSFGSSNINRLIVSLLYLPKGKKISE +SYFLDPKESTWFLPITKKCIMPESNRGSRWWRNWIGKRRDSSCKISNETV +AGIEISFKEKDIQYLEFPFVYYMDDPIRKDHDWELFDCLSLFLRNVSREN +WIWLDNVRLVNKDRFFSKVRNVSSNIQYDFTRSSFVQVTDSSQLKESSDQ +SRDRSNSISNADSEYHTLINKREIQQLKERSILRDPSFLQTEGTEIESDR +FPKCLSGYSSMPRLFTAREKQMIIHLLPEEIEQLLENPTRSIRSFFSGRW +SELHLGSNPTERSTRDPQLLKKQQDVSFAPSRQSENKEMVNIFKIIKYLQ +NTVSIHPISSDPGCDMVPKDELDMDSSDKISFLNKNSFFDLFHLFHDRNR +GGYALHHDFESEEKFQEMADLFTLSITDPDLVYHRGFSFSIDSCGLDQKQ +FLNEVFNSRDESKKKSLLVLSPIFYEENESFYRRIRKKGVRISRNVLNRF +FLINRSDRSFEYGIQRDQIGNDTLNHRTIRKYMINQDFSNLKKSQKKWFD +PLIFLSRTERFMNRDPDAYRYKWFNGSKNFQEHLEHFVSEQKSRFQVVFD +QLRINQYSIDWSEVIDKKDLSKSLRFFLSKSLRFFLSKLLLFLSNSLPFF +FVSFGNIPINRSEIRIYELKGPNDQLYNPLVESIGLQIVHLKKWKAFLLD +DHDTFQKSKFLINGGTISPFLFNKIPKWMIDSFHTRNNSGKSFDNTDSYF +SMISHDQNNWLNPVKPFHRSSLISSFYKANQLRFLNNPHHFCFYCNKRFP +FYMEKARINNSDFTYRQFLNILFIHNKLFSLCVGKKKHAFLERDTISPIE +SQVSNIFLPNDFPIRSDLLVRRTIYSIADISGTPLTEGQLVHFERTYCQP +LSDMNLSDSEKKNLHQYLNFNSNMGFIYTPCSEKYLLSEKRKKRSLCLKK +CVEKGQMYRTFQRDSAFSTLSKWNLFQTYMPWFLTSTGYKYLNFLFLDTF +SDLLPILSSSQKFLSILHDIMHGSGISWRILQKKLCLPPWNLISEISSKC +LHNLLLPEEMIHRNNESPLIWTHLASPNVREFFYSILFLLFVAGYLVRTH +LLFVFRASSELQTEFERVKSLMIPSYMIELRKLLDRYPTSEPNSFWLKNL +FLVALEQLGDSLEEIRGSASGDNMLLGGGPGPAYGFKSIRSKKKYLNINL +IDILDLISIIPNPINRITFSRNTRHLSHTSKEIYSLIRKRKRVNGDWIDD +KIESWVASSDSIDDEEREFLVQFSTLTTEKRIDQILLSLTHSDHLSKNDS +GYQLIEQPGAIYLRYLVDIHKKYLMNYEFNTSCLAERRVFLAHYQTITYS +QTSCGANSFHFPSHGKPFSLRLALSPSRGILVIGSIGTGRSYLVKYLATN +SYVPFITVFLNKFLDNKPKGSLIDASDDIDRDLDTELELLTMMNALTMDM +MPEIDQFSITLQFELAKAMSPCIIWIPNIHDLDVNESNYLSLGLFVNYLS +RDCERGSTRNILVIASTHIPQKVDPALIAPNQLNTCIKIRRLRIPQQRKH +FFTLSYTRGFHLEKKMFHTNGFGSITMGSNVRDLVAFINEALSISITQKK +SIIDTNTIRSALHRQTWDLRSQVRSVQDHGILFYQIGRAVAQNVLLSNCP +IDPISTYMKKKSCNEGDSYLYKWYFELGTSMKKLTILLYLLSCSAGSVAQ +DLWSLPGPDEKNGITSYGLVENDSYLVHGLLEVEGALVGSSRIEKACSQN +DRVTLFLRPELRNPLDMMQNGSCSILDHRFLYEKYESELEEGEGALDPQQ +IEEDLFNHIVWAPRIWNPWGFLFDCIERPNELGFPYWARSFRGKRSIYDK +EDELQENDSEFLQSGTMQYQTRDRSSKEQGFFRISQFIWDPADPLFFLFK +DQPFVSVFSHREFFADEEISKGLLTSQMNPPISIFQRWFIKNTQEKHFEL +LINRQRWLRTNSSLSNGSFRSNTLSESYQYLSNLFLSNGTLLDQMTKTLL +RKRWLFPDEMKIGFMQEEKDFPFLSRKDMWP +>NC_002693@OeelhCp081@ycf2@92143@99165@D@1@2341 Ycf2 +MGNQRNRVNLNPFRFWVFELREILREIKNSRYPFNSVGSFIHIFVHQERF +LKLLDPRIWSVLRSQGSTGVVLFLVAVLIYRINNRNMIERKNIYLTGLLP +IPTNFAGPRNETLEESFLSSNINRLIVSLLHLPKGKRLSESCFLDPKEST +RVLPITKWRNWIGKRRDSSQLKGSSDQSRDHFDSIGTEDSEYHTLINQRE +IQQRKERSSLLDPSFLQTERTEIESDRFSKGLSGSSSKSRLFTEGEKEMN +NHLPPEEIEEFLGNPTRSILSFFSDEWSELHLGSNPTERSTVDQKLLKKE +QEVSFAPFRRSETKEIVNLFKTMAYLQKTVSIHPISSDPGCDMVPKDELD +SEERFQEMADLFTLSITEPDLVYHKGFAFSIDSSVLDQKQFLAEARDESK +KKSLLVLPPVFYQENESFYRRIRKRGVQISCGNDLEDPKPKIVVFASNNI +VEAVNQYRWIRNLIQIQYSTHGYIRNVLNRFFLMNRSDRNFEYGIQRDQI +GNDTLNHRTFMKYTINQHLSNLKKSQKKGSDPLILISRTERSVNRDPNAY +RYKWSKGSKNFQEHLEHFVSEQKSRFQVVFDRYRSIRNRYRSIRNRYRSR +INQYSSDRSEVSDKKDNRYRSRINQYSSDRSEVSDQKNLAKFRSFVFSKL +LLFLSNSLPFFFVSFGNTPPIQRSEIRVSELKGPNDRLCNQFLESIGLQL +VYLKKLKPFLLDDHETSQKSKLLFNKKPEGMIDSFHTRNNRGKSLDSYFS +MISHDQDNWLNPVKPFHRSSLISSFYKANRLRFLNNPHDFGFFCNKRFPF +YVDIKNLDFTYGQFLNILFIRNTKFSLCGDKKKHAFLERDTISSIESQVS +NLFKDFPQSGDERYNFYKYFHLAMRSDPLVRRAIYSIADISGTPLTEGQR +VNFERTYCQPLSDMNLSDSEGKNLYQYLNFNSNMGLIYSEKCFSSEKRKK +KKPEKRKEKKPEKRKEKKPEKRKEKKPEKRKEKKPEKRKEKKPEKRKEKK +PEKRKEKKQSLYLKQWVEKVQMDRALQGERVSLILSNWNLFKTYVMPFSL +TSTGYNLLKLMFLDTLGSYVMPLLRSSPKFVSICYAISDPCGISWRILQK +KLCLLQWNWISAISNKCFHKLLLSEESIHRNNESPSMTDLRWPNLGAFLY +SILFLLFVAGHLVFSHLLFLSQDFSELQRDFARAQSLMIPSYIVELRELL +DMYPAPRSFKKLFLAAREKLVNYLRWGGGRKSFLIHLFELLNITPNPIDR +IAFLKNTRHLSHTSKELYSLITELGDFSSLCSGQRYRYDQIIENVNGPCC +LIDDKIESWISNCDAIEDKEREFLVPFCNFTRETRIDQILLSLTHSDHLS +NNDSASQMSEEPGAFYLRHLVDIHKKGLMNYECNTSCLAERRIFLAHYQT +ITYSPCGDNRSHFPSHGKTFSLRLPLHPSRATLVIGSIGSGRSYLVKSLA +TNSYVPLITVVLNKFLKNWTPQGFDIHESGVYDEYGDDAEEANDYGASFF +DFLDNDSDDYEDRDSDDYDEPGASDDYEDRDMEDFVDSEMTEWLTKTNVP +LVYQLLDDEIDEFYITLQFELAKAMSPCILWIPNIHDLDAKESDYLSLGL +LVNHLSRDCGRRSTKNEILVIASTHIPQKVDPSLIGPDGLSTCIKTRRLL +VPQQQQCLFTLSYTRGFHLENKMFHTHTNEFESTILGPSVPDLVALTNEA +LSISITQKKSIIDTTTIRYALHRKTWDLEADRNLSPAKEHGTLFYQVGRA +FAHTVLLRNCPIDPISIYIKKNLCEAGDSSLYKWYFELGTSMKKLTILLY +LLTCSAGSIAQDLLSPPGPDEQNLITSYGLVENDSDLVHGLSDIVHGLLE +LEGALVGSSPTEEEVEGTEEEVEGTEEEVEGTEEEVEGTEEEVEGTEEEV +EGTEEEVEGTEDEEGEGTEEEVEGTEDEEGEGTEEEVEGTEDEEGEGTEE +EVEGTEDEEGEGTEDEEGEGTEEEVEGTEEEVEGTEDEEGEGTEKDSSQF +DNDRVTLLLRPKPRNPLDIQRLIYQHQKYESELEEDDDDDEDVFAPQKML +EDLFSELVWSPRIWHPWDFILDCEAEIPAEEIPEEEDPLPEEALETEVAV +WGEEEEGEADDEEDERLEAQQEDELLEEEDEELKEEEDELHEEEEEEEEE +EEEEEEDELHEEEEEEEEEDELQENDSEFFRSETQQPQARDGFSEEEGCF +RISQFMWVPGDPLSFLYKDTPFVEVLSYPEEATEISKELLRLLNPKTKRD +APKRARQRWWTKKKQDKHYELVLDRQRWLITKSSLSKSNGFFRSNTPSES +YQYLSNLFLSNRRLLDQITKTFFRKKWLFPDEMKIGFMEQ diff --git a/detectors/cds/test/test.ref b/detectors/cds/test/test.ref index 7449c64..4101ab6 100644 --- a/detectors/cds/test/test.ref +++ b/detectors/cds/test/test.ref @@ -45,28 +45,27 @@ FT AAAQSISYEIPLALCVLSISLRVIR" FT gene 42910..45121 FT /gene="ndhB" FT /locus_tag="" -FT CDS join(42910..43780,44367..45121) +FT CDS join(42910..43685,44365..45121) FT /codon_start=1 FT /transl_table=11 FT /gene="ndhB" FT /locus_tag="" FT /product="NADH dehydrogenase subunit 2" -FT /inference="similar to DNA sequence:NC_008535:CoarCp067" +FT /inference="similar to DNA sequence:AC_000188:LyesCp066" FT /translation="MIWHVQNENFILDSTRIFMKAFHLLLFDGSLIFPECILIFGLILL FT LMIDSTSDQKDIPWLYFISSTSLVMSITALLFRWREEPMISFSGNFQTNNFNEIFQFLI FT LLCSTLCIPLSVEYIECTEMAITEFLLFVLTATLGGMFLCGANDLITIFVAPECFSLCS FT YLLSGYTKKDVRSNEATMKYLLMGGASSSILVHGFSWLYGSSGGEIELQEIVNGLINTQ -FT MYNSPGISIALIFITVGIGFKLSPAPSHQWTPDVYEGVRFVREIPTSLSISEMFGFFKT -FT PWTCRREMLSPTPVVAFLSVTSKVAASASATRIFNIPFYFSSNEWHLLLEILAILSMIL -FT GNLIAITQTSMKRMLAYSSIGQIGYVIIGIIVGDSNDGYASMITYMLFYISMNLGTFAC -FT IVLFGLRTGTDNIRDYAGLYTKDPFLALSLALCLLSLGGLPPLAGFFGKLYLFWCGWQA -FT GLYFLVLIGLLTSVVSIYYYLKIIKLLMTGRNQEITPHVRNYRRSPLRSNNSIELSMIV -FT CVIASTIPGISMNPIIAIAQDSLF" -FT exon 42910..43780 +FT MYNSPGISIALIFITVGIGFKLSPAPSHQWTPDVYEGSPTPVVAFLSVTSKVAASASAT +FT RIFNIPFYFSSNEWHLLLEILAILSMILGNLIAITQTSMKRMLAYSSIGQIGYVIIGII +FT VGDSNDGYASMITYMLFYISMNLGTFACIVLFGLRTGTDNIRDYAGLYTKDPFLALSLA +FT LCLLSLGGLPPLAGFFGKLYLFWCGWQAGLYFLVLIGLLTSVVSIYYYLKIIKLLMTGR +FT NQEITPHVRNYRRSPLRSNNSIELSMIVCVIASTIPGISMNPIIAIAQDSLF" +FT exon 42910..43685 FT /gene="ndhB" FT /locus_tag="" FT /number=1 -FT exon 44367..45121 +FT exon 44365..45121 FT /gene="ndhB" FT /locus_tag="" FT /number=2 @@ -79,7 +78,7 @@ FT /transl_table=11 FT /gene="ndhD" FT /locus_tag="" FT /product="NADH dehydrogenase subunit 4" -FT /inference="similar to DNA sequence:NC_007898:LyesC2p017" +FT /inference="similar to DNA sequence:AC_000188:LyesCp081" FT /translation="MNYFPWLTIIVVFPIFAGSLIFFLPHKGNRVIRWYTICICILELL FT LTTYAFCYHFQSDDPLIQLVEDYKWIDFFDFHWRLGIDGLSIGPILLTGFITTLATLAA FT WPVTRDSRLFHFLMLAMYSGQIGLFSSRDLLLFFIMWELELIPVYLLLAMWGGKKRLYS @@ -98,7 +97,7 @@ FT /transl_table=11 FT /gene="ndhE" FT /locus_tag="" FT /product="NADH dehydrogenase subunit 4L" -FT /inference="similar to DNA sequence:NC_001879:NitaCp085" +FT /inference="similar to DNA sequence:AC_000188:LyesCp080" FT /translation="MILEHVLVLSAYLFSIGIYGLITSRNMVRALMCLELILNAVNINF FT VTFSDFFDNRQLKGDIFSIFVIAIAAAEAAIGLAIVSSIYRNRKSTRINQSNLLNN" FT gene complement(11509..13722) @@ -178,7 +177,7 @@ FT /transl_table=11 FT /gene="psaC" FT /locus_tag="" FT /product="photosystem I subunit VII" -FT /inference="similar to DNA sequence:NC_023792:CP89_p014" +FT /inference="similar to DNA sequence:AC_000188:LyesCp065" FT /translation="MSHSVKIYDTCIGCTQCVRACPTDVLEMIPWDGCKAKQIASAPRT FT EDCVGCKRCESACPTDFLSVRVYLWHETTRSMGLAY" FT gene 53817..55307 @@ -190,7 +189,7 @@ FT /transl_table=11 FT /gene="rpl2" FT /locus_tag="" FT /product="ribosomal protein L2" -FT /inference="similar to DNA sequence:NC_007898:LyesC2p002" +FT /inference="similar to DNA sequence:AC_000188:LyesCp030" FT /translation="MAIHLYKTSTPSTRNGTVDSQVKSNPRNNLIYGQRRCGKGRNARG FT IITARHRGGGHKRLYRKIDFRRNEKDIYGRIVTIEYDPNRNAYICLIHYGDGEKRYILH FT PRGAIIGDTIVSGTEVPIKMGNALPSTDMPLGTAIHNIEITLGKGGQLARAAGAVAKLI @@ -213,7 +212,7 @@ FT /transl_table=11 FT /gene="rpl23" FT /locus_tag="" FT /product="ribosomal protein L23" -FT /inference="similar to DNA sequence:NC_007898:LyesC2p003" +FT /inference="similar to DNA sequence:AC_000188:LyesCp026" FT /translation="MDGIKYAVFTDKSIRLLGKNQYTSNVESGSTRTEIKHWVELFFGV FT KVIAMNSHRLPGKSRRMGPIMGHTMHYRRMIITLQPGYSIPPLRKKRT" FT gene 14505..14672 @@ -249,7 +248,7 @@ FT /transl_table=11 FT /gene="rps7" FT /locus_tag="" FT /product="ribosomal protein S7" -FT /inference="similar to DNA sequence:NC_007898:LyesC2p007" +FT /inference="similar to DNA sequence:AC_000188:LyesCp008" FT /translation="MSRRGTAEKKTAKSDPIYRNRLVNMLVNRILKHGKKSLAYQIIYR FT AVKKIQQKTETNPLSVLRQAIRGVTPDITVKARRVGGSTHQVPIEIGSTQGKALAIRWL FT LAASRKRPGRNMAFKLSSELVDAAKGSGDAIRKKEETHRMAEANRAFAHFR" diff --git a/detectors/cds/tools/chlorodb/go_chlorodb.sh b/detectors/cds/tools/chlorodb/go_chlorodb.sh new file mode 100755 index 0000000..75ad7e5 --- /dev/null +++ b/detectors/cds/tools/chlorodb/go_chlorodb.sh @@ -0,0 +1,254 @@ +#!/bin/csh -f +# +# make ChloroDB's +# +# usage: copy genbank/embl files into 'DB_DIR/download' +# usage: [create a paramter.sh file in 'DB_DIR'] +# usage: go_chlorodb [DB_DIR] +# +unsetenv ORG_SOURCED + +setenv ORG_HOME `dirname $0`/../../../.. +source $ORG_HOME/scripts/csh_init.sh + +# +# which DB to process +# + +set DB_BASE = $DATA_DIR/cds/chlorodb # default location + +if ($#Argv > 0) then + set DB_BASE = $Argv[1]; Shift +endif + +set DB_BASE = `cd $DB_BASE && pwd -P` + +NeedDir $DB_BASE/download + +if (! -d $DB_BASE/info) mkdir $DB_BASE/info +if (! -d $DB_BASE/fasta) mkdir $DB_BASE/fasta + +cd $DB_BASE/info + +# +# params +# + +if (! -e $DB_BASE/parameters.sh) then + @ n = `find $DB_BASE/download -depth 1 -type f -print | wc -l` + @ cor_cutoff = $n / 2 + @ atg_cutoff = $n / 10 + @ dbs_cutoff = $n / 4 + if ($cor_cutoff == 0) @ cor_cutoff = 1 + if ($atg_cutoff == 0) @ atg_cutoff = 1 + if ($dbs_cutoff == 0) @ dbs_cutoff = 1 + echo "# sourced file" > $DB_BASE/parameters.sh + echo "" >> $DB_BASE/parameters.sh + echo "set CORE_NCDS_CUTOFF = $cor_cutoff" >> $DB_BASE/parameters.sh + echo "set CORE_START_ATG_CUTOFF = $atg_cutoff" >> $DB_BASE/parameters.sh + echo "set CORE_START_DFT_CUTOFF = $atg_cutoff" >> $DB_BASE/parameters.sh + echo "set CORE_START_OTH_CUTOFF = 10" >> $DB_BASE/parameters.sh + echo "set CORE_STOP_CUTOFF = $cor_cutoff" >> $DB_BASE/parameters.sh + echo "set CORE_SPLICE_CUTOFF = $atg_cutoff" >> $DB_BASE/parameters.sh + echo "" >> $DB_BASE/parameters.sh + echo "set SHEL_NCDS_CUTOFF = 10" >> $DB_BASE/parameters.sh + echo "" >> $DB_BASE/parameters.sh + echo "set CORE_DELTA = Inf" >> $DB_BASE/parameters.sh + echo "set CORE_COVMIN = 30" >> $DB_BASE/parameters.sh + echo "set CORE_PMAX = 1e-6" >> $DB_BASE/parameters.sh + echo "set CORE_IDMIN = 30" >> $DB_BASE/parameters.sh + echo "set CORE_SIZMIN = $cor_cutoff" >> $DB_BASE/parameters.sh + echo "" >> $DB_BASE/parameters.sh + echo "set SHEL_DELTA = 0.5" >> $DB_BASE/parameters.sh + echo "set SHEL_COVMIN = 30" >> $DB_BASE/parameters.sh + echo "set SHEL_PMAX = 1e-6" >> $DB_BASE/parameters.sh + echo "set SHEL_IDMIN = 30" >> $DB_BASE/parameters.sh + echo "set SHEL_SIZMIN = $dbs_cutoff" >> $DB_BASE/parameters.sh + echo "" >> $DB_BASE/parameters.sh + echo "set DUST_DELTA = 0.5" >> $DB_BASE/parameters.sh + echo "set DUST_COVMIN = 30" >> $DB_BASE/parameters.sh + echo "set DUST_PMAX = 1e-6" >> $DB_BASE/parameters.sh + echo "set DUST_IDMIN = 30" >> $DB_BASE/parameters.sh + echo "set DUST_SIZMIN = 10" >> $DB_BASE/parameters.sh + +endif + +source $DB_BASE/parameters.sh + +##set CMIN_COD = 0 +##set FMIN_COD = 0.01 + +# +# temporarily uncompress +# + +set ff = `find $DB_BASE/download -depth 1 -name \*.gz -print` + +if ($#ff != 0) then + Notify "uncompressing $#ff entries" + foreach f ($ff) + gunzip -f $f + end +endif + +# +# convert gbk/embl to fasta +# + +set ff = `find $DB_BASE/download -depth 1 \( -name \*.gbk -or -name \*.embl \) -print` + +Notify "convert $#ff gbk/embl entries to fasta" + +foreach f ($ff) + set nom = `basename $f:r` + set typ = $f:e + $AwkCmd -f $LIB_DIR/$typ.tofasta.awk $f > $DB_BASE/fasta/$nom.fst +end + +# +# get gbk/embl info +# + +Notify "get gbk/embl info for $#ff entries" + +echo "" | awk -v HEADONLY=1 -f $LIB_DIR/gbk.info.awk > db.info.txt # just get header + +foreach f ($ff) + set nom = `basename $f:r` + set typ = $f:e + $AwkCmd -f $LIB_DIR/$typ.oneliner.awk $f |\ + $AwkCmd -f $LIB_DIR/libutil.awk -f $LIB_DIR/$typ.info.awk |\ + egrep -v '^#' >> db.info.txt +end + +# +# get cds info +# + +Notify "get gbk/embl cds for $#ff entries" + +echo "" | awk -v HEADONLY=1 -f $LIB_DIR/gbk.cds_long.awk > db.cds.txt # just get header + +foreach f ($ff) + set nom = `basename $f:r` + set typ = $f:e + $AwkCmd -f $LIB_DIR/$typ.oneliner.awk $f |\ + $AwkCmd -v FASTA=$DB_BASE/fasta/$nom.fst -f $LIB_DIR/libutil.awk \ + -f $LIB_DIR/$typ.cds_long.awk |\ + egrep -v '^#' >> db.cds.txt +end + +# +# get fasta for prots +# + +Notify "get prots" +$AwkCmd -f $LIB_DIR/libutil.awk -f $LIB_DIR/cds2fasta.awk db.cds.txt > db.prot.fst + +# +# get introns +# + +Notify "get gbk/embl introns for $#ff entries" + +echo "" | awk -v HEADONLY=1 -f $LIB_DIR/gbk.intron.awk > db.intron.txt # just get header + +foreach f ($ff) + set nom = `basename $f:r` + set typ = $f:e + $AwkCmd -f $LIB_DIR/$typ.oneliner.awk $f |\ + $AwkCmd -v FASTA=$DB_BASE/fasta/$nom.fst -f $LIB_DIR/libutil.awk \ + -f $LIB_DIR/$typ.intron.awk |\ + egrep -v '^#' >> db.intron.txt +end + +# +# make models +# + +Notify "Making models" + +echo -n "" > db.models.params.txt +echo "CORE_NCDS_CUTOFF <- $CORE_NCDS_CUTOFF" >> db.models.params.txt +echo "CORE_START_ATG_CUTOFF <- $CORE_START_ATG_CUTOFF" >> db.models.params.txt +echo "CORE_START_DFT_CUTOFF <- $CORE_START_DFT_CUTOFF" >> db.models.params.txt +echo "CORE_START_OTH_CUTOFF <- $CORE_START_OTH_CUTOFF" >> db.models.params.txt +echo "CORE_STOP_CUTOFF <- $CORE_STOP_CUTOFF" >> db.models.params.txt +echo "CORE_SPLICE_CUTOFF <- $CORE_SPLICE_CUTOFF" >> db.models.params.txt +echo "SHEL_NCDS_CUTOFF <- $SHEL_NCDS_CUTOFF" >> db.models.params.txt + +$LIB_DIR/make.models.r |& Cat + +GetStatus +OnError then + Error 2 "model parameter too stringent" +endif + +# +# add matrices +# + +cp -f $PROG_DIR/matrices/* models + +# +# make subDBs +# + +if (-e db.core.pat.txt) then + Notify "Making core DB (take some time... please wait)" + $PROG_DIR/subdb/go_subdb.sh db.prot.fst db.core.pat.txt \ + $CORE_DELTA $CORE_COVMIN $CORE_PMAX $CORE_IDMIN $CORE_SIZMIN +endif + +if (-e db.shell.pat.txt) then + Notify "Making shell DB (take some time... please wait)" + $PROG_DIR/subdb/go_subdb.sh db.prot.fst db.shell.pat.txt \ + $SHEL_DELTA $SHEL_COVMIN $SHEL_PMAX $SHEL_IDMIN $SHEL_SIZMIN +endif + +if (-e db.dust.pat.txt) then + Notify "Making dust DB (take some time... please wait)" + $PROG_DIR/subdb/go_subdb.sh db.prot.fst db.dust.pat.txt \ + $DUST_DELTA $DUST_COVMIN $DUST_PMAX $DUST_IDMIN $DUST_SIZMIN +endif + +# +# recompress entries +# + +set ff = `find $DB_BASE/download -depth 1 -type f -print` + +if ($#ff != 0) then + Notify "recompressing $#ff entries" + foreach f ($ff) + gzip -f $f + end +endif + +# compress fasta + +set ff = `find $DB_BASE/fasta -depth 1 -name \*.fst -print` + +if ($#ff != 0) then + Notify "compressing $#ff fasta entries" + foreach f ($ff) + gzip -f $f + end +endif + +# install everything in proper directory + +foreach dir ("core" "shell" "dust") + if (-e $DB_BASE/$dir) \rm -r $DB_BASE/$dir + if ((-d db.$dir.pat.db) && (-e db.$dir.pat.db/Annot.lst)) then + Notify "installing $DB_BASE/$dir" + \mv -f db.$dir.pat.db $DB_BASE/$dir + endif +end + +if (-e $DB_BASE/models) \rm -r $DB_BASE/models +if (-d models) \mv -f models $DB_BASE + +Notify "Done" +exit 0 + diff --git a/detectors/cds/tools/chlorodb/matrices/blosum62.mat b/detectors/cds/tools/chlorodb/matrices/blosum62.mat new file mode 100644 index 0000000..37f3f29 --- /dev/null +++ b/detectors/cds/tools/chlorodb/matrices/blosum62.mat @@ -0,0 +1,29 @@ +# +# blosum62 substitution matrix +# with larger penalty for stops +# + A R N D C Q E G H I L K M F P S T W Y V B Z X * +A 4 -1 -2 -2 0 -1 -1 0 -2 -1 -1 -1 -1 -2 -1 1 0 -3 -2 0 -2 -1 0 -50 +R -1 5 0 -2 -3 1 0 -2 0 -3 -2 2 -1 -3 -2 -1 -1 -3 -2 -3 -1 0 -1 -50 +N -2 0 6 1 -3 0 0 0 1 -3 -3 0 -2 -3 -2 1 0 -4 -2 -3 3 0 -1 -50 +D -2 -2 1 6 -3 0 2 -1 -1 -3 -4 -1 -3 -3 -1 0 -1 -4 -3 -3 4 1 -1 -50 +C 0 -3 -3 -3 9 -3 -4 -3 -3 -1 -1 -3 -1 -2 -3 -1 -1 -2 -2 -1 -3 -3 -2 -50 +Q -1 1 0 0 -3 5 2 -2 0 -3 -2 1 0 -3 -1 0 -1 -2 -1 -2 0 3 -1 -50 +E -1 0 0 2 -4 2 5 -2 0 -3 -3 1 -2 -3 -1 0 -1 -3 -2 -2 1 4 -1 -50 +G 0 -2 0 -1 -3 -2 -2 6 -2 -4 -4 -2 -3 -3 -2 0 -2 -2 -3 -3 -1 -2 -1 -50 +H -2 0 1 -1 -3 0 0 -2 8 -3 -3 -1 -2 -1 -2 -1 -2 -2 2 -3 0 0 -1 -50 +I -1 -3 -3 -3 -1 -3 -3 -4 -3 4 2 -3 1 0 -3 -2 -1 -3 -1 3 -3 -3 -1 -50 +L -1 -2 -3 -4 -1 -2 -3 -4 -3 2 4 -2 2 0 -3 -2 -1 -2 -1 1 -4 -3 -1 -50 +K -1 2 0 -1 -3 1 1 -2 -1 -3 -2 5 -1 -3 -1 0 -1 -3 -2 -2 0 1 -1 -50 +M -1 -1 -2 -3 -1 0 -2 -3 -2 1 2 -1 5 0 -2 -1 -1 -1 -1 1 -3 -1 -1 -50 +F -2 -3 -3 -3 -2 -3 -3 -3 -1 0 0 -3 0 6 -4 -2 -2 1 3 -1 -3 -3 -1 -50 +P -1 -2 -2 -1 -3 -1 -1 -2 -2 -3 -3 -1 -2 -4 7 -1 -1 -4 -3 -2 -2 -1 -2 -50 +S 1 -1 1 0 -1 0 0 0 -1 -2 -2 0 -1 -2 -1 4 1 -3 -2 -2 0 0 0 -50 +T 0 -1 0 -1 -1 -1 -1 -2 -2 -1 -1 -1 -1 -2 -1 1 5 -2 -2 0 -1 -1 0 -50 +W -3 -3 -4 -4 -2 -2 -3 -2 -2 -3 -2 -3 -1 1 -4 -3 -2 11 2 -3 -4 -3 -2 -50 +Y -2 -2 -2 -3 -2 -1 -2 -3 2 -1 -1 -2 -1 3 -3 -2 -2 2 7 -1 -3 -2 -1 -50 +V 0 -3 -3 -3 -1 -2 -2 -3 -3 3 1 -2 1 -1 -2 -2 0 -3 -1 4 -3 -2 -1 -50 +B -2 -1 3 4 -3 0 1 -1 0 -3 -4 0 -3 -3 -2 0 -1 -4 -3 -3 4 1 -1 -50 +Z -1 0 0 1 -3 3 4 -2 0 -3 -3 1 -1 -3 -1 0 -1 -3 -2 -2 1 4 -1 -50 +X 0 -1 -1 -1 -2 -1 -1 -1 -1 -1 -1 -1 -1 -1 -2 0 0 -2 -1 -1 -1 -1 -1 -50 +* -50 -50 -50 -50 -50 -50 -50 -50 -50 -50 -50 -50 -50 -50 -50 -50 -50 -50 -50 -50 -50 -50 -50 1 diff --git a/detectors/cds/tools/chlorodb/subdb/go_subdb.sh b/detectors/cds/tools/chlorodb/subdb/go_subdb.sh new file mode 100755 index 0000000..9365fec --- /dev/null +++ b/detectors/cds/tools/chlorodb/subdb/go_subdb.sh @@ -0,0 +1,195 @@ +#!/bin/csh -f +# +# usage: go_subdb.sh prot.fst pat.txt [deltalen covmin pmax idmin sizmin] +# usage: prot.fst : proteins fasta file +# usage: pat.txt : text file containing patterns and names for families to extract +# usage: output directory containig subdbs : basename .db +# + +unsetenv ORG_SOURCED + +setenv ORG_HOME `dirname $0`/../../../../.. +source $ORG_HOME/scripts/csh_init.sh + +NeedArg 2 + +set ProtFile = $Argv[1]; Shift +set PatFile = $Argv[1]; Shift + +NeedFile $ProtFile +NeedFile $PatFile + +# +# parameters +# + +set Delta = 0.5 +set Covmin = 30 +set Pmax = 1e-6 +set Idmin = 30 +set Sizmin = 5 + +if ($#Argv > 0) then + set Delta = $Argv[1]; Shift +endif + +if ($#Argv > 0) then + set Covmin = $Argv[1]; Shift +endif + +if ($#Argv > 0) then + set Pmax = $Argv[1]; Shift +endif + +if ($#Argv > 0) then + set Idmin = $Argv[1]; Shift +endif + +if ($#Argv > 0) then + set Sizmin = $Argv[1]; Shift +endif + +# +# output directory +# + +set OutDir = `basename $PatFile:r`.db + +if (-d $OutDir) \rm -r $OutDir +mkdir $OutDir + +set OutLog = `basename $PatFile:r`.log + +echo -n '' > $OutLog + +alias Report 'egrep "^>" \!:1 | wc -l | awk -v P=`basename \!:1` -v H=\!:2 '"'{print H,P,"'$1}'"'"' >> $OutLog' + +# +# remove entries with bad symbols +# + +Notify "cleanup $ProtFile" + +Report $ProtFile "init_size" + +$AwkCmd -f $LIB_DIR/db.filter.sym.awk $ProtFile > P_$$ + +Report $ProtFile "cleanup_size" + +# +# select by name pattern +# + +Notify "select by patterns" + +mkdir D_$$ +mkdir E_$$ +mkdir F_$$ + +set noms = `awk '{print $1}' $PatFile` + +foreach nom ($noms) + set pat = `egrep "^$nom " $PatFile | awk '{print $2}'` + $AwkCmd -f $LIB_DIR/db.filter.pat.awk -v PAT="$pat" P_$$ > D_$$/$nom.fst + set n = `egrep '^>' D_$$/$nom.fst | wc -l` + Notify " pattern : $nom : $n" + Report D_$$/$nom.fst "pattern_filter" + if ($n <= $Sizmin) \rm -f D_$$/$nom.fst +end + +set ok = `ls D_$$ | wc -l` +if ($ok == 0) goto fin + +# +# select by length +# + +Notify "select by length" + +foreach f (D_$$/*.fst) + set nom = `basename $f:r` + $AwkCmd -f $LIB_DIR/db.getlen.awk $f > L_$$ + $LIB_DIR/db.filter.len.r L_$$ $Delta |\ + $AwkCmd '($NF == "TRUE") {print $2}' > M_$$ + $AwkCmd -v FILE=M_$$ -f $LIB_DIR/db.subdb.awk $f > E_$$/$nom.fst + Report E_$$/$nom.fst "length_filter" + set n = `egrep '^>' E_$$/$nom.fst | wc -l` + Notify " length filter : $nom : $n" + if ($n <= $Sizmin) \rm -f E_$$/$nom.fst +end + +set ok = `ls E_$$ | wc -l` +if ($ok == 0) goto fin + + +# +# select by similarity +# + +Notify "select by similarity" + +foreach f (E_$$/*.fst) + set nom = `basename $f:r` + + Notify " blasting $nom" + + makeblastdb -dbtype 'prot' -in $f >>& db.log + blastp -db $f -query $f -outfmt 7 > $f.blast.out + \rm -f $f.p?? + + $AwkCmd -v COVMIN=$Covmin -v PMAX=$Pmax -v IDMIN=$Idmin \ + -f $LIB_DIR/db.blastlink.awk $f.blast.out |\ + $AwkCmd -f $LIB_DIR/db.todl.awk > G_$$ + + ($LIB_DIR/db.cc.r G_$$ > $f.cc.txt) >>& db.log + + awk -v NAME=$nom -f $LIB_DIR/db.reportcc.awk $f.cc.txt >> $OutLog + + $AwkCmd -f $LIB_DIR/db.selcc.awk $f.cc.txt > S_$$ + $AwkCmd -v FILE=S_$$ -f $LIB_DIR/db.subdb.awk $f > F_$$/$nom.fst + + Report F_$$/$nom.fst "similarity_filter" + + set n = `egrep '^>' F_$$/$nom.fst | wc -l` + Notify " blast filter : $nom : $n" + if ($n <= $Sizmin) \rm -f F_$$/$nom.fst + +end + +set ok = `ls D_$$ | wc -l` +if ($ok == 0) goto fin + +# +# annotations +# + +echo -n "" > J_$$ + +foreach f (F_$$/*.fst) + $AwkCmd -f $LIB_DIR/db.annot.awk $f >> J_$$ +end + +awk '(NF >= 3) {print $1, $NF}' $PatFile | sort > A_$$ +sort J_$$ | egrep -v '^ *$' > B_$$ +join A_$$ B_$$ > F_$$/Annot.lst + +# +# copy files +# + +set n = `ls F_$$/* | wc -l` +Notify "copy $n files to $OutDir" + +\mv -f F_$$/* $OutDir + +# +# end +# + +fin: +Notify "output directory : $OutDir" + +\rm -r ?_$$ + + +exit 0 diff --git a/detectors/cds/tools/chlorodb/subdb/lib/db.annot.awk b/detectors/cds/tools/chlorodb/subdb/lib/db.annot.awk new file mode 100644 index 0000000..f000eca --- /dev/null +++ b/detectors/cds/tools/chlorodb/subdb/lib/db.annot.awk @@ -0,0 +1,39 @@ +# + +/^>/ { + N++ + na = split($1, a, "@") + if (a[na-1] > NEXMAX) NEXMAX = a[na-1] + NEX[a[na-1]]++ + ANNOT[$NF]++ +} + +END { + na = split(FILENAME, a, "/") + na = split(a[na], a, "\\.") + printf("%s %d ", a[1], N) + s = "" + for (i = 1 ; i <= NEXMAX ; i ++) { + if (NEX[i] != 0) + s = s "" i ":" NEX[i] "_" + } + gsub("_+$", "", s) + printf("%s ", s) + + s = (NEXMAX == 1) ? "MONEX" : "POLYEX" + printf("%s ", s) + + nmax = 0 + amax = "none" + for (e in ANNOT) { + if (ANNOT[e] > nmax) { + nmax = ANNOT[e] + amax = e + } + } + print amax + +} + + + diff --git a/detectors/cds/tools/chlorodb/subdb/lib/db.blastlink.awk b/detectors/cds/tools/chlorodb/subdb/lib/db.blastlink.awk new file mode 100644 index 0000000..0d9eb17 --- /dev/null +++ b/detectors/cds/tools/chlorodb/subdb/lib/db.blastlink.awk @@ -0,0 +1,48 @@ +# + +function min(x, y) { + return ((x < y) ? x : y) +} + +BEGIN { + if (COVMIN == "") COVMIN = 50 + if (PMAX == "") PMAX = 1e-6 + if (IDMIN == "") IDMIN = 30 +} + +/^#/ { + hitnum = 0; + next; +} + +{ + if ($1 == $2) next + + hitnum++; + + na = split($1, a, "@"); + if (na < 2) { + print "query file not properly formatted" > "/dev/stderr" + exit(1); + } + len1 = a[na]; + + na = split($2, a, "@"); + if (na < 2) { + print "bank file not properly formatted" > "/dev/stderr" + exit(1); + } + len2 = a[na]; + + id = $3 + 0.0; + ali = $4; + + covmin = ali * 100. / min(len1, len2); + + proba = $11 + 0.0; + + if ((covmin > COVMIN) && ((proba < PMAX) || (proba == 0)) && (id > IDMIN)) { + print $1, $2, hitnum, id, covmin, proba, ali, len1, len2; + } +} + diff --git a/detectors/cds/tools/chlorodb/subdb/lib/db.cc.r b/detectors/cds/tools/chlorodb/subdb/lib/db.cc.r new file mode 100755 index 0000000..2a69b8e --- /dev/null +++ b/detectors/cds/tools/chlorodb/subdb/lib/db.cc.r @@ -0,0 +1,18 @@ +#!/usr/bin/env Rscript +# + +require(igraph, warn.conflicts=F) + +args <- commandArgs(T) +path <- if(length(args) > 0) args[1] else 'graph.dl' + +g <- read.graph(path, format='dl') + +cc <- clusters(g) + +res <- cbind(V(g)$name, membership(cc)) + +write.table(res, quote=FALSE, row.names=FALSE, col.names=FALSE) + +quit(save="no") + diff --git a/detectors/cds/tools/chlorodb/subdb/lib/db.filter.len.r b/detectors/cds/tools/chlorodb/subdb/lib/db.filter.len.r new file mode 100755 index 0000000..13cb5a2 --- /dev/null +++ b/detectors/cds/tools/chlorodb/subdb/lib/db.filter.len.r @@ -0,0 +1,19 @@ +#!/usr/bin/env Rscript +# + +args <- commandArgs(T) +path <- if(length(args) > 0) args[1] else 'len.txt' +delta <- if(length(args) > 1) args[2] else 0.5 + +tab <- read.table(path, header=T) + +lmed <- median(tab$len) + +dlen <- lmed * as.numeric(delta) + +tab$ok <- (abs(tab$len-lmed)/lmed) <= delta + +write.table(tab, quote=F) + +quit(save='no') + diff --git a/detectors/cds/tools/chlorodb/subdb/lib/db.filter.pat.awk b/detectors/cds/tools/chlorodb/subdb/lib/db.filter.pat.awk new file mode 100644 index 0000000..c14baf4 --- /dev/null +++ b/detectors/cds/tools/chlorodb/subdb/lib/db.filter.pat.awk @@ -0,0 +1,10 @@ +# + +/^>/ { + split($1, a, "@") + ok = a[3] ~ PAT +} + +ok { + print $0 +} diff --git a/detectors/cds/tools/chlorodb/subdb/lib/db.filter.sym.awk b/detectors/cds/tools/chlorodb/subdb/lib/db.filter.sym.awk new file mode 100644 index 0000000..9ae9570 --- /dev/null +++ b/detectors/cds/tools/chlorodb/subdb/lib/db.filter.sym.awk @@ -0,0 +1,30 @@ +# +# +# + +function Check(seq) { + if (seq == "") return 0 + gsub("[ACDEFGHIKLMNPQRSTVWXY\n]+", "", seq) + return (length(seq) == 0) +} + +/^>/ { + if (Check(Seq)) { + print Name + printf("%s", Seq) + } + Name = $0 + Seq = "" + next +} + +{ + Seq = Seq "" $0 "\n" +} + +END { + if (Check(Seq)) { + print Name + printf("%s", Seq) + } +} diff --git a/detectors/cds/tools/chlorodb/subdb/lib/db.getlen.awk b/detectors/cds/tools/chlorodb/subdb/lib/db.getlen.awk new file mode 100644 index 0000000..117c90b --- /dev/null +++ b/detectors/cds/tools/chlorodb/subdb/lib/db.getlen.awk @@ -0,0 +1,10 @@ +# +BEGIN { + print "id len" +} + +/^>/ { + na = split($1, a, "@") + print substr($1, 2), a[na] +} + diff --git a/detectors/cds/tools/chlorodb/subdb/lib/db.reportcc.awk b/detectors/cds/tools/chlorodb/subdb/lib/db.reportcc.awk new file mode 100644 index 0000000..0acb7f9 --- /dev/null +++ b/detectors/cds/tools/chlorodb/subdb/lib/db.reportcc.awk @@ -0,0 +1,15 @@ +# +# + +{ + cnt[$NF]++ +} + +END { + n = asort(cnt) + printf("cc_size %s", NAME) + for (i = n ; i >= 1 ; i--) + printf(" %d", cnt[i]) + print "" +} + diff --git a/detectors/cds/tools/chlorodb/subdb/lib/db.selcc.awk b/detectors/cds/tools/chlorodb/subdb/lib/db.selcc.awk new file mode 100644 index 0000000..a621519 --- /dev/null +++ b/detectors/cds/tools/chlorodb/subdb/lib/db.selcc.awk @@ -0,0 +1,19 @@ +# + +{ + N[$NF]++ + E[$NF, N[$NF]] = $1 +} + +END { + cmax = 1 + nmax = N[1] + for (i in N) { + if (N[i] > nmax) { + nmax = N[i] + cmax = i + } + } + for (i = 1 ; i <= nmax ; i++) + print E[cmax, i] +} diff --git a/detectors/cds/tools/chlorodb/subdb/lib/db.subdb.awk b/detectors/cds/tools/chlorodb/subdb/lib/db.subdb.awk new file mode 100644 index 0000000..472b4f3 --- /dev/null +++ b/detectors/cds/tools/chlorodb/subdb/lib/db.subdb.awk @@ -0,0 +1,17 @@ +# + +BEGIN { + if (FILE == "") FILE = "db.sel.txt" + while (getline < FILE) + INC[$1] = $1 + close(FILE) +} + +/^>/ { + name = substr($1, 2) + ok = name in INC +} + +ok { + print $0 +} diff --git a/detectors/cds/tools/chlorodb/subdb/lib/db.todl.awk b/detectors/cds/tools/chlorodb/subdb/lib/db.todl.awk new file mode 100644 index 0000000..65c9a07 --- /dev/null +++ b/detectors/cds/tools/chlorodb/subdb/lib/db.todl.awk @@ -0,0 +1,21 @@ +# + +{ + node[$1]++ + node[$2]++ + link[++M] = $1 " " $2 +} + + +END { + for (n in node) + N++ + print "DL n=" N + print "format = edgelist1" + print "labels embedded:" + print "data:" + for (i = 1 ; i <= M ; i++) + print link[i] +} + + diff --git a/detectors/cds/tools/compare/go_compare.sh b/detectors/cds/tools/compare/go_compare.sh index 1305598..9cca5c2 100755 --- a/detectors/cds/tools/compare/go_compare.sh +++ b/detectors/cds/tools/compare/go_compare.sh @@ -47,8 +47,8 @@ $AwkCmd -f $LIB_DIR/libutil.awk -f $LIB_DIR/$PrdType.cds_short.awk > P_$$ Notify "compare bank to predictions" -$AwkCmd -f $LIB_DIR/libnws.awk \ - -f $LIB_DIR/compareCds.awk \ +$AwkCmd -f $LIB_DIR/libnws.awk \ + -f $LIB_DIR/compare.cds.awk \ R_$$ P_$$ > S_$$ # base statistics diff --git a/detectors/cds/tools/compare/go_summarize.sh b/detectors/cds/tools/compare/go_summarize.sh index d6f3ce7..04ac7c5 100755 --- a/detectors/cds/tools/compare/go_summarize.sh +++ b/detectors/cds/tools/compare/go_summarize.sh @@ -15,6 +15,8 @@ NeedArg 1 egrep '^#|^MATCH' $* | awk -f $LIB_DIR/summary.cmp.awk > compare.txt +Notify "text file: compare.txt" + $LIB_DIR/summarize_cmp.r diff --git a/detectors/cds/tools/lib/cds2fasta.awk b/detectors/cds/tools/lib/cds2fasta.awk new file mode 100644 index 0000000..41436e2 --- /dev/null +++ b/detectors/cds/tools/lib/cds2fasta.awk @@ -0,0 +1,19 @@ +# +# get fasta sequence from cds list +# +# [-v FIELD=13] CDS sequence +# [-v FIELD=14] Prot Sequence +# + +BEGIN { + if (CHARPERLINE == "") CHARPERLINE = 50 + if (FIELD == "") FIELD = 14 +} + +/^#/ { next } + +{ + name = $1 "@" $2 "@" $3 "@" $5 "@" $6 "@" $7 "@" $8 "@" int($9/3) + comment = $NF + PrintFasta($FIELD, name " " comment) +} diff --git a/detectors/cds/tools/lib/compareCds.awk b/detectors/cds/tools/lib/compare.cds.awk similarity index 100% rename from detectors/cds/tools/lib/compareCds.awk rename to detectors/cds/tools/lib/compare.cds.awk diff --git a/detectors/cds/tools/lib/embl.cds_long.awk b/detectors/cds/tools/lib/embl.cds_long.awk new file mode 100644 index 0000000..48fb098 --- /dev/null +++ b/detectors/cds/tools/lib/embl.cds_long.awk @@ -0,0 +1,97 @@ +# +# get cds features from embl (long version) +# +# -v FASTA + +# @include lib.embl.awk + + +BEGIN { + print "#locus locustag genefam gene from to strand nexon length status start stop dnaseq protseq product" + + if (HEADONLY != "") exit(0) + + if (MAXSPAN == "") MAXSPAN = 10000 + + if (FASTA == "") Error("No FASTA file specified", 1) + + if (! TestPath(FASTA)) Error("Fasta file: '" FASTA "' not found", 1) + + Seq = tolower(ReadFasta(FASTA)) +} + +/^ID / { + locus = $2 + gsub(";", "", locus) + incds = 0 + next +} + +/^FT CDS/ { + revstrand = match($3, "^complement") + s = substr($0, 22) + gsub("^complement", "", s) + ok = ! match(s, "complement|order") + nexon = Nexons(s) + SpanLocation(s, sloc) + spanlen = sloc[2] - sloc[1] + 1 + len = LenLocation(s) + ok = ok && (len < MAXSPAN) + cdsseq = ok ? SeqLocation(Seq, s, revstrand) : "XXX" + cstart = substr(cdsseq, 1,3) + cstop = substr(cdsseq, length(cdsseq)-2) + + gene = "none" + locustag = "none" + product = "none" + translation = "X" + incds = 1 + next +} + +(incds && /^FT [^ ]/) { + print locus, locustag, GeneFamily(gene), gene, sloc[1], sloc[2], (revstrand ? "R" : "D"), + nexon, len, (ok ? "Ok" : "Error"), cstart, cstop, cdsseq, translation, product + incds = 0 + next +} + +/^FT \/gene=/ { + split($0, a, "=") + gene = a[2] + gsub("^[^a-z,A-Z]+", "", gene) + gsub("\"", "", gene) + gsub(" ", "_", gene) + next +} + +/^FT \/locus_tag=/ { + split($0, a, "=") + locustag = a[2] + gsub("\"", "", locustag) + gsub(" ", "_", locustag) + next +} + +/^FT \/product=/ { + split($0, a, "=") + product = a[2] + gsub("\"", "", product) + gsub(" ", "_", product) + next +} + +/^FT \/translation=/ { + split($0, a, "=") + translation = a[2] + gsub("\"", "", translation) + gsub(" ", "", translation) + next +} + +END { + if (incds) { + print locus, locustag, GeneFamily(gene), gene, sloc[1], sloc[2], (revstrand ? "R" : "D"), + nexon, len, (ok ? "Ok" : "Error"), cstart, cstop, cdsseq, translation, product + } +} diff --git a/detectors/cds/tools/lib/embl.info.awk b/detectors/cds/tools/lib/embl.info.awk new file mode 100644 index 0000000..dda6cc2 --- /dev/null +++ b/detectors/cds/tools/lib/embl.info.awk @@ -0,0 +1,97 @@ +# +# get feature info from embl +# + +# @include libgbk.awk + +function GC(s, _local_, i, len) { + s = toupper(s) + len = length(s) + gsub("G|C", "", s) + return ((len - length(s)) * 100 / (len ? len : 1)) +} + +# +# rules +# + +BEGIN { + print "#locus orga len oklen gc nbCds nbCds_int0 nbCds_int1 nbCds_intsup1 perCds_noex meanCdsSize nbtRNA nbrRNA nboRNA" +} + +/^ID/ { + locus = $2 + gsub(";", "", locus) + next +} + +/^OS/ { + orga = substr($0, 6) + gsub(" ", "_", orga) + next +} + +/^FT source/ { + GetLoc($3, loc); + len = loc[2]; + next +} + +/^FT CDS/ { + meanCds = meanCds * nbCds + LenLocation($3) + nbCds++ + meanCds /= nbCds + n = Nexons($3) + if (n > 3) n = 3 + nbCdx[n]++ + next +} + +/^FT tRNA/ { + nbTrna++ + next +} + +/^FT rRNA/ { + nbRrna++ + next +} + +/^FT mRNA/ { + next +} + +/^FT .*RNA/ { + nbOrna++ + next +} + +/^SQ / { + inseq = 1 + seq = "" + next +} + +inseq && /^ / { + s = $0 + gsub("[0-9]+", "", s) + gsub(" ", "", s) + seq = seq "" s + next +} + +/^\/\// { + oklen = (len == length(seq) ? "ok" : "wrong") + gc = GC(seq) + print locus, orga, len, oklen, gc, nbCds+0, nbCdx[1]+0, \ + nbCdx[2]+0, nbCdx[3]+0, (nbCdx[1]+0)*100/Max(1, nbCds+0), \ + meanCds+0, nbTrna+0, nbRrna+0, nbOrna+0 + nbCds = nbTrna = nbRrna = nbOrna = len = inseq = meanCds = 0 + delete nbCdx + orga = locus = "?" +} + + + + + diff --git a/detectors/cds/tools/lib/embl.intron.awk b/detectors/cds/tools/lib/embl.intron.awk new file mode 100644 index 0000000..83dabb0 --- /dev/null +++ b/detectors/cds/tools/lib/embl.intron.awk @@ -0,0 +1,97 @@ +# +# get intron features from embl +# + +# @include libembl.awk + +BEGIN { + print "#locus locustag genefam gene from to strand intron_num intron_nb acceptor-donor status" + + if (HEADONLY != "") exit(0) + + if (FASTA == "") Error("No FASTA file specified", 1) + + if (! TestPath(FASTA)) Error("Fasta file: '" FASTA "' not found", 1) + + Seq = tolower(ReadFasta(FASTA)) +} + +/^ID / { + locus = $2 + gsub(";", "", locus) + next +} + +/^FT CDS/ { + revstrand = match($3, "^complement") + s = substr($0, 22) + gsub("^complement", "", s) + ok = ! match(s, "complement|order") + if (! ok) next + + na = ParseLocation(s, locs) + if (na < 2) next + + delete SINfo + Ninfo = 0 + + val = locs[1][1] + for (i = 2 ; i <= na ; i++) { + if (locs[i][1] < val) ok = 0 + val = locs[i][1] + } + if (! ok) next + + val = locs[1][2] + for (i = 2 ; i <= na ; i++) { + if (locs[i][2] < val) ok = 0 + val = locs[i][2] + } + if (! ok) next + + from = locs[1][2] + 1 + for (i = 2 ; i <= na ; i++) { + to = locs[i][1] - 1 + inseq = SeqLocation(Seq, (from - 4) ".." (to + 4), revstrand) + SINfo[++Ninfo] = from " " to " " (revstrand ? "R" : "D") " "\ + (revstrand ? na-i+1 : i-1) " " na-1 " "\ + substr(inseq, 1,4) "."\ + substr(inseq, 5,6) "-"\ + substr(inseq, length(inseq)-9, 6) "."\ + substr(inseq, length(inseq)-3, 4) " "\ + "ok" + from = locs[i][2] + 1 + } + + gene = "none" + locustag = "none" + next +} + +/^FT \/gene=/ { + split($0, a, "=") + gene = a[2] + gsub("^[^a-z,A-Z]+", "", gene) + gsub("\"", "", gene) + gsub(" ", "_", gene) + next +} + +/^FT \/locus_tag=/ { + split($0, a, "=") + locustag = a[2] + gsub("\"", "", locustag) + gsub(" ", "_", locustag) + next +} + +/^FT \/translation=/ { + for (i = 1 ; i <= Ninfo ; i++) + print locus, locustag, GeneFamily(gene), gene, SINfo[i] + Ninfo = 0 + next +} + +/^\/\// { + locus = "?" +} diff --git a/detectors/cds/tools/lib/embl.tofasta.awk b/detectors/cds/tools/lib/embl.tofasta.awk new file mode 100644 index 0000000..0485ffb --- /dev/null +++ b/detectors/cds/tools/lib/embl.tofasta.awk @@ -0,0 +1,36 @@ +# +# get fasta sequence from embl +# + +/^ID / { + locus = $2 + gsub(";", "", locus) + next +} + +/^SQ / { + inseq = 1 + nln = 0 + delete seq + next +} + +/^\/\// { + inseq = 0 + print ">" locus + for (i = 1 ; i <= nln ; i++) + print seq[i] + next +} + +inseq { + s = $0 + gsub(" ", "", s) + gsub("[0-9]+", "", s) + seq[++nln] = s + next +} + + + + diff --git a/detectors/cds/tools/lib/gbk.cds_long.awk b/detectors/cds/tools/lib/gbk.cds_long.awk new file mode 100644 index 0000000..e3f1c7a --- /dev/null +++ b/detectors/cds/tools/lib/gbk.cds_long.awk @@ -0,0 +1,99 @@ +# +# get cds features from genbank (long version) +# +# -v FASTA + +# @include libgbk.awk + +BEGIN { + print "#locus locustag genefam gene from to strand nexon length status start stop dnaseq protseq product" + + if (HEADONLY != "") exit(0) + + if (MAXSPAN == "") MAXSPAN = 10000 + + if (FASTA == "") Error("No FASTA file specified", 1) + + if (! TestPath(FASTA)) Error("Fasta file: '" FASTA "' not found", 1) + + Seq = tolower(ReadFasta(FASTA)) +} + +/^LOCUS/ { + locus = $2 + incds = 0 + next +} + +/^ CDS/ { + revstrand = match($2, "^complement") + s = substr($0, 22) + gsub("^complement", "", s) + ok = ! match(s, "complement|order") + nexon = Nexons(s) + SpanLocation(s, sloc) + spanlen = sloc[2] - sloc[1] + 1 + len = LenLocation(s) + ok = ok && (len < MAXSPAN) + cdsseq = ok ? SeqLocation(Seq, s, revstrand) : "XXX" + cstart = substr(cdsseq, 1,3) + cstop = substr(cdsseq, length(cdsseq)-2) + + gene = "none" + locustag = "none" + product = "none" + translation = "X" + incds = 1 + next +} + +(incds && /^ [^ ]/) { + print locus, locustag, GeneFamily(gene), gene, sloc[1], sloc[2], (revstrand ? "R" : "D"), + nexon, len, (ok ? "Ok" : "Error"), cstart, cstop, cdsseq, translation, product + incds = 0 + next +} + +/^ \/gene=/ { + split($0, a, "=") + gene = a[2] + gsub("^[^a-z,A-Z]+", "", gene) + gsub("\"", "", gene) + gsub(" ", "_", gene) + next +} + +/^ \/locus_tag=/ { + split($0, a, "=") + locustag = a[2] + gsub("\"", "", locustag) + gsub(" ", "_", locustag) + next +} + +/^ \/product=/ { + split($0, a, "=") + product = a[2] + gsub("\"", "", product) + gsub(" ", "_", product) + next +} + +/^ \/translation=/ { + split($0, a, "=") + translation = a[2] + gsub("\"", "", translation) + gsub(" ", "", translation) + next +} + +/^\/\// { + locus = "?" +} + +END { + if (incds) { + print locus, locustag, GeneFamily(gene), gene, sloc[1], sloc[2], (revstrand ? "R" : "D"), + nexon, len, (ok ? "Ok" : "Error"), cstart, cstop, cdsseq, translation, product + } +} diff --git a/detectors/cds/tools/lib/gbk.info.awk b/detectors/cds/tools/lib/gbk.info.awk new file mode 100644 index 0000000..3fdadc3 --- /dev/null +++ b/detectors/cds/tools/lib/gbk.info.awk @@ -0,0 +1,97 @@ +# +# get feature info from genbank +# + +# @include libgbk.awk + +function GC(s, _local_, i, len) { + s = toupper(s) + len = length(s) + gsub("G|C", "", s) + return ((len - length(s)) * 100 / len) +} + +# +# rules +# + +BEGIN { + print "#locus orga len oklen gc nbCds nbCds_int0 nbCds_int1 nbCds_intsup1 perCds_noex meanCdsSize nbtRNA nbrRNA nboRNA" +} + +/^LOCUS/ { + locus = $2 + next +} + +/^ ORGANISM/ { + orga = substr($0, 13) + split(orga, a, ";") + orga = a[1] + gsub(" ", "_", orga) + next +} + +/^ source/ { + GetLoc($2, loc); + len = loc[2]; + next +} + +/^ CDS/ { + meanCds = meanCds * nbCds + LenLocation($2) + nbCds++ + meanCds /= nbCds + n = Nexons($2) + if (n > 3) n = 3 + nbCdx[n]++ + next +} + +/^ tRNA/ { + nbTrna++ + next +} + +/^ rRNA/ { + nbRrna++ + next +} + +/^ mRNA/ { + next +} + +/^ .*RNA/ { + nbOrna++ + next +} + +/^ORIGIN/ { + inseq = 1 + seq = "" + next +} + +inseq && /^ +[1-9][0-9]*/ { + s = substr($0, 11) + gsub(" ", "", s) + seq = seq "" s + next +} + +/^\/\// { + oklen = (len == length(seq) ? "ok" : "wrong") + gc = GC(seq) + print locus, orga, len, oklen, gc, nbCds+0, nbCdx[1]+0, \ + nbCdx[2]+0, nbCdx[3]+0, (nbCdx[1]+0)*100/Max(1, nbCds+0), \ + meanCds+0, nbTrna+0, nbRrna+0, nbOrna+0 + nbCds = nbTrna = nbRrna = nbOrna = len = inseq = meanCds = 0 + delete nbCdx + orga = locus = "?" +} + + + + + diff --git a/detectors/cds/tools/lib/gbk.intron.awk b/detectors/cds/tools/lib/gbk.intron.awk new file mode 100644 index 0000000..32aa5be --- /dev/null +++ b/detectors/cds/tools/lib/gbk.intron.awk @@ -0,0 +1,96 @@ +# +# get intron features from genbank +# + +# @include libgbk.awk + +BEGIN { + print "#locus locustag genefam gene from to strand intron_num intron_nb acceptor-donor status" + + if (HEADONLY != "") exit(0) + + if (FASTA == "") Error("No FASTA file specified", 1) + + if (! TestPath(FASTA)) Error("Fasta file: '" FASTA "' not found", 1) + + Seq = tolower(ReadFasta(FASTA)) +} + +/^LOCUS/ { + locus = $2 + next +} + +/^ CDS/ { + revstrand = match($2, "^complement") + s = substr($0, 22) + gsub("^complement", "", s) + ok = ! match(s, "complement|order") + if (! ok) next + + na = ParseLocation(s, locs) + if (na < 2) next + + delete SINfo + Ninfo = 0 + + val = locs[1][1] + for (i = 2 ; i <= na ; i++) { + if (locs[i][1] < val) ok = 0 + val = locs[i][1] + } + if (! ok) next + + val = locs[1][2] + for (i = 2 ; i <= na ; i++) { + if (locs[i][2] < val) ok = 0 + val = locs[i][2] + } + if (! ok) next + + from = locs[1][2] + 1 + for (i = 2 ; i <= na ; i++) { + to = locs[i][1] - 1 + inseq = SeqLocation(Seq, (from - 4) ".." (to + 4), revstrand) + SINfo[++Ninfo] = from " " to " " (revstrand ? "R" : "D") " "\ + (revstrand ? na-i+1 : i-1) " " na-1 " "\ + substr(inseq, 1,4) "."\ + substr(inseq, 5,6) "-"\ + substr(inseq, length(inseq)-9, 6) "."\ + substr(inseq, length(inseq)-3, 4) " "\ + "ok" + from = locs[i][2] + 1 + } + + gene = "none" + locustag = "none" + next +} + +/^ \/gene=/ { + split($0, a, "=") + gene = a[2] + gsub("^[^a-z,A-Z]+", "", gene) + gsub("\"", "", gene) + gsub(" ", "_", gene) + next +} + +/^ \/locus_tag=/ { + split($0, a, "=") + locustag = a[2] + gsub("\"", "", locustag) + gsub(" ", "_", locustag) + next +} + +/^ \/translation=/ { + for (i = 1 ; i <= Ninfo ; i++) + print locus, locustag, GeneFamily(gene), gene, SINfo[i] + Ninfo = 0 + next +} + +/^\/\// { + locus = "?" +} diff --git a/detectors/cds/tools/lib/gbk.tofasta.awk b/detectors/cds/tools/lib/gbk.tofasta.awk new file mode 100644 index 0000000..195ebc5 --- /dev/null +++ b/detectors/cds/tools/lib/gbk.tofasta.awk @@ -0,0 +1,32 @@ +# +# get fasta sequence from genbank +# + +/^LOCUS/ { + locus = $2 + next +} + +/^ORIGIN/ { + inseq = 1 + nln = 0 + delete seq +} + +inseq && /^ +[1-9][0-9]*/ { + s = substr($0, 11) + gsub(" ", "", s) + seq[++nln] = s + next +} + +/^\/\// { + print ">" locus + for (i = 1 ; i <= nln ; i++) + print seq[i] +} + + + + + diff --git a/detectors/cds/tools/lib/install.rpackages.r b/detectors/cds/tools/lib/install.rpackages.r new file mode 100755 index 0000000..c6f9778 --- /dev/null +++ b/detectors/cds/tools/lib/install.rpackages.r @@ -0,0 +1,31 @@ +#!/usr/bin/env Rscript +# +# check and install required packages +# + +out <- function(...) { + cat(paste0('+ ', ..., '\n'), file=stderr()) +} + +installed <- function(package) { + package %in% rownames(installed.packages()) +} + +check <- function(package, repos="http://cran.univ-lyon1.fr") { + if (installed(package)) { + out("R package ", package, " installed") + } else { + out("Installing R package ", package, " from ", repos) + install.packages(package, repos=repos) + } + invisible(installed(package)) +} + +check("grid") +check("gridExtra") +check("vcd") +check("plotrix") +check("igraph") + +quit(save='no', status=0) + diff --git a/detectors/cds/tools/lib/make.models.r b/detectors/cds/tools/lib/make.models.r new file mode 100755 index 0000000..b2e0a74 --- /dev/null +++ b/detectors/cds/tools/lib/make.models.r @@ -0,0 +1,224 @@ +#!/usr/bin/env Rscript +# +# compute start, stop, splice-junctions models for core DB +# +# source("make.models.r") +# + +LIB_DIR <- Sys.getenv("LIB_DIR") +if (LIB_DIR == "") LIB_DIR = "." + +source(paste0(LIB_DIR, "/util.base.r")) +source(paste0(LIB_DIR, "/util.cons.r")) +source(paste0(LIB_DIR, "/util.modelio.r")) + +# ------------------------------- +# parameters +# ------------------------------- + +# core cutoffs + +source("db.models.params.txt") + +# ------------------------------- +# genome infos +# ------------------------------- + +notify("loading info table") +chromo <- read.table("db.info.txt", com="", head=T, stringsAsFactors=F) + +# ------------------------------- +# CDS +# ------------------------------- + +notify("loading cds table") +cds <- read.table("db.cds.txt", com="", header=T, stringsAsFactors=F) + +cds$start <- as.factor(cds$start) +cds$stop <- as.factor(cds$stop) + +cds <- cds[cds$status=="Ok",] +cds <- cds[cds$genefam!="none",] + +cds$categ <- "dust" + +x <- sort(table(cds$genefam), dec=T) +ok <- names(x[x >= CORE_NCDS_CUTOFF]) + +cds$categ[cds$genefam %in% ok] <- "core" + +x <- x[! names(x) %in% ok] +ok <- names(x[x >= SHEL_NCDS_CUTOFF]) + +cds$categ[cds$genefam %in% ok] <- "shell" + +# + +cds.ori <- cds + +cds.lst <- split(cds.ori, cds.ori$categ) + +# +# write out families +# + +# patterns & names + +invisible(lapply(cds.lst, function(cds) { + + x <- sort(table(cds$genefam), decreasing=T) + tab <- paste0("^", names(x), "$") + names(tab) <- names(x) + + y <- sapply(split(cds$gene, cds$genefam), function(g) { + head(names(sort(table(g), decreasing=T)), 1) + }) + + tab <- cbind(tab, y[names(x)]) + + categ <- unique(cds$categ) + f <- paste0("db.", categ, ".pat.txt") + notify("writing patterns for", categ, ":", f) + write.table(tab, file=f, quote=F, col.names=F, row.names=T) +})) + +# ------------------------------- +# Start models (core only) +# ------------------------------- + +if (! "core" %in% names(cds.lst)) { + notify("*** no gene found in core") + notify("*** please change parameters") + quit(save='no', status=1) +} + +cds <- cds.lst[["core"]] + +# +# start by genes +# + +tab <- split(cds$start, cds$genefam) + +fatg <- sapply(tab, function(x) table(x)["atg"]/length(x)*100) +names(fatg) <- names(tab) + +start.dft <- names(which(fatg >= CORE_START_ATG_CUTOFF)) +start.spc <- names(which(fatg < CORE_START_ATG_CUTOFF)) + +tab <- cds[cds$genefam %in% start.dft,] +tab <- table(tab$start) + +# default model + +x <- sort(tab[tab>=CORE_START_DFT_CUTOFF], decreasing=T) +write.model.start(x, "default") + +# gene specific models + +invisible(sapply(start.spc, function(g) { + x <- cds[cds$genefam == g,] + tx <- table(x$start) + tx <- sort(tx[tx>=CORE_START_OTH_CUTOFF], decreasing=T) + write.model.start(tx, g) +})) + +# ------------------------------- +# Stop models (core only) +# ------------------------------- + +# write default stop model + +tab <- table(cds$stop) +x <- sort(tab[tab>=CORE_STOP_CUTOFF], decreasing=T) +write.model.stop(x, "default") + +# ------------------------------- +# splice junctions +# ------------------------------- + +notify("loading intron table") +intron <- read.table("db.intron.txt", com="", header=T, stringsAsFactors=F) + +# remove invalid sequences + +intron$seq <- gsub("\\.|-", "", intron$acceptor.donor) + +lseq <- nchar(gsub("[^acgt]", "", intron$seq)) + +intron <- intron[lseq == 20,] + +# remove genes out of core + +intron <- intron[intron$genefam %in% cds$genefam,] + +# acceptors / donors + +intron$acc <- substr(intron$seq, 5, 6) +intron$don <- substr(intron$seq, 15, 16) + +# consensus + +cons.px <- cons.build(intron$acceptor.donor) +cons.px <- cons.px[,! is.nan(colSums(cons.px))] + +seq.px <- sapply(intron$acceptor.donor, function(s) gsub("[^acgt]", "", s)) + +conf.px <- cons.confusion(cons.px, seq.px) + +sfam <- split(conf.px$l2scor, intron$genefam) +sfam <- sfam[order(sapply(sfam, median))] + +# extract splice exceptions + +name.bad <- names(which(sapply(sfam, median) < 0)) +name.spc <- names(which(sapply(sfam[name.bad], length) >= CORE_SPLICE_CUTOFF)) +name.ok <- setdiff(unique(intron$genefam), name.bad) +name.bad <- setdiff(name.bad, name.spc) +name.list <- c(sapply(name.spc, function(x) x), list(default=name.ok)) + +cons <- lapply(name.list, function(x) cons.build(intron[intron$genefam %in% x, "acceptor.donor"])) + +# write junction models + +invisible(sapply(names(cons), function(n) write.model.splice3(cons[[n]], n))) +invisible(sapply(names(cons), function(n) write.model.splice5(cons[[n]], n))) + +# use uniform model for bad guys + +invisible(sapply(name.bad, function(n) write.unif.splice(3, n))) +invisible(sapply(name.bad, function(n) write.unif.splice(5, n))) + +invisible(write.unif.splice('', "none")) + +# ------------------------------- +# keep data for plotting +# ------------------------------- + +DB <- list() + +params <- list() + +params$CORE_NCDS_CUTOFF <- CORE_NCDS_CUTOFF +params$CORE_START_ATG_CUTOFF <- CORE_START_ATG_CUTOFF +params$CORE_START_DFT_CUTOFF <- CORE_START_DFT_CUTOFF +params$CORE_START_OTH_CUTOFF <- CORE_START_OTH_CUTOFF +params$CORE_STOP_CUTOFF <- CORE_STOP_CUTOFF +params$CORE_SPLICE_CUTOFF <- CORE_SPLICE_CUTOFF + +params$SHEL_NCDS_CUTOFF <- SHEL_NCDS_CUTOFF + +DB$params <- params +DB$chromo <- chromo +DB$cds.lst <- cds.lst +DB$intron <- intron +DB$cons <- cons + +notify("saving db.data.Rdata") +save(DB, file="db.data.Rdata") + +# ------------------------------- +# end +# ------------------------------- + +quit(save='no') diff --git a/detectors/cds/tools/lib/plot.models.r b/detectors/cds/tools/lib/plot.models.r new file mode 100755 index 0000000..223b091 --- /dev/null +++ b/detectors/cds/tools/lib/plot.models.r @@ -0,0 +1,424 @@ +#!/usr/bin/env Rscript +# +# plots models previously computed by make.models.r +# +# source("plot.models.r") +# + +require(vcd) +require(plotrix) + +LIBDIR <- Sys.getenv("LIB_DIR") +if (LIBDIR == "") LIBDIR = "." + +source(paste0(LIBDIR, "/util.base.r")) +source(paste0(LIBDIR, "/util.plot.r")) +source(paste0(LIBDIR, "/util.cons.r")) +source(paste0(LIBDIR, "/util.grid.r")) + +# ------------------------------- +# setup +# ------------------------------- + +OUT.DEV <- TRUE +OUT.TYPE <- "pdf" +OUT.FILE <- "models" + +if (OUT.DEV) uplot.init.dev(OUT.FILE, OUT.TYPE) + +# ------------------------------- +# Load data +# ------------------------------- + +notify("loading DB data") +load("db.data.Rdata") + +params <- DB$params +chromo <- DB$chromo +cds.lst <- DB$cds.lst +intron <- DB$intron +cons <- DB$cons + +# ------------------------------- +# Genomes infos +# ------------------------------- + +grd.titlepage("Species") +grd.textpage(lineno=1, "# org: ", nrow(chromo)) + +# +# general stats +# + +grd.hist(chromo, "len", main="Histogram of chromosome length") +grd.hist(chromo, "gc", pos.quant=c(0.75, 0.6), main="Histogram of chromosome GC") +grd.hist(chromo, "nbCds") +grd.fplot(chromo, "len", "nbCds") + +# +# nb cds no introns +# + +chromo$nbCds_Mono <- chromo$nbCds_int0 +chromo$nbCds_Poly <- chromo$nbCds_int1 + chromo$nbCds_intsup1 +chromo$percentPoly <- round(chromo$nbCds_Poly * 100 / (chromo$nbCds_Poly + chromo$nbCds_Mono)) + +grd.hist(chromo, "nbCds_Mono", main="Histogram of monoexonic Cds") +grd.hist(chromo, "nbCds_Poly", main="Histogram of polyexonic Cds") +grd.hist(chromo, "percentPoly", pos.sum=c(0.23,0.6), main="Histogram of % polyexonic") + +grd.fplot(chromo, "nbCds", "nbCds_Mono", TRUE, ablin=list(a=0, b=1, col=3)) +grd.fplot(chromo, "nbCds", "nbCds_Poly") + +# +# cds size +# + +grd.hist(chromo, "meanCdsSize", pos.quant=NULL, main="Histogram of Cds size") + +# ------------------------------- +# CDS +# ------------------------------- + +cds.all <- do.call(rbind, cds.lst) + +grd.titlepage("CDS") + +grd.textpage(lineno=1, "# core cds core cutoff: ", params$CORE_NCDS_CUTOFF) +grd.textpage(lineno=2, "# core cds shell cutoff: ", params$SHEL_NCDS_CUTOFF) + +grd.textpage(lineno=4, "# total cds: ", nrow(cds.all)) +grd.textpage(lineno=5, "# core cds: ", nrow(cds.lst[["core"]])) +grd.textpage(lineno=6, "# shell cds: ", nrow(cds.lst[["shell"]])) +grd.textpage(lineno=7, "# dust cds: ", nrow(cds.lst[["dust"]])) + +grd.textpage(lineno=9, "# total org: ", length(unique(cds.all$X.locus))) +grd.textpage(lineno=10, "# core org: ", length(unique(cds.lst[["core"]]$X.locus))) +grd.textpage(lineno=11, "# shell org: ", length(unique(cds.lst[["shell"]]$X.locus))) +grd.textpage(lineno=12, "# dust org: ", length(unique(cds.lst[["dust"]]$X.locus))) + + +grd.textpage(lineno=14, "# total families: ", length(unique(cds.all$genefam))) +grd.textpage(lineno=15, "# core families: ", length(unique(cds.lst[["core"]]$genefam))) +grd.textpage(lineno=16, "# shell families: ", length(unique(cds.lst[["shell"]]$genefam))) +grd.textpage(lineno=17, "# dust families: ", length(unique(cds.lst[["dust"]]$genefam))) + +uplot.setup(mfrow=c(2,2), xpd=NA) + +x <- sapply(cds.lst, nrow) +uplot.pie(x, main="CDS", text.r=1.1, col=c(3,2,4)) + +x <- sapply(cds.lst, function(cds) length(unique(cds$X.locus))) +uplot.pie(x, main="ORG", text.r=1.1, col=c(3,2,4)) + +x <- sapply(cds.lst, function(cds) length(unique(cds$genefam))) +uplot.pie(x, main="FAM", text.r=1.1, col=c(3,2,4)) + +uplot.setup(xpd=F) + +# +# plot genes cutoff +# + +cds.all <- do.call(rbind, cds.lst) +cds.byfam <- split(cds.all, cds.all$genefam) + +tab <- sort(sapply(cds.byfam, nrow), decreasing=T) +cols <- rep("red", length(tab)) +cols[tab >= params$SHEL_NCDS_CUTOFF] <- "blue" +cols[tab >= params$CORE_NCDS_CUTOFF] <- "green" +barplot(tab, col=cols, border=NA, main="# genes") + +cols <- cols[tab >= 50] +tab <- tab[tab >= 50] +barplot(tab, col=cols, border=NA, las=2, cex.names=0.5, main="# genes in core") +abline(h=params$CORE_NCDS_CUTOFF, col=1) +text(50, 200, "CORE_NCDS_CUTOFF", pos=3) + +# +# cds length for core +# + +invisible(sapply(c("core", "shell", "dust"), function(what) { + + cds <- cds.lst[[what]] + + x <- split(cds$length, cds$genefam) + x <- x[order(sapply(x, mean))] + + uplot.setup(mfrow=c(2,1)) + + boxplot(x, pars = list(boxwex = 0.8, staplewex = 0.5, outwex = 0.5, outcex = 0.1), + las=2, cex.axis=0.5, main=paste0(what, " genes - length distribution")) + + boxplot(x, pars = list(boxwex = 0.8, staplewex = 0.5, outwex = 0.5, outcex = 0.1), ylim=c(0,2000), + las=2, cex.axis=0.5, main=paste0(what, " genes - length distribution zoom")) + + uplot.setup() +})) + +# ------------------------------- +# starts & stops +# ------------------------------- + +cds <- cds.lst[["core"]] + +grd.titlepage("Starts and Stops") + +tab <- sort(table(cds$start), dec=T) +tab <- tab[tab >= 100] +tab <- tab / sum(tab) * 100 + +barplot(tab, log="y", las=1, ylim=c(0.1, 100), main="start frequencies (%)") +text(0.7, 50, round(tab[1], 2)) +text(1.9, 2.3, round(tab[2], 2)) +text(3.1, 2.3, round(tab[3], 2)) + +# +# start by org and gc +# + +x <- split(cds$start, cds$X.locus) + +fatg <- sapply(x, function(x) table(x)["atg"]/length(x)*100) +names(fatg) <- names(x) +chromo$fatg <- round(fatg[chromo$X.locus], 2) + +fgtg <- sapply(x, function(x) table(x)["gtg"]/length(x)*100) +names(fgtg) <- names(x) +chromo$fgtg <- round(fgtg[chromo$X.locus], 2) + +facg <- sapply(x, function(x) table(x)["acg"]/length(x)*100) +names(facg) <- names(x) +chromo$facg <- round(facg[chromo$X.locus], 2) + +grd.hist(chromo, "fatg", pos.quant=c(0.5, 0.6), main="Histogram of atg freq. by org") +grd.hist(chromo, "fgtg", main="Histogram of gtg freq. by org") +grd.hist(chromo, "facg", pos.sum=c(0.3, 0.6), main="Histogram of acg freq. by org") + +grd.fplot(chromo, "gc", "fatg", main="atg freq. by org GC", pos=c(0.2, 0.3)) +grd.fplot(chromo, "gc", "fgtg", main="gtg freq. by org GC") +grd.fplot(chromo, "gc", "facg", main="acg freq. by org GC") + +ter <- cbind(fatg, fgtg, facg) +colnames(ter) <- c("ATG", "GTG", "ACG") +igc <- cut(chromo$gc, breaks=quantile(chromo$gc, seq(0, 1, 0.1)), include.lowest=T, labels=1:10) +cols <- rainbow(10)[igc] +ternaryplot(ter, col=cols, cex=0.2, main="Start by org", labels="outside") + +# +# start by common genes +# + +x <- split(cds$start, cds$genefam) + +fatg <- sapply(x, function(x) table(x)["atg"]/length(x)*100) +names(fatg) <- names(x) + +fgtg <- sapply(x, function(x) table(x)["gtg"]/length(x)*100) +names(fgtg) <- names(x) + +facg <- sapply(x, function(x) table(x)["acg"]/length(x)*100) +names(facg) <- names(x) + +barplot(sort(fatg)[1:10], las=2, main="atg freq. by gene") +barplot(sort(fgtg, dec=T)[1:10], las=2, main="gtg freq. by gene") +barplot(sort(facg, dec=T)[1:10], las=2, main="acg freq. by gene") + +ter <- cbind(fatg, fgtg, facg) +colnames(ter) <- c("ATG", "GTG", "ACG") +ternaryplot(ter, col=1, cex=0.5, id=rownames(ter), main="Starts by genes", labels="outside") + +# ------------------------------- +# stops +# ------------------------------- + +# +# stop by org and gc +# + +tab <- sort(table(cds$stop), dec=T) +tab <- tab[tab >= 100] +tab <- tab / sum(tab) * 100 + +barplot(tab, log="y", las=1, ylim=c(0.1, 100), main="stop frequencies (%)") +text(0.7, 80, round(tab[1], 2)) +text(1.9, 30, round(tab[2], 2)) +text(3.1, 25, round(tab[3], 2)) + +x <- split(cds$stop, cds$X.locus) + +ftaa <- sapply(x, function(x) table(x)["taa"]/length(x)*100) +names(ftaa) <- names(x) +chromo$ftaa <- round(ftaa[chromo$X.locus], 2) + +ftag <- sapply(x, function(x) table(x)["tag"]/length(x)*100) +names(ftag) <- names(x) +chromo$ftag <- round(ftag[chromo$X.locus], 2) + +ftga <- sapply(x, function(x) table(x)["tga"]/length(x)*100) +names(ftga) <- names(x) +chromo$ftga <- round(ftga[chromo$X.locus], 2) + +grd.hist(chromo, "ftaa", pos.quant=c(0.7, 0.6), main="Histogram of taa freq. by org") +grd.hist(chromo, "ftag", pos.quant=c(0.8, 0.6), main="Histogram of tag freq. by org") +grd.hist(chromo, "ftga", pos.quant=c(0.8, 0.6), main="Histogram of tga freq. by org") + +grd.fplot(chromo, "gc", "ftaa", main="taa freq. by org GC", pos=c(0.2, 0.3)) +grd.fplot(chromo, "gc", "ftag", main="tag freq. by org GC") +grd.fplot(chromo, "gc", "ftga", main="tga freq. by org GC") + +ter <- cbind(ftaa, ftag, ftga) +colnames(ter) <- c("TAA", "TAG", "TGA") +igc <- cut(chromo$gc, breaks=quantile(chromo$gc, seq(0, 1, 0.1)), include.lowest=T, labels=1:10) +cols <- rainbow(10)[igc] +ternaryplot(ter, col=cols, cex=0.2, main="Stops by org", labels="outside") + +# +# stop by common genes +# + +x <- split(cds$stop, cds$genefam) + +ftaa <- sapply(x, function(x) table(x)["taa"]/length(x)*100) +names(ftaa) <- names(x) + +ftag <- sapply(x, function(x) table(x)["tag"]/length(x)*100) +names(ftag) <- names(x) + +ftga <- sapply(x, function(x) table(x)["tga"]/length(x)*100) +names(ftga) <- names(x) + +barplot(sort(ftaa), las=2, cex.names=0.5, ylim=c(0,100), main="taa freq. by gene") +barplot(sort(ftag), las=2, cex.names=0.5, ylim=c(0,100), main="tag freq. by gene") +barplot(sort(ftga), las=2, cex.names=0.5, ylim=c(0,100), main="tga freq. by gene") + +ter <- cbind(ftaa, ftag, ftga) +colnames(ter) <- c("TAA", "TAG", "TGA") +ternaryplot(ter, col=1, cex=0.3, id=rownames(ter), main="Stops by genes", labels="outside") + +# ------------------------------- +# splice junctions +# ------------------------------- + +grd.titlepage("Splice Junctions") + +grd.textpage(lineno=1, "# intron in core: ", nrow(intron)) + +# +# intron size +# + +intron$size <- intron$to - intron$from + 1 + +grd.hist(intron, "size", pos.quant=NULL, main="Histogram of intron size", br=1000, xlim=c(0,2000)) + +# +# nb intron / gene +# + +x <- split(intron, intron$genefam) +x <- x[order(sapply(x, function(x) mean(x$intron_nb)), decreasing=T)] + +nmax <- max(intron$intron_nb) +lintron <- lapply(x, function(x) x$intron_nb) +mintron <- sapply(lintron, function(x) table(factor(x, levels=1:nmax))) + +lintron0 <- table(cds[cds$nexon == 1,"genefam"])[names(lintron)] +mintron <- rbind("0"=lintron0, mintron) +mintron <- t(t(mintron)/colSums(mintron)) + +mintron[mintron==0] <- NA + +nn <- nrow(mintron) +xx <- mintron[nn:1,] +ll <- lapply(1:nn, function(i) xx[i,]) +mintron <- mintron[,do.call(order, c(ll, decreasing=T))] + +battleship.plot(mintron, maxxspan=0.3, maxyspan=0.3, + cex.labels=0.7, + main="% intron per polyexonic gene") + +# +# acceptors / donors +# + +tab <- sort(table(intron$acc), dec=T) +tab <- tab[tab >= 100] +tab <- tab / sum(tab) * 100 + +barplot(tab, log="y", las=1, ylim=c(0.1, 100), main="acceptor frequencies (%)") +text(0.7, 50, round(tab[1], 2)) +text(1.9, 3, round(tab[2], 2)) +text(3.1, 2.3, round(tab[3], 2)) + +tab <- sort(table(intron$don), dec=T) +tab <- tab[tab >= 100] +tab <- tab / sum(tab) * 100 + +barplot(tab, log="y", las=1, ylim=c(0.1, 100), main="donor frequencies (%)") +text(0.7, 50, round(tab[1], 1)) +text(1.9, 40, round(tab[2], 1)) +text(3.1, 15, round(tab[3], 1)) +text(4.3, 12, round(tab[4], 1)) + +# +# consensus all +# + +cons$all <- cons.build(intron$acceptor.donor) + +invisible(sapply(rev(names(cons)), function(what) { + cons.plot(cons[[what]], paste0("consensus ", what)) +})) + +# +# default consensus score by consensus length +# + +cons.def <- cons[["default"]] +cons.def <- cons.def[,! is.nan(colSums(cons.def))] +seq.def <- sapply(intron$acceptor.donor, function(s) gsub("[^acgt]", "", s)) + +epx <- apply(cons.def, 2, function(col) -sum(col * log(col, base=4))) +opx <- order(epx) + +conf.def <- lapply(seq(2, length(opx), by=2), function(n) { + pos <- head(opx, n) + notify(n, "/", length(opx)) + cons.confusion(cons.def, seq.def, thresh=0, pos=pos) +}) + +acc <- sapply(conf.def, function(x) x$acc) +sen <- sapply(conf.def, function(x) x$sen) +sel <- sapply(conf.def, function(x) x$sel) + +plot(sel, ylim=c(0.7, 1), pch=1, type="b", main="accuracy by nb consensus positions", ylab="") +lines(sen, type="b", pch=2) +lines(acc, type="b", pch=3) +legend(1, 0.95, c("sensit.", "select.", "accur."), pch=1:3, horiz=T, bty="n") + +# +# default consensus score by genes +# + +conf.def <- cons.confusion(cons.def, seq.def, thresh=0) +cons.histconf(conf.def) + +sfam <- split(conf.def$l2scor, intron$genefam) +sfam <- sfam[order(sapply(sfam, median))] + +boxplot(sfam, pars = list(boxwex = 0.8, staplewex = 0.5, outwex = 0.5, outcex = 0.1), + las=2, cex.axis=0.7, main="default junction logr score by genes") +abline(h=0) + +# +# end +# + +if (OUT.DEV) { + cat("+ plot file:", paste0(OUT.FILE, ".", OUT.TYPE), "\n") + invisible(dev.off()) +} + +quit(save='no') diff --git a/detectors/cds/tools/lib/summarize_cmp.r b/detectors/cds/tools/lib/summarize_cmp.r new file mode 100755 index 0000000..145564a --- /dev/null +++ b/detectors/cds/tools/lib/summarize_cmp.r @@ -0,0 +1,71 @@ +#!/usr/bin/env Rscript +# +# plot summary graphics of comparisons +# +# + +LIBDIR <- Sys.getenv("LIB_DIR") +if (LIBDIR == "") LIBDIR = "." + +source(paste0(LIBDIR, "/util.plot.r")) + +COLORS <- 2:10 + +# + +OUT.DEV <- TRUE +OUT.TYPE <- "pdf" +OUT.FILE <- "compare" +if (OUT.DEV) uplot.init.dev(OUT.FILE, OUT.TYPE) + +# + +tab <- read.table("compare.txt", header=T, comment.char="", stringsAsFactors=F) + +# + +par(xpd=NA) + +# + +sel <- c("cor", "alcor", "acc", "wrong", "over", "misstot") +tab$ptot <- rowSums(tab[,sel]) +for (s in sel) + tab[,paste0("p", s)] <- tab[,s] * 100 / tab$ptot + +colors <- head(COLORS, length(sel)) + +cols <- paste0("p", sel) +ord <- order(tab$pcor+tab$palcor+tab$pacc, decreasing=T) + +barplot(t(tab[ord,cols]), names.arg=tab$X.org[ord], + ylim=c(0,100), col=colors, las=2, cex.names=0.5) + +legend(0, 110, sel, fill=colors, cex=0.7, horiz=T) + +# + +sel <- c("cor", "alcor", "acc", "wrong", "over", "misschlo") +tab$rtot <- rowSums(tab[,sel]) +for (s in sel) + tab[,paste0("r", s)] <- tab[,s] * 100 / tab$rtot + +colors <- head(COLORS, length(sel)) + +cols <- paste0("r", sel) +ord <- order(tab$rcor+tab$ralcor+tab$racc, decreasing=T) + +barplot(t(tab[ord,cols]), names.arg=tab$X.org[ord], + ylim=c(0,100), col=colors, las=2, cex.names=0.5) + +legend(0, 110, sel, fill=colors, cex=0.7, horiz=T) + +# + +if (OUT.DEV) { + cat("# plot file:", paste0(OUT.FILE, ".", OUT.TYPE), "\n") + invisible(dev.off()) +} + +quit(save='no') + diff --git a/detectors/cds/tools/lib/summary.cmp.awk b/detectors/cds/tools/lib/summary.cmp.awk new file mode 100644 index 0000000..6d1898f --- /dev/null +++ b/detectors/cds/tools/lib/summary.cmp.awk @@ -0,0 +1,54 @@ +# +# + +function getOrg(s, _local_, a, na, org) { + na = split(s, a, "/") + na = split(a[na], a, "\\.") + return a[1] +} + + +BEGIN { + PROCINFO["sorted_in"] = "@ind_num_asc" + print "#org tot cor alcor acc wrong over misstot misschlo missoth" +} + +/MISSED in ChloroDB/ { + org = getOrg($1) + Org[org]++ + Cnt[org]["MISSCHLORO"] = $2 + next +} + +/MISSED not in ChloroDB/ { + org = getOrg($1) + Org[org]++ + Cnt[org]["MISSNOTCHLORO"] = $2 + next +} + +/^#/ { next } + +/^.*:MATCH/ { + org = getOrg($1) + Org[org]++ + split($NF, a, "\\.") + Cnt[org][a[1]]++ +} + +END { + for (org in Org) { + Cnt[org]["TOTAL"] = Cnt[org]["CORRECT"] + Cnt[org]["ALMOST_CORRECT"] \ + + Cnt[org]["ACCEPTABLE"] + Cnt[org]["WRONG"] \ + + Cnt[org]["MISSED"] + } + for (org in Org) { + print org, Cnt[org]["TOTAL"]+0, Cnt[org]["CORRECT"]+0, \ + Cnt[org]["ALMOST_CORRECT"]+0, Cnt[org]["ACCEPTABLE"]+0, \ + Cnt[org]["WRONG"]+0, Cnt[org]["OVERPRED"]+0, \ + Cnt[org]["MISSED"]+0, \ + Cnt[org]["MISSCHLORO"]+0, Cnt[org]["MISSNOTCHLORO"]+0 + + } + +} diff --git a/detectors/cds/tools/lib/util.base.r b/detectors/cds/tools/lib/util.base.r new file mode 100644 index 0000000..ea1690e --- /dev/null +++ b/detectors/cds/tools/lib/util.base.r @@ -0,0 +1,12 @@ +# +# R basic utilities +# + +# +# notify on stderr +# + +notify <- function(...) cat("+", ..., "\n") + + + diff --git a/detectors/cds/tools/lib/util.cons.r b/detectors/cds/tools/lib/util.cons.r new file mode 100644 index 0000000..707b503 --- /dev/null +++ b/detectors/cds/tools/lib/util.cons.r @@ -0,0 +1,109 @@ +# +# R consensus utilities +# + +# +# compute consensus +# + +cons.build <- function(seqs, backcount=1) { + xx <- do.call(rbind, sapply(seqs, strsplit, "", USE.NAMES=F)) + lv <- c("a", "c", "g", "t", ".", "-") + mx <- apply(xx, 2, function(x) table(factor(x, levels=lv)))[1:4,] + cx <- colSums(mx) + mx <- mx + backcount + mx[,cx==0] <- 0 + apply(mx, 2, function(x) x / sum(x)) +} + +# +# score consensus +# + +cons.score <- function(cons, seq, pos=1:ncol(cons)) { + seq <- strsplit(seq, "")[[1]] + if (length(seq) != ncol(cons)) { + warning("incompatible seq and cons size") + return(NA) + } + ppx <- sapply(pos, function(i) cons[seq[i],i]) + sum(log10(ppx+1e-6)) +} + +# +# logratio to uniform model score +# + +cons.logratio <- function(cons, seq, m0=NULL, pos=1:ncol(cons)) { + if (is.null(m0)) { + m0 <- matrix(rep(0.25, 4), nrow=4, ncol=ncol(cons)) + rownames(m0) <- c('a', 'c', 'g', 't') + } + + sc <- cons.score(cons, seq, pos=pos) + sc0 <- cons.score(m0, seq, pos=pos) + + 2 * (log(10^sc, base=2) - log(10^sc0, base=2)) +} + +# +# shuffle sequence +# + +seq.shuf <- function(seq) { + paste0(sample(strsplit(seq, "")[[1]], nchar(seq), replace=F), collapse="") +} + +# +# compute confusion matrix between actual and shuffled sequences +# + +cons.confusion <- function(cons, seq, m0=NULL, pos=1:ncol(cons), thresh=0) { + som <- function(x) sum(x, na.rm=T) + + res <- list() + res$l2scor <- l2scor <- sapply(seq, function(s) cons.logratio(cons, s, m0=m0, pos=pos)) + + seq <- sapply(seq, seq.shuf) + res$r2scor <- r2scor <- sapply(seq, function(s) cons.logratio(cons, s, m0=m0, pos=pos)) + + res$conf <- conf <- matrix(c(som(l2scor >= thresh), som(l2scor < thresh), + som(r2scor >= thresh), som(r2scor < thresh)), + nrow=2, byrow=T) + + res$acc <- sum(diag(conf)) / sum(conf) + res$sen <- conf[1,1] / sum(conf[1,]) + res$sel <- conf[1,1] / sum(conf[,1]) + + res +} + +# +# plot consensus +# + + +cons.plot <- function(cons, main="consensus") { + cols <- c("blue", "orange", "red", "green") + bp <- barplot(cons, col=cols, ylim=c(0,1), main=main) + plx <- apply(cons, 2, function(col) -sum(col * log(col+1e-6, base=4))) + lines(bp, plx, type="b", pch=19) + legend(0, 1.1, c("a","c","g","t"), fill=cols, horiz=T, xpd=NA, bty="n") + legend(20, 1.1, "entropy", pch=19, horiz=T, xpd=NA, bty="n") + invisible() +} + +# +# plot confusion scores histograms +# + +cons.histconf <- function(conf, main="junction logr score") { + lrh <- hist(c(conf$l2scor, conf$r2scor), br=50, plot=F) + lh <- hist(conf$l2scor, br=lrh$breaks, plot=F) + rh <- hist(conf$r2scor, br=lrh$breaks, plot=F) + xx <- rbind(lh$counts, rh$counts) / sum(lh$counts) + colnames(xx) <- lrh$mids + barplot(xx, col=c(3,2), beside=T, main=main) + legend(0, 0.1, c("true", "shuffled"), fill=c(3,2), horiz=F, xpd=NA) + invisible() +} diff --git a/detectors/cds/tools/lib/util.grid.r b/detectors/cds/tools/lib/util.grid.r new file mode 100644 index 0000000..f8d34cd --- /dev/null +++ b/detectors/cds/tools/lib/util.grid.r @@ -0,0 +1,93 @@ +# +# R misc grid plotting +# + +require(grid) +require(gridExtra) + +# +# get line height +# + +grd.lineheight <- function(s="X") { + convertHeight(unit(1,"strheight", s), "native", valueOnly=T) +} + +# +# quantile table +# + +grd.qtab <- function(df, what, cols, n=5) { + df <- df[order(df[,what], decreasing=T),cols] + sep <- head(df,1) + sep[] <- "-" + rbind(head(df, n), sep, tail(df, n)) +} + +# +# histogram with tables +# + +grd.hist <- function(df, what, cols = c(1,2, which(colnames(df) == what)), + breaks=50, pos.sum=c(0.2,0.6), pos.quant=c(0.7,0.6), cex=0.7, + main=paste0("Histogram of ", what), ...) { + hist(df[,what], breaks=breaks, xlab=what, main=main, ...) + if (! is.null(pos.sum)) { + pushViewport(viewport(pos.sum[1], pos.sum[2], gp=gpar(cex=cex))) + grid.table(x<-summary(df[,what]), rows=names(x)) + popViewport() + } + if (! is.null(pos.quant)) { + pushViewport(viewport(pos.quant[1], pos.quant[2], gp=gpar(cex=cex))) + grid.table(grd.qtab(df, what, cols), rows=NULL) + popViewport() + } + invisible() +} + +# +# plot with fit +# + +grd.fplot <- function(df, what.x, what.y, linfit=T, pos=c(0.2, 0.8), ablin=NULL, ...) { + plot(df[,what.x], df[,what.y], xlab=what.x, ylab=what.y, ...) + if (linfit) { + fit <- lm(df[,what.y] ~ df[,what.x]) + abline(fit, col=2) + pushViewport(viewport(gp=gpar(col=2))) + a <- sprintf("%.2e", coef(fit)[2]) + b <- sprintf("%.2e", coef(fit)[1]) + grid.text(paste0(what.y, " = ", a, " * ", what.x, " + ", b), + pos[1], pos[2], just="left") + pos[2] = pos[2] - 2 * grd.lineheight() + grid.text(paste0("R2=", round(summary(fit)$r.squared, 3)), + pos[1], pos[2], just="left") + popViewport() + } + if (! is.null(ablin)) + do.call(abline, ablin) + invisible() +} + +# +# write text +# + +grd.textpage <- function(..., lineno=0, left=0.1, top=0.9, cex=1, fact=1.4) { + txt <- do.call(paste0, list(...)) + pushViewport(viewport(gp=gpar(cex=cex))) + grid.text(txt, left, top-lineno*grd.lineheight()*fact, just="left") + popViewport() + invisible(txt) +} + +# +# title page +# + +grd.titlepage <- function(title, x=0.5, y=0.7, cex=3, ...) { + notify("processing", title) + grid.newpage() + grid.text(title, x, y, gp=gpar(cex=cex), ...) + invisible() +} diff --git a/detectors/cds/tools/lib/util.modelio.r b/detectors/cds/tools/lib/util.modelio.r new file mode 100644 index 0000000..76c725f --- /dev/null +++ b/detectors/cds/tools/lib/util.modelio.r @@ -0,0 +1,90 @@ +# +# R models I/O utilities +# + +# +# write start model +# + +write.model.start <- function(frq, what) { + dir.create("models", showWarnings=F) + fil <- paste0("models/start.", what, ".frq") + notify("writing start model:", fil) + cat("# start model :", what, "\n", file=fil) + for (x in names(frq)) + cat(x, frq[x]/sum(frq), frq[x], "\n", file=fil, append=T) + invisible(fil) +} + +# +# write stop model +# + +write.model.stop <- function(frq, what) { + dir.create("models", showWarnings=F) + fil <- paste0("models/stop.", what, ".frq") + notify("writing stop model:", fil) + cat("# stop model :", what, "(freq. ignored)\n", file=fil) + for (x in names(frq)) + cat(x, frq[x]/sum(frq), frq[x], "\n", file=fil, append=T) + invisible(fil) +} + +# +# write splice3 model +# [FIXME] positions are hard-coded +# + +write.model.splice3 <- function(cons, what) { + dir.create("models", showWarnings=F) + fil <- paste0("models/splice3.", what, ".frq") + notify("writing splice3 model:", fil) + .catcons <- function(i) { + cat(round(cons[c("a","c","g","t"), i]*100, 0), "\n", + file=fil, append=T) + } + cat("# 3' splice model :", what, "\n", file=fil) + cat("# A C G T\n", file=fil, append=T) + sapply(seq.int(1, 4), .catcons) + cat("splice\n", file=fil, append=T) + sapply(seq.int(6, 11), .catcons) + invisible(fil) +} + +# +# write splice5 model +# [FIXME] positions are hard-coded +# + +write.model.splice5 <- function(cons, what) { + dir.create("models", showWarnings=F) + fil <- paste0("models/splice5.", what, ".frq") + notify("writing splice5 model:", fil) + .catcons <- function(i) { + cat(round(cons[c("a","c","g","t"), i]*100, 0), "\n", + file=fil, append=T) + } + cat("# 5' splice model :", what, "\n", file=fil) + cat("# A C G T\n", file=fil, append=T) + sapply(seq.int(13, 18), .catcons) + cat("splice\n", file=fil, append=T) + sapply(seq.int(20, 23), .catcons) + invisible(fil) +} + +# +# write splice3/5 uniform model +# + +write.unif.splice <- function(pos, what) { + dir.create("models", showWarnings=F) + fil <- paste0("models/splice", pos, ".", what, ".frq") + notify("writing uniform splice", pos, "model:", fil) + cat("# 3'/5' splice null model", file=fil) + cat("# A C G T\n", file=fil, append=T) + cat("25 25 25 25\n", file=fil, append=T) + cat("splice\n", file=fil, append=T) + cat("25 25 25 25\n", file=fil, append=T) + invisible(fil) +} + diff --git a/detectors/cds/tools/lib/util.plot.r b/detectors/cds/tools/lib/util.plot.r new file mode 100644 index 0000000..056e4e6 --- /dev/null +++ b/detectors/cds/tools/lib/util.plot.r @@ -0,0 +1,105 @@ +# +# R plot utilities +# + +# +# setup graphic device +# tiff: high resolution 600 dpi +# pdf +# + +uplot.init.dev <- function(fname, type="pdf", width=7, height=7, resol=600, ...) { + fname <- paste0(fname, ".", type) + res <- NULL + if (type == "tiff") { + res <- tiff(fname, width=width, height=height, units="in", res=resol, ...) + } + if (type == "pdf") { + res <- pdf(fname, width=width, height=height, ...) + } + invisible(res) +} + +# +# convert pdf to tiff using ghostscript +# + +uplot.convert2tiff <- function(fname, resol=600) { + infile <- paste0(fname, ".pdf") + oufile <- paste0(fname, ".tif") + cmd <- paste0("echo quit | gs -r", resol, "-dBATCH -dNOPAUSE -sDEVICE=tiff12nc -sCompression=lzw -sOutputFile=", oufile, " ", infile) + system(cmd) +} + +# +# default plot setup +# + +uplot.setup <- function(mfrow=c(1,1), + las=1, + mgp=c(2, 0.7, 0), + oma=c(0, 0, 0, 0), + mar=c(4, 3, 3, 2), + cex.main=1, + font.main=1, + family='Helvetica', ...) { + par(mfrow=mfrow, las=las, mgp=mgp, oma=oma, mar=mar, cex.main=cex.main, font.main=font.main, family=family, ...) +} + +# +# pie plot +# + +uplot.pie <- function(tab, main="", labels=c("name", "val", "per"), text.r=0.5, text.col="black", text.cex=1, main.pos=c(0,0), main.col="black", ...) { + pie(tab, edges=2000, main="", labels="", ...) + text(main.pos[1], main.pos[2], main, cex=1.5, col=main.col) + prop <- tab/sum(tab) + theta <- 2*pi * (cumsum(prop) - prop/2) + lab <- list(name=names(tab), val=tab, per=sprintf("%d%%", round(prop*100))) + lab <- apply(data.frame(lab[labels]), 1, paste, collapse="\n") + if (length(lab) > 0) + text(text.r*cos(theta), text.r*sin(theta), lab, cex=text.cex, col=text.col) + invisible(NULL) +} + +# +# plot utility : color representation of a table +# + +uplot.table <- function(tab, col=heat.colors(100), with.lines=TRUE) { + image(as.matrix(tab), xaxt="n", yaxt="n", col=col) + nli <- nrow(tab) + nco <- ncol(tab) + dx <- 0.5 / (nli-1) + dy <- 0.5 / (nco-1) + xf <- (seq_len(nli)-1)/(nli-1) - dx + yf <- (seq_len(nco)-1)/(nco-1) - dy + if (with.lines) { + segments(xf, -dy, xf, 1+dy) + segments(-dx, yf, 1+dx, yf) + } + Axis(c(0,1), at=xf+dx, side=1, labels=rownames(tab), las=2, cex.axis=0.5, padj=0) + Axis(c(0,1), at=yf+dy, side=2, labels=colnames(tab), las=2, cex.axis=0.5, padj=0) + invisible(NULL) +} + +# +# plot utility : identify points within user's rectangle +# + +rect.identify <- function(data) { + if (is.null(dim(data))) data <- cbind(seq_along(data), data) + xy <- locator(n=2, type='n') + r <- matrix(c(range(xy$x), range(xy$y)), ncol=2, byrow=TRUE) + rect(r[1,1], r[2,1], r[1,2], r[2,2], border='red') + .in.range <- function(p, r) { + .in.int <- function(i) { + (p[i] >= r[i,1]) && (p[i] <= r[i,2]) + } + .in.int(1) && .in.int(2) + } + isel <- which(apply(data, 1, .in.range, r)) + points(data[isel,], col='red', pch=19) + isel +} + diff --git a/scripts/csh_init.sh b/scripts/csh_init.sh index 3f4e1a3..7099a7d 100644 --- a/scripts/csh_init.sh +++ b/scripts/csh_init.sh @@ -18,8 +18,8 @@ if ($?ORG_SOURCED == 0) then # o Verbose : default verbosity (may be changed by -v option) # - setenv AwkCmd "gawk" - setenv Verbose 0 + if ($?AwkCmd == 0) setenv AwkCmd "gawk" + if ($?Verbose == 0) setenv Verbose 0 # -------------------------------------- # don't change hereafter (normally) @@ -90,11 +90,15 @@ set path = ($SCRIPT_DIR $BIN_DIR $path) # alias should be sourced each time # -------------------------------------- -alias Debug 'if ($Verbose) echo "# "\!:* >> /dev/stderr' +alias Cout 'echo `date "+%Y-%m-%d %H:%M:%S"` "[OA \!:1]" \!:2-* >> /dev/stderr' -alias Notify 'echo "# "\!:* >> /dev/stderr' +alias Debug 'if ($Verbose) echo `date "+%Y-%m-%d %H:%M:%S"` "[OA DEBUG]" \!:* >> /dev/stderr' -alias Error 'echo "# Error "\!:2-*"" >> /dev/stderr; Exit \!:1' +alias Cat 'awk -v D="`date '"'"'+%Y-%m-%d %H:%M:%S'"'"'`" '"'"'{print D " [OA FILE ] " $0}'"'"' \!:* >> /dev/stderr' + +alias Notify 'Cout "INFO " \!:*' + +alias Error 'Cout ERROR \!:2-*; Exit \!:1' alias Exit 'set Stat = \!:1; Debug "<--- $0 [$Stat]"; exit \!:1' @@ -124,8 +128,6 @@ alias NeedFile 'if (! -e \!:1) eval Error 5 "\!:1 : file not found"' alias NeedDir 'if (! -d \!:1) eval Error 5 "\!:1 : directory not found"' -alias Cat 'awk '"'"'{print "# " $0}'"'"' \!:*' - alias AssignUndef 'if ($?\!:1 == 0) set \!:1=\!:2-*' # --------------------------------------