LOCUS sequence001 11370 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence001 VERSION sequence001 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..11370 /mol_type="genomic DNA" /organism="" /note="sequence001" misc_feature <1..1158 /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_008762692.1:AMP-binding protein" /note="WP_008762692.1 AMP-binding protein (Bacteroides) [pid:59.4%, q_cov:96.6%, s_cov:67.7%, Eval:5.8e-132, partial hit]" /note="MGA_1" /locus_tag="LOCUS_0010" CDS 1541..3829 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MQNTGIELKILEMAGRIRDLREIIGLSTAEMALKTGVSEEEYIAC ENARRDLNFAFLYRCALALGVDVTDIIEGASPRLAGYTVTRKGDGQRIEQAHGMVYYNL ASAFKNRIAEPLLVVSAYSEEAQHADIELTTHEGQECDIIVSGSLKVQIGDHIEILKEG DSIYYDSDTPHGMIAVGGSDCVFYAIVLNPSGESIEKITHGGVREFTARPLKTPERKWI YEDYIDAKEDKNGVLEKISFKNEQSFNFAFDLVDRMGREQPDKLALLHIDKNHVERRFT FADIKRASSQTANYLKSLGIKRGDKVLLILKRHYQFWLVMIALHKLGAVAIPATNQLKE HDITYRLNKAGVKMVICTADDGVAEQVDISAKHAQTLEHKLIVNGEREGWRSFDEEYTL YTGKFDRPDDCPCGDEPMLMYFTSGTTGNPKIATHNFMYPLGHFVTAKYWHCVNPNGLH LTVSDSGWAKCAWGKLYGQWLCEAPLFVYDFDRFDAEDILPMFAKYQITTFCAPPTILR MLAKQDIGKYDLSSVEHMSTAGEALNPEVFRQFEAATGLQIMEGFGQTETTVALATLAG MKAKLGSMGKPVALYDIDLVDADGNTVDDGEVGEICIRIDKGSPCGLFRGYYKDEEKTE EVFRHGLYHTGDTAWRDEDGYYWYVGRVDDVIKSSGYRIGPFEIENVIMELPYVLECGV SAAPDEVRGQVVKASIVLTKGTEPTDELKKEIQQYVKTRTAPYKYPRIVVFKDELPKTT SGKIQRNKL" /locus_tag="LOCUS_0020" /note="WP_008762692.1 AMP-binding protein (Bacteroides) [pid:51.5%, q_cov:68.6%, s_cov:95.3%, Eval:1.2e-159, partial hit]" /note="MGA_2" CDS 3842..4507 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003357453.1" /transl_table=11 /codon_start=1 /translation="MNHKRITLFAGHYGSGKTNIAVNYAMELAKTGKPVVIADLDIVNP YFRTKDSADELAALGIELISPEFANSNVDLPALPAQVYGVVQNKNRLAVLDIGGDDRGA YALGRYAPYILEENDFEMVFVANFMRPLTKTAEEALEVMREIELAGKIPFTAIVNNTNL GNLTDAETVEASNYEAKKLSEISGLPILFTSAEADVAPKVKLENVFPLNLQKKYFDIK" /locus_tag="LOCUS_0030" /note="WP_003357453.1 hypothetical protein (Clostridium botulinum) [pid:37.7%, q_cov:95.9%, s_cov:97.3%, Eval:1.0e-37]" /note="MGA_3" CDS 4531..4737 /product="4Fe-4S binding protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003420706.1" /transl_table=11 /codon_start=1 /translation="MAKVTFDTDTCKGCGLCVDACPKNLLVIAKDKINKKGHSPAEMTD MSQCIGCAFCATMCPDCVITVEK" /locus_tag="LOCUS_0040" /note="WP_003420706.1 4Fe-4S binding protein (Clostridioides) [pid:59.1%, q_cov:97.1%, s_cov:93.0%, Eval:9.3e-20]" /note="MGA_4" CDS 4754..5815 /product="3-methyl-2-oxobutanoate dehydrogenase subunit VorB" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003357407.1" /transl_table=11 /codon_start=1 /translation="MAEKVLMKGNEAIAEAAIRAGCRHYFGYPITPQTELAAYMAKRMP KIGGVFLQAESEISAINMVYGVAGTGLRVMTSSSSPGVSLKQEGISYIAGADLPALIIN VQRGGPGLGGIQPSQSDYFQATKGGGHGDYHLIVLAPASVQEMADLTATAFELAEKYRM PAMILADGTMGQMMEPVTLPEPVEYNPNHDWTVTGTKCERKHNIINSLYLVPEELEKKN FERFEKYKTIEENEVMYESYLMDDADYCVVAFGIAARVAKNAINEARAKGIKVGMIRPI TLWPFPTKVIREAADKVKAFISVELSMGQMIEDVKLASECLKPVYLCNRSGGMIPEPAQ ILEMIEKLDGGEN" /locus_tag="LOCUS_0050" /note="WP_003357407.1 3-methyl-2-oxobutanoate dehydrogenase subunit VorB (Clostridium) [pid:59.0%, q_cov:99.4%, s_cov:99.4%, Eval:1.2e-117]" /note="MGA_5" CDS 5815..6573 /product="thiamine pyrophosphate-dependent enzyme" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003357567.1" /transl_table=11 /codon_start=1 /translation="MVVFEKPKSLTDAPLHYCPGCTHGIIHRLVAEAIDELGIEGKTIG VAPVGCAVMAYNYFACDMVEAAHGRAPAVATGLKRALPENIIFTYQGDGDLASIGMAET VHAATRNENITVIFVNNAIYGMTGGQMAPTSLPGQVTQTSPYGRDVKTVGYPIRVCEML SALDGPELIQRVAVNNVKNVKAAKKAIKKAFENQINGKGFSLIEVVSSCPTNWGMTPSK ALEWVETNMIPYYPLGVYKDRSAKEADAND" /locus_tag="LOCUS_0060" /note="WP_003357567.1 thiamine pyrophosphate-dependent enzyme (Clostridium) [pid:68.9%, q_cov:95.6%, s_cov:96.8%, Eval:5.3e-100]" /note="MGA_6" CDS 6566..7102 /product="2-oxoacid:acceptor oxidoreductase family protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003357379.1" /transl_table=11 /codon_start=1 /translation="MTNSILIAGFGGQGVLFAGKFLAYKGLLEGKEISWLPSYGPEMRG GTANCSVIVSDSPVGSPIVSNPDILIAMNLPSFDKYENSANAGGYIFADSTLISKETAR DDVKAFYVPATQMAKDLGIPTLANMILMGKVIKETGVVSFDEMREALGKVVSAKRAELL ELNLKALEAGYNYCD" /locus_tag="LOCUS_0070" /note="WP_003357379.1 2-oxoacid:acceptor oxidoreductase family protein (Clostridium) [pid:51.4%, q_cov:98.3%, s_cov:97.7%, Eval:6.6e-46]" /note="MGA_7" CDS 7215..8282 /product="branched-chain amino acid aminotransferase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003244231.1" /transl_table=11 /codon_start=1 /translation="MLDIRIEKTLTPKEKPAKGTPLGFGHIFTDHMFVMNYTEGKGWHD ARIVPFDNISLSPASMVFHYGQEMFEGLKAYKGDDDKVYLFRPDMNAKRANASNDRLCI PRIPEEDFVQAIKAVVDVDRDWIPEEEGTSLYIRPFVIATDNFLGVAPSKTYLFMVILS PSGAYYASGLAPVGIWIEDEYVRAVRGGIGYAKTGGNYAASLAAQVKAHDGGYSQVLWL DGVDRKYIEEVGAMNIVFKISGKVVTPALNGSILPGITRNSVLQLCRDWGYEVEERKIS VDELIEAAHNGTLEEVWGTGTAAVVSPVGKLRYKDEVFTIGDGGIGELTQKLYDEITGI QWGRREDPNGWRVTV" /locus_tag="LOCUS_0080" /EC_number="2.6.1.42" /note="WP_003244231.1 branched-chain amino acid aminotransferase (Bacillus) [pid:59.9%, q_cov:99.2%, s_cov:96.7%, Eval:1.3e-122]" /note="MGA_8" CDS 8477..9766 /product="O-acetylhomoserine aminocarboxypropyltransferase/cysteine synthase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_013390162.1" /transl_table=11 /codon_start=1 /translation="MSERKIETKCVQGGYTPGNGEPRQIPIIQSTTFKYSTSEDMGKLF DLEAEGYFYSRLQNPTCDAVARKICELEGGSAAMLTSSGQAANFFAVFNIASCGDHVVS VSSIYGGTFNLFSVTMKKMGIDFTFVAPDCSDEELEAAFKPNTKAVFGETIANPALRVL DIERFANAAHAHGVPLIVDNTFATPVNCRPFEWGADIVTHSTTKYMDGHGAAVGGCIVD SGKFDWVKYADKFPGLTTPDDSYHGITYTERFGLAGAYITKATAQLMRDFGCTPAPQSA FLLNFGLESLHVRMERHCQNGLAVAKFLESHPMVSWVKYPDLEGDEDNALAKKYLPKGS CGVVSFGVKGGRKAAEKFMKELRLAAIETHVADARTCCLHPASATHRQMNDAELEAAGV GADLVRMSCGIESADDLIADIKQALDKVNN" /locus_tag="LOCUS_0090" /note="WP_013390162.1 O-acetylhomoserine aminocarboxypropyltransferase/cysteine synthase (Bifidobacterium bifidum) [pid:69.2%, q_cov:98.4%, s_cov:99.1%, Eval:6.8e-177]" /note="MGA_9" CDS 9779..10696 /product="homoserine O-succinyltransferase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_010965131.1" /transl_table=11 /codon_start=1 /translation="MPIKIPNTLPAAKTLTDENIFIMTETRAISQDIRPLRILILNLMP TKIDTETQLVRLIGNTPLQVEVELIHTASHQSKNTSEEHLLSFYKTFDQVKNQRFDGMI ITGAPVEMLEYEDVEYWDELCEIFEWTKTHVHSTFHICWGAQAGLYYHFGIQKKPLDAK LFGVFPHKVDYKNPILFRGFDDVFLAPHSRHSTVERADIEACPELKILASSEVAGVYAC MTQNGKQIFITGHSEYDAGTLAKEYFRDKNKGLEIQIPVNYFPNDDDTREPIVSWRAHA NLLYSNWLNYFVYQTTPYDLSEDL" /locus_tag="LOCUS_0100" /gene="metA" /EC_number="2.3.1.46" /note="WP_010965131.1 homoserine O-succinyltransferase (Clostridium) [pid:63.1%, q_cov:98.7%, s_cov:100.0%, Eval:1.0e-114]" /note="MGA_10" CDS 10713..11168 /product="acyl-CoA thioesterase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003244690.1" /transl_table=11 /codon_start=1 /translation="MVKHPKDSLTESVHIVVPKHLNGGNRLFGGTLLNWIDDVGAVAAR RHAGGMVTGASVDNVQFLGPAFQNETIICVGKVTYVGRTSMEVCVKSYAETLDGERRLI NVAYQVAVAIDENGKPVPVPALEPETDEEKAEYENAKKRKEFRNLYR" /locus_tag="LOCUS_0110" /note="WP_003244690.1 acyl-CoA thioesterase (Bacillus) [pid:40.6%, q_cov:94.0%, s_cov:83.1%, Eval:1.1e-20]" /note="MGA_11" ORIGIN 1 aaaaacttcg taatggtcgg cggatgccgc gagggttggc gcgactttga cgctgaatac 61 agcctcttta caggtaagtt tgagcgcacc cccgaatcct cctgcggaga tgacacagcc 121 ttaatgttct tcacatcggg cacaacaggc aatcccaaaa tggcggcaca caagcataca 181 tatgctttgg gacactttgt caccgccaaa tattggcact gctgtgagcg cgacggcttg 241 cacctcacaa tttccgacac cggctggggc aaatcccttt ggggcaagct ttatggccag 301 tggctctgcg agggtgccgt atttgtatat gactttgata agtttgatgc tgccgacatc 361 atgccgatgt ttgcaaaata tcagatcacg accttctgcg cacctccgac aatgctcaga 421 atgttcatca aggaagacct ctcaaagtat gatttaagct ccattcacca tatgaccact 481 gcaggcgaag ccctcaaccc cgaggtattc agacagtttg agcttgcaac cggcctgcag 541 ataatggaag gctttggtca gactgaaacc acccttgcaa ttgcaaacct tgttggcgac 601 acgcccaagc tcggatctat gggtaaggcg aacccgcagt ttgatgttga tatcgttgac 661 cccgacggca acagcttgcc cagcggtgaa gtcggcgaga tcgtcatcca caccgacaag 721 actgttccct gcggtctttt caaggaatat taccgcgacg cggaaaagac caccgacgct 781 tggcatgacg gactttatca cacaggcgac accgcttggc gtgatgagga cggctacttc 841 tggtatgttt cccgtatcga cgacgtcatc aagtcctccg gttaccgcat cggcccattc 901 gagatcgaat cggtcatcat ggaattgccg tatgtactcg aatgcggcgt ttccgccgta 961 cccgatgagg tcagaggcca gatcgttaag gcctcaatcg tcctcacaaa gggcaccgag 1021 ggcacagatg ctctcaagaa ggagatccag caatatgtta aggatcacac cgcaccttac 1081 aagtacccca gagttatcgt atttaaagat gaacttccca aaactatcag cggaaagatt 1141 caaagaaata agctttaatt gcggcttttg gtgttgacaa caatataggg acgtggtata 1201 atactgctgt aaagcataaa agcgttgacg aagaagggca gcttcttttc caatcaagag 1261 aaacggcgtt tggtgcgagc cgcaattgga gaaatgttgc ttgtagcttc cgagctgaga 1321 ggaagaaagg ctatatattt gccgagtaga ccctttccgt gattgctgcg ttaatgcata 1381 cggcttaata atgagcctga gtggcgcgaa ttcgcgcaat ttgagtggta ccgcgggata 1441 taattatgca ctgattatac tcgtctcaaa gaagtaatat ctttgggacg agtttttatt 1501 tcctgctccg cccaaatgat acaaagaaag gaagaagagt gtgcaaaaca ccggaattga 1561 attaaaaatt cttgaaatgg cgggccgaat tcgggatctg cgagagatca tcgggctttc 1621 aaccgctgaa atggcgctta aaacgggcgt ttccgaggaa gaatatatcg cttgtgaaaa 1681 tgcaaggcga gaccttaact tcgcattctt atatagatgt gcgcttgcct tgggcgttga 1741 cgtcaccgac attatcgagg gtgcatcccc ccgacttgcg ggatataccg ttacgcgcaa 1801 gggcgacggc cagcgaatcg agcaggccca cggcatggta tactataacc ttgcatctgc 1861 atttaaaaac agaattgcag agcctttgct ggttgtttcc gcatatagcg aagaggctca 1921 gcacgccgat attgagctta ccacccacga gggtcaggaa tgcgacatta ttgtcagcgg 1981 ttctttgaaa gttcagatcg gtgaccatat cgagatactt aaagaaggcg actcgatcta 2041 ttacgactcg gacacccctc acggtatgat cgctgtcggc ggaagcgact gtgtgttcta 2101 tgcgatcgtt ttgaatccgt cgggcgaatc aattgaaaag atcacccacg gcggcgtcag 2161 agagttcacc gcacgtcctt tgaagactcc cgaaagaaag tggatctatg aggactatat 2221 tgatgctaag gaagacaaaa acggcgtttt ggaaaagatc tcctttaaga acgaacaaag 2281 cttcaatttc gccttcgacc ttgtcgacag aatgggcaga gagcagcccg acaagctggc 2341 acttttgcat attgacaaaa accacgttga acgcagattt acctttgcgg acattaagcg 2401 tgcatccagc cagacagcca actatctcaa atcgcttggc atcaagcgcg gagataaggt 2461 cttgcttatt ttgaagcgcc attatcagtt ctggcttgta atgatcgctt tgcataagct 2521 tggggcagtt gcaattcccg caacaaacca gcttaaagag cacgacatca cctatcgcct 2581 caacaaagcg ggcgttaaaa tggtcatctg taccgccgat gacggcgttg ccgagcaggt 2641 ggatatttcc gccaagcacg cgcaaacgct tgagcataag ctgattgtca acggcgagcg 2701 cgaaggctgg cgaagctttg acgaggaata tactctttat acaggcaagt ttgaccgacc 2761 cgacgattgc ccctgcggcg acgaaccgat gcttatgtat ttcacatcgg gcacaacagg 2821 caaccccaaa attgccaccc acaactttat gtatcctttg ggacactttg ttaccgcgaa 2881 atattggcat tgcgttaacc ccaacggctt gcacctgacc gtttccgact cgggctgggc 2941 gaagtgtgca tggggtaagc tatatggaca gtggctctgc gaagctccgc tgtttgtata 3001 tgactttgac agattcgatg ccgaagacat tttgccgatg tttgcaaaat atcagattac 3061 aacattctgc gctccgccca caattttgcg aatgctcgca aagcaggata taggaaaata 3121 tgacctgagt tctgttgagc atatgtcaac tgcgggcgaa gccctcaacc ctgaggtctt 3181 cagacagttt gaagcggcaa caggcttgca gataatggaa ggcttcggcc agaccgaaac 3241 caccgttgcc cttgcaactc ttgcgggcat gaaagcaaag ctcggctcaa tgggcaaacc 3301 tgttgcgcta tatgatatcg acctggtgga tgctgacggc aacaccgttg acgacggtga 3361 agtcggcgaa atctgcatcc gaatcgacaa gggctcgcct tgcggactct tcagaggata 3421 ttataaggac gaagaaaaga ccgaagaagt attccgccac ggcctttatc acacaggcga 3481 caccgcttgg cgtgatgagg acggatatta ctggtatgtc ggacgagttg acgatgtcat 3541 taagtcgtca ggctaccgaa tcggcccctt cgaaattgaa aatgtcatta tggagcttcc 3601 ttatgtcctt gaatgcggcg taagtgccgc acccgacgag gtcagaggcc aggttgttaa 3661 ggcttccatc gtcctcacaa agggcaccga gccgacagac gagctgaaaa aggagattca 3721 acagtacgtt aaaacgagaa ctgcgcctta taaatatccg agaatcgttg tctttaagga 3781 tgaacttccc aagacgacca gcggaaagat tcagcgcaac aagctttaag gaaatgaact 3841 tatgaatcac aaacgcataa ctctttttgc agggcattac ggctcgggca aaacgaatat 3901 cgccgtcaat tatgctatgg agcttgccaa aacgggaaag ccggtggtga tcgccgacct 3961 tgatattgtt aacccgtatt ttcgcaccaa ggactcggca gacgaacttg ccgccttggg 4021 gatcgagctt ataagccctg aatttgccaa ctcaaatgtc gatctgcccg cgcttcccgc 4081 gcaggtctac ggagttgtgc aaaacaaaaa ccgcttggcg gttttggata tcggaggtga 4141 cgaccgaggc gcatatgcct tgggcagata cgcgccctat atcctcgagg aaaacgattt 4201 tgaaatggtg tttgttgcga actttatgcg ccccttaacc aaaacggcgg aagaagcgct 4261 tgaagtgatg cgcgagatcg agctggcggg aaagattccc ttcacagcta tcgtcaacaa 4321 cacaaatttg ggaaatctta ccgacgccga aacggttgaa gcttcaaatt atgaagccaa 4381 aaaactgagc gaaatttccg gcttgccgat tttgtttaca tctgccgagg ctgatgttgc 4441 gccaaaggtt aaacttgaaa acgttttccc gctcaacctg caaaagaaat attttgatat 4501 aaaataaccc attcaatagg aggttctatc atggcaaagg ttacatttga taccgatacc 4561 tgcaagggct gtgggctgtg cgttgatgcc tgccccaaaa atcttctggt tatcgccaag 4621 gacaagatca acaaaaaggg tcactctccc gcagagatga ccgatatgtc gcagtgcatc 4681 ggctgtgcat tctgtgccac catgtgcccc gactgtgtaa tcaccgttga aaagtaagga 4741 ggttttgcat atcatggctg aaaaagtttt aatgaagggc aacgaagcaa tcgcagaagc 4801 cgcaatcaga gcaggctgcc gccattactt cggctatccc atcactcccc agacagagct 4861 tgccgcatat atggctaaaa gaatgcccaa gatcggcggc gttttccttc aggctgaaag 4921 cgaaatttcc gctatcaata tggtatacgg cgttgcggga acaggcttgc gcgttatgac 4981 gagctcgtcc tctcccggag tgtccttgaa gcaggagggc atttcctata ttgcgggtgc 5041 agatcttcct gcactcatca tcaacgttca gcgcggcggc cccggtttgg gcggtattca 5101 gccctctcag tcggactatt tccaggccac aaagggcggc ggacacggcg actatcacct 5161 tattgttttg gctcccgcat cggtgcagga aatggctgac cttacagcaa ccgcatttga 5221 gcttgccgaa aagtaccgta tgcccgcaat gatcttggct gacggcacaa tgggccagat 5281 gatggagccc gtaaccctgc ccgagcctgt ggaatataac ccaaaccacg attggaccgt 5341 tacaggtaca aagtgcgaaa gaaagcacaa tataatcaac tcgctctatc tcgttcccga 5401 ggagcttgaa aagaagaact tcgaacgctt tgaaaagtat aagaccattg aggaaaacga 5461 ggtcatgtac gagtcctatc ttatggacga tgctgactat tgcgttgttg ccttcggcat 5521 tgcggcacga gttgcaaaga acgcaattaa cgaagcaaga gcgaagggca tcaaggtggg 5581 tatgataaga cccatcaccc tttggccttt ccccacaaag gtgatcagag aagcggctga 5641 taaggttaag gcatttatca gcgtcgagct ttcaatgggc cagatgatcg aggacgttaa 5701 gcttgcaagc gaatgcttga agcctgttta cctttgcaac cgttcgggcg gtatgattcc 5761 cgaacctgcg cagattcttg aaatgatcga aaaactcgac ggaggtgaaa actgatggta 5821 gtatttgaaa aacccaagtc cttaactgat gcacccttgc attattgccc cggttgcacc 5881 cacggaatta ttcaccgact tgttgccgaa gcaatcgacg agctgggcat tgagggcaag 5941 accatcggtg ttgctcctgt cggatgtgcc gttatggcat ataactactt cgcctgcgat 6001 atggttgaag ctgctcacgg cagagcgcct gccgttgcaa caggcttaaa gagagctttg 6061 cccgaaaaca ttatctttac atatcagggc gacggcgacc ttgcatccat cggtatggcg 6121 gaaaccgttc acgccgcaac aagaaacgaa aacatcaccg taatttttgt taacaacgca 6181 atttacggta tgaccggcgg ccagatggct cccacatcac tccccggaca ggtcacccag 6241 acttctcctt acggaagaga tgttaaaact gtcggctatc ccatcagagt ttgtgagatg 6301 ctttccgcac tcgacggccc cgagcttatt cagcgtgttg ccgttaacaa cgtcaagaac 6361 gtcaaggcag ccaagaaggc aattaagaag gcttttgaaa accagatcaa cggcaagggc 6421 ttctctctca ttgaagttgt ttcctcttgc cccaccaact ggggtatgac tccctcaaag 6481 gctttggaat gggtcgaaac aaatatgatt ccttattacc ccttgggcgt atataaggac 6541 agaagcgcaa aggaggccga cgcaaatgac taacagtatt ttaattgcag gcttcggcgg 6601 acagggcgtt ttgtttgcag gtaagttttt ggcatataag ggacttttgg agggcaagga 6661 aatttcctgg cttccctcat acggccctga aatgcgcggc ggcacagcaa actgctcggt 6721 aatagtcagc gattcacccg ttggctcacc tatcgtttcc aatcccgaca ttttgatcgc 6781 aatgaatctg cccagctttg ataaatatga aaacagcgca aacgcaggcg gatatatctt 6841 tgcagactca acactcatct ccaaggaaac tgcaagagat gatgttaagg ctttctatgt 6901 tcccgcaaca cagatggcaa aggaccttgg aattcccaca cttgcaaata tgattttaat 6961 gggcaaggtc attaaggaaa cgggcgttgt aagcttcgat gaaatgcgcg aggctttggg 7021 caaggtcgtt tctgccaagc gtgcagagct tttggaactt aacttgaagg ctttggaagc 7081 aggatataac tattgtgact aaaaacactt gataaaaact taaaaatgtg ttagtgtgaa 7141 ataagactgc tgtattatat aacagccttg gcttgtttca cacttgcttt attaaacata 7201 ggaggcataa ggatatgctt gatattagaa ttgaaaaaac tttaaccccc aaggaaaagc 7261 ccgcaaaggg cacacctctc ggattcggcc atattttcac cgaccatatg tttgttatga 7321 actataccga gggcaaggga tggcatgacg caagaatcgt tccctttgat aatatttctc 7381 tttctcccgc atcaatggta ttccattacg gacaggaaat gtttgaaggc ttaaaggcat 7441 ataagggcga cgacgataag gtatatcttt tccgccccga tatgaacgca aagcgcgcaa 7501 acgcttcaaa cgaccgcctt tgcatcccca gaatccccga ggaggacttt gttcaggcaa 7561 ttaaggcagt tgttgatgtt gatagagatt ggattcctga ggaagaggga accagcttat 7621 atatccgtcc ctttgttatt gcaactgata atttcttggg cgttgcccct tcaaagacat 7681 atttgtttat ggttatcctc tcgccttccg gcgcatatta tgcaagcggt ttggcacctg 7741 tcggcatctg gatcgaggat gaatatgtaa gagctgtacg cggcggtatc ggatatgcaa 7801 aaacaggcgg caactatgcc gcatccttgg cagcacaggt taaggctcac gacggcggat 7861 atagccaggt tttgtggctt gacggcgttg acagaaagta tatcgaagaa gtaggagcca 7921 tgaacatcgt tttcaagatt tcgggcaagg tggtaacccc tgctctcaac ggctcaattt 7981 tgccgggtat tacaagaaac tccgttcttc agctttgccg cgattggggc tatgaagttg 8041 aagaaagaaa gatcagcgtt gatgagctga ttgaagccgc acacaacggc acccttgagg 8101 aagtttgggg aacaggcact gcggctgttg tttctcccgt cggaaagctc cgctataagg 8161 acgaggtatt caccatcggt gacggcggaa tcggagagct gacccagaag ctttatgatg 8221 agataacagg tatccaatgg ggtagacgcg aagaccccaa cggctggaga gttaccgtat 8281 aattttcaca gacaaattcg ggaattcggc aagattgcaa agcaatattg tcgaattcac 8341 agcgaccgca tcaacactta cctttatagc aaattaagac ggtcgcttgg ctacctgctc 8401 ggacacgcct tcggcgtacc cctcacagac ggcgccttaa atcagcaaac ccaaccactt 8461 aacaggagtg ataaaaatga gcgaaagaaa aattgaaacc aaatgcgttc agggcggata 8521 tacccccggc aacggcgagc ccagacagat tccgataatc cagtccacca cctttaaata 8581 ttccaccagc gaggacatgg gcaagctttt cgaccttgaa gcggaaggat atttctattc 8641 ccgtctgcaa aaccccacct gcgacgctgt tgcgcgcaaa atttgcgagc ttgagggcgg 8701 aagtgccgca atgcttacat cttcgggtca ggcggcaaac ttcttcgccg ttttcaacat 8761 tgcatcctgc ggcgaccatg ttgtttccgt ttcatccatc tatggcggaa ccttcaacct 8821 cttctccgtt acaatgaaaa agatgggcat cgactttacc ttcgttgcac ccgattgctc 8881 cgacgaggag ctggaagctg catttaagcc caacaccaag gctgttttcg gcgaaacaat 8941 tgcaaaccct gcgctcagag tgctcgatat cgagcgtttt gcaaatgccg cgcacgctca 9001 cggcgttccg cttattgtgg acaacacctt tgcaacgcct gtaaactgcc gaccctttga 9061 atggggcgca gatattgtca cacattccac caccaagtat atggacggcc acggtgcggc 9121 tgtcggcgga tgcattgtcg attctggcaa gtttgattgg gtcaagtatg ccgacaaatt 9181 ccccggactt acaacacccg atgatagcta ccacggcatt acctataccg agcgattcgg 9241 attggcagga gcatacatca ccaaggcaac agcacagctt atgcgtgact ttggttgcac 9301 acccgcgccc cagagcgcat tccttttgaa tttcggactt gagagcctgc acgtcagaat 9361 ggaacgccac tgtcaaaacg gtcttgctgt tgcgaagttc cttgaaagcc acccgatggt 9421 aagctgggtc aaatatcccg accttgaggg ggatgaggac aacgctttgg caaagaaata 9481 tctgcccaag ggttcctgcg gagttgtaag ctttggcgtt aagggcggaa gaaaagccgc 9541 cgagaagttt atgaaggagc ttagactcgc cgcaattgaa acccacgttg cagacgcaag 9601 aacctgctgt ttgcaccctg caagcgccac ccaccgccag atgaacgatg ccgagcttga 9661 agcggcaggc gttggagcag accttgtgag aatgtcctgc ggtatcgagt cggccgacga 9721 cctgattgca gatatcaagc aggcgcttga caaagttaac aactaacgga gaaactaaat 9781 gccgattaaa attccaaaca cactccctgc ggcgaaaacg ctgacagacg aaaatatatt 9841 tataatgacc gaaaccaggg cgatatcgca ggatatccgc cctcttcgga ttttgatttt 9901 aaatttgatg cccacaaaga tcgacaccga aactcagctt gtgcgcctta tcggtaacac 9961 acccttgcag gtcgaggtcg agcttatcca tacggcgtcg caccaatcga aaaacacctc 10021 tgaggagcat cttttgagct tctataagac ctttgaccag gtgaaaaacc agcgctttga 10081 cggcatgata atcacaggcg cgcccgttga aatgcttgaa tatgaggatg tcgaatattg 10141 ggatgagctt tgcgagatct ttgagtggac aaagacccac gttcattcca ccttccacat 10201 ctgctggggc gcgcaggcgg gactttatta tcacttcgga attcagaaaa agccccttga 10261 tgcgaagctc ttcggagttt tccctcacaa ggtggattat aaaaacccga ttttgttccg 10321 cgggtttgac gatgtgttct tagcacctca ttcaagacat tcaactgttg agcgggcgga 10381 tatcgaagct tgtcccgagc ttaaaattct tgcatccagc gaagttgcag gcgtttatgc 10441 ttgcatgacc caaaacggca agcagatctt cattaccggc cactcggaat atgacgcagg 10501 cacccttgca aaggaatact tcagagataa aaacaagggg cttgaaattc aaatccccgt 10561 caactatttc ccgaacgatg acgacacccg cgaacctatc gtttcctggc gggctcatgc 10621 gaatttactc tactccaact ggttaaacta ctttgtatat cagacaacgc cttacgattt 10681 gtctgaggat ctataaggag tgagaacgaa ttatggttaa acacccgaag gatagcttga 10741 cggagagtgt gcatatcgtt gtgccaaagc atttgaatgg cggaaaccga cttttcggcg 10801 gaacgctttt gaattggatc gacgatgtgg gcgcagttgc tgcccgccgc cacgcaggcg 10861 gaatggttac gggagcgtcg gttgacaatg ttcaattttt aggccctgcg tttcaaaatg 10921 aaacaatcat ctgtgtcggc aaggtgacat atgtgggcag aacctcgatg gaggtctgcg 10981 tcaagtcata tgccgagacc cttgacggcg aacgcaggct cataaatgtg gcatatcagg 11041 ttgcggttgc aattgatgaa aacggcaagc ctgtgcctgt gcccgctttg gagcccgaga 11101 cagatgagga aaaagcagaa tatgaaaacg caaaaaagcg aaaagaattc agaaacctct 11161 accgctaacg gtggaggttt tgcttttttg tgcgaatctc accgcgcggc tacctgcacg 11221 actcgccgca ttcgcggcac ccgagcagac agccgcgctt ttgcggcggc agccaaggcg 11281 ttttgcttgc gcaaaacgcc ttccttgcgc ccttcgggcg caaggcgacg gagctgaaag 11341 ctccgtcggg ctgccgcctc gcaagcgcaa // LOCUS sequence002 11363 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence002 VERSION sequence002 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..11363 /mol_type="genomic DNA" /organism="" /note="sequence002" CDS 140..1423 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MKKLLAIILAVAMVMSMAVVAYADEAELSGNYPKYEVLFSKVYET PLAGDWSWCGSDTLGLNTATFDAAVRTDGALMVMELGTNTNWWQLQINGLFFYHGGDNN ADLGPAAAGVTSFNGATNHYIVMPCDAMLAKAEELGVTGDIKVSGGNGAGVVEAIYVIA PKAEEEAPEAIDVTIYENEAGNTFTADATTYLDPWGGFGICSEVNGQNVGNISLPELIT YAEMEGAELVITFAGGGIWGGSKPETEVQFNCWDTEEDLQVKFDIATLPSGVNKGVVKF EALISKLEALGLTTADIRNLGVQVWASEFKLHTVAIHVPAPEVEEETYRGSGYFMTGEE THAMIIGKAIITSNHEFDEDGDCKYCGHHVDVEVEDIIVEQPTESTEEESEDITVEEPK EDTNPGTGLTLAVIPAIVALAAVVISKR" /locus_tag="LOCUS_0120" /note="MGA_13" CDS 1703..2059 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MENKVKVRIIGREYTLGTDNSPEYTLELAEKLDLTMNKLLATSKS LSGIDVAILAALDAMDEAAKATANADNIRLQIGEYVTSADKARQSYDNAKREIALLKKR IEELEAKLSGSRLF" /locus_tag="LOCUS_0130" /note="MGA_14" CDS 2059..4128 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MATYTSKKPEVLSPCGGMESLYAALRSGADAVYVGGKSFSARRGA VNFTADELKEAVRECHRYGVLIYQAINTAALDSELEALAAEIKTACDVGVDGIIVQDLA TMAIAKAACPDMPLHASTQMTIHTAEGVLQARELGFSRCVVARELPLDTISELCKLDTE IEAFVHGALCMSVSGHCYLSAMIGSRSANRRGCAGACRLPFSCGKRSDDKYALSLKDMS YASHAKELCDAGVASLKIEGRMKRPEYVAAATDAMRKAVDGEKYDTDRLRAIFSRSGFT DGYLTKKLGADMFGARVKEDVTGARDVIPELRELYRAERKKFVVSFDFSATENCPVSLT ASDGENSVTVYGENPQIANNRPTEAEAIIKQLSKLGETVYDAGEISAHIGTGLMVPLSA INELRRKAIAELDEKRIETLTKIKEFKSEELSLRFPQPRIRKIPQLRVSVQSVKTLALM NLNDIEYVILPLSQAGAYLDLGYDPEKAILSLPRYMHREADVINKLEKAKELGFNRAEC TNIAHIRICKSFGILPFGGFGLNITNSLSVREYEALGLREITLSYELKAAQMNKIHASV PVGFLAYGKLPLMLTVNCPIAAQVGCKSCTGQLTDRTGAQFPISCHKDLGYYELLNSAV LHLEDRIDDFNLDVATLYFTDESPEEAQRVVKNYREGVRPNGEYTKGLYYRGIE" /locus_tag="LOCUS_0140" /note="WP_012048131.1 U32 family peptidase (Clostridium botulinum) [pid:45.3%, q_cov:41.7%, s_cov:38.1%, Eval:4.6e-67, partial hit]" /note="MGA_15" CDS 4297..4737 /product="dUTP diphosphatase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_005808844.1" /transl_table=11 /codon_start=1 /translation="MKLTFKKLKDNATIPHSATKTSAGLDLHACLDEPMTIGVGEIKTV PTGIACAPEREDVVMLVFVRSSLGRKFGLTLANSVGVIDSDYRGEILVPMVNHGSEPYT IQDGERFAQLVVTPVIFPEICLSDELDETERGVNGFGSTGKL" /locus_tag="LOCUS_0150" /gene="dut" /EC_number="3.6.1.23" /note="WP_005808844.1 dUTP diphosphatase (Desulfitobacterium) [pid:50.7%, q_cov:98.6%, s_cov:95.4%, Eval:5.5e-35]" /note="MGA_16" CDS complement(4632..6005) /product="sodium:alanine symporter family protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_000956710.1" /transl_table=11 /codon_start=1 /translation="MKFLTALSDAVFGLPTVAVIICMGIYYSLSLGFIQLKAKTMMKVF KQSLKGSAFSACATSLAATVGTGSVVGVAMAISLGGAGAIFWMWVSAFFGMALAYAEGV LSIKFRVKTKDGYQGGMMYSMEQGLGSRPMGATYALFATLASLGMGVMAQTNSASVSLE SEFSLDPKICGIVLAILMAFCVFSKSETVGKICSLGVPILAASYILLMLGVIAVNYKSL PEAISSIFAGAFGIRPIIGGGVGYTVKVALTQGIRRGVFSNEAGLGTTAAIHAGAKNIT PREQGYMNMFEVFVDTFVICTLTALAILSSGADISSSGVDMLISACETAFGSLSGGLIA VCVAGFAVATAVGWSQIGKSAFLYVTKGKFSGIYNIIYIVCAFLGAITSLEAVFTLSDI FNGLMALPCLTALMLLSSHVKREAQSLPVEPKPLTPRSVSSSSSDRHISGNITGVTTS" /locus_tag="LOCUS_0160" /note="WP_000956710.1 sodium:alanine symporter family protein (Streptococcus) [pid:40.9%, q_cov:95.0%, s_cov:99.3%, Eval:6.4e-88]" /note="MGA_17" CDS 6039..6479 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MRKYTPKIAALYTIQVLIFLVSVLITALAILYLSSFRILMSVLII ICWALATLFGLWLLPMYFRRTVMYLGTGEISIHSGLLFLWREHMKISAVQYVSLIKVPL SGLTGFNFVLVHGLGGTVILPFLSKPDADEIIAVLNLRISEQ" /locus_tag="LOCUS_0170" /note="MGA_18" CDS 6598..8073 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MTIKGRQHPIKLFSYTTKYFWLLIIPVLRSLYAIFFEGDSWERWI TGAWVDLLVLAAIIGFAYLRWSSVEFMFDDKSLTVQKGIFFTVSEQVFYPQISTVSIYQ GFLYRALGACTVKIGTNAGMLDKADVSIVMKRSDADKFYQAMRASRVKSLNYSVSPNKL RLLVFSFIFSSSFSGVALIIALLLEAGSMIDRRAEAQFVLNTLTEALNKAAIYVPPILA GVALFLGITWVLSFASNIFYFWDHILTKCSDTLYIRSGLITKRRSIISLDKINFVDFRQ NLLARLFKISSLNVHAAGFGDTGRSEMSAIMPITTKKELVSTIREVFPEYPAPKITLRS DIKSYKGFYVWPFWCLIIPLCGFLVLKNLAPEWYAVAEPAMIISLIPALWLTVVKTAAL FSTGIGFEKGYVSLRYAKFFAFHTVIMPKSRITKIELRQSVFQRINGTCTLKIYSAADS KKVHRIHGLRMDRAMNMLDNNGYDLYFTENPEG" /locus_tag="LOCUS_0180" /note="MGA_19" tRNA 8172..8248 /product="tRNA-Met" /inference="COORDINATES:profile:Aragorn:1.2.38" /locus_tag="LOCUS_t0010" /note="Aragorn_1" tRNA 8251..8325 /product="tRNA-Glu" /inference="COORDINATES:profile:Aragorn:1.2.38" /locus_tag="LOCUS_t0020" /note="Aragorn_2" CDS complement(8701..9516) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MEVWVKFFSEGFFGYAEKGNFKYYSLAHFIPLILLALAIYLTYRY RDKLKNWKHEENLRFAFAFVMLLAEMSYFWRLLYVGSSNPEMTTLLDKLPLQVCEWTCI CAIFMITKKSELLYQVCFYVCLTIGIFPLLTPSVISQTGPAYFRYYQFWLEHILPIVAV FYMTFVHGFRPKFKGIALSTGFMMALAAMALICNFNIEGANYLYLARGTTDGGGSIMDV LIKIAPSVWARLAFLTVVVLAMFFLAYGIYRGICKLASKKSEHKAKIPV" /locus_tag="LOCUS_0190" /note="MGA_21" CDS complement(9543..10376) /product="polysaccharide deacetylase family protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_010963680.1" /transl_table=11 /codon_start=1 /translation="MFKMRFPGGLKKTFTLSYDDNLYDDIRLMELMQKHGIKGTFNLSS DINREESEAPEGRWPRMTLAEALDNYPKYGVEVAVHGLRHRDFTKITEPELYYEISADK ANLEVRYNRVIRGAAYPYGSWNQTAVEALKKCGIKYCRTVWCDQNFTIPSGDGWLALKA TCHHNVPNLMELAKNFAGLDPNECKMFYVWGHTAEFRNDNNWNVIEELLEFIGEREDIW YATNIDICEYCLAYEKLEYSAAPDSNMVYNPTAKEIWLEHFGHVFSVKPGETVKI" /locus_tag="LOCUS_0200" /note="WP_010963680.1 polysaccharide deacetylase family protein (Clostridium) [pid:39.9%, q_cov:98.2%, s_cov:97.0%, Eval:6.0e-47]" /note="MGA_22" CDS 10552..11319 /product="TatD family hydrolase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003435866.1" /transl_table=11 /codon_start=1 /translation="MLSHIFETHSHYDAEQFDGIREQLIESLFERNIAGIIHAATDIKS SEFGIETANKYERFYTSVGFHPEYASEVPENAIEVLKELAKKDKVVAIGEIGLDYHYEG YDREAQIELFRAQLELANELNLPVIVHSRNATEDTLEILRELRPRGVMHCFSGSAETAK ELIEMGFYISLTGVLTFKNAKKASKVMEALPLDRFMLETDCPYMAPEPHRGELCDSSMI RFTAQKAAEIKGISLEQMLMATEENAKRFFGIK" /locus_tag="LOCUS_0210" /note="WP_003435866.1 TatD family hydrolase (Clostridioides difficile) [pid:47.5%, q_cov:98.4%, s_cov:99.6%, Eval:2.8e-64]" /note="MGA_23" ORIGIN 1 cataaaccga tacctattat tgatgttttg cacagaaaga tatttgaaag gctaaaaact 61 attgactttt tgcgcaagtt cgcgttataa ttatcctgtt aaattgcctt taacaaatta 121 tattaggagg acaatatata tgaaaaaact tttggcaatt attttggcag ttgctatggt 181 aatgtccatg gcagttgttg cttatgctga cgaggctgaa ctctctggaa actatcctaa 241 gtacgaagtt ctctttagca aggtttatga aacacccctt gcaggcgatt ggtcatggtg 301 cggttcagat actctcggtt tgaacactgc tacttttgac gctgctgtaa gaactgacgg 361 cgctttgatg gttatggaac ttggcaccaa tactaactgg tggcagctcc agatcaatgg 421 tttgttcttc taccacggcg gcgacaacaa cgctgacctt ggtcctgcgg ctgctggcgt 481 aaccagcttc aacggcgcaa ccaatcacta catcgtaatg ccttgcgatg ctatgctcgc 541 aaaggctgaa gaactcggcg ttaccggcga cattaaggtt tccggcggta acggtgccgg 601 cgttgtagaa gcaatctatg ttattgctcc caaggctgag gaagaagctc ctgaagctat 661 cgacgttact atctacgaaa acgaagcagg caacaccttc actgctgatg ctaccaccta 721 cctcgatcct tggggaggct tcggtatctg ctctgaagta aacggccaga acgttggtaa 781 catttccttg cccgaactta tcacatacgc tgaaatggaa ggcgcagaac tcgttatcac 841 cttcgcaggc ggcggaatct ggggcggctc caagcccgaa actgaagttc agttcaactg 901 ctgggatact gaagaagatc ttcaggttaa gttcgatatc gcaaccttgc ccagtggcgt 961 taacaagggc gttgttaagt tcgaagccct catctccaag ctcgaggctt tgggcttgac 1021 caccgctgac atcagaaacc tcggtgttca ggtttgggca agcgaattca agctccacac 1081 cgttgcaatt cacgttcccg ctcccgaagt tgaggaagaa acctaccgtg gctccggtta 1141 cttcatgacc ggcgaagaaa cccatgctat gatcatcggc aaggcaatca tcacttctaa 1201 ccacgaattc gacgaagacg gcgactgcaa gtactgcggc caccacgttg acgttgaagt 1261 tgaagacatc attgttgaac agcccaccga atctaccgaa gaagagtccg aggatatcac 1321 cgttgaagag cccaaggaag ataccaaccc cggtaccggc cttactctcg ctgtaatccc 1381 cgcaatcgta gcactcgctg cagttgtaat ctccaagaga taatttaaca actcacaata 1441 acattctccc gctccgagca atcggggcgg gagttttttg tatgcgggca ggcacacagg 1501 cctgccccta tggcaatata agggcgaccc tatgtggtcg cacgaaaacc gcaggacgga 1561 tgaggtgtca gctttgccga tggagagggc atagtacggt atctgcacct ttttctcaaa 1621 aatcccccgc aaaaccttgc aatctcgcaa tatataatgt ataatcaaat tgacatatta 1681 tagattaacg gagggcaaat atatggaaaa caaggtgaaa gtaagaatca tcggcagaga 1741 atatacttta ggtaccgata actcccccga atatactctt gagcttgccg aaaagcttga 1801 tttgacaatg aacaagcttt tggcaaccag caaatcttta agcggaattg acgttgcaat 1861 tttagcagcg ttggatgcta tggacgaggc tgcaaaggca actgcaaacg ccgacaatat 1921 ccgtctgcag atcggcgaat atgttacctc cgctgacaag gcaagacaga gctatgacaa 1981 cgccaagcgc gagatcgccc ttttgaaaaa gcgcattgaa gagcttgaag caaagcttag 2041 cggctcgcgt cttttctgat ggcaacatac acttctaaaa aaccggaggt tttgtcccct 2101 tgcggcggca tggagtcgct ttatgccgct ttgcgctcgg gagcagatgc cgtatatgta 2161 ggcggaaaga gcttttccgc cagaagaggc gccgttaatt tcaccgctga tgagctaaaa 2221 gaagctgtcc gcgaatgtca tagatacggc gttttgattt atcaggcgat caacaccgcc 2281 gcacttgatt cggaacttga ggcccttgcc gccgaaatca aaactgcttg cgatgtgggc 2341 gttgacggaa taatcgttca ggatttggcg actatggcga ttgcaaaagc tgcttgcccc 2401 gatatgccgt tgcacgcttc aactcaaatg accattcaca cagccgaggg cgttttgcag 2461 gcgcgtgagc tcggtttttc gcggtgtgtc gttgcccgcg agctaccgct tgatacaata 2521 agcgagcttt gcaaacttga tacggaaatt gaggcatttg ttcacggcgc tttgtgtatg 2581 tccgtgtcgg gacattgcta tttaagtgcg atgataggct cccgctcggc aaaccgacgg 2641 ggatgcgcgg gagcttgccg tctgcccttt tcctgcggca aacgcagtga cgataaatat 2701 gccctatcct tgaaggatat gtcatacgct tcccatgcaa aggagctatg cgatgcaggg 2761 gttgcatctt taaaaatcga gggacgaatg aagcgccccg aatatgtcgc cgcggcaacg 2821 gatgcaatgc gcaaggccgt tgacggcgaa aaatatgata ccgatcgctt gagagcaatt 2881 ttttctcgaa gcggatttac cgacggatat ttgacaaaaa agttgggtgc tgatatgttc 2941 ggcgcgcgtg ttaaggaaga tgtcacgggt gcgagggatg taatcccgga actgcgtgag 3001 ctttaccgcg cagagcgcaa gaagtttgtg gtaagctttg atttttccgc cactgaaaac 3061 tgtcccgttt ctcttacggc aagcgacggc gaaaacagcg taacggtata tggtgagaat 3121 ccccaaattg caaacaaccg ccccaccgag gcagaagcaa tcatcaaaca gctttcaaag 3181 cttggcgaaa cggtatatga tgcgggcgag atttctgcgc atatcggcac ggggctgatg 3241 gtaccattat cggcaatcaa cgagctaagg cgaaaggcaa ttgccgagct tgacgaaaaa 3301 cgcattgaaa ccttgacaaa aatcaaagaa ttcaagagcg aggagctgag tcttcgattc 3361 cctcagccaa gaatcagaaa aattccgcag cttcgcgtga gcgttcaaag cgtcaagact 3421 cttgcgctga tgaatctgaa cgatattgaa tatgtcattt tgccattatc gcaggcggga 3481 gcatatttgg acttggggta tgacccggaa aaggcaattt tgagtctgcc gcggtatatg 3541 catcgcgagg cggatgtcat aaataagctc gaaaaggcga aagagctcgg atttaatagg 3601 gcagagtgca cgaatatcgc ccacataaga atatgcaaaa gctttggaat tttgcccttt 3661 ggcggatttg gactgaatat tacaaattcg ctgtcggtgc gcgaatatga agctttgggg 3721 cttcgggaaa ttaccctttc atatgagctt aaagccgcac agatgaacaa aattcacgca 3781 tcggtgcccg ttggcttttt ggcatacggc aagttgccgc taatgctaac ggtcaactgt 3841 ccaattgcgg cacaggttgg ttgcaagagc tgtacaggtc agctcaccga ccgcacagga 3901 gcgcagttcc cgatttcctg ccacaaggat ctgggatatt atgagctttt gaattcggca 3961 gtcttgcatc ttgaggatcg aattgacgac tttaaccttg atgtcgcaac gctgtatttc 4021 accgatgaat ctcccgagga agctcaaagg gtggttaaaa actaccgcga gggcgtaagg 4081 ccgaacggag agtataccaa ggggctatac taccgcggta tcgaataaaa caaaacattg 4141 cgcgctgata cggcgccgcc aattttcccg cccccctaat gtgggcggga aaatccgcca 4201 agaagcgcga cgcgcttctt ggcctgcgcc gccctgcggg cggcgaggcg gcgcctcgca 4261 agcgcataac tattcgcaat gaaggagcaa caaaaaatga aactcacctt caaaaaactc 4321 aaagacaacg caaccattcc ccattccgcc accaaaacca gcgcgggact ggatctgcac 4381 gcttgccttg acgagccgat gacgatcggt gtcggagaga tcaaaacggt gcccacaggc 4441 atcgcttgtg cgcccgagcg ggaagatgtt gtaatgctgg tgtttgtgcg ctcatccttg 4501 ggaagaaaat ttggccttac tcttgccaat tctgtcgggg tgatcgattc tgattatcgc 4561 ggggaaattt tggttccgat ggtcaatcac ggaagtgagc cgtatacaat tcaggacggc 4621 gagcgctttg ctcagcttgt tgtgacaccc gtgatattcc ccgaaatatg tctgtcggat 4681 gagctggatg aaactgagcg gggagttaac ggcttcggtt cgacaggcaa gctttgagcc 4741 tcgcgcttta cgtgactgct caaaagcatc agcgccgtta agcatggcag agccattaag 4801 ccgttaaaga tgtcgctgag cgtgaatact gcttcaaggc tagttatcgc tcccaagaac 4861 gcgcagacga tgtatatgat gttatatatt ccgctgaatt tgccttttgt cacatataaa 4921 aatgcgcttt tgccgatttg cgaccagccc accgctgttg caaccgcaaa tcctgcaacg 4981 caaacggcaa tcagcccgcc cgaaagggaa ccaaaagctg tttcgcaagc ggaaatcagc 5041 atatccacac cgcttgatga tatgtccgcg cccgaggaca agattgcaag tgcagtcagc 5101 gtgcatataa caaacgtatc gacaaatact tcaaacatat tcatatatcc ttgttcgcgg 5161 ggtgtgatat ttttggctcc tgcgtgaatt gccgcggtcg tgcccaaacc tgcttcgttt 5221 gaaaatacac ctcggcggat gccttgggtt agggcaacct tgacagtata tcccactccg 5281 ccaccgatta tcgggcggat gccgaaggct cccgcaaaaa ttgacgatat ggcttcgggc 5341 aatgatttat aattcacggc gatgacgccg agcatcaaaa gaatatacga ggcagccaaa 5401 atcgggacgc ccaacgagca gatttttcca acggtttctg attttgaaaa tacgcagaaa 5461 gccataagaa tggcgagaac gatgccgcag attttcgggt caagcgaaaa ctcgctctca 5521 aggctgactg aggctgaatt tgtttgtgcc attacgccca taccaaggga agcgagcgtt 5581 gcaaaaaggg catacgtagc acccatggga cgtgaaccga gcccttgctc cattgaatac 5641 atcattccgc cttgataacc gtctttggtt ttaacgcgga atttgatgct taaaacgccc 5701 tcggcatatg caagagccat tccgaagaat gcagacaccc acatccaaaa aattgcacct 5761 gcaccgccca gcgatattgc cattgcgacg ccgacaacgc tgcctgtacc cacggttgcg 5821 gcaagtgatg tggcgcaggc ggaaaatgcg cttcctttaa ggctttgctt gaaaactttc 5881 atcattgttt tggctttaag ctgaataaac ccaagggaaa gcgaataata aatacccata 5941 catatgatta ctgcgacagt aggcaacccg aaaacggcat cacttaatgc agttagaaat 6001 ttcaaaaaca cacccccact accgaaagga ggacaacaat gcgaaaatat accccaaaaa 6061 ttgccgcact ttataccatt caggtgctta tattcttagt atccgtgttg atcactgcgt 6121 tggcaatttt atatctgtcc tcatttagaa ttcttatgag tgtgctgata attatatgct 6181 gggcattggc cacacttttt gggctgtggc ttttgccgat gtatttcaga agaactgtta 6241 tgtatctcgg cacaggggag ataagcatcc actcggggct tttgttcctc tggcgggagc 6301 atatgaagat aagcgctgtg caatatgtca gcctgataaa agttcccctt tcgggattga 6361 cgggctttaa cttcgtgctg gttcacggac tcggcggtac tgttatattg ccgtttcttt 6421 caaagcccga tgcagatgag attattgcag ttttaaactt gcggataagc gagcagtagg 6481 cacgctacgc gccacctgct tacacacccc catcgggggt acgtttcgca gacggcgctc 6541 cgcttcaatg acgcatcgat cagccaaccc aaaatccaca agaaaggagc cgataatatg 6601 accattaaag gcagacagca cccgatcaag ctgttcagct atacaactaa atatttctgg 6661 cttcttatca tccccgtgct gagaagctta tatgcgatat tcttcgaggg tgactcgtgg 6721 gagcgttgga taacaggcgc atgggttgac cttttggttt tagctgccat catcggcttt 6781 gcatatctgc ggtggtcgag cgttgaattc atgtttgatg acaagtcact gactgtgcaa 6841 aaaggaatct ttttcaccgt cagcgagcag gttttttatc cccaaatttc tacagttagt 6901 atatatcaag gatttttata cagagcgttg ggcgcttgca ccgttaaaat cggcacaaac 6961 gcaggaatgc ttgacaaagc agacgtcagt atcgttatga aaaggtccga tgcggataag 7021 ttttatcagg caatgagagc atcgcgagtt aaaagcctta actattccgt gtcaccgaat 7081 aagctcaggc ttttggtgtt ctcctttatc ttttcgtcct ccttctcggg cgttgcgctg 7141 ataattgctt tgcttcttga ggcagggtcg atgatcgacc gccgcgccga ggcacagttt 7201 gttttgaaca ccttgaccga agctctgaac aaagcggcaa tatatgtccc gccgatattg 7261 gcaggcgttg cgctgttttt gggcatcacc tgggttcttt cctttgcaag caacatcttt 7321 tatttttggg atcacatttt aacaaaatgt tccgacactt tgtatatccg ctcgggacta 7381 attacaaaac gccggagcat aataagcctt gataagatca actttgttga ctttcggcag 7441 aatcttttgg cgaggctgtt taaaatatcc tcgctgaatg ttcacgctgc aggctttggt 7501 gacacaggca gaagcgaaat gtccgcaatt atgccgataa ccaccaaaaa agagctggta 7561 tccaccatta gagaggtctt ccccgaatat cctgcgccga agataacttt gcgctcggat 7621 atcaaaagct ataagggttt ttatgtctgg ccgttttggt gtttaattat tcctctttgc 7681 ggatttttgg tactaaaaaa cctggcaccc gagtggtatg ccgtggcgga accggcaatg 7741 ataatcagcc tgattcccgc gctgtggctg acagttgtta aaacagcggc gctcttttca 7801 acaggcatcg gatttgaaaa agggtatgtg agtttgcgat atgcaaagtt tttcgcattc 7861 catacagtca taatgccgaa atcgcggata acaaaaattg aactgcgcca gtcggtattt 7921 cagcgcataa acggcacctg caccttaaaa atctattctg ccgcagacag caagaaggtt 7981 caccgcattc acggcctgcg aatggacagg gcgatgaata tgctggacaa taacgggtat 8041 gacttatatt tcaccgagaa tcccgaggga taaaacaaat gaaaattttt tcgaaaattt 8101 ttgaaaaagg tattgacaaa tctctcggag ttgattataa tgtacaagtc accttgagtg 8161 atatggcttt tggctttata gctcagctgg ctagagcact cggttcatac ccgaggtgtc 8221 actggttcaa atccagttaa agccaccatc ggcccgttgg tcaagcggct aagacaccgc 8281 cctttcacgg cggaaacatg agttcgattc tcgtacgggt caccaaaaaa tccatccgat 8341 taagtcggat ggatttttta ttcaaccgga aggcttggtg ttcaggaaca agttgccctg 8401 cggaatagcc ttcataatga aaagcaagag gataaaataa gaaaggacag ggaatttttt 8461 acgttctctg tccttttcat tagtgacaaa atctatgcga tatgtttgct tgcgcaaacg 8521 cgatatattc tcgcttacgc ttcgattgcg atataacctc ccggttggtc ggttgcaata 8581 tgatataaat ccgcaaacgc ccgcagggca tatcgcatcg aagatatatc gcacgtcgca 8641 gcgtatatcg caaatctcgt aagagattta tatcgttgta acctgctctt gagcaggtta 8701 ctaaacgggg atttttgctt tatgttccga ttttttagat gcaagtttgc agatgccgcg 8761 gtatatgccg tatgcaagga agaacattgc cagcacgaca accgtaagaa atgcaagtct 8821 tgcccaaacg cttggcgcaa ttttaattag cacatccatt attgaaccgc cgccgtcggt 8881 ggtgcctctt gcgagataaa gatagttcgc accttcgatg ttgaagttgc agatgagcgc 8941 cattgccgcc aaagccatca taaagccggt tgaaagggca atgcctttaa acttgggacg 9001 gaagccgtgg acaaaggtca tatagaacac ggcaacgatc ggcaaaatat gctcgagcca 9061 gaactgataa taacggaaat atgcagggcc cgtctgcgat attacagagg gagttaacag 9121 cgggaagatg ccgatcgtca ggcagacata gaagcagacc tgataaagaa gctcgctctt 9181 tttggttatc ataaatatcg cacatataca ggtccactcg cagacctgca agggcagctt 9241 gtccagcagg gttgtcattt cggggttgct gcttccgaca tacagaagcc gccagaaata 9301 tgacatttcc gccaatagca tcacaaacgc aaaggcaaaa cgcaggttct cctcatgctt 9361 ccaattttta agcttgtcgc gatagcgata tgtaagataa attgccaggg caagcaaaat 9421 aagcggaatg aaatgagcga gtgaatagta tttaaagttg cctttttcag cgtatccgaa 9481 gaaaccttcg ctgaaaaact taacccaaac ttccataatt aagtcctcct attggccggc 9541 ggtcagattt taactgtttc gccgggctta acgctgaata catggccaaa atgctcaagc 9601 caaatttcct tggcggtggg gttataaacc atattcgaat cgggagctgc ggaatattca 9661 agcttttcat atgccaagca atactcgcag atgtcgatat tggtggcgta ccagatgtcc 9721 tcgcgttcgc cgatgaattc aagaagctct tcaattacat tccagttgtt gtcattgcgg 9781 aattctgcgg tatgtcccca aacatagaac atcttgcatt cattcgggtc aagccctgcg 9841 aaattctttg ccaattccat gaggttgggc acattgtggt ggcaggtggc tttcaaagcc 9901 agccaaccgt cgcccgaggg aattgtgaag ttctggtcac accagactgt gcggcaatat 9961 ttgatcccgc actttttgag agcttcaacc gcagtctgat tccagcttcc gtaagggtat 10021 gccgcaccgc ggatgacgcg gttatatctt acctctaagt ttgccttgtc ggcggaaatt 10081 tcgtaatata gctcgggctc ggttatcttg gtaaaatcgc ggtgacgcaa accgtgaaca 10141 gcaacctcga caccatattt gggatagtta tccaaagctt ctgccaaagt cattctcggc 10201 cagcgtccct cgggggcttc gctttcttcg cggttgatat ccgagctgag gttgaatgtg 10261 cctttaatgc cgtgcttttg catcagctcc atcaagcgga tatcatcgta aagattgtca 10321 tcatagctga gggtgaaggt cttttttaaa ccgccgggaa atctcatttt aaacattatc 10381 aaatcatcct ttcatgggtg ttgcattttt ggggtgaaca tattaaaata ctaatatgac 10441 tataaccatt ataaaacagc gggaaagact tttcaacagg aaagaacgct ttttgttgat 10501 tagttataag ttgttcccgc aagatttgta tatattttaa ggagaagcaa aatgctgtca 10561 cacatttttg aaacccattc gcattatgat gccgagcagt tcgacggaat cagagagcag 10621 ttgattgaaa gtctgtttga aagaaatatc gcaggaatca ttcatgcggc aacggacatt 10681 aaatccagcg aattcggaat tgaaaccgca aataaatatg agagatttta tacatccgta 10741 ggcttccatc ccgaatatgc aagcgaggtg cctgaaaacg ccattgaggt tttgaaagag 10801 cttgcaaaga aggacaaggt ggttgcgatc ggtgagatcg ggcttgatta tcactatgag 10861 ggatatgacc gcgaggcgca aattgagctt ttccgcgcac agcttgagct tgcaaacgag 10921 cttaatttgc ccgttatcgt tcactctcgc aatgcgacgg aggacacact tgaaattttg 10981 cgtgagttga gaccgagagg agttatgcac tgcttttccg gctcggctga aacagcaaaa 11041 gagcttattg aaatgggatt ttatatcagc ctgacaggtg ttctgacatt taaaaatgca 11101 aagaaagcca gcaaggtgat ggaagcgttg ccgcttgata ggtttatgct tgaaaccgac 11161 tgcccatata tggcgccgga gcctcacaga ggcgagcttt gcgattcgtc gatgattaga 11221 ttcactgcac aaaaggccgc ggaaattaag ggcatcagcc ttgagcagat gttgatggcg 11281 actgaggaaa atgcgaagag gttctttggg attaagtgat cggtgctgcg gaacctacgt 11341 ttgcgcatag ctaagcgatg ggc // LOCUS sequence003 10663 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence003 VERSION sequence003 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..10663 /mol_type="genomic DNA" /organism="" /note="sequence003" misc_feature <1..783 /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_011860677.1:phosphoribosylformylglycinamidine synthase" /note="WP_011860677.1 phosphoribosylformylglycinamidine synthase (Clostridioides difficile) [pid:62.7%, q_cov:100.0%, s_cov:20.5%, Eval:1.3e-96, partial hit]" /note="MGA_24" /locus_tag="LOCUS_0220" CDS complement(1022..2500) /product="glycoside hydrolase family 43 protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_010890799.1" /transl_table=11 /codon_start=1 /translation="MVKKLVMVLLAMTMCLCLCTPISAENPIVQTCFTADPAPMVYGDT VYVYVGEDAIGDGGNYNMPHWRCYSTTDMVKWTDHGAVMRSDDFEWALPGSAWAAQCIE RNGKFYLYTTVTTEEFGGGRAIGVGVSDSPTGPFEDALGKPLAGPNWIYIDPTVFIDDD GQAYLYWGNPTLHVVKLKKNMIALDGEIKEFSMTYKAFGQMIDPDGSHDDCYEEGPWVH KRNGIYYLVYAGYGTPESICYSTSDSPTGGWEYQGIIMNNKNSFTIHPGIIEFKGKNYF FYHGGDLEGSAWNLRAVCVAEFEYNEDGTIPLIIQTTKGVEAIATLDPYSRVEAETICW SEGLKTDMAENGMYVTDVDNGDYIKVENVDFSDGGAINFIANIKANANAIIDVRLDSMF GELAASLNVKKTQDWENIKCNCENITDVHDVYILFRTEAEDALEIDYWQFLREGDEVVT TAEADISTPVVAVAVFVIVAGLAVILVATRKKKK" /locus_tag="LOCUS_0230" /note="WP_010890799.1 glycoside hydrolase family 43 protein (Clostridium acetobutylicum) [pid:47.5%, q_cov:92.7%, s_cov:99.6%, Eval:2.9e-118]" /note="MGA_25" CDS complement(2530..4053) /product="cellulase family glycosylhydrolase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_010920215.1" /transl_table=11 /codon_start=1 /translation="MAIKICKNGSASFKNNVLFCVGTGKMGLALHKEYYDQLALVQKEI GFKHIRGHGLFCDDMAIYQENTDREGNTTIEYNFTYLDRVVDSYLSVGIRPFLELGFMP YKLKSAENYVFHWRGNTSPPKSYEAWQELIKATLNHLISRYGEEEVLSWPIEVWNEPNL PGFWYKADMEEYFKLYTMSANAVKAVDERFKVGGPAICGGADEKWMRGFLNFCRETNPP LDFITRHHYTTHFPKPQGHYGYASLMGTREALDTLKNVRAMIDEYDEFKDLPFYITEFN TSYIPNCPMHDTNENAAELARTLSEIGDYTDGYSYWTFGDVFEEQGVPHSLFHGGFGMV ADRCIPKPTFYTFKFFKELKGECIWRGENGVITREKNGTLKGVLWNVTRDSKTDLLHLD FDIDTEAGEYMLLTQTVDEEVCNPLKAWHDLGEPKMPSESEIELIRGCARPLCKTERIA SEGTLALGFDIKKNGLVYFETKIAPMKGDRGYDYARVTMGENKWEEEHQ" /locus_tag="LOCUS_0240" /note="WP_010920215.1 cellulase family glycosylhydrolase (Caulobacter vibrioides) [pid:31.5%, q_cov:90.3%, s_cov:93.2%, Eval:1.0e-65]" /note="MGA_26" CDS 4213..5532 /product="SGNH/GDSL hydrolase family protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_010963858.1" /transl_table=11 /codon_start=1 /translation="MKPKKYIALFVALIMLGSLVGCGANTSSNGVSPEELEQPDIIIDV TDSNGDASESTTSHTTETKEETTEMTTENTVEATYRKYSAIPEFVKLIGRTYLDDEDVL WIPQSAGGIEFLANGSDLRITLAGDNSATPFSDSAVRYAIYINGERVADQMMKSSDLTL GINLPEGENKVRFVKLSESANGIIGIKHISILSTQDIKPTPESSLKIEFIGDSITCGYG VDDENREHHFSTETENATKTFAYKAAQILGADYSMVCYSGHGIISAFTGDGKINESGVV PKIYTQVGKTWDHSFKVNVNELEWDFDGFDADIVVINLGTNDNSYVKGDADRAKEFEAG YVDFLKLIRKNNPNAHIVCALGIMGADLYGSVEASAETFTKETGDDNISCLKFGTIMGN EGYSADWHPTEATQTRCADELIQHLITISDEAKALYEANN" /locus_tag="LOCUS_0250" /note="WP_010963858.1 SGNH/GDSL hydrolase family protein (Clostridium) [pid:29.3%, q_cov:77.2%, s_cov:88.5%, Eval:6.0e-27]" /note="MGA_27" CDS complement(5582..6508) /product="diacylglycerol kinase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003233894.1" /transl_table=11 /codon_start=1 /translation="MNKKLLFVYNPHSGMQVIARNLAKIIDYFTKSGYDVTAHPTQAKG DCMATVERLCNSYDLCVFAGGDGTLNEAINGMINADCNKPYGYIPCGSTNDFSHSVGIP RQTMEAAKVAVEGKPIAYDVGKLNERYFTYVAAFGTLTEVSYSTPQETKNALGFLAYVL EGIVALGQMKSFQIEFESDVRSGSGDYLIGLVSNTLHVAGMKNFLGKDISLDDGLFEVI LIKRPQDLLELNSILTSVAKQELDSEYIDYFKADRLSVKCAEGLSWTLDGENGGRHVVS NISCHTKALAVKTNGKKNQFELSNLDG" /locus_tag="LOCUS_0260" /EC_number="2.7.1.107" /note="WP_003233894.1 diacylglycerol kinase (Bacillus) [pid:36.1%, q_cov:89.0%, s_cov:90.8%, Eval:7.1e-47]" /note="MGA_28" CDS complement(6545..6862) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MGLFSRKKKQVTPTYKELERFDGKPLQYAVERIDGQEKVLGKSGG IIILEDAVVVMCEAKEIFRCKLEGATVAELLSGNGAEISGYDAYTGEKRYVVAHYSYYR K" /locus_tag="LOCUS_0270" /note="MGA_29" CDS complement(6872..7447) /product="Maf family protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_001226275.1" /transl_table=11 /codon_start=1 /translation="MLENINVILASKSPRRRELMEFIKHEFEIIPSLKEEVVPEGLDIE DIPAFLAAQKALDISRDRRDSLVIGCDTVVTLGGVIMGKPSDETDAKAMLMRLSGRTHT VISGVCLCYMGRTMTFTEKTSVTFYDLTEDEIDSYIASGSPLDKAGAYGIQDGAALFVK KIDGDYYNVVGLPVAKLAREIKTLIKLV" /locus_tag="LOCUS_0280" /note="WP_001226275.1 Maf family protein (Bacillus) [pid:52.0%, q_cov:93.7%, s_cov:93.7%, Eval:7.7e-46]" /note="MGA_30" CDS 7577..8443 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MSEFLHLILHTLEHTFLDSIKMLPFLFGVYLLIEFLEHKAENKIE DLLRRLGPFGPVGGAVLGCLPQCGFSVAASNLYSGRLISLGTLMAVFIATSDEAIPILL TNPGRGQDILRLLVAKMVIAVVAGLFIDAVLKFFRKRVNEEAPPYSDLCENCGCENHSI LYSAFKHTLQIFIFLFAVSFVFGFVIELVGEDTLNKVLMSDSLIQPFLAALIGLIPNCA PSVILTELYVSGAVSFGSVVAGLSTGAGMGLVVLFKTNKNLKQNLAIMGALYAIGAVSG LIINLVF" /locus_tag="LOCUS_0290" /note="MGA_31" CDS complement(8803..9498) /product="M23 family metallopeptidase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003360546.1" /transl_table=11 /codon_start=1 /translation="MKKVKFSKNGRVGKWLYVTLCIGVVAISAATVAGYRHAMNSLTDN LVNNEPNEPLEDIDYSEVDAILKDIEKQQAEANAQVTQDIQSELEAVFYEQAVYMPVAN GDVIGEFSFGELVKSSTGVWRTHDGVDLKADPGDPVKSMTGGTVTDVYNDQLWGNCIAI DHGDAITGYYFGLTADALVNVGDKVDAGQIIGYVGETELEADMEPHLHFALKLADQWID PISYIEPYK" /locus_tag="LOCUS_0300" /note="WP_003360546.1 M23 family metallopeptidase (Clostridium botulinum) [pid:26.6%, q_cov:98.3%, s_cov:96.8%, Eval:2.2e-14]" /note="MGA_32" CDS 9714..10193 /product="QueT transporter family protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003434065.1" /transl_table=11 /codon_start=1 /translation="MKNLSTKRLAKLAVVSAIYVALTLSLSFMAYGNIQFRIAEALMLL CFYKKDYGISLILGCLIVNLFSPMGLVDVVFGTLATVVAVALIYISPNIYVASLMPVVS NAIIVGAEIWWAFDMPFAISAIEVAAGEFVCVSILGVVLFKVLEKNSRFMRMIRE" /locus_tag="LOCUS_0310" /note="WP_003434065.1 QueT transporter family protein (Clostridioides difficile) [pid:45.0%, q_cov:88.7%, s_cov:89.8%, Eval:6.6e-30]" /note="MGA_33" ORIGIN 1 attcccgtat tccccggcac taactgtgaa tttgactcgg ccaaggctat ggacgatgca 61 ggtgcagaaa gtaagattat cgtaatcaac aacctgtcag cagaaggtat tcagagaagt 121 gttgaacagt atgcaaacga gcttaaaact gcacagatgg tattcatccc cggtggattc 181 tcgggcggtg acgagcccga cggctccggc aagttcatta cagccttctt cagaaatgcc 241 gcaattaaag acggcgttca cgaacttttg aacaatcgtg acggtttgat gtgcggcatc 301 tgcaacggct tccaggcact catcaagttg ggtcttgtgc cttacggcaa gatcatcgac 361 accgatgaaa actgcccgac cttgaccttc aataccatcg cccgccacca gtcgagaatt 421 gtcagaacaa gaattgcttc caacaagtcg ccttggttgg cgctcacaaa tgtcggcgat 481 atatacaatg ttccgatttc ccacggcgag ggcagattcc ttgcaagcga ggagcttatt 541 aaggagcttg ccgcaaacgg ccagatcgca acgcagtatg ttgacctttc gggcaatgcc 601 accagcgaca ttcacttcaa ccccaacgat tcgatgtatg ccatcgaggg tatcacctct 661 cccgacggca gagtattcgg taaaatgggt cactcggaga gaatcggcgc aggactttac 721 aaaaacattc ccggcgaata tgacattaag atgttcaagg ctgcggttaa gtattttaag 781 taaacattat cttataaggg gaaccccgaa cgggttcccc ttatattatc ccctcctgca 841 tcggcttcgc tcgcgctcac gagcgtaaat gaatttacgc tctgcgccga ttaaggaata 901 aaatccgagg caaagccccg gattttatat gcttatgcta tatttcaccc caaacgggtt 961 cccctttttg tttgtgcata aaaagagccg tcccaaatcg gaacggctca tatatattta 1021 tttacttttt cttttttctt gttgcaacga gaatcactgc caagccagca acgattacaa 1081 ataccgcaac agctacaaca ggtgttgata tatcagcctc ggctgttgtt accacctcgt 1141 cgccctcgcg caaaaactgc caatagtcaa tttcaagcgc atcctcagcc tcggttcgga 1201 aaagaatata tacatcgtga acatctgtaa tgttttcaca attgcatttg atgttttccc 1261 agtcctgagt ctttttgacg ttcaggcttg ccgccaactc tccgaacatc gaatcaaggc 1321 ggacatcaat tattgcattg gcgtttgctt ttatgtttgc gatgaagtta attgcgcctc 1381 cgtctgaaaa atctacattt tcaaccttga tatagtcgcc gttgtcaaca tccgtaacat 1441 acattccgtt ttcagccatg tctgtcttta agccctcact ccaacatata gtttcagctt 1501 caactcggct gtaagggtca agagttgcaa tcgcttctac gcccttggtg gtttggatta 1561 tcaaaggaat agtgccatcc tcgttatatt caaattcagc gacgcacacc gctcttaagt 1621 tccatgcgct tccttcaaga tccccgccat gatagaagaa ataattcttc cctttaaatt 1681 caatgatacc ggggtgaatt gtaaaggaat ttttattgtt cattattatg ccctgatatt 1741 cccaaccgcc ggtcggtgaa tcggaagttg aatagcaaat gctttctggt gttccatagc 1801 ccgcatatac aagatagtat atcccgttgc gcttatgtac ccaagggcct tcctcataac 1861 agtcatcgtg gcttccgtca gggtctatca tctgtccgaa agctttatat gtcatgctga 1921 attctttaat ttcaccgtca agtgcaatca tattcttttt aagcttaaca acatgcaagg 1981 tgggatttcc ccaatataaa tatgcttgac cgtcatcgtc gataaaaacc gtgggatcga 2041 tatatatcca attgggtcct gccaacggtt tgccaagagc atcctcaaaa ggtccggtcg 2101 ggctgtccga aacgccgacg cctattgctc tgccgccgcc aaactcttcg gtagtaactg 2161 ttgtatacaa ataaaacttt ccgtttcgtt cgatacactg tgcagcccaa gcgcttccag 2221 gcaatgccca ctcgaagtcg tcacttcgca taactgcgcc gtgatccgtc cattttacca 2281 tatcggttgt ggaataacat ctccaatgag gcatattata gtttccgcca tcaccgattg 2341 cgtcctctcc cacatataca taaacagtat ccccatatac catcggtgca gggtctgcag 2401 taaagcaagt ctgaacgatc gggttttctg cgctaatagg tgtgcaaagg caaagacaca 2461 ttgtcattgc caacaaaacc ataactaatt ttttaaccat aacgtttctc ctagcagatt 2521 tttatataat tactgatgct cttcttccca cttgttttcg cccatggtta cgcgagcgta 2581 atcatatccg cggtcgccct tcatgggtgc aatcttcgtt tcaaaataaa caaggccgtt 2641 tttctttatg tcaaagccaa gcgcaagggt tccttcgctt gcaattctct cggttttgca 2701 aagaggtctt gcgcagccgc gaataagctc gatttcgctt tcagagggca ttttcggctc 2761 gcctaaatcg tgccaagcct ttaaggggtt gcaaacctct tcatccaccg tttgggtcag 2821 gagcatatac tcccctgcct cggtgtcaat atcaaaatca agatgcaaca ggtcggtttt 2881 tgaatctctt gtaacattcc acaaaacgcc tttaagagtg ccgttctttt cgcgggtgat 2941 aactccgttt tcgcctcgcc aaatacattc accctttaac tccttgaaga acttgaaggt 3001 atagaaagtg ggcttgggaa tacatctgtc agcaaccata ccgaagccgc cgtggaaaag 3061 cgaatggggc acgccctgct cctcaaatac gtctccgaag gtccaatagg aatatccatc 3121 ggtataatcg cctatttctg agagggtgcg cgcaagctcg gccgcgtttt cattggtgtc 3181 gtgcatcggg cagttgggaa tatatgaggt gttaaactcg gtgatataga agggcagatc 3241 cttgaactcg tcatattcgt cgatcattgc gcggacgttt ttaagggtgt caagcgcttc 3301 gcgggtaccc ataagggagg catagccgta atgtccctgg ggcttgggaa aatgagtggt 3361 atagtggtga cgggtgataa aatcgagggg cggatttgtt tcacggcaga aattcaaaaa 3421 tcctcgcatc catttttcat ccgctccgcc gcagattgca ggaccaccaa ccttaaagcg 3481 ttcatcgacc gccttgacgg cattcgcact cattgtatat agcttgaaat attcctccat 3541 atccgcttta taccagaagc cgggcaggtt aggctcgttc cagacttcga tcggccagga 3601 gagaacttct tcctcgccat atcgggatat aaggtgatta agggttgctt tgatcagttc 3661 ctgccaagcc tcatagcttt tcgggggcga ggtgtttccg cgccaatgga aaacataatt 3721 ctcggcagat ttgagcttat agggcataaa gccaagctcc aaaaagggtc tgattccgac 3781 gctcaaatag ctgtcaacaa cacggtccaa atatgtaaag ttatattcaa tggtggtgtt 3841 gccctcgcgg tcggtattct cctgatatat cgccatatcg tcacagaaaa ggccgtggcc 3901 gcgaatatgt ttaaagccga tctccttttg aacgagcgcc agctggtcat aatattcctt 3961 gtgaagcgca aggcccattt tgccggtgcc gacacagaac aaaacattgt tcttgaagct 4021 cgcgctgccg ttcttgcaaa tcttaatagc cataaaatat atcctccctg aaagtatcca 4081 agtaaaaata aatgcttata attttagttt atttatgaaa cagcgatctg tcaatgataa 4141 aacgcatttt gttattgatt ttttcttttc tgcaagttat aattttatta atatcaccat 4201 aggggagaag atatgaaacc aaaaaaatat attgctttat ttgttgcact cataatgctc 4261 ggatcattag tcggatgcgg agcgaacacc tcatcgaacg gagtatcccc cgaagaattg 4321 gagcagccgg acattattat tgatgtaacc gactcaaatg gagatgcttc cgaaagcaca 4381 acctctcata ctactgaaac gaaagaggag accaccgaaa tgacaactga aaatactgta 4441 gaagctacat acagaaaata tagcgctatc cccgagtttg taaagctcat cggcagaaca 4501 tatttggatg acgaagacgt tttatggatc cctcagtcgg caggcggaat tgaatttttg 4561 gctaacggtt ccgaccttcg cattaccctt gcgggcgaca acagcgcaac gccattcagc 4621 gacagcgctg taagatatgc aatatatatc aacggcgagc gcgttgctga ccagatgatg 4681 aaatcatccg acctgaccct tggaattaat ctccccgagg gcgaaaacaa ggtcagattt 4741 gtgaaattgt ccgaatcggc aaacggcatt attggcatta aacatatcag cattctttca 4801 acgcaggaca ttaagcccac gcccgaaagc tcccttaaaa ttgaattcat tggcgactcg 4861 atcacctgcg gatacggtgt tgacgacgaa aaccgcgagc accacttttc cactgaaacc 4921 gagaatgcca ccaagacttt tgcttataaa gctgctcaga ttttaggtgc tgattacagc 4981 atggtatgct atagcggaca cggaatcatt tccgcattta cgggagacgg aaagatcaac 5041 gaatcgggcg ttgtgccgaa aatatataca caggtcggca aaacttggga ccattctttc 5101 aaagttaacg tcaatgagct tgaatgggac ttcgacggat ttgacgccga tatcgttgta 5161 attaacctcg gtaccaacga caattcatat gtcaagggcg atgccgacag agcaaaggaa 5221 tttgaagcgg gatatgttga tttcctcaag ctgataagaa aaaacaatcc caatgctcac 5281 attgtttgtg ctttgggtat tatgggcgct gacctttacg gcagtgttga agcttccgca 5341 gagacattta caaaggaaac aggcgatgat aacatcagct gtttgaaatt tggcactatt 5401 atgggcaacg aaggctattc cgcagactgg catcccaccg aagccaccca gacaagatgc 5461 gcagacgagc ttatccaaca tctcatcaca ataagcgatg aggcgaaggc tctttatgag 5521 gcaaataact gatagtataa caaaaaatgt ccgtaccgat tcggtgcgga cattttgttt 5581 tttatccatc cagattgctc agctcaaact gatttttctt gccgttggtt ttaaccgcca 5641 acgccttggt atggcaactt atgttgctga caacgtggcg tcccccgttt tcgccgtcaa 5701 gagtccagga aagcccctca gcgcacttga cactcaagcg gtcagccttg aaatagtcga 5761 tatattcgct gtcaagctcc tgcttggcaa cgctggtcaa aatgctgtta agctccaata 5821 aatcctgcgg acgcttgatt aaaataacct caaacagacc gtcatcaagg gaaatatcct 5881 tacccaaaaa gtttttcatt cccgcaacgt gcaaggtgtt gctgacaagt ccgataagat 5941 aatcacccga accggagcgc acatcgcttt caaattcaat ttggaaggat ttcatctgtc 6001 ccagcgcgac aatcccctca agcacatatg ccaaaaaacc cagggcgttc ttggtctcct 6061 gcggagtgct gtatgacacc tcggtcaggg ttccgaatgc ggcgacatat gtgaaatagc 6121 gctcgttgag cttgccgacg tcatatgcga tgggcttgcc ctctaccgcg accttcgccg 6181 cttccatcgt ctggcgcgga attcccaccg agtgggaaaa gtcgttggtc gagccgcagg 6241 gaatatagcc atatggcttg ttgcagtctg catttatcat tccgttgatg gcttcgttaa 6301 gggtgccgtc ccctcctgca aatacgcaaa ggtcatagct gttgcaaagc cgctcgacag 6361 ttgccataca gtcgcccttc gcctgagtgg ggtgggctgt aacgtcatat ccgcttttgg 6421 tgaaatagtc aattattttt gcgaggtttc ttgcaatcac ctgcataccc gagtggggat 6481 tataaacgaa tagtagcttt ttgttcatct tgtgtcactc ctgaaaattg aacaaacaaa 6541 agggttattt tctgtaatat gaatagtggg caacgacata tcttttctca ccggtatatg 6601 catcatagcc ggaaatttca gcgccgtttc cgctcaaaag ttccgcaacg gttgcaccct 6661 caagcttaca gcgaaagatc tctttcgcct cgcacataac gacaacggca tcctctaaaa 6721 taatgatacc acccgatttg cccaagacct tctcctgtcc gtcgattctc tcaacggcat 6781 actgcaaagg cttgccgtcg aaacgctcaa gctctttata tgtgggtgtt acctgctttt 6841 tctttcttga aaaaagtccc atattgtcac ctcaaacaag tttgatcagt gttttgatct 6901 cacgcgcaag ctttgcaaca ggcagcccga ctacattata ataatctccg tcaatttttt 6961 tgacgaaaag agccgcgccg tcctgaattc catatgctcc cgctttatcg agcggtgagc 7021 cgcttgcgat gtatgaatct atctcatcct cggtcaggtc ataaaatgta actgatgtct 7081 tttcggtgaa tgtcatcgtc ctgcccatat agcaaaggca tacaccgctg ataaccgtgt 7141 gagttctgcc cgaaagacgc ataagcatcg cttttgcgtc ggtttcgtca ctcggctttc 7201 ccattattac tccaccgaga gtgacaacag tgtcacatcc gataaccagg ctgtcgcgac 7261 ggtcgcggga tatatcaagc gccttctgtg ccgccaaaaa tgcgggaata tcctcaatat 7321 caagcccttc gggaacaact tcctctttca gcgaggggat gatttcaaat tcgtgcttga 7381 tgaattccat cagctcccgt ctgcggggag attttgaagc aaggataacg tttatatttt 7441 caagcataac gctcagtcct ttcaattata tcatagtaat tctaccacat aatgcaaaca 7501 aaatcaactt gacgaaagtg attctatgaa ttataatttt tatgatttgt tttatttaat 7561 gttgaaagga aaaaatatgt cggaattttt gcatttgatt ttgcacacct tggagcacac 7621 attccttgat tcaattaaga tgctcccctt tttgttcggc gtatatctgc tcattgagtt 7681 tttggagcac aaagccgaga ataaaattga agacctgtta agacgtttgg gcccattcgg 7741 ccctgtgggc ggtgctgtgc tgggatgtct gcctcaatgc ggattctccg ttgcggcatc 7801 taacctatat tcgggaaggc tcataagttt gggcaccctt atggcggtat tcatcgccac 7861 cagcgacgag gcgataccca tacttttgac caaccccggc agaggtcagg atattttgag 7921 gcttttggtc gcaaagatgg tcattgcggt cgtcgcgggt ctttttatcg acgcggtgct 7981 caaattcttc cgcaagcgcg taaacgaaga ggctccgcca tattcagatc tttgcgaaaa 8041 ctgcggatgc gagaatcatt cgattctcta ctcggcattt aagcacacct tgcagatatt 8101 cattttcctg tttgctgtgt cctttgtgtt tggatttgta attgagctgg tcggtgagga 8161 tacactgaac aaagttttga tgagcgacag ccttattcaa ccattcttag cggcacttat 8221 cgggctgatt cccaactgcg ctccgtcggt tattttaact gagctgtatg taagcggagc 8281 ggtttccttc gggtctgtgg ttgcaggact ttcaacaggc gcagggatgg gacttgtggt 8341 gcttttcaag accaacaaga atctaaaaca aaacctcgcg ataatgggag ctttgtatgc 8401 tattggcgca gtttcggggc tgataattaa tttggtgttt taagttataa aaggcaggca 8461 cataggcctg ccttttaaaa tgcggaaact tgtttccgct attcatgtcg cgtcagcgac 8521 aattcatgat gtttaatcaa ttcatgtgcg aagcacaatt catttatcta attacttgta 8581 ggggcggacc cgtgtgtccg cccgaagccc tctccgtcac gctacgctcc gcgccacctg 8641 cttacactgt tccttcggaa cgcgcttcgc agacggcgct ccgctcgacc gagcgaggcg 8701 tggcagacgc ggcaccgcgc cgaaggtgcg gtggtttgcg gcgtgccgtg ccgagcggtc 8761 ggggcaggcc cgcaggcctg cccctatctt cacggtaaat gcttacttat acggctcgat 8821 ataggatatc gggtcgatcc actggtcggc aagcttcaag gcaaagtgca aatgtggctc 8881 catatctgct tcaagctctg tttcgccgac gtagccgatg atctgccctg catcgacctt 8941 gtcgcccaca ttcacaagag catccgctgt caacccgaaa taatagccgg taatggcatc 9001 gccgtggtcg attgcaatgc agtttcccca aagctggtca ttatatacat ccgtaacagt 9061 accgccggtc atagatttta cagggtcgcc cggatctgct ttaaggtcaa caccgtcgtg 9121 ggttcgccaa acacctgtgg atgacttgac aagctcacca aaggaaaact cgccgatgac 9181 atcgccgttt gcaacgggca tatataccgc ctgctcatag aataccgcct caagctccga 9241 ttggatatcc tgtgtcacct gtgcgtttgc ttccgcctgc tgtttttcaa tgtctttcaa 9301 aatggcgtcg acttccgaat agtctatgtc ctccaagggc tcattaggct cattgttgac 9361 aaggttgtcc gtcaatgaat tcatcgcgtg acgataaccc gcaacggttg ccgcagaaat 9421 tgccacaact ccgatgcaaa gagtaacata tagccatttg ccgacacggc cgttttttga 9481 gaatttaact tttttcatat tccataactc gctttctccg gcagattaag tattttgatg 9541 actgtgccgg ctcaacctaa gtattaacag gttttggcgg aatattcacc ataaaacaaa 9601 atatgataag ttgacaaacg gcacaaacag gtgtatatta ttcgttggca aaaccaaacg 9661 gggtgttcct tgcctaacca tcccgaaaat aaaacaagga gtaattgaat attatgaaga 9721 acttatcgac caaacggctg gcaaagctgg cagttgtcag tgcgatatat gtagcgctga 9781 ccttatccct tagctttatg gcatacggaa acattcagtt tcgaattgcc gaggcgctga 9841 tgcttctgtg tttctataaa aaggactacg gaatcagcct gatactcgga tgcctgatcg 9901 tcaacctgtt cagtcccatg ggtcttgttg atgtcgtgtt cggaacgctt gcaactgttg 9961 ttgcagttgc acttatttac atcagcccga atatctatgt tgcatcgctt atgcctgttg 10021 tttcaaacgc cataatcgtc ggcgctgaaa tttggtgggc attcgatatg ccttttgcaa 10081 tctcggcgat tgaagttgcc gcgggcgaat ttgtctgcgt gagcatattg ggcgtggtgc 10141 tgtttaaagt tttggagaaa aacagccgtt ttatgcgtat gattagagaa tgataagaaa 10201 aagcacctct cggggtgctt tttgttttaa tgaagattgc ccttaggggg aatgaggtgt 10261 ttcgcctgat atctctccct cagtcagcta cgctgacggc tccctcatca gagggagcct 10321 tagaggtgtc gcctgcggcg aaagatttaa tgcgcccgcg cccttaccgc tcggcaccac 10381 cggcgctgcc gcgcttttcg gtgacgcctc gctccgtaca taaaaaaatt ttacccgaag 10441 tgcaatattt cagcgctccg ggttgtatta taatatgaaa gagctcgcaa ggtctgcata 10501 acgatccctg ctcttgatca tgtcttcagg attttccccg tcagaaatgg cggggaaaat 10561 ctttttttac aatttgaaca ggctgacaac accgtagctg agtatcagca caataattcc 10621 cgcaatcacc actccgccaa aaatcgacca gaaagcgtgc ttg // LOCUS sequence004 9924 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence004 VERSION sequence004 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..9924 /mol_type="genomic DNA" /organism="" /note="sequence004" CDS 171..1178 /product="3-deoxy-7-phosphoheptulonate synthase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003439427.1" /transl_table=11 /codon_start=1 /translation="MIVILKKNPDKVQLDRLISWLEKSGIGVHTSVGHSETVLGLIGDT SKVDIDLITQLDIVDTVKRVQEPYKNANRKFHPENTVINVGNAHIGDGSLTLIAGPCSV ESEEQICLIAESVKKSGAHLLRGGAFKPRTSPYSFQGLREEGLRLLTVAKQQTGLPIVT EIMDISQMDNFEKFDVDVIQVGARNMQNFELLKALGTMRRPILLKRGLSNTYEELLMSA EYIMAGGNNQVMLCERGIRTFETYTRNTLDVAAIPVLKTLSHLPIIIDPSHSAGKSALV APLSCAAVAGGADGLIIEVHNDPSHAMCDGPQCIKPDTFADLVGKLEAIHEAIR" /locus_tag="LOCUS_0320" /gene="aroF" /EC_number="2.5.1.54" /note="WP_003439427.1 3-deoxy-7-phosphoheptulonate synthase (Clostridioides difficile) [pid:62.3%, q_cov:99.7%, s_cov:98.8%, Eval:4.2e-112]" /note="MGA_34" CDS 1178..2038 /product="prephenate dehydrogenase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_010964211.1" /transl_table=11 /codon_start=1 /translation="MKNAVGIIGLGLIGGSMAKAVREYIGRAPEGYAEKIFGTDLNKSY VKRALDEGIIDGELTDDMFADCKLVMVAIPPRAAAKWIKENAKKLTGSVLVDLCGVKRY ICDIVRPLATAHGFTFVGGHPMAGKEVGGYENSAASLFKGASMILTPDDDTDIAQMDEL SEFYKAIGFGRVTICSSERHDEVIAYTSQLAHIASSAYIKSPTAQNHRGFSAGSYKDLT RVARLDENMWTELFMANREPLINELELLIKNLCDYRDVLAEGDENTLREMLKNGRELKE SAGGK" /locus_tag="LOCUS_0330" /note="WP_010964211.1 prephenate dehydrogenase (Clostridium) [pid:31.9%, q_cov:95.8%, s_cov:94.8%, Eval:2.7e-37]" /note="MGA_35" CDS 2247..2771 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MTTIKVNAGKPYDVKIGAGILSSLGKDIRALMGGLRAAVITDSNV APLYLDGVLKNLEAAGYETDSFVFKAGEESKTAETLVEILEFLAMMGYTRTDVVIALGG GVVGDITGFAAAIYLRGIDFVQIPTTLLAAVDSSVGGKTAIDLKAGKNLAGAFKQPRLV IMDTDTIKTLP" /locus_tag="LOCUS_0340" /note="WP_010942668.1 3-dehydroquinate synthase (Geobacter sulfurreducens) [pid:51.4%, q_cov:98.9%, s_cov:47.8%, Eval:3.4e-44, partial hit]" /note="internal stop codon at [2769:2771](+)" /note="MGA_36" CDS 2790..3296 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MAEAIKYGVLFDEELFESFAEDVTDEMLESVIAKCVQHKANIVER DEFDRGERKLLNLGHTIGHAIEKASGYTVAHGHAVAAGMAMIARSCEALGIAEKGTAER IERMLEKYHLPTNYDCDPARLAGLALSDKKREGTTISLILPEKIGKCIIKDEPVARLKE YIQKF" /locus_tag="LOCUS_0350" /note="WP_010964212.1 3-dehydroquinate synthase (Clostridium) [pid:40.1%, q_cov:98.8%, s_cov:48.3%, Eval:2.5e-25, partial hit]" /note="internal stop codon at [2769:2771](+)" /note="MGA_37" CDS 3589..4851 /product="3-phosphoshikimate 1-carboxyvinyltransferase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_010964213.1" /transl_table=11 /codon_start=1 /translation="MNKFDIKITPNILSGLVPAIGSKSDIHRLLICAGLCDEETIIKGV TRSDDIDATAECLRQLGVGVDFQGRICVVTPNATAVDSPLLDCRESGSTLRFMLPVAAA LSDNARFVGSGRLPKRPIGDLVDAMEKGGVSFSSPSLPLEISGKLKAGVYLLPGNVSSQ YVSGLLMALSITEGESEVVLTSDLESTSYVNMTISTLSMFGAQVIRTERGYKISGQRRL RSPGRAVADGDWSNAAFFICAGAFKDEVTVTGLDPFSAQGDKKVCEFLKRFGAAVISVN SQVTVSADNLLACDIDLTDTPDLLPILAVVATNAKGTSRFSGAKRLKLKESDRLLTVAD MINSLGGDAKVLPDGIIVTGKPLVGGVVDSHNDHRIVMAAAIASTLCSEPVTITNAHAV NKSYPAFFEDFKRLGGEASVI" /locus_tag="LOCUS_0360" /gene="aroA" /EC_number="2.5.1.19" /note="WP_010964213.1 3-phosphoshikimate 1-carboxyvinyltransferase (Clostridium) [pid:37.9%, q_cov:97.9%, s_cov:97.4%, Eval:4.7e-74]" /note="MGA_38" CDS 4841..5917 /product="chorismate synthase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011861346.1" /transl_table=11 /codon_start=1 /translation="MSSEFGKLFKVSVFGESHGEAIGCVINGLPAGEKIDLERLYAFMK RRAPGSGLSTPRKEEDRPRFLSGIRDGVLTGAPLCAIIENKDTRSGDYAFGDTPRPGHA DYTAAVKYKGQADMRGSGHFSGRLTAPLCIAGGIALQLLEKKGIYIGAHLQSVGHLMDE DFPLHPTKELFEEIAKKPLAVISDDALEAFSEEIQATRRRKDSVGGCIEVAAIGIPAGL GEPMFDGIENRLAQAIFGIPAVKGLEFGMGFASARLNGSQNNDEFCIENGKVMTRTNNA GGVLGGITTGMPLTFRAAMKPTPSIGIKQNTVKLSTFEDATVEIKGRHDPCVAVRAVPV FEAVTAAVIYDIILEEKI" /locus_tag="LOCUS_0370" /gene="aroC" /EC_number="4.2.3.5" /note="WP_011861346.1 chorismate synthase (Clostridioides difficile) [pid:50.0%, q_cov:98.6%, s_cov:99.2%, Eval:6.7e-95]" /note="MGA_39" CDS 5917..7056 /product="prephenate dehydratase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011861347.1" /transl_table=11 /codon_start=1 /translation="MDLKDIRQRIDEIDDKLIELFIERMGLSKEVAEYKAATGTPILNM TREREILKKVCDKAGDMDLYAHRLYSTILELSRALQQEHIPQNTGVRKQVEASLNKNYD AFPRGGMIACQGTEGAYGQMAADRMFPQGHLVFFKTFEAVFDAVESGFCDFGVLPIENS SNGSVRETYDLLQTKNCKIVRSERLCIRHELMAKPGTKLSDIKTIISHEQAIGQCSKFL KSLGDKVSVVAVSNTAVAAEQVANCADGSVAAIASHATAHLYGLEPVVKDIMDSDNNYT RFVCIAKDHQLYPGSDHVGLILALQHKPGALYDILAKMAALEVNLIKLESCPVVGHDFE FMFFFEMQANVRDPKILGMLEAIEASCEQFVYLGNYLEA" /locus_tag="LOCUS_0380" /gene="pheA" /EC_number="4.2.1.51" /note="WP_011861347.1 prephenate dehydratase (Clostridioides difficile) [pid:34.7%, q_cov:98.9%, s_cov:98.2%, Eval:2.1e-54]" /note="MGA_40" CDS 7284..8522 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MSKLYGLIGRKLGHSYSVPIHFALGNDAYKLFEMEPEEIGKFVSN PDLGGINVTVPYKLEVMQYLDEISPEALEIGAVNTVVRRNGKLYGYNTDEYGFRVMLDA AKISLFGKKVMILGDGGASKTAQYCARRLGAREIVVIDVANNTPEYLAKHIDTEILINC TPVGMKPNYIQSAVELEQFPACEGVVDVIYNPLRTKLIMDAEVRGIKHIGGLLMLTAQA KRAHELFFDTAVSDDFALKCAANLFKENENIVLVGMPGSGKSTVGKILGEMSGRKVYEL DEMIAKAAGKTIPEIFASDGEEGFRKIESQIVFEASKNNGAVIITGGGAVTREENYYPL HQNSRIYEIKRDLNTLATDGRPLSKDLETLKRMYDIRKPMYEHFADVSFENSSTAEECA KKVWEEFCEDFSY" /locus_tag="LOCUS_0390" /note="WP_003439416.1 shikimate dehydrogenase (Clostridioides difficile) [pid:39.8%, q_cov:56.3%, s_cov:93.3%, Eval:2.0e-37, partial hit]" /note="MGA_41" CDS 8503..8937 /product="type II 3-dehydroquinate dehydratase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_010964217.1" /transl_table=11 /codon_start=1 /translation="MKILVINGPNLNMLGIREPAIYGNRTYNDLIKMIKEHCDAKGIDV EFYQSNHEGDLVDKIQSAFGNTDGIVINPGAYTHTSVALLDAVKSVGIPTVEVHISDPD TREEFRKVSYIRLGCIATIKGKGFEGYLEAVDVLEKRHNR" /locus_tag="LOCUS_0400" /gene="aroQ" /EC_number="4.2.1.10" /note="WP_010964217.1 type II 3-dehydroquinate dehydratase (Clostridium) [pid:56.8%, q_cov:96.5%, s_cov:96.5%, Eval:2.7e-39]" /note="MGA_42" tRNA 9633..9709 /product="tRNA-Pro" /inference="COORDINATES:profile:Aragorn:1.2.38" /locus_tag="LOCUS_t0030" /note="Aragorn_3" ORIGIN 1 ctcaaatccg ccgtccgcag gacctcccct ctgcggaggg gagccgagag ggtttggagc 61 gcctcgtcgt gcacccacct catccgtcag cttcgctgac accttcccct caaggggaag 121 gctatcagca ttcaaataca agggcaatac ccattaaagg agaaatcaat atgatagtaa 181 ttttaaagaa aaaccccgac aaagttcagc ttgaccgact tataagctgg cttgaaaaga 241 gcggtatcgg tgttcacacc tccgttggcc actcggaaac cgttttgggt cttatcggtg 301 acacctcgaa ggtcgatatc gaccttatta cccagcttga cattgttgac accgttaagc 361 gtgttcagga accgtataag aacgcaaacc gcaaatttca ccccgaaaat actgttatca 421 acgtgggcaa tgcccatatc ggcgacggaa gtctgaccct tattgcaggc ccttgctcgg 481 ttgaatcgga agaacagatc tgccttattg cggaaagcgt taaaaagagc ggcgcccacc 541 ttttgcgcgg aggcgcattc aagccgagaa cctcgccata ttccttccag ggacttcgcg 601 aagagggcct tcgacttttg accgttgcaa aacagcagac aggtttgcct attgtcaccg 661 aaattatgga catcagccag atggataatt ttgaaaagtt tgatgtcgac gtaattcagg 721 tcggcgcaag aaatatgcag aactttgagc ttttaaaggc tctgggaacc atgcgcagac 781 ccattttgct caagcgcgga ctttcaaaca cctatgaaga gcttttaatg agcgccgaat 841 acattatggc gggcggcaac aaccaagtaa tgctctgcga gcgcggaatc agaacctttg 901 aaacatatac ccgcaacacc cttgacgttg cggcgattcc cgttttgaag accctttccc 961 atcttcccat aatcatcgac cccagccact cggcaggtaa atccgcgctt gttgcgcctc 1021 tttcctgcgc ggcagttgca ggcggagcag acggactcat catcgaggtt cacaacgacc 1081 cctcacacgc tatgtgtgac ggccctcagt gcattaagcc tgataccttt gctgatctgg 1141 tcggaaaact cgaagcaatt cacgaggcga taagataatg aaaaacgcag taggcatcat 1201 cgggctcggt ctcatcggcg gctcgatggc aaaagctgta agagaataca ttgggcgtgc 1261 ccctgaaggg tatgccgaga agatttttgg cactgacctc aacaaaagct atgttaaacg 1321 cgcacttgac gaaggaataa tcgacggcga gctgacagac gatatgttcg ccgattgtaa 1381 gctggttatg gttgcaattc cgcccagagc cgcggcaaag tggataaaag aaaacgcaaa 1441 aaagctgacc ggctcggtgc tggtcgacct ctgcggcgtt aaaagatata tttgcgatat 1501 tgtaagacct cttgcaaccg cgcacggttt cacctttgtg ggcggacatc ccatggcggg 1561 caaagaggtc ggaggatatg aaaattcagc cgcttcgctt ttcaagggtg cttcaatgat 1621 actcacccct gatgatgaca ccgacattgc acagatggat gagcttagcg agttttataa 1681 agctatcggc ttcggcagag tcaccatttg ctcgtcagag cgacacgacg aggtgattgc 1741 atatacctct cagttggcgc acattgcatc aagtgcatac attaaaagcc cgacggctca 1801 aaaccatcgg ggcttttccg caggaagcta taaagacttg acaagagttg caagactgga 1861 cgaaaatatg tggacggagc tgtttatggc taaccgcgaa ccgctgataa atgagcttga 1921 gcttctgatt aaaaatctct gcgactaccg cgatgttctc gccgagggcg atgaaaacac 1981 ccttcgcgaa atgcttaaaa acggcagaga gcttaaagag agtgcgggag gaaagtgacc 2041 ccctgcggcg cgatgatgtt ccggctgacg gcggattgcc ctctccgtca gctccgctga 2101 cacctctccc gcagggagag tctaaaaggt gtcggcttcg ccgacagatt gcgggtcccc 2161 tccgtcacga cccttcgggt cacgacggcc gccgccccgc ctttaatgaa ttgttgcttc 2221 gcaacattaa aaggagccaa accaaaatga ccaccatcaa agttaatgca ggaaaaccct 2281 atgacgttaa gatcggcgcg ggaattttaa gttccctcgg caaggatatc cgcgcgctta 2341 tgggcggctt gcgcgccgcc gttataaccg actcaaacgt agcacctctg tatcttgacg 2401 gggtgcttaa aaatcttgaa gcggcgggat atgaaacgga cagctttgtt tttaaggcag 2461 gagaggaatc gaaaaccgcc gaaacgctgg ttgaaatact cgaatttttg gcgatgatgg 2521 gctatacccg cacagatgtt gtgatcgccc tcggcggcgg agttgtggga gatattacgg 2581 gctttgccgc tgctatatat cttcgcggaa tcgactttgt tcaaattccc accacccttt 2641 tggctgcggt tgattcatct gtcggcggaa agacagcgat cgaccttaaa gcaggcaaaa 2701 accttgcggg tgcatttaaa cagccccgcc tggtaataat ggataccgac acaattaaga 2761 ctctgcccta atttgaattt gcaaacggca tggcagaagc aattaaatac ggcgtattgt 2821 ttgacgaaga acttttcgaa agcttcgctg aagatgtcac cgacgaaatg cttgaaagcg 2881 taattgcaaa atgtgtccaa cataaagcaa acattgttga gcgggacgaa tttgaccgcg 2941 gtgagcgcaa gcttttgaac ctcggccaca ccatcggcca cgccattgaa aaagcatcgg 3001 gatataccgt tgcacacggc cacgcagttg ccgcaggaat ggcgatgatc gcccgctcct 3061 gcgaagccct cggaattgcc gaaaaaggca ctgccgaaag aattgagcgg atgcttgaaa 3121 aataccatct ccccacaaac tatgactgcg accccgcaag gcttgcagga cttgctcttt 3181 cggacaaaaa acgcgagggc acaaccataa gtctgatttt gcccgagaag ataggcaagt 3241 gcattattaa ggacgagccg gttgcgagat tgaaggaata tatccaaaag ttctgattcg 3301 ggagcaggta cttcctcgca aacagacccc atacaatagg ggcggacaca taggtccgcc 3361 cacagaaacg cacaacttca aaaatgttgt ttcgcttaca agattttgac aagaatcctc 3421 tttaagaatc ttggcggcac agataacaaa aatattgcta aagaatttat tgaattattg 3481 aggggcaggc ttatgtgcct gcccgccaag tcgcattgat ttatcgggcg accacatagg 3541 gtcgccccta tataaaatca ccatcccacc acaaaggaac ccaaaacaat gaacaaattt 3601 gacattaaga tcacccccaa catactttcg ggacttgtac ctgcaatcgg ctccaagtcg 3661 gatatccacc gccttttgat ctgtgcggga ctttgcgacg aggaaacgat aattaaaggt 3721 gtcacccgaa gcgacgatat tgatgcaact gccgaatgtc tgcgccagct tggcgtcggc 3781 gttgattttc aaggcaggat ctgcgttgta acacccaacg ccaccgccgt tgattccccc 3841 ttgctggact gccgcgaaag cggttcgacc cttaggttta tgctgcccgt tgcggcggcg 3901 ctcagcgaca atgcgcgctt tgtcggctcg ggcagacttc ccaagcgacc catcggcgac 3961 cttgtggatg caatggaaaa gggcggtgtg agcttctcaa gcccatcact tccgcttgaa 4021 atttcgggca agctcaaagc aggcgtatat cttttgccgg gaaatgtcag ctcccagtat 4081 gtttcgggac ttttaatggc actttccatc accgagggcg agagcgaggt tgttttaaca 4141 agcgaccttg aatccacctc atatgtaaat atgacaattt caaccctttc gatgttcggc 4201 gcacaggtaa tccgcaccga gagaggttat aaaatatcgg gacagcgcag acttagatcc 4261 cccggcagag cggttgccga cggcgactgg tcaaatgccg catttttcat ctgcgcgggc 4321 gcatttaagg acgaggtcac cgttacgggt cttgacccgt tttcggcaca gggcgacaaa 4381 aaggtctgcg aatttttgaa gcgcttcggt gcggcagtta tcagcgtgaa ttcgcaggtg 4441 acggtatccg ctgacaacct gcttgcctgc gatattgacc tgaccgacac ccccgacctt 4501 ctgccgattc tggctgttgt tgcaactaat gccaagggca ccagccgatt ttcgggcgca 4561 aaacgcttaa agcttaaaga atccgaccga cttttgaccg ttgctgatat gataaattct 4621 ttgggcggcg atgctaaggt gttgccagac ggcataattg taacaggcaa gccccttgtg 4681 ggcggtgtgg tggattctca caacgaccac cgaatcgtaa tggcggcggc aatcgcctcg 4741 accctgtgtt cggagcctgt gaccattaca aatgctcatg cggtcaacaa gtcatatccc 4801 gcattctttg aagatttcaa acgcttagga ggagaagcaa gtgtcatctg aattcggcaa 4861 gctttttaaa gtcagcgttt tcggcgaatc tcacggcgag gcaataggct gtgtaatcaa 4921 cggcttacct gcaggcgaga agatcgacct tgagaggctt tatgcattta tgaagcgccg 4981 tgcccccggc tcgggccttt caactccccg aaaagaggag gacagacccc gatttttgtc 5041 ggggatccgc gacggtgttt tgacaggtgc acctttgtgt gcaataattg aaaacaagga 5101 cacccgctcg ggcgattatg cctttggcga caccccccga cccggtcatg ccgactatac 5161 ggcggcggtg aaatataagg gtcaagccga tatgcgcggc tcgggacatt tttccggcag 5221 acttacagca cctctttgca ttgcgggcgg aatcgctttg cagcttttgg aaaagaaggg 5281 catttatatc ggcgcgcatc ttcaatcggt gggacattta atggacgagg attttccttt 5341 gcaccctacc aaggagcttt ttgaggaaat tgcaaaaaag ccgttggcag ttatcagcga 5401 cgatgcgctt gaggcatttt ccgaggaaat tcaagccacc cgccggcgaa aggattctgt 5461 cggcggatgt attgaagttg cggcgatcgg aattcccgca gggctgggag agccgatgtt 5521 tgacggaatt gaaaaccgat tggctcaggc aattttcgga attcccgcag ttaaaggtct 5581 tgaattcgga atgggctttg catcggcaag acttaacgga agccagaata acgatgaatt 5641 ctgtattgaa aacggcaaag ttatgacccg cacaaacaac gcaggcggag ttttgggcgg 5701 cattacaacg ggaatgcctt taaccttccg cgcggcgatg aagccgacac ccagcatcgg 5761 aattaaacaa aacaccgtta aactttcaac atttgaagat gcaacggttg aaattaaagg 5821 cagacacgac ccctgcgtag cggtaagagc tgtgcctgtt tttgaagccg tcaccgcggc 5881 ggttatatat gacattattt tggaggaaaa aatctaatgg acctgaagga tataagacag 5941 agaattgacg aaattgacga caagctgatc gagcttttca ttgaaagaat gggactttca 6001 aaggaagttg cggaatataa agccgcaaca ggcacaccca ttctcaatat gacccgcgag 6061 cgcgaaattt tgaagaaggt atgcgataag gcaggagata tggaccttta tgcacaccgc 6121 ctttattcga caattttaga gctgagccgt gctcttcagc aggagcatat tccccagaac 6181 acaggtgtca gaaagcaggt cgaggcatcg cttaacaaaa actatgatgc atttccccgc 6241 ggcggaatga tcgcctgtca gggcacagaa ggagcatacg gccagatggc ggcagacaga 6301 atgttccccc agggacattt ggtgttcttc aagacctttg aagcggtgtt cgatgctgtt 6361 gaatcgggat tttgcgactt cggcgttctg ccaattgaaa actcctccaa cggctctgta 6421 agagaaacat atgacctttt gcagaccaaa aactgcaaga tcgtcagaag cgagcgcctt 6481 tgcatccgcc acgagctgat ggcaaagccg ggcaccaagc tttcggatat taaaacaatc 6541 atctcccacg agcaggcaat cggccagtgc tcgaaattct taaaatcatt gggcgataag 6601 gttagtgttg tcgctgtcag caacaccgct gttgcggcag agcaggttgc aaactgcgcc 6661 gacggaagcg ttgcggcgat tgcaagccac gccaccgcgc atctttacgg acttgagcct 6721 gttgtcaagg acattatgga ctcggacaac aactataccc gctttgtttg catcgccaag 6781 gatcatcagc tttatcccgg ttccgaccac gttggattga ttttggcact tcagcacaag 6841 cccggcgctc tgtatgacat cttggcaaag atggcggcgc ttgaggttaa ccttatcaag 6901 ctggaaagct gtcctgttgt tggtcacgat tttgagttta tgttcttctt tgagatgcag 6961 gcaaatgtac gcgatcccaa gattttaggt atgcttgaag cgattgaagc aagctgtgag 7021 cagtttgttt atttgggtaa ttatttagag gcgtgatgtt ccaaggggac ataaatgtcg 7081 aaacgaactt cattgagggg cgaccctatg tggtcgcccc tcctctacag gaattttgca 7141 ccgcccttac cgctcgccac caccggcgct gccgcgctgt tcggtgacgg ctcgctgctc 7201 tgcaatttct ccaaacaacg aatgaattga tgcatacgca tcatggtttg cgccgtcggc 7261 gcatttttta gaggtgaaaa ctcatgtcaa aactttacgg ccttatcggc agaaagctgg 7321 gacacagcta ttcggttccg atacactttg cccttggcaa cgatgcctat aaactctttg 7381 aaatggagcc tgaggagatc ggcaaatttg tttcaaaccc cgatctgggc ggcatcaatg 7441 taacggtgcc ttataaactc gaggtcatgc aatatctcga tgagatctcc cccgaggcac 7501 ttgaaatcgg cgctgtcaac accgttgtca gacgaaacgg caagctatat ggatacaaca 7561 ccgatgaata cggcttccga gtaatgctcg atgcggcaaa aatttcgctt ttcggcaaaa 7621 aggttatgat tttgggcgac ggcggagctt caaagaccgc gcagtattgc gcgcgcagac 7681 tcggtgcccg cgagatcgtt gtcattgatg ttgcaaacaa cactcccgaa tatctcgcga 7741 agcatataga caccgagata ctcattaact gcacacctgt cggaatgaag ccgaattata 7801 ttcaatcggc ggtggaactc gaacaattcc ccgcttgtga gggcgtggtg gatgttatat 7861 acaatcctct tcgcaccaag ctgataatgg atgccgaagt cagaggcatc aagcatatcg 7921 gcggactctt aatgctgaca gcgcaggcaa aacgcgccca cgagctgttc ttcgataccg 7981 ccgtttcgga cgattttgcc ctcaaatgcg cggcaaacct ctttaaggaa aacgaaaaca 8041 tcgttttggt gggtatgccc gggtcgggaa aatccaccgt cggcaaaatt ttgggcgaga 8101 tgtcaggccg caaggtctat gagctggacg agatgatagc caaagccgca ggaaaaacca 8161 ttcccgagat tttcgcttca gacggcgaag agggcttccg caaaattgaa tcgcaaattg 8221 tttttgaagc ctcaaaaaac aacggcgcgg tcataatcac cggcggcgga gctgtaaccc 8281 gcgaggaaaa ctactatcct ttgcaccaga actcgaggat ttatgagata aagagggatc 8341 ttaataccct tgcaacagac ggcaggcccc tttcgaagga tcttgaaacg ctgaaaagga 8401 tgtatgatat aagaaaaccg atgtatgagc actttgcgga tgtgagtttt gaaaacagct 8461 ccacggcgga agaatgtgca aagaaggttt gggaggaatt ctgtgaagat tttagttatt 8521 aacgggccga atttgaatat gcttggcatc agagagcctg caatttacgg caaccgcaca 8581 tataatgacc tcataaagat gataaaagag cactgcgatg caaaaggcat cgacgtcgag 8641 ttttatcagt cgaaccacga gggcgacctt gtcgataaga ttcaatcggc attcggcaac 8701 accgacggta tcgtcatcaa tccgggggca tatacccaca caagcgttgc acttttggat 8761 gcagtcaaat cggtgggaat accaactgtc gaggtgcata taagcgaccc cgacacccga 8821 gaggaattca gaaaagtttc ctatatccgc cttggatgca ttgcaacaat caagggcaaa 8881 ggctttgagg gatatcttga agcggtggat gtgttggaaa agaggcataa ccgatgaata 8941 aagccgatat agtgatgctt gtaatcggag ttgcctttgc aatcgccttg ttttttggca 9001 tcagatatca cgttaagaac cgcaaagagg attgttctgc aataactccc atatcggtag 9061 tattcttttt gctgtttccc gctctgcctt ttgctttgac gagcggttat tttctttcaa 9121 agcttgtcga taccaaattt gacatcacta tgtggatagt tggtgcgttt gcagcattga 9181 cagttctcac gatggtttta atgccgatta tcggcatttt gcgctgtgat accatagtgg 9241 aagccaaatt gatatcctgg gagtatcatg gcggcggaag aaacggtcct gcccgccgca 9301 gattggtttt tgcatatgaa tttgagggca agaagtataa atgcgcgaca aactcgcaat 9361 tgctcagagg ggaatttgcg caattcaagt tgaaagaaaa gtatgatatt tacatatcga 9421 aaaagctacc gacgctttgc cgcccttggc gcagaataat gcaatatgaa atatacggta 9481 tgatttgcgg tgtggcattg gttttggtat gcttgccgat gtttttgggg aaatgagtaa 9541 ggggcgacca cgcagggtcg ccctttaaca ttgcaaatat tttcaaaaaa cagttgcaaa 9601 cgcaaaaatc ttatgatata ctaacatagt tacgaggtgt ggctcagttt ggtagagcgc 9661 cacgttcggg acgtggaagc cgtgggttcg aatcccgtca cctcgaccat aaaaacaaaa 9721 agactcctgc aaaggggtct tttgttttta tgagtggaat tggcgagtaa gaagaacgcg 9781 tcacctctct gcaggcactt caagaagccg cgaagcgggt tcttgacaaa gtttttccga 9841 gcaaagcgag gaaacacttt tggcacctcg accataaaaa tgaatttgag ccccgatttt 9901 gagaagcaaa ctattatttc tatc // LOCUS sequence005 9805 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence005 VERSION sequence005 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..9805 /mol_type="genomic DNA" /organism="" /note="sequence005" CDS 106..924 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MGGNIKAVYVQAGDTVNEGDLIAEYETYELDLEIELKELEVYREE LEYQIAIEKGESETVKNKELLDVQLMQNELDKLYAEKDATKLYAGVSGTVSYVKTLSPG DWVNPGETIATIIDITDLYIKISPNSEMGEFLIGRPITIRYEGQYFDGTIVSNKSGKLW DEETKAAQVDENGEFILGEESEAVIVKFNDMIPESSAVGNIADTLLILDKRENVIVISA NLIKSSGGINYVYVFKDNQKVQVNVTIGLESGSLCEITSGLEEGDEVIIR" /locus_tag="LOCUS_0410" /note="WP_005791602.1 efflux RND transporter periplasmic adaptor subunit (Bacteroides fragilis) [pid:23.9%, q_cov:98.2%, s_cov:74.0%, Eval:1.1e-08, partial hit]" /note="MGA_44" CDS 1003..3825 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MRNTKWMVICLLIGFIMATAMTSAIPIYMDASLQRMLIKDMQAYQ EENNEYPGVYAVSKTIVSGTSAKNQRATVNNVYAKSADRFNQLLVPFITYKCYTADSYL YVSSIESEELSMLKLGGMSEIDDHITILEGRMYEPGKRDDGVYEVICTEKSLQLTQLTL NQVYEVTNILNPGATIKLEIVGVFDLANPTDTYWSEGMKNYDNTLLVDFDTLVGNENKS TGVTTADGIIFTGVVNLTSVDCRYIINYPEMDMNIIEHVRNCFEYHSELYKEENCTFRV PAREVLDQYAEKAASLKYILLMLDIPVVLMLIFYLFMVSQLNIESEKNEIAMLKSRGAS SWQILRIYAYETLILGGISALVGPFVGLGLCNILGVSNGFLEFVNRPALQARLSLAAFL YAVAAVAVFFVTTLVPIVPASRVSIVAHKQSHAKSVQKPAWQKMYLDFILTFGSVLWLY FHNRQEQKLIEQGIADVASTMNPLMFAASTVFILGAALICVRFYPYVIRLIYKIGQKRW SPAAYFSLNNISRSSTGREKFIMIFLILTVALGIFSANTARAINRNTEERIKYNLGADA VIQEAWKTTRVKIYSEEDGGETSVTQYTEPEFSKYSELAGVETATPVFKRDSVQIKYED KTTTNVQIMGIVPHQFADVCWFRDNLLPVHINYYINALSECQDGVIISSSYQEKNGIKL GDVVSFKWSKNDWFEATVVAVVDFWPTMNPYEKNSSGDYRDFAILNFDYINALTITEPY EVWLSLDDETPIADLYQSVIDMDITATRLDVARQMVTSSKTDATLQGVNGALTLGFITI MAMCFIGFLIYWILSIKGRTLQFGILRAMGMSFKEIIAMIVYEQILVSGVSIFLSIIIG GIASDLFVPLFQVLYNVTDQVPPFVVVSQRSDYIKLYVIVGIMLVVGFLVIARLIKSIN INKALKLGED" /locus_tag="LOCUS_0420" /note="MGA_45" CDS complement(3910..4116) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MKMVGLRKIRKQKKLSQLKVAMDLHISREALSYYENGHRSPDLEM LVKMSSYFKVSIDFLITGNEYDQ" /locus_tag="LOCUS_0430" /note="WP_002267623.1 helix-turn-helix domain-containing protein (Streptococcus mutans) [pid:50.0%, q_cov:88.2%, s_cov:20.3%, Eval:5.6e-09, partial hit]" /note="MGA_46" CDS 4216..4335 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MKKVLFIIGTVILVGLGTWIAISVKKRFTLANTYAEYKY" /locus_tag="LOCUS_0440" /note="MGA_47" CDS 4371..4652 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MGKGKAIAGLVLSIIGVVLGVLNGWFSVVGLPVAIVGLVLSVSGG KQLRANDLPHGIATAGLVLGIIAVVFTAIAFFTCGICVVCASALGAAA" /locus_tag="LOCUS_0450" /note="MGA_48" CDS 4715..5470 /product="prolipoprotein diacylglyceryl transferase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_002680889.1" /transl_table=11 /codon_start=1 /translation="MKPFFSLFDRQIPVYGVMWFVGIFFAGVVALLICNRRKIERYDIV YSAVYSLIGGLIGSKLLFVLVSLKTIIDNALPIEAVIKGGFVFYGGLIGGIVGLYVYVK QFKLSAAPFFDVYAIVLPLGHAFGRIGCHFAGCCFGIEYSGPFAVEYNYSLSGVPINTP LLPIQLIESVVLIVVFGILLFAYFRHISDGMCAVLYTVIYSICRFALEFLRGDQDRGIA ILSTSQWISILFLATTVIYLIIKNKKQCN" /locus_tag="LOCUS_0460" /EC_number="2.4.99.-" /note="WP_002680889.1 prolipoprotein diacylglyceryl transferase (Treponema denticola) [pid:35.4%, q_cov:96.0%, s_cov:94.2%, Eval:1.0e-34]" /note="MGA_49" CDS complement(5485..6114) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MNVKSGILKEIAHTGPKSRAELSRILGVCPSRITEVCASLLDQGA LCPCGYREGYARGRKNLLLDIDCSYKFALGVGISKDIICVGLTTLKGEALGKELIEAKG ELNFWTVYDAVKTAANKILRECCLSKEQILGIGVSMTASAVSALNIDISDGLLPEGYRA ADGIPMLFEPLDDYLEYAGQYLNISPDGLYMFGCAKVTRDLFIYGK" /locus_tag="LOCUS_0470" /note="MGA_50" CDS complement(6104..7552) /product="HAMP domain-containing sensor histidine kinase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011459501.1" /transl_table=11 /codon_start=1 /translation="MTTSSSKPKKQPLTLRATIWIYFAVFTVAMLMFLWVFQVLSLDQY YEFSVKRNVTMASNLITQNFSRSNPTAVASLVEDIAYKNKMTIAITDRNGNVITVSDFM GNFSVITSDHGFRLFEYRNRVLMSSTSTIMETIVNERIETTEILYGALIPQTTYMIFIN ATFEPIDSTVDIIKDQFVYISALLLFAALWVSLLMSKNLSKPIVQITNSASKMAKGDYA ANFESGSYAEINELAQTLNYAAQEISKVDTLRNDLIANVSHDLRTPLTMIKAYAEMIRD LSGDKPEKRNEHLGVIIQETDRLSALVSNMLELSKLQSGTMSIEYSKVGLEGFVESVLS RYQHLSEMDGFEFMYESDGDCICYGDRAKLEQVMYNFVNNAINYSGDSRKIIIRTHILP YTVRIEVVDFGKGIEKDKLPLIFDRYYRGDRTKRDVVGSGLGLSIVKEILRLHKTKYGV QSEIDKGSTFWFEVERIKENSNER" /locus_tag="LOCUS_0480" /note="WP_011459501.1 HAMP domain-containing sensor histidine kinase (Desulfitobacterium hafniense) [pid:25.1%, q_cov:97.1%, s_cov:98.1%, Eval:7.4e-42]" /note="MGA_51" CDS complement(7533..8213) /product="response regulator transcription factor" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_054938388.1" /transl_table=11 /codon_start=1 /translation="MPRILIVDDEAKISEVVREYAEFEGMDVTEAVDGMDAVEKVRSNS ESFDCIVLDIMMPRLDGYSACKEIKKIKNIPVIMLSARGEEYDKLFGFEVGVDDYVVKP FSPKELMARIKVAIKRGSAPENSDVIRYKGLVINFAARDVTIDGKRVQMTPKEYDILFY LARNMNIAMSREKLLEEVWGFDFYGDDRTVDTHIKMLRNSLGPYRDLIVTLRGMGYKFD DIKQ" /locus_tag="LOCUS_0490" /note="WP_054938388.1 response regulator transcription factor (Moorella) [pid:52.3%, q_cov:97.3%, s_cov:96.9%, Eval:5.6e-63]" /note="MGA_52" ORIGIN 1 cagcctgtcc ttatcaacat aaggagtaag tgcattgtag tgtgaagcac cgaggcagaa 61 aataaggctg tcatcaagct cgtaagggct caacggtctt gctctgtggg cggaaatatc 121 aaggctgtat atgttcaggc aggcgatacc gtcaatgagg gtgacctgat tgcggaatat 181 gaaacctatg agttggacct tgagatcgag ctcaaggagc ttgaggtata ccgtgaagag 241 cttgaatacc agattgcaat tgaaaagggc gaaagcgaaa cagttaagaa caaggagctt 301 ttggacgttc agcttatgca gaatgagctt gacaagcttt atgccgaaaa agacgctacc 361 aagctttatg caggagtaag cggcactgtt tcatatgtca aaactctctc ccccggcgac 421 tgggtcaacc ccggtgaaac cattgcaacc atcatcgaca tcacagatct ttacataaag 481 atttccccca acagcgagat gggcgaattt ttgatcggca gaccgatcac cattcgctat 541 gaaggccagt atttcgacgg caccatcgtt tccaacaagt cgggcaagct ttgggatgaa 601 gaaaccaagg ctgctcaggt tgatgaaaac ggcgaattca tcctcggtga ggaatctgag 661 gctgtaatcg ttaagtttaa cgatatgatc cccgaatcct ccgctgtcgg aaacattgct 721 gacacccttt tgatcttgga taagcgcgaa aacgtaattg ttatctccgc aaacctgatc 781 aagtcctcgg gcggcatcaa ttatgtatat gttttcaagg acaatcagaa ggttcaggtc 841 aacgtaacca tcggacttga gagcggctcg ctttgcgaga tcacttccgg tcttgaagag 901 ggcgacgagg taatcatcag ataattaacc ttttttgatt tatctcggct ctcatcataa 961 ttaaactgga ggaaagaaaa tgctcacttt attgttcaga aaatgcgcaa tacaaagtgg 1021 atggtaatct gccttctcat cggatttatt atggcgacag ccatgacgag tgcgatcccg 1081 atatatatgg acgcatcctt gcagagaatg ctcatcaagg atatgcaggc ttatcaggaa 1141 gagaacaacg aatatcccgg tgtatatgcc gtttcaaaaa ccattgtcag cggcacctcg 1201 gcaaagaatc agcgcgcaac agttaacaat gtctatgcta aatctgccga ccgctttaac 1261 cagcttttgg tgcccttcat aacatataaa tgttataccg ccgactcata tctttacgtt 1321 tccagcatcg aatcggaaga actctcaatg ctcaagctgg gcggtatgag cgaaattgat 1381 gaccacatca caattctcga gggcagaatg tatgagcccg gcaagcgtga tgacggtgtc 1441 tatgaagtca tctgtaccga aaagtcgctt cagcttacac agctgaccct taatcaggta 1501 tatgaagtta caaatatttt gaatcccggc gcaacaatca agcttgagat cgtcggtgtg 1561 ttcgatcttg caaatccgac cgacacttat tggtcggagg gtatgaagaa ctatgacaac 1621 accttgcttg tcgactttga caccctcgtc ggtaacgaaa acaagtcaac aggtgttaca 1681 actgccgacg gtatcatctt taccggcgtt gttaacctga cctctgttga ctgccgctat 1741 atcatcaact atcccgaaat ggatatgaat atcattgagc atgttcgaaa ctgtttcgaa 1801 tatcattcgg agctctataa ggaagaaaac tgcaccttca gagttcctgc aagagaagtt 1861 ttggatcagt atgccgaaaa ggctgcttct ttgaagtata ttcttttgat gcttgatatc 1921 cctgttgttt tgatgcttat cttctatctt ttcatggtaa gccagctcaa catcgaatcg 1981 gaaaagaacg aaattgcaat gctcaagtcc cgcggtgcgt cctcttggca aattcttaga 2041 atttatgctt atgagaccct cattttgggt ggaatttccg cacttgtcgg accctttgta 2101 ggcttgggac tttgcaacat tctgggtgta tccaacggtt tcttggaatt tgtaaaccgt 2161 cctgcacttc aggcgagact ttcgcttgct gcattcttat atgcagttgc ggctgttgca 2221 gtattctttg ttaccaccct ggtgcctatt gttcctgcat ccagagtttc aatcgttgca 2281 cacaagcaat cccacgccaa gagcgtgcaa aagcccgctt ggcagaagat gtatcttgat 2341 tttattctga cctttggctc cgttttgtgg ctctatttcc acaaccgcca ggagcagaag 2401 ctcatcgagc agggcattgc cgacgttgca tcaacaatga acccgcttat gtttgctgca 2461 tccaccgtat ttattttggg tgctgcgctc atctgcgtaa gattctatcc ttatgttatc 2521 cgtcttatct ataagatcgg acagaagaga tggagccctg cggcttattt ctctctcaac 2581 aatatcagcc gttcttcaac aggcagagag aagttcatta tgatcttctt gatccttacc 2641 gttgcactcg gcatcttctc tgcaaatacc gcaagagcga tcaaccgcaa taccgaagag 2701 cgaatcaagt ataatcttgg tgctgatgct gttattcagg aagcttggaa gaccacccga 2761 gttaagatct actcggaaga ggacggcgga gaaacctctg tcacacagta taccgagcct 2821 gaattctcga aatatagcga gcttgcaggc gtcgaaaccg ctacccctgt tttcaagcgc 2881 gacagcgttc aaattaaata tgaagacaag accacaacca acgttcagat catgggcatt 2941 gtgcctcatc agtttgctga tgtctgctgg ttcagagata acctcttgcc tgtacatatc 3001 aactactata tcaatgctct gagcgaatgc caggacggcg taatcatctc cagctcttat 3061 caggaaaaga acggaattaa gcttggcgac gttgtttcct tcaagtggtc gaagaacgac 3121 tggttcgaag caacagttgt tgcagttgtc gacttctggc cgactatgaa tccttatgaa 3181 aagaactcct cgggcgacta ccgcgacttt gcaattttga actttgacta tatcaacgcg 3241 cttaccatca ccgagcctta tgaagtttgg ctctcgttgg acgatgaaac ccccatcgcc 3301 gacctttatc agtcggttat cgatatggac atcaccgcta cacgtctgga tgttgcaaga 3361 cagatggtaa catcctcgaa gaccgatgcc acattgcagg gcgttaacgg tgcgctgacc 3421 ttgggcttca tcaccattat ggcgatgtgc ttcatcggct tcctcattta ttggattctc 3481 tcaattaagg gcagaactct ccagttcggt attctgcgag caatgggtat gtccttcaag 3541 gagatcattg cgatgatcgt atatgagcag atactcgttt ccggtgtatc tatcttcctt 3601 tcaatcatca tcggcggcat cgcatccgac ctcttcgttc ctctgttcca ggtgctctat 3661 aatgtcaccg accaggtacc tcctttcgta gtggtatccc agagaagcga ctatattaag 3721 ctttatgtaa tcgtcggaat tatgcttgtt gtcggcttcc ttgtaattgc aagacttatc 3781 aagtcgatca acatcaacaa ggccctcaag cttggcgagg actaaaaaac cagctcccat 3841 caaaatcgga tgggagcttt ttttgcgttt atttggttga acaacaaagg cctctgctgt 3901 catgtggcct tactggtcat attcatttcc ggtaattaaa aagtcaatag aaaccttaaa 3961 atacgacgac atctttacaa gcatttccag atccggagat ctatgaccgt tttcataata 4021 agaaagagct tctctactaa tgtgtaaatc catagcaact ttaagctggc tgagcttttt 4081 ctgcttcctt atttttctta acccgaccat cttcatgata aactcctatt ttttcgaaat 4141 taatacttga cattagtgta acactgtgtt acactaataa atgtaacaat ttgttacatt 4201 ttacgaggag gaattatgaa aaaagtttta tttatcatag ggacagttat acttgtcgga 4261 ctgggcactt ggattgccat aagcgttaaa aaacgcttca ctttagcgaa cacatatgcc 4321 gaatacaaat attaggcatt gatgttattc ttaggagggg aggtaatatt ttgggtaagg 4381 gaaaagctat tgccggcttg gtgctcagca ttatcggcgt tgttcttggt gtacttaacg 4441 gatggttctc tgttgttggt ttgcccgttg caatcgtagg attggttctt tcagtttccg 4501 gcggaaaaca attgagagca aatgatttgc cgcacggtat cgcaactgca ggcttagttc 4561 tcggtataat tgctgttgta ttcactgcta ttgcattctt cacatgcggc atttgtgttg 4621 tttgcgcatc tgctcttggt gcagcagcat aacaatcatt tgagttgcca cagtatagtt 4681 tctatactgt ggtaacttac tattgaggtg aattatgaag ccgttttttt ctttatttga 4741 taggcaaata cctgtatatg gcgtcatgtg gtttgtcggg atttttttcg ccggtgttgt 4801 tgctttgcta atatgtaaca gacgcaaaat tgaacgatat gacattgttt attctgctgt 4861 ttatagtttg attggtggac ttattgggtc aaaacttctt tttgtcttgg tgtctttaaa 4921 gactattatc gacaatgctc tgccgattga agccgttatt aagggtggat ttgtttttta 4981 tggcggactg attggtggca tagtaggttt atatgtttat gttaagcagt ttaaattgag 5041 cgcggcacct ttttttgacg tgtatgcgat tgtgttaccg cttggtcatg cttttggacg 5101 cattggctgt catttcgctg gatgctgttt tgggattgag tatagcggtc cttttgctgt 5161 agagtataat tactctttaa gtggagtacc cataaacact cctttgctgc cgatacaact 5221 tatagaatcg gtcgtgttaa ttgttgtttt cggtattttg ctgtttgcat attttcgaca 5281 tattagtgac ggaatgtgtg cagttttata taccgttatt tattcgatat gcagatttgc 5341 cttggaattt ttaagaggcg atcaagatcg tggaatagca attctgtcaa catctcaatg 5401 gataagcata ctgtttttgg cgacaacagt tatatatctt attataaaaa ataaaaagca 5461 gtgcaattaa aagcactgct tttatcattt accgtatatg aacaaatctc ttgtgacttt 5521 tgcgcagccg aacatataca gcccgtcggg gctgatgtta agatattgtc ctgcatactc 5581 taaatagtca tccagcggtt caaacagcat cggaattccg tctgctgctc tgtagccctc 5641 gggaagaagc ccgtcgctga tgtcgatatt cagcgcactg accgctgaag cggtcatcga 5701 aacgccgatg ccaagaatct gttctttgct taaacagcat tcacgcaaaa tcttgtttgc 5761 ggcggtttta accgcatcgt atacagtcca aaaattcagc tcgccctttg cttcaatcag 5821 ctctttgccc aatgcctcgc ctttaagggt ggtcagacct acgcagatga tatccttcga 5881 tattccaacg cctaaggcga atttatatga gcagtcgata tccagaagca ggtttttgcg 5941 ccctctggca tatccttcac ggtatccgca gggacaaagc gcgccttggt cgagaagcga 6001 tgcacaaacc tcggtgattc tcgaggggca aacgcccaat atgcgggaaa gctccgcacg 6061 ggatttcggt cccgtgtggg caatttcctt taaaattccc gatttaacgt tcattgctgt 6121 tctccttgat gcgctcaacc tcaaaccaga atgttgagcc cttgtctatc tcgctttgaa 6181 cgccatactt tgtcttgtgc aatcgcaaaa tttccttgac gattgaaaga cccaagccgg 6241 agccgacgac gtcgcgcttg gtgcggtcgc ctctgtaata tcggtcgaat atcagcggga 6301 gcttgtcctt ttcaatgccc ttgccgaagt cgacgacctc gattctcacg gtatatggca 6361 aaatgtgagt gcggattatg atcttgcgcg agtcaccgct atagttgatc gcattgttga 6421 caaagttata cataacctgt tcaagcttcg ctctgtcacc atagcagatg cagtcgccgt 6481 ccgactcata cataaattca aagccgtcca tttcgctcag atgctgatat cgcgagagca 6541 cgctttcaac aaaaccttcc agcccgacct ttgaatattc aatactcatt gttccgcttt 6601 gaagctttga aagctcaagc atattgctta caagtgccga caatcggtcg gtttcctgaa 6661 tgatgacccc aaggtgttcg tttcgctttt caggcttatc gcccgaaaga tctctgatca 6721 tctcggcata tgctttgatc atcgttaagg gggtcctcaa atcgtgggat acgttggcaa 6781 tgaggtcgtt tctcaatgta tcgacctttg agatctcctg cgcggcatag ttaagggttt 6841 gagcaagctc gttaatttca gcgtatgaac cgctttcaaa gttggcggca tagtcgccct 6901 ttgccatttt cgatgcgctg tttgtaatct gcacgatagg ctttgaaagg ttcttcgaca 6961 ttaaaagaga aacccaaagc gccgcaaaca gcaagagcgc gctgatatat acaaactggt 7021 ctttaatgat atcaacggtc gagtcaatag gctcgaaggt ggcgttaatg aatatcatat 7081 aggtagtctg gggaatgagc gcgccgtata atatctcggt ggtttcaatg cgctcgttca 7141 caattgtctc cataatggta ctggttgaag acattaagac gcggtttcga tattcaaaca 7201 gtctgaagcc gtggtcactt gtaatgaccg agaagtttcc cataaagtcg gaaacagtga 7261 tgacatttcc gtttcggtcg gtgattgcaa tggtcatctt gtttttatat gcgatatcct 7321 caaccaacga agctacagcc gtggggtttg acctgctgaa gttctgggtg atgaggttgg 7381 atgccattgt tacattccgc ttgacggaaa attcgtaata ttggtctaaa gacaaaacct 7441 gaaagaccca caggaacata agcattgcaa cggtgaatac ggcaaagtat atccagatgg 7501 tcgcccttaa ggtcaatggc tgtttttttg gtttactgct tgatgtcgtc aaatttatac 7561 cccattccgc gaagagtcac aattaaatct ctgtatgggc caaggctgtt tctgagcatt 7621 ttaatgtggg tgtcaacggt tctgtcgtca ccgtagaagt caaatcccca cacttcttca 7681 aggagctttt cgcggctcat tgcaatgttc atatttcttg cgagatagaa caaaatgtca 7741 tattccttag gtgtcatctg cacacgcttg ccgtcgatgg ttacatctct ggctgcgaag 7801 ttgatgacaa gtcctttata gcggatgaca tcggagtttt cgggggcgct tccgcgctta 7861 attgcaacct tgattctcgc cataagctcc ttgggggaga agggcttgac cacatagtcg 7921 tcaacgccaa cctcaaagcc gaagagcttg tcatattctt cgcctctggc ggagagcatt 7981 atgacgggaa tgtttttgat ctttttgatc tccttgcagg cagagtagcc gtcaagacgg 8041 ggcatcataa tgtccaaaac gatacagtcg aagctctcgg agttggagcg caccttttca 8101 acggcatcca taccgtcgac cgcttccgtg acatccatgc cctcaaattc ggcatattcc 8161 cttacgacct cgctgatctt cgcttcgtca tcaacgatta aaattcttgg cattttttca 8221 ttcctcctat attgatagat tcggttaatt atattatagc aataaaatgt gtcaaaatta 8281 tgaaattctt ctaacaataa tataaaagca ggttcttgtt atttgccgat gtgtgtgata 8341 caataacatt acaaatatgt ttgcgaggaa ttgcgtatga aaaagacata tgtcacaacc 8401 atgccgaacc atatcggcgc atttttaaaa gcaagccagt gtttttctgc gcttggaata 8461 aatatcacac gtgtcagcta taacaaagcg gtggattccc acacgctgtt tattgatgcc 8521 gagggcacac ccgaacagct tgctcttgcc gacatcgagc ttgagaagat cggatatttg 8581 cacaaggatc gaaaagaatc gagcatcttg ctgatcgagt gctatttaaa agatgagccg 8641 ggaagtgtga cggatatttt ggcacttata aatgaatttg actttaatat ttcatatatc 8701 agctatcagg gcaacgattc ggacaaccag cttttcaaaa tgggtctgaa tgtcaacgac 8761 aacgaccgaa tcaatgagtt tttatcagaa gccgagaaaa tttgcaagct tagggtcatt 8821 gactataaca gctcggaaaa ggtatatgat aacagcattt tctataacac atatgtcacc 8881 ggactttcaa agatgatgga gctttcggag gagctgaagc aaaagctttt ggtacacgtc 8941 aatcttgcga tgcagaccct tgatgaaacg ggcttatcgc catatcgcac atttgacagc 9001 atctcgaaat ttgccgagct tttggcgctt tcaaagggca aaaattttgt ccctcgaatc 9061 accgagcata agatctccga aaacacaaca attacaacca tcgagccgcc ctgcggaagc 9121 aatgtgacga ttattaaaag taacggcaaa tatcttttca tcgacaccgg ctatgcttgc 9181 tatgaggcgg agatgctccc gataattaaa agcatcgttc ccgagtttga cgagattgaa 9241 aagaacgtcc taattaccca cgccgacctt gaccattgcg gtttgctctc gatgtttgac 9301 aatattattg caagcgccaa gagcaaaaag atcttgacgg atgaatttga tggcagggat 9361 agcttccgcg agcaaaaccc gcttcacaag ccatatatca acatctgcaa gattttaact 9421 tcatatcaac cgccgaatcc cgaaaagatc acggtcgctt gggatgagcg ggaaaacatg 9481 acagagccgc tgacacagat cggtatattc gattttgagg agctgcactt tgaggtatat 9541 gagggcttgg gaggacatct gccgggagaa atcgttctga ttgactattc aaagcacatc 9601 gccttcacag gggatgtata tatcaatatg cagggactta ccccgcagca ggcggagtat 9661 aaccaatatg ccccgatttt gatgacctcg gtagacagcg acccgaagct ctgcgccctt 9721 gaaagaaagg caattatgca acgcctgggc gttggtgagt ggaagatatt cggcgcacac 9781 ggactcaaaa aggattactc cgtta // LOCUS sequence006 9516 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence006 VERSION sequence006 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..9516 /mol_type="genomic DNA" /organism="" /note="sequence006" CDS 1208..3862 /product="cation-translocating P-type ATPase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_002377094.1" /transl_table=11 /codon_start=1 /translation="MKSYAKSVDEVLRELNATAEGLTTEQAKERLEKYGPNKLKEGEKP TLLQRFIAQLKDPMLIILLIAAAVSALTGMLAQENEWAEVIIILAVVLLNAILGVFQES KAEAAIEALQTMTAATCKVLRDGKMVILHSDELVPGDVVLLEAGDAVPADGRLIENASL KIEEAALTGESVPVNKALDILGLGEETEDIPLGDRKNMCYMGSTVVYGRGKAVITETGM DTEMGKIAGALAATAEEQTPLQRKLDELGKLLSKMVLGICVFIFAFNLFMEGDFHLEVI LDTFMVAVSLAVAAIPEGLATVVTVVLSIGVTKMSKRNAVIRRLTAVETLGCTQVICSD KTGTLTQNKMTVVDHIGDTKLVATAMALCSDANLNEENQAEGEPTECALVNFAYAEGLH KADLEKLTPRVDEAPFDSSRKMMSTVHDLGGSFIQYTKGGPDVVLAKCNYYYEDGQALP MTEEKRAEIMAANKAMADKALRVLAAAKRDWASRPTDNTAEYLEQDLVFLGLTGMIDPV RPEVKAAIEECRSAGIRAVMITGDHKDTAVAIAKELGIITDASEAITGAELDDISDDDI CEFVKRYGVYARVQPEHKTRIVTAWKKNGAITAMTGDGVNDAPSIKSADIGVGMGITGT DVTKNVADMVLADDNFATIVSAVGEGRRIYDNIRKAIQFLLASNMSEVLGVFFASLLGF ILLNPVHLLFINLVTDCFPALALGMEAAEPDTMNRPPRNSKEGIFAGGLFFDIAYQGIL VTLITIAAYLIGAYFEFGAGFFATLREVGESGHGMTMAFLTMSMCEIFHSFNLRSQRKS IFSLKSHNKVLWAAMLGSLVLTTLVLEVPFIANAFGFTTIGWDEYAIALVLAIVVIPIV EIVKLVQRLIKKH" /locus_tag="LOCUS_0500" /note="WP_002377094.1 cation-translocating P-type ATPase (Enterococcus) [pid:46.8%, q_cov:99.1%, s_cov:97.9%, Eval:2.2e-218]" /note="MGA_55" CDS 4127..4276 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MTKKLILVALLIAMVFQITACSAVGKAEDNMTNRSLYSLGNVSRL NGKL" /locus_tag="LOCUS_0510" /note="MGA_56" CDS 4263..4469 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MGSFEIYVNGVKKTTIFTSQNGGWGEAYTERCVWLFSPEEMEIEI RPTEESKGKEVTIVAIGLVDNTK" /locus_tag="LOCUS_0520" /note="MGA_57" CDS complement(4828..5616) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MGSADYEIDYIFDITGKYPAIRGLDYMSDDFKGVNKRAIEWWNEG GIVTIMWHTGADFNGEWSHCMNTEVADWDKTLTEGTAEYEAFVAGMYKAAQALLELQEE GVPVIWRPFHEFDGRWFWWGKGGAENFKKLWQLMYTRYTDHWGLNNLIWVLPYSGNGEA YDMWYPGDEYCDVIGADSYAGGVQHGLYEKLTEISDAGKPYCFHECGTAPTAEELETTP WTWFMIWHTSHLTDGNSLKDLNALYNHKYVITRDELPDFK" /locus_tag="LOCUS_0530" /note="WP_026468327.1 glycosyl hydrolase (Amycolatopsis balhimycina) [pid:42.2%, q_cov:100.0%, s_cov:58.6%, Eval:1.0e-56, partial hit]" /note="internal stop codon at [5650:5652](-)" /note="MGA_58" CDS complement(5650..5823) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MKRVLSVLIVIVTVISIFAGCGKTPANSDYVSVCELSNPNATDEA KKVYDSICSLSG" /locus_tag="LOCUS_0540" /note="MGA_59" CDS complement(5845..8034) /product="alpha-galactosidase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_012584017.1" /transl_table=11 /codon_start=1 /translation="MGIVYNEKNRVFKLDTKNTSYIMGVADSFGYLLHYYYGKKLSTCD VEYLGRIYEPPFTPDKNARDKLSFLDCAPMEYPTGGIGDFRNHCLEILTEQGHNAVELA YKSHTITSGKPALEGLPATFASDNECTTLTVLLSDDILGLDVELIYSAFEELDVITRSV KIINRAQAPIYLTKVLSACLDMDNNDFSLMSLHGSWARERHIQYRKIGYGRQSVLSERG ETSHQDHCFIALTTPGITQTTGEVYSMHFVYSGNFVAETEVNQFDTARTVMGISPYNFK WKLAGGEAFQAPEVVMTYSANGLGDMTRTHHELYRKHLIRSPYRNQKRPILINNWEATY FNFNTEKIIAIAREASQLGIEMLVLDDGWFGNRFDDNRALGDWIVNEEKLPGGLKYLAE EINKLGMKFGIWLEPEMISPDSDLYRAHPDWAIAVPGRVAGLCRNQYVLDLTRKEVLEY TWGQIKAVLNSANIDYVKWDMNRQLADLGSLGLDADRQGELYHRYVLAVYELQERLVRE FPHILLENCSGGGARFDPAMLYFSPQIWCSDDTDALERLSIQEGTALIYPLSSMGAHVS DCPNHTTGRVTPFRTRGHVALAGTFGYELDVTRIPENDRNTIPEQVAMYHKYNDLVREG DYYRLASYSENRYYDAWMVVSKDGGEALLTFVQVLGRANHKSRRIRLQGLDATATYIIE STDKRYKGDALMYAGLPIDNMWGDFQSKLIHLIRE" /locus_tag="LOCUS_0550" /EC_number="3.2.1.22" /note="WP_012584017.1 alpha-galactosidase (Dictyoglomus turgidum) [pid:48.1%, q_cov:98.9%, s_cov:98.8%, Eval:3.1e-207]" /note="MGA_60" CDS complement(8242..9066) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MKINQSIYPYNIEARKLPIHLTGIGGTEWQSHVVRVHGYQWHQIL FCDKGSGVLKYDNTYMPVEANTFFFLPAGYPHEYYSENANWDVKWVTFDGYAVNHIISL LDMTSPVVIKPNDPNALKKMFSKMLSAQTSDKLYGDLICSGLIYEYVIEFHRNMNNKAN KVISKRNNLLMPVLNYMDENFRSNFSMADLAESVGISPQHLCRVFKSAMNMRPNEYLTL LRIRESKHLLETSDLPISEIATQSGFPDAGYFSTVFKKHEGMTPMEYKNSLR" /locus_tag="LOCUS_0560" /note="WP_038966772.1 AraC family transcriptional regulator (Bradyrhizobium diazoefficiens) [pid:38.8%, q_cov:35.8%, s_cov:29.9%, Eval:1.6e-12, partial hit]" /note="MGA_61" ORIGIN 1 gtcggcatat gttgcaacaa ttctgacctc gccgtcaggc attgtgaatt gggtcttttc 61 gctgtttgca tctgaaatgg ttatctctcc ggaaattacc acccaaccgt taaacacctt 121 tccctttgga gccttgtctg cggttattga aaccacatct cccttaacag cttcctgctt 181 gtttgccttt ccgttggtta cgttaacggt gtagccctcc agcttataaa tagagaatgt 241 ggcggggttg ctttcatatc cgttgatcag acctcgcgag ttatagttga gaacaatgct 301 tcccgaactg aatgtgaatg tatcctcggc tctgccaatg gtgaaaacat cgccgtcatt 361 ttcaaacgtt gcggtaattg cgcagtcgtt agttcgggtg aatttaacat atcccttatc 421 gcatttaatt ttccatccgc cgtcggcctt ttcaaaggag aattcctttc ccgcaaagtc 481 gccgtaggtg tgatgagcat agtcgccgca gaacaaaaat ccgtcaaatt cagtctgccc 541 ttgggcaacc attgcactaa cgatggattc aattatcgcc tggcctgcct cgttgccgtc 601 aatgtgttga aaatccgaag ccgccaaaac ggttgtaacc gtgcctgcag atgtgctgct 661 tgaattcgcg ccggaaagat cagaccccga tgatggagag tatacaaccc acacaataat 721 tccgattatc gccagcagac atgccgctac ggtctatact tttgcaacat aaagcttttt 781 gtttttcata ttaaacatct ccgcttttga atttgttttc aatttaagta tacaataatt 841 gcagtcaaat tgaaagagca attactaata tctttttata aaaacagttg cattttctac 901 acttttgaag atttcgcaat cttttttcct ttgatagtat accttagtgc gaaagctatc 961 ttacgttttt aaaacctgcg tggacaagcc catgcttgtg agcacatatg tgcaatctca 1021 aatagcacca aatattttga atcaatgcgg gaatgttaaa taatatggtt tttcatactt 1081 atttcggatg tgacaggaca tataatacac tttggttaaa aaatcttcct cacaacccct 1141 tgtatcagtc tgttaaatgt tgtataatgg tatgtatgat tttctcaata attaaaggag 1201 aatttttatg aaaagttatg ctaaatccgt tgatgaagtt cttcgcgagc tgaatgctac 1261 cgctgaggga cttaccacag agcaggccaa ggaaagactt gaaaagtatg gccccaacaa 1321 gctgaaggaa ggcgaaaagc ccactctgct ccagagattt atcgctcagc ttaaggaccc 1381 aatgcttatc atcctcttga ttgccgccgc tgtcagtgcg ctgaccggta tgcttgccca 1441 agaaaatgaa tgggcagagg taatcatcat tttggccgtt gttcttttaa acgcaatttt 1501 gggtgtattc caggaaagta aggctgaagc ggcaattgaa gcacttcaga ctatgaccgc 1561 tgcaacctgt aaggttcttc gtgacggcaa aatggtaatc ctgcattcgg acgagctggt 1621 acccggcgac gttgttttgc tcgaagcggg agatgccgta cctgccgacg gacgcctgat 1681 tgagaacgct tctttgaaga ttgaagaagc tgcgctcaca ggtgaatcgg tgcccgtcaa 1741 caaagcgctc gatattctcg gtcttggtga ggaaacagaa gatattcctt tgggcgaccg 1801 caagaatatg tgctatatgg gctccaccgt tgtatacggc cgcggcaagg cagtcattac 1861 cgaaacaggt atggacaccg aaatgggtaa gattgcaggc gcattggccg caaccgcaga 1921 agagcagact cctttgcagc gcaagcttga cgagcttgga aagctcctct ccaagatggt 1981 attgggcatc tgcgtattca tttttgcatt caacctcttc atggaaggcg atttccacct 2041 tgaagtaatc ctcgacacct ttatggttgc ggtttccttg gctgttgccg caattcccga 2101 aggcttggca accgttgtaa ccgtagtttt gtccatcggt gtaacaaaaa tgtccaagcg 2161 caacgccgta atccgcagac ttaccgctgt tgaaaccttg ggctgtaccc aggtcatctg 2221 ctcggataag acaggtaccc tcactcagaa caagatgacc gttgttgacc acatcggtga 2281 caccaagctt gttgcaaccg caatggctct ttgctcggat gctaacctca acgaggaaaa 2341 ccaggcagag ggcgagccca ccgaatgtgc cttggtcaac tttgcatatg ccgaaggcct 2401 ccacaaggct gacctcgaaa agctcactcc ccgtgtggat gaagctccct tcgactcgag 2461 cagaaagatg atgtccaccg ttcacgacct cggcggctcc ttcattcagt acaccaaggg 2521 cggccccgac gttgttctgg caaaatgtaa ctattattat gaagacggtc aggctcttcc 2581 catgaccgaa gaaaagcgcg ccgaaatcat ggcggcaaac aaggcaatgg ccgacaaggc 2641 tttgcgtgtt cttgccgctg caaagcgcga ctgggcatct agacccaccg acaacaccgc 2701 tgaatacctt gagcaggatc ttgttttcct tggtcttaca ggtatgatcg accctgtccg 2761 tcccgaggtt aaggctgcaa tcgaagaatg ccgctccgca ggtatcagag ccgttatgat 2821 caccggtgac cacaaggaca ccgctgttgc tatcgctaag gagttgggca tcatcaccga 2881 tgcttccgaa gctatcacag gtgctgagct tgacgatatt tctgatgatg atatctgcga 2941 attcgtcaag agatatggcg tatatgcccg tgttcagcct gagcataaaa caagaatcgt 3001 caccgcttgg aagaagaacg gtgccatcac cgctatgact ggcgacggcg ttaacgacgc 3061 tccttcaatt aagtccgctg acatcggtgt tggtatgggt atcacaggta ccgacgttac 3121 caagaacgtt gccgatatgg ttttggcaga cgacaacttt gcaaccatcg tttccgcagt 3181 aggcgagggc agaagaattt acgataacat ccgcaaggct atccagttct tgctcgcatc 3241 caatatgtct gaggttttgg gcgtattctt tgcttcactt ctcggattta tacttctcaa 3301 ccctgttcac cttctcttta tcaacctcgt aaccgactgc ttccctgcac tcgctttggg 3361 tatggaagct gctgaacccg acacaatgaa ccgtcctcct cgtaactcca aggaaggtat 3421 attcgcaggc ggactcttct tcgatatcgc atatcagggt attttggtaa ccctcattac 3481 aatcgctgca tacctcatcg gcgcttactt tgaattcggc gcaggcttct ttgcaacctt 3541 gcgcgaagtt ggcgaatcgg gccacggtat gacaatggca ttcttaacaa tgtcaatgtg 3601 tgagatcttc cactccttca accttcgttc acagcgcaag tcgatcttca gcctcaagag 3661 ccataacaag gttctctggg cggcaatgct cggctcactc gtgctcacaa ccctcgttct 3721 ggaagtacct ttcattgcaa acgctttcgg cttcaccacc atcggctggg atgaatatgc 3781 aattgcactc gttcttgcaa tcgtcgttat cccgatcgtt gagatcgtta agctggttca 3841 gcgccttatc aagaagcact aagctcaatt tttaaaacag caggcacagc tccaaaagga 3901 gttgtgcctg ttttttatat ataacacaaa atcgacctac tcgaataacg gttggttttt 3961 ccctgcgatt tatctgcttg ctttaggact tgaatttgcg ctgatcaatt gtttttctat 4021 aaatctttga cacaccgcgc ataacgcatt ataatataag ttgttcaagg tcatattcaa 4081 ataatgtaag cgttgaacgc taaatgatta aaatgagggt ataaaaatga caaagaaact 4141 catattggtg gcattgctga ttgcaatggt atttcaaata actgcttgtt cggcagttgg 4201 aaaggcggag gataatatga caaacagatc gctatacagc ttgggcaatg tttcaagact 4261 caatgggaag ctttgaaata tatgtgaacg gtgtcaaaaa aacaaccatc ttcaccagtc 4321 agaacggcgg ttggggagag gcatacaccg aaagatgcgt ctggttgttc tcgccagaag 4381 aaatggagat tgaaatcaga ccgaccgagg aaagcaaggg caaggaagtt accattgtcg 4441 caatcggatt ggtagacaat acaaaataat agaccaatat gtaaaaaaac accttatctt 4501 taagagcgtc actctaaggg gcggtgttac ctaacaacag gaaaaggacg aagagttgta 4561 aaaaactcct cgtcctcttt tttgtggcaa tatattttct ttcgcaaatg cgatatattt 4621 tcactcacgt tcaaaagcga tataacctcc cttgcggtcg gttgcgatat ggtataaatc 4681 ccactcacgc cctgcagggc atatcgcatc gaagatatat cgcacgctta gcgtatatag 4741 cagatcccgt gagggattta tatcgctgcg tagtgccctt aaggacacta cgcataacga 4801 taaggtgttt ttgtttgtga taaaatctta tttgaaatcg ggaagctcat cccttgtgat 4861 gacgtatttg tgattataaa gcgcattcaa atctttaagg ctgtttccgt cggtgagatg 4921 cgatgtatgc cagatcataa accaagtcca aggggtggtt tcaagctctt cggctgtggg 4981 tgcggttccg cactcgtgga agcaataggg ctttccggca tcgctgattt cggtgagctt 5041 ttcatataat ccgtgctgaa cgccgccggc atagctgtca gcgccgataa cgtcgcaata 5101 ttcatctccc ggataccaca tatcatatgc ttcgccgttg cccgaatagg gaagtaccca 5161 aatcagattg ttaagtcccc aatggtcggt atatcgtgta tacatcagct gccagagctt 5221 tttaaagttt tctgctccgc cttttcccca ccagaaccat ctgccgtcaa actcgtggaa 5281 aggtcgccaa attacaggaa cgccttcttc ctgaagttcc aaaagggcct gtgccgcttt 5341 gtacatacct gcaacaaagg cttcatattc agcggtgcct tcggtcaagg tcttgtccca 5401 atcggcaacc tcggtgttca tgcaatggct ccattcgcca ttgaaatcgg cgcccgtatg 5461 ccacatgatt gtgacgattc cgccctcatt ccaccactcg atggcgcgct tgttgacgcc 5521 cttgaagtca tcgctcatat agtcaagacc tcttattgcg ggatacttgc ctgtgatgtc 5581 gaaaatatag tcgatctcat aatctgccga acccatccag gtggattcct gctgtgcgct 5641 gaggcagttt tatccgctga gcgagcagat ggagtcataa accttttttg cttcatcggt 5701 tgcgttgggg tttgaaagct cgcatacaga aacgtaatca ctgtttgcgg gtgttttgcc 5761 gcagcctgca aaaatcgaaa tgacggtgac aataacaatt aaaactgata atactctttt 5821 catactttag ccctttctgc actattactc acgaatcaaa tgaataagct tcgactggaa 5881 atcgccccac atattatcaa taggcaaacc tgcatacatc agcgcatcgc ctttatatcg 5941 tttgtcggtg ctctcgatga tatatgtcgc agtggcatca agaccctgca agcgaattct 6001 gcgggatttg tggttggctc ttcccaagac ctgaacaaag gtcaaaagcg cctctccgcc 6061 gtcctttgaa accaccatcc aggcatcata gtaacggttt tccgaatatg atgcgagtct 6121 gtaataatcg ccctctctta cgaggtcgtt atatttatga tacattgcaa cctgctcagg 6181 gatcgtgttg cggtcgtttt cgggaattcg tgtaacgtcc agctcatatc cgaacgtacc 6241 tgccaaagca acgtgtccgc gggttctgaa aggtgtaact ctgccggttg tgtggttggg 6301 gcaatcggaa acgtgtgcac ccatcgacga gaggggataa attaaagctg tgccctcctg 6361 aatggacaaa cgttcaagtg catcggtgtc gtccgagcac cagatctgcg ggctgaagta 6421 tagcatcgca gggtcaaatc ttgcgccgcc gcccgagcag ttttcaagca aaatatgcgg 6481 gaattcacgg acaaggcgtt cctgaagctc atataccgcc aaaacgtagc gatggtaaag 6541 ctcgccctgt cggtcggcat caaggcctag tgagccaagg tcagcaagct gacggttcat 6601 atcccacttg acatagtcaa tatttgcgct gttaagaaca gcttttatct gtccccatgt 6661 atattcaagc acttctttgc gggtcagatc caaaacatac tgatttcggc aaagccctgc 6721 aactcttccc ggaacagcaa ttgcccagtc gggatgggca cgatataggt cggagtcggg 6781 agagatcatt tccggctcca gccagatgcc gaacttcatt ccaagcttgt tgatctcttc 6841 tgctaaatat tttaatccgc cgggtagctt ttcctcgttg acaatccagt cgcccaaggc 6901 gcggttgtcg tcaaatcggt tgccgaacca gccgtcatcc aaaacgagca tttcaatgcc 6961 gagctgtgaa gcttcgcggg cgattgcaat gatcttttcc gtgttgaagt taaagtatgt 7021 tgcctcccag ttgttgatca agatcgggcg cttttggttt ctgtaaggac ttctgataag 7081 atgtttgcga taaagctcgt ggtgagttct tgtcatatct cccaaaccgt ttgcggaata 7141 tgtcataacc acctcggggg cttggaaagc ttcgccacca gcgagcttcc acttgaaatt 7201 ataagggctg atgcccataa cggtgcgagc tgtgtcaaac tgattgactt ctgtctcggc 7261 aacaaaattg cccgagtata caaaatgcat cgaatagacc tcgcccgttg tctgggtaat 7321 tccgggtgtg gtcaatgcaa tgaagcaatg gtcctggtgg ctggtctcgc ctcgctcgga 7381 taatacgctc tgtctgccgt aaccgatctt gcgatactga atgtggcgct cgcgtgccca 7441 tgaaccgtgg agcgacataa ggctgaagtc gttgttgtcc atatcaaggc aagcggagag 7501 aacctttgtc aaataaatcg gtgcctgtgc gcggttgata atttttacgc ttcttgtaat 7561 aacatcaagc tcttcaaacg ccgaatatat cagctcaaca tcaagcccca aaatgtcgtc 7621 actaagcaaa actgtcagag ttgtgcattc gttatcgctt gcaaaggttg caggtaatcc 7681 ctcaagtgcg ggcttaccgc ttgtaattgt atgagattta tatgcaagct caacagcgtt 7741 gtgaccctgc tcggtcaaaa tttcaagaca gtggtttctg aaatctccga taccgcctgt 7801 gggatattcc ataggggcgc aatccaaaaa gctcagcttg tcgcgggcgt ttttgtcggg 7861 agtgaagggc ggctcataaa ttctgcccaa atactcaaca tcacaggtcg aaagcttctt 7921 gccatagtaa taatgcaaaa ggtagccaaa cgaatcggca acacccatta tatagctggt 7981 gtttttggta tcaagtttga acaccctgtt tttttcatta taaacaatac ccatatgaaa 8041 ttcctcccaa aggttttttg atttaataat atcatttgtt ttgactgctg acaagttcaa 8101 tatcatatca ttttcaacta aacttttctc tttttccgca aactttcagg cttatccgca 8161 tcacaagaaa agttaaacac aaaagccgac catttaatag acggttggct ttctgaactt 8221 ttaacgattg gaagccaagc cctacctcaa tgagttttta tactccattg gggtcatacc 8281 ctcgtgcttt ttgaaaactg tgctgaagta tcctgcatcg gggaatccgg attgagttgc 8341 gatctcggaa atcggcaggt cgcttgtttc caaaaggtgt tttgattcgc gtatccgcag 8401 aagcgtcaga tattcattcg ggcgcatatt cattgcactt ttaaacacac ggcaaagatg 8461 ctgcgggctg attccaaccg actcggcaag atcggccatt gaaaaattac tgcggaaatt 8521 ttcgtccata tagttcaaaa ccggcatcaa caagttgttg cgtttgctga tgaccttgtt 8581 tgctttgttg ttcatattcc tgtgaaattc aatgacatat tcgtagataa gtcccgagca 8641 aataaggtcg ccgtaaagct tgtcagaggt ttgggctgaa agcatcttgc tgaacatttt 8701 cttcaatgcg tttgggtcat ttggcttaat gaccacaggg cttgtcatat caagcaggct 8761 gataatatgg ttaacggcat atccgtcaaa tgtcacccac ttgacgtccc aattcgcgtt 8821 ttccgaatag tattcgtggg ggtatcccgc aggcagaaag aaaaacgtat tcgcttcaac 8881 gggcatatat gtattgtcat atttcaaaac gccgcttcct ttgtcacaga acaaaatctg 8941 gtgccactga tatccgtgaa ctctcacaac gtgactctgc cactcggttc cgccgatgcc 9001 tgtaaggtga atcggcagtt tcctcgcttc aatattgtaa ggataaatgc tctgattgat 9061 tttcacaata tcatcctccg catcattttc ttatttaagt atagccgttt cgtgaattcc 9121 tgtcaaactt tttttgcttt tatgaacaca caaaatgttc aaaaataaaa agttggttca 9181 taattttcaa ttgaccgttc tcttaaacaa tgttaccatt attataggaa aagtgtattg 9241 ctttgccaaa tttatgaggg agtgcgttgc gaatatgaaa aggtatgtca cattgatatt 9301 ggcaattatg ctggcacttt tgtgcttaac aggttgcgga ctttcaaagg aggaaaggta 9361 tatgaaaaag tatgacggca aaattgttga gcttgcaccc gaggaaatat tcattaagca 9421 agaaggcgtt gaatatgccg agtttgaaaa attcacctac ttttcgacct acgccaacag 9481 agaatcccga gtaaatgttc ttttgcctcc aaacta // LOCUS sequence007 9279 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence007 VERSION sequence007 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..9279 /mol_type="genomic DNA" /organism="" /note="sequence007" CDS 485..1336 /product="AraC family transcriptional regulator" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011263652.1" /transl_table=11 /codon_start=1 /translation="MHSEDRVYGASRPYFGFSANQNPGYFQLNSIGWHRCNDKYCIKRP NGIALHTILVTTKGKGTLEVGKNEYSLIPGTVAFIPRNTANSYYTPKGGNWEFYWIHPN FGTTEQFLDTVAQKRKYIVKFEAEYNCQQKIESIMKLCANKPLNYELLISQELGGLLHH LALCMCKDLEPTSLSERAITYIQMYFSTDITIDEIAKGLFVSTAHLIRAFKKEIGMTPH QYLMQYRLHFAVQLLELSAYRVEEVAAKSGFYSASHFISCFKNKYGLTPLQYREKALIN KG" /locus_tag="LOCUS_0570" /note="WP_011263652.1 AraC family transcriptional regulator (Aliivibrio fischeri) [pid:26.0%, q_cov:81.3%, s_cov:89.2%, Eval:3.1e-14]" /note="MGA_64" CDS complement(1530..2768) /product="GTPase HflX" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_009895824.1" /transl_table=11 /codon_start=1 /translation="MTENIQTKPKVMLVSVDTGEYDVERSIAELQELCYTAGADVEAVV TQKRPVYDKSTCIGSGRLEEMAQLCEDLEIDQVIFDCELTATQIRNIEDVIDTHTIDRT MLILDIFAQRATTREGKLQVELAQNKYRLPRLAGMGIKLSRLGGGIGTRGPGETKLETD KRHIRSRIGYLEAELKEIETRRNLMRKRRHKDGVLCAAIVGYTNVGKSTLLNRLTDAGV LAEDKLFATLETTSRSITLPDGRNVMLIDTVGLISRLPHHLVEAFKSTLEEAAEADVIL HICDASSEDIDQQMTVTKDLLGELGCEGIPVVTVLNKCDLLPDAAYANAEGVVRISAKE GRGIDDLLSAIQNALPETAKRMKLLIPFAQAGVLARIRDEGNIFSEEYTADGIEVDALV DIKLVSACEQYQI" /locus_tag="LOCUS_0580" /gene="hflX" /note="WP_009895824.1 GTPase HflX (Clostridioides difficile) [pid:45.9%, q_cov:92.5%, s_cov:91.3%, Eval:4.7e-87]" /note="MGA_65" CDS complement(2906..3379) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MDKLRLVITIVFSLILLVGCSPKEEVLNHQEGQPAQTGSTSQATD SAEEYVMDKTPSKFNVDEVKSITVGLIDADVTVQKQAISSVDDAIAYGQLIFDEYNKAE GWSNDNWVMMGIERDEANDAWLTWFSEPPLHPGECISVAFYGNGEIIAVFAGE" /locus_tag="LOCUS_0590" /note="MGA_66" CDS complement(3515..3880) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MTYYDYFWPDNNIESIFIEYDKAILTVFNDELRKRVKIVCSGFAG ITNLCIWDDMTIFSTDLRPANQKDTFVKKIYSAYDKNFNYGGRALNDGLLALSIELSNH FVFSIYCLKVEVEEFYQ" /locus_tag="LOCUS_0600" /note="MGA_67" CDS complement(3949..4893) /product="N-acetyl-gamma-glutamyl-phosphate reductase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_010919254.1" /transl_table=11 /codon_start=1 /translation="MKKVLVDGHSGAVSLNIKSLVCKRDDLEVICLEDKTRFTPQQRLA LLNTADIVILCQSSKTVVETIPLIENRQTKVIDTSNAFRLAPNWTYGLPELDIDQRRKI ASSRFVSLPASMVTGAALLINPLMKSRIMPPYHPLYINSVMGYSSGGSNMISLYESSDR PNTYGGVRQYALDQQLLQQKELMHACGVSYRPSINPMIMDYPNGALVTVPLHLRTLAKR LHAKQVWETMARYYEKEKLVKVHDYSSASDDLGGFLDANAMAGSPGIELFVFGDNDICL LAARYDNLGKGGAYACVQCMNLMLGLDEYKGII" /locus_tag="LOCUS_0610" /gene="argC" /EC_number="1.2.1.38" /note="WP_010919254.1 N-acetyl-gamma-glutamyl-phosphate reductase (Caulobacter vibrioides) [pid:35.7%, q_cov:99.0%, s_cov:98.4%, Eval:4.0e-45]" /note="MGA_68" CDS 5312..5680 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MQLCRIRPIFDSDEHEKAWLLRVTINMCKNYNKKIFSHPSVELSE NIPVNDTYSDGTVMDAVMALPQKYRTVVYLFYYEGYQIKEISEILDMNQNTIASLLMRA RAKLKDMLEGEFDDEKSI" /locus_tag="LOCUS_0620" /note="WP_005809864.1 RNA polymerase sigma factor (Desulfitobacterium) [pid:42.6%, q_cov:94.3%, s_cov:68.7%, Eval:1.4e-18, partial hit]" /note="MGA_69" CDS 5664..7370 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MKNQYKIEVDQISLSESFKQSLKEKMAAEYAAEAANTLKTKKSFN FSKYSKYIATAACLVLIAATVSVVSALNGGFAVEKSADSLFRAEDLAPESNNMGADTES IDSDGLTYGLEEDDDAPVEDTVESEDEAIVVEEPVEDIVVEDALPSVEESESAVTEAEN EEVVEEAVLTEEEEVLKSAFAPENYDGEYFAEDYILSTSAANNENISTVENIVDVLGNK EITYSELCSEIDDMDEVGFAKFRIVEVLSEEDANAVAENDSFADENTMYRAELIYDYLN NTSVDGELYVTAYGNSSIQQEGFPAFAEGDVILAGIDNSDGYSSLLEEMVYMVYRVNGV DIAYHLVYENMDPGDTNMGILDMETEMVTTTENNPAKFTHKAAVKELTRYVRRNFEKRE FTFADLVNVIVNESENEETTLPEETVVSGEVSVNVSAIKLMIGSKSINPAGSGSQIRDF ANYVTATETGEDSCTVKFGQNAVTFEGTSPYVGNIRSIEINSIGSGNMMFTINSSIGIG SSWQHVVSSLGLEIEPAENAVVDVAVMSGDWVSYTMTVTVENGVVTQILFS" /locus_tag="LOCUS_0630" /note="MGA_70" CDS complement(7363..7533) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MPTDEVEQLFNFKVCHKLGATPPLRTCNHCLQQKPPLLFQARAVL FIYLYYAKEFS" /locus_tag="LOCUS_0640" /note="MGA_71" CDS 7584..7778 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MPQKSENGGDPQCGAMREIRRRLCKQVARRDCKLALTSNKKAPQI RLESEVLGFYYKLSIIGAM" /locus_tag="LOCUS_0650" /note="MGA_72" CDS complement(7748..8368) /product="SGNH/GDSL hydrolase family protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_002288769.1" /transl_table=11 /codon_start=1 /translation="MIRLLFQGDSITDWGRDHNNMYDVGWGYARHAYNELLKRYPDKEF EFINLGIGGNQTIDLVNRLESDFVDIQPDVVSILIGINDIWHHAGDRSWLPDEVFEERY RTVLQALKERTNAKIMLMEPFLIPVEDKLFFREDLYRKIEVVRKLAREYADVYLPTDGL LASAYTNEEPILFAEDGVHPTEKGAKLIGKLYADYIAPIIESL" /locus_tag="LOCUS_0660" /note="WP_002288769.1 SGNH/GDSL hydrolase family protein (Enterococcus) [pid:43.3%, q_cov:97.1%, s_cov:92.0%, Eval:4.4e-37]" /note="MGA_73" misc_feature complement(8391..>9279) /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_012582688.1:glycosyl hydrolase" /note="WP_012582688.1 glycosyl hydrolase (Dictyoglomus turgidum) [pid:39.3%, q_cov:98.0%, s_cov:62.7%, Eval:5.6e-62, partial hit]" /note="MGA_74" /locus_tag="LOCUS_0670" ORIGIN 1 acgagctgcg accaaaacct cgggaacata aatatcatta ttcttgaact tttcgccaat 61 gatgttcata ccggcaacaa gacccttttc aaggatctcc tgtgcgggaa cgccttcgtc 121 cacagccttc tgcacaagtt ccttaactgc ctttgaatcg ccgatctgaa gttttgctga 181 aatctcgtta aaaatcataa tacaatgtcc tcctgaaaac aaattaatag cacaaaattg 241 atatattgaa aacagcaaac tgagctgtaa ttcaaacttt tagttgaaat tgattgcaaa 301 atattgtata attttgatat ggttctcatt gagcctataa gtacatacta ttgcaaaaag 361 cacatcactt caagaaaatg cttaaaatcg gttcattttt gacaacttaa tatcattttt 421 ttgatatcag cagcattcaa accaatggtt ttttcagcgg tttattatta aaggagataa 481 taagatgcat agcgaagaca gagtatacgg agcgtcaaga ccttacttcg gtttttcagc 541 aaatcagaat ccgggttatt ttcaacttaa ctctatagga tggcacagat gcaacgataa 601 gtattgcatt aagcgcccaa acggcattgc tttacacaca attttggtca caacaaaagg 661 caaaggcact ttggaagtcg gcaaaaacga atatagcctc attcccggaa ctgttgcatt 721 tattcccaga aacaccgcaa acagttacta tactcccaag ggcggaaatt gggaattcta 781 ttggatccat ccgaactttg gcacaacaga gcaatttctt gatactgtcg cacaaaagag 841 aaagtatatt gtgaaatttg aagcggagta taattgtcag cagaagattg aaagcattat 901 gaagctttgc gcgaacaagc ctttaaacta tgagctttta atatcgcagg agcttggcgg 961 tctgttgcat catctggcgc tgtgtatgtg caaggatttg gagcctacaa gtctttcgga 1021 gcgtgcaatt acatatattc aaatgtactt ttcgacagat atcaccattg atgaaattgc 1081 aaaagggttg tttgtttcaa cagcacattt gattcgtgca tttaagaagg agatcggaat 1141 gacaccacat cagtatctga tgcaatatcg gcttcacttt gctgttcagc ttttggagct 1201 gagtgcatat agggttgaag aggtcgcggc gaaatccggg ttctattcgg cgagccattt 1261 tatcagctgt tttaagaata aatatggctt aacgcctttg caatatcgcg agaaagcctt 1321 gataaacaag ggataaaaga agccccacct gctgttgagg tggggctttg tgatttggaa 1381 gatatgatac ggagcgaggc gtgactgaca cggcgccgcg ccgtaggtgc ggcggcttgt 1441 ggcgtgtcgt gccgagcggt gatttggagg ctgctgttca cctcatccgt cagcttcgct 1501 gacaccttcc cctcaagggg aaggctccgc taaatttgat actgttcgca agcggatacc 1561 aacttaatat ctaccaacgc atcaacttcg atgccgtcgg cggtgtattc ttcggaaaag 1621 atgtttcctt cgtctcggat acgcgcaagc acgcctgcct gagcaaatgg aatgagcagc 1681 ttcatacgct tggcggtttc aggaagcgca ttttgaattg ctgaaagcag atcatcaatt 1741 cccctgccct ccttggcgga gattcgcaca acgccctcag catttgcata tgcggcgtcg 1801 ggcaaaaggt cgcatttgtt caaaacggtt acgacgggaa ttccctcaca gccaagttcg 1861 ccaagcagat ccttggtgac ggtcatttgc tgatcgatgt cctcgcttga ggcgtcacag 1921 atatgcaaaa ttacatccgc ctcggcggct tcttcaaggg tagatttgaa agcttcgaca 1981 agatggtgag gaagtcggga aattaagccg actgtatcaa taagcataac gtttctgccg 2041 tcgggcaagg ttatcgaacg agaggttgtt tcaagggttg caaaaagctt atcctcggca 2101 aggacgcctg catctgtcag gcggttgaga agagttgatt ttcccacgtt ggtatagccg 2161 actattgctg cgcaaagcac gccgtcctta tggcggcgct tacgcattaa gtttcggcgg 2221 gtttcaattt ctttaagctc cgcttcgaga tagccgatac gtgaacggat atggcgttta 2281 tcggtctcaa gcttggtttc acccggacct cgggtaccga ttccgccgcc aagacgggaa 2341 agcttaatcc ccatacctgc gagtcggggc aggcggtatt tattctgcgc aagttcaacc 2401 tggagtttgc cctcgcgggt ggtggcgcgc tgtgcaaaga tatcaagaat cagcatggtg 2461 cggtcgatgg tgtgagtgtc gatgacatct tcgatatttc ttatctgtgt ggcggtcagc 2521 tcgcagtcga aaataacctg gtcgatctca aggtcctcac aaagctgagc catttcttcg 2581 agtctgcccg agccgatgca ggttgatttg tcatatacag ggcgtttttg ggtgacaacc 2641 gcttcgacgt ctgcacctgc agtatagcaa agctcctgaa gctcggcaat cgagcgttca 2701 acatcatatt cgcccgtatc gacggatacg agcattacct tcggttttgt ttggatattt 2761 tcagtcataa gtcctcctgt aaattcgtgg ctaagggtta aatggtttgt tgcgtcttat 2821 gactgttcat cataagacat attatcttct gatgcgcatt tcttgatacc tcttttcgag 2881 aaatttatat ttacaggcgg tagggtcatt cgcctgcaaa gacagcgatt atttcgccgt 2941 tgccgtaaaa agcaaccgag atgcattccc ccgggtgcaa cggcggttcg gaaaaccaag 3001 tcagccaagc atcatttgct tcgtcacgct cgattcccat cataacccag ttgtcattgc 3061 tccagccttc ggctttatta tattcatcaa agatcagttg cccataggca atcgcatcgt 3121 caaccgacga aatggcttgc ttttgaacag tcacatcggc atctatcaaa ccgacggtga 3181 tgcttttgac ttcatccaca ttaaacttcg acggggtttt gtccataacg tattcctcgg 3241 cggagtcggt agcttgagag gtggatcctg tctgagcggg ttggccttcc tgatgattga 3301 gaacttcttc cttcggagaa cagccgacaa gaagaatcag cgagaaaaca attgtaataa 3361 ctaagcgtaa tttatccatt tgttcctcct ttggtggtaa gtaagcagtg aagcggggcg 3421 tgaggccaaa aatgttgctc gctttttcga aaaatgtgcg tgaaaaactg aaagttggga 3481 tgcaattggt agaataaatg ttaaggtcgc attattattg ataaaattct tcaacttcaa 3541 ctttcaaaca gtatatggaa aatacgaaat gatttgataa ttcaatgctt aaagcaagca 3601 gtccatcatt taatgctcgc ccgccgtaat tgaagttctt gtcatatgcg gaatatatct 3661 ttttaacaaa agtgtctttc tgattagcag gtcttaagtc tgtgctaaaa atcgtcatat 3721 catcccatat gcacaaattt gtaattccgg caaacccgct gcaaacgatt ttgactctct 3781 ttcgcaattc atcattaaat actgtgagaa ttgctttatc gtattcaata aagatacttt 3841 ctatattgtt gtcaggccaa aaataatcat aataagtcat attatataac ctctctgcaa 3901 acacttaata gtcgatataa agggcgaccg taacgatcgc cccgaaagtt aaatgattcc 3961 tttatattcg tcaagtccga gcataaggtt catacactga acacaggcat atgcgccgcc 4021 cttgcccaga ttgtcatatc ttgcggccaa gaggcagatg tcattatctc cgaagacgaa 4081 cagctcaatg ccgggcgagc ctgccatcgc atttgcatcg aggaagcctc ccaaatcgtc 4141 agaagcagat gaataatcat gaaccttgac gagcttttcc ttttcataat agcgtgccat 4201 ggtctcccag acctgcttgg cgtgaagtct ttttgcaaga gttctcaaat gcaacggaac 4261 agtaaccaat gcgccgttgg gataatccat gatcatcgga tttatcgacg ggcggtagga 4321 tactccgcaa gcatgcataa gctccttttg ctgcaaaagc tgttgatcaa gggcatactg 4381 gcgcacgccg ccgtatgtat tggggcggtc ggaactttcg taaagagaaa tcatatttga 4441 gccgccgctg gaatagccca tgaccgagtt gatatataaa ggatgatatg ggggcataat 4501 tcttgatttc atcaaggggt tgatcaaaag cgccgcgcct gtgaccattg atgcaggcag 4561 ggaaacaaag cgtgaagatg caatttttct gcgctgatca atatcaagct ccggcaaacc 4621 atatgtccag tttggggcaa gtcggaatgc gtttgatgta tcaataacct tggtctggcg 4681 gttttcaatc aatgggatag tttcaacaac ggttttcgag gactgacaga gtatgacgat 4741 gtccgccgtg ttcaaaagag caaggcgctg ttggggagta aatctggttt tatcttcgag 4801 gcatattact tctaaatcat cccgcttgca gacgagagat tttatattca ggctgaccgc 4861 gccgctgtgg ccgtcaacaa gaactttttt catctatgtc acttccctta ctttcagaca 4921 aattcaaaca tatttcaaca tattacattt acacataata agtgtcccat attttttgca 4981 atttgtcaac actttttgtc agttttactg ttttggaaca aaactgtaac catttattta 5041 tttacttttg aaaaaaaact gataaaatga aaatatgatg caatttttat gtgttgcaga 5101 ttgtattata tacgaaacat gatcaaaagc tttcgttgaa cggaaaggag ttctttgctt 5161 ttaacaggca ataaacagga ttatgcagac aaatgatatg aacacctaca tatcttctgt 5221 tgtcgataaa tattccgata tggtctaccg cgcggctcgg catgccgttt gcgattcgca 5281 ctatgcggag gatatcacac aggaggtgtt cttgcagctt tgccgtatcc gccctatctt 5341 tgattcggac gaacacgaaa aggcatggct cttgagagtc acaataaata tgtgcaagaa 5401 ctataacaag aaaattttct cgcatccaag cgttgagctg agcgaaaaca ttcccgtcaa 5461 tgatacatac agcgacggaa ctgttatgga tgcggttatg gcattgcctc aaaaataccg 5521 tacagtagtc tatctgttct attatgaagg ctaccagatc aaggagatat cagaaattct 5581 cgatatgaat caaaatacta ttgcttccct gcttatgaga gcaagggcca agcttaaaga 5641 catgctggag ggagagttcg acgatgaaaa atcaatataa gattgaagtc gatcagattt 5701 ctttaagcga aagctttaag cagagcctta aagagaaaat ggctgctgaa tatgccgcag 5761 aagccgcaaa cacattaaaa actaaaaaat catttaattt cagcaagtat tccaaataca 5821 ttgcaactgc cgcttgcctg gttttaattg cggcaactgt cagtgtcgtt tcggcactta 5881 acggcggttt tgcagttgaa aagtcggctg attcgctgtt tagagccgag gacctcgcac 5941 cggagagcaa caatatgggt gctgacacgg aaagtataga tagcgacgga ttgacatatg 6001 gacttgaaga ggatgacgac gctcccgttg aagacaccgt tgaatcggaa gacgaggcta 6061 tcgttgttga agaacctgtc gaggatattg tggttgaaga cgccctcccc tcagttgaag 6121 agagtgagtc tgcggtaact gaagctgaaa atgaagaagt cgttgaagag gcggttttga 6181 ccgaagagga agaagttctt aaatcggcat tcgctccgga aaactacgat ggcgaatact 6241 tcgcagagga ttatattctt tcgacatccg ctgcaaacaa tgaaaacatt tcgacggttg 6301 agaacatcgt tgatgtttta ggcaataaag agataaccta cagcgagttg tgctcggaga 6361 tcgacgatat ggacgaggtt ggatttgcaa aattcagaat cgttgaggtg ctttcggagg 6421 aagatgcaaa cgctgttgct gaaaatgaca gctttgcaga cgagaacaca atgtatcgtg 6481 cagaactgat atatgactat cttaacaaca cttctgttga tggcgagtta tatgttacgg 6541 catacggtaa ttcaagtatt cagcaggaag gattccccgc atttgccgaa ggcgacgtga 6601 ttctggcagg tatcgacaac tcggatggat atagctccct tttggaagaa atggtctata 6661 tggtataccg agtaaacgga gttgacattg cttaccatct ggtatatgaa aacatggacc 6721 cgggagatac aaatatgggt attctcgata tggagactga gatggtaacc acgaccgaga 6781 acaatcccgc aaagttcacc cacaaggctg cagtcaagga attgacaaga tatgtaagac 6841 gcaactttga aaagcgagag ttcacatttg cagaccttgt aaatgtcatt gtgaatgagt 6901 cggaaaacga agaaaccacc ttgcctgagg aaacagttgt tagcggcgaa gtgagcgtta 6961 atgtgagtgc aatcaagctg atgatcggaa gcaagagcat taaccctgca ggaagcggct 7021 cgcagattcg tgattttgca aactatgtta ccgcaaccga gacgggcgaa gacagttgca 7081 cagttaaatt cggacagaac gcagttacat ttgagggcac atcgccctac gtcggcaata 7141 tacgttcgat tgaaattaac agcatcggct cgggcaacat gatgttcaca atcaactcga 7201 gcatcggaat cggttcatcg tggcagcacg ttgtaagctc gcttggactt gaaattgaac 7261 ctgctgagaa cgcagttgtt gatgttgcgg ttatgagcgg cgattgggtt tcatacacca 7321 tgacagtgac tgttgaaaac ggagttgtta cacagatttt gttcagctaa attccttcgc 7381 ataatagaga tatataaaca aaaccgccct tgcttggaag agcaagggtg gtttttgttg 7441 caagcagtgg ttgcatgtgc gcaaaggcgg ggttgcgccc agcttatggc agactttgaa 7501 gttgaaaagt tgctccacct catccgtcgg cattcgccga cacctttcct caaaaggaag 7561 gctttgggcg gggcggaggc catttgccgc agaagtcgga aaatggaggg gacccgcaat 7621 gtggggcgat gcgcgaaatc aggcgccgtc tgtgcaaaca ggtggcgcgg agggattgca 7681 agcttgccct tacatcgaac aaaaaagcac ctcagatccg cttggaatct gaggtgctgg 7741 gtttttatta caaactttca attatcggtg cgatgtaatc ggcataaagc ttgccgatga 7801 gcttagcgcc cttttcggtg ggatgaacgc cgtcttcggc aaataagata ggttcttcgt 7861 ttgtatatgc agatgccaaa agtccgtcgg taggaagata tacatcggca tattcgcgag 7921 ccaatttgcg gacgacctca atcttgcggt aaaggtcctc gcggaagaag agcttatctt 7981 caacaggaat caagaaaggt tccataagca ttatttttgc gttggttctt tccttgagcg 8041 cctgcaaaac ggtgcgatat ctttcctcga acacttcgtc gggaagccag ctgcggtcgc 8101 cagcgtggtg ccaaatgtca ttgataccga tgagaatgga tacaacgtcg ggctgaatgt 8161 caacaaaatc cgattcaagg cggtttacaa ggtcaattgt ttggtttccg ccgatgccga 8221 ggttgatgaa ctcaaactcc ttatcagggt atcttttgag caattcattg taagcgtgtc 8281 tggcatagcc ccaaccgaca tcatacatat tgttgtggtc tctgccccaa tcggttatag 8341 agtcgccttg aaacagtaat ctgatcataa ttcgtatcct cctaaaattt ttattccaac 8401 cgatactttt taaggttcgg cagttcatct aaggttaatg tatattcgga attatatgcc 8461 ttatatagca tttcatcgga tgtgtacatt gcgctggcat attcaccgcc ccaagttccc 8521 cagaagagcc aacgggcatt atctcggaag cagagctcgg gatccattac aatgccgttc 8581 tcggaaagtg cgataagctt tgtttcacca taactctcag tcaaggtagc aaaagttgat 8641 gaatagcttc cgtattcata tctgtcagca taaatgtccc aagaaacgat gtcaacaacg 8701 tcgtcaccgg ggtaccaatc gaggttctga ccattccacg tccagattag gttggtaagg 8761 ttaaactcgt tggtcatttt gtcatacatc gtgcgccaaa gcttgatata tgactcaggc 8821 tcgcaatcgc cccaccagaa ccatccgcct gcggcttcgt gcaaaggtct ccaaagaatc 8881 ggcacaccgt catcgcggag cttttgaagc tcggtcgcaa tgttatcaat atccttcatt 8941 aaaagctcat aaccgcgctc atcctcgccg ttcataataa ggtcgaggtc tatgtcggaa 9001 ttttcagcgt agaaggagtt ccaataattt gcgccatatg caacataagg cttgggcgaa 9061 ttccaatgcc agcaatactg aacgattccg cctgcgttgt gataccagtc gtgggcatgc 9121 tccatactgt tgccaactgc gccgtggtcc ttgttaatga gggtgtagct catcatatcc 9181 agtcccaaaa cagcaaattc cttgccggtt gtatctaaca cataatcata atgctccgaa 9241 gatcttccgc cgtcagcata ctgacccgtc agagaatag // LOCUS sequence008 8749 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence008 VERSION sequence008 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..8749 /mol_type="genomic DNA" /organism="" /note="sequence008" CDS 190..504 /product="ribosomal-processing cysteine protease Prp" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003438074.1" /transl_table=11 /codon_start=1 /translation="MIVAQFLTTNGRLKGFAVKGHAGYAKSGQDIVCASVSSAVMLTVN TASESFNIETDTYVGDDEIRCTFKGSSPEGEKLLISLKNHLEILSEDYPKFVKVNTSEV " /locus_tag="LOCUS_0680" /note="WP_003438074.1 ribosomal-processing cysteine protease Prp (Clostridioides difficile) [pid:34.8%, q_cov:83.7%, s_cov:84.8%, Eval:3.4e-09]" /note="MGA_76" CDS 508..789 /product="50S ribosomal protein L27" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_000944958.1" /transl_table=11 /codon_start=1 /translation="MLRISMQFFAHKKGVSSTKNGRDSESKRLGAKRADGQAVLAGNIL YRQRGTHIHPGNNVGIGSDDTLYAKIDGIVRFERLGRDRKKVSVYPAE" /locus_tag="LOCUS_0690" /gene="rpmA" /note="WP_000944958.1 50S ribosomal protein L27 (Bacillus) [pid:80.2%, q_cov:97.8%, s_cov:94.8%, Eval:5.0e-37]" /note="MGA_77" CDS 868..2142 /product="GTPase ObgE" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_010964572.1" /transl_table=11 /codon_start=1 /translation="MFVDEVYIPVEAGDGGDGCVSFHREKYVAAGGPDGGDGGKGGDIV FLVDDNCSTLIDFRFKRKYVAQRGNDGGSKNSFGKSAPDLVIKVPRGTVVREKESGRII ADMSGNEPVVIAKGGRGGRGNAHFATPTRQIPRFAKPGFKGQKLELKLELKLLADVGLV GFPNVGKSTLISVVSAAKPKIANYHFTTLTPVLGVVKAYDGKSFVMADIPGLIEGASDG VGLGHEFLRHVERCRLIIHVVDVSGCEGRDPIDDFEIINRELRNFSDDLANAPQIVAAN KSDMATDEQIAEFKEYIESQGLMFFTISAATTMGTKELIDAASLELAKLPPLKVFEPDP VPEWTPEELSSDRKFEITHEDGIYFVEAEWLEGVLRMVNIDDYSSLQHFQLVLKSSGII DKLEEIGSQDGDTVSVCDFEFDYVR" /locus_tag="LOCUS_0700" /gene="obgE" /note="WP_010964572.1 GTPase ObgE (Clostridium) [pid:50.4%, q_cov:100.0%, s_cov:100.0%, Eval:2.3e-116]" /note="MGA_78" CDS 2164..2571 /product="ribonuclease III domain-containing protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011860630.1" /transl_table=11 /codon_start=1 /translation="MFKPLEKREVNQYSPLALAFLGDSVYEQLVREKLTLFANMPANKL HNLAVKYVCCEFQSNAVEVILPILSEDEQDIIRRGRNSSGITEPKHSDIATYRRATGLE TLFGYLDLLDRQERIQELFEKIWETVEIDAK" /locus_tag="LOCUS_0710" /note="WP_011860630.1 ribonuclease III domain-containing protein (Clostridioides difficile) [pid:43.1%, q_cov:95.6%, s_cov:99.2%, Eval:8.6e-21]" /note="MGA_79" CDS 2620..3363 /product="YebC/PmpR family DNA-binding transcriptional regulator" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_012048090.1" /transl_table=11 /codon_start=1 /translation="MSGHSKWNNIKRKKEAADGAKAKIFTRIGREIAVAVKEGGADPSS NSKLRDLISKAKANNVPNDNIDRVIKKAAGDTDKNSYETMVYEGYGPGGVAVIVECLTD NKNRTAGDVRHYFDKFGGNMGTTGCVSFMFTRKGVITMEYDGQDEDKVMEDCFEAGAED FNIEDEIIEVNAEPNDVYKVSEALTGLGYKVLSAEAAMVPSTYTELTDETHLKFMNLLL ENLDENDDVQQVWHNWDMPEEPEED" /locus_tag="LOCUS_0720" /note="WP_012048090.1 YebC/PmpR family DNA-binding transcriptional regulator (Clostridium botulinum) [pid:56.3%, q_cov:99.6%, s_cov:100.0%, Eval:1.2e-72]" /note="MGA_80" CDS complement(3522..4187) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MKNKKLSFIIAVGLMAALCYVGNYLQIKIPNGVLITRVHLGNSMC LLAGILFGGPIGGLASGIGAALYDLFDPVYIISAPFTFLSKFAMGYVAGVIAKSAKRFS NETVHMSIAAVLGQLTYIVLYLSKTYITQIILGYEVETALAAVGTNAITSTINAVLAVI ISVPLYFALKKPLSITYFKELVAARNESKHKWYVKLAVVVIFIAIAVGAAVFYAVKKG" /locus_tag="LOCUS_0730" /note="MGA_81" CDS 4563..4934 /product="metalloregulator ArsR/SmtB family transcription factor" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_005807906.1" /transl_table=11 /codon_start=1 /translation="MEHNHNCANCEHAECCGRNVEKVRLYASKMISEEEAYYISELYKA MSDPTRVRILFSRIPGEMCVCDITELVGVSQSAVSHQLRTLKQAGLVRYRRDGKTMYYS IADSHVSTMLAMGLEHIAE" /locus_tag="LOCUS_0740" /note="WP_005807906.1 metalloregulator ArsR/SmtB family transcription factor (Desulfitobacterium hafniense) [pid:48.4%, q_cov:99.2%, s_cov:94.4%, Eval:2.3e-26]" /note="MGA_82" CDS complement(4956..5120) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MAMAATAAVIIVRMARATVTMAMEFETVIVGVLIVMMAMALVIVA GAGICFVVV" /locus_tag="LOCUS_0750" /note="MGA_83" CDS 5319..6980 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MSIATFGAIAVGELREAVAVMVFYSIGQILEEVAQNRSKKSIRAL MELHPDVVHIKQDGKIVPVTPEEVNVGDIVMAVAGERISLDGKILSGTTSIDYSALTGE SIPVYAAEGDNVFGGGINLSGSIEIEVTKPYSESSAARIIRLVEDARSKKAKSERFIAR FAKKYTVAVCIIAAMIAFIFPIFTGYADTFSRWLYTGLTFLVVSCPCALVISVPLTFFA GLGCASSHGILIKSTASVETISKLKTIAFDKTGTITKGVLSVTHTELDDESLRFAAYAE SRSNHPAAKAIVSYFGGDIPLDAITETEEIPGRGIKATVSGREVLVGNRQMMIDNGIRE DDLKQRHAFGIYSYVLVDGELKGHIILNDELKSDSIDAIDKLHKSGVEAVMLTGDNQEA ANEVCNRVRIISNYANLSPEQKCLRMMSITQFAKSNQGGTAAFVGDGINDAPVLAMADV GIAMGGLGSDAAIETADAVILNDSLMKLPLLIKISKRTMSIVKQNIVFSLGVKILVMIL SVLNIATMWMAVFADIGVMLLAVLNALRALRYRKRD" /locus_tag="LOCUS_0760" /note="WP_011860727.1 heavy metal translocating P-type ATPase (Clostridioides difficile) [pid:47.4%, q_cov:99.1%, s_cov:68.8%, Eval:2.7e-139, partial hit]" /note="MGA_84" CDS 7076..8044 /product="50S ribosomal protein L11 methyltransferase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011861555.1" /transl_table=11 /codon_start=1 /translation="MEWLCLNIYTTHEGIEPLSAALMDIGISGIVINDPYDIDQFVANK TDEWDYIDDDLADTSDKDTYITVYITNDADGAELLSEINTAIMRLKVFDEAKAYGNLNI ENTSIREEDWENNWKRFFKPVYIGEKLVIKPTWEDLPSDNTRVVIELDPESSFGTGRHY TTQLCLELLEKYVHSGDKVADLGCGSGIISIAAMMLGAESAKCTDIAENAIRIAKENAF KNGIADDKYAVYCGDIASDNTLAEKFGVGYDLVAANIVADVLLSMTDVFKNITREGGIL VVSGIIDDRLDEVMTKITDNGFEVIESAHRDIWNAAALRRV" /locus_tag="LOCUS_0770" /gene="prmA" /note="WP_011861555.1 50S ribosomal protein L11 methyltransferase (Clostridioides difficile) [pid:35.6%, q_cov:97.5%, s_cov:96.8%, Eval:7.6e-55]" /note="MGA_85" CDS 8041..8679 /product="RluA family pseudouridine synthase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_009892161.1" /transl_table=11 /codon_start=1 /translation="MIDILYNDDSIVVCIKPAGIISEDGGLPDLLRAQLGCEIYPIHRL DKPVGGIMVYAKTKPASAKLSADFQNRAVTKEYLCIVKGIPQEHSAVLKDLLYKDSRAN KTFVVTRERKGVKPASLEYELLDTKSSPDGELSLLKVKLHTGRSHQIRVQFASRKLPLL GDSRYGGKKQGIDVCLWSHRLKFSHPIIGSAFDYIACVPDDYPWILFKM" /locus_tag="LOCUS_0780" /note="WP_009892161.1 RluA family pseudouridine synthase (Clostridioides difficile) [pid:41.3%, q_cov:99.1%, s_cov:100.0%, Eval:7.0e-41]" /note="MGA_86" ORIGIN 1 taacggcgaa tccaccaccg taggtgctcc ctatgttgct ggtgctaccg ttgaagctaa 61 ggttcttaag aacggtaagg ctaagaagat cactgttatg acctacaagc ccaagaaggg 121 ttcttcccac aagaagcagg gtcacagaca gccctacact caggtaagaa ttgaagctat 181 caaggcataa tgattgtagc gcagttttta acaactaacg gcagacttaa aggctttgcc 241 gtgaaaggcc acgcaggata tgcaaaatcg ggacaggaca tcgtatgtgc gagtgtttct 301 agcgcggtta tgctgactgt gaacacagca tctgaatcat tcaatatcga aaccgataca 361 tacgtcggtg atgatgagat cagatgcaca tttaaaggaa gttctcccga aggcgaaaag 421 cttttgataa gtcttaagaa tcaccttgag attttaagtg aggactatcc caaattcgta 481 aaagttaata cttcggaggt gtgataaatg ttgagaatca gtatgcagtt cttcgcccat 541 aagaagggtg taagttctac aaagaacggc cgtgactccg aatccaagag acttggtgca 601 aagagagccg acggacaggc tgtattggca ggtaatattc tttaccgtca gcgcggcaca 661 catattcatc ccggcaacaa cgtaggaatc ggttccgatg ataccctcta cgcaaagatt 721 gacggtatcg taagattcga aagactcgga cgcgacagaa agaaagttag cgtatatccg 781 gctgaataat ttttaaagga ctaaatcccg gacttttcag cccgggattt tccattgaat 841 cgagattttt ttataggagg cgaaaaaatg ttcgtcgatg aagtatatat acccgtagaa 901 gcaggcgacg gcggcgacgg ctgtgtgtcg ttccaccgtg aaaaatatgt tgccgcaggc 961 ggacccgacg gcggagacgg aggtaagggc ggagatatcg tttttttggt cgatgataac 1021 tgctcgaccc tgatcgattt tcgcttcaag cgcaaatatg tggctcagcg cggaaatgac 1081 ggcggctcga aaaacagctt cggcaaatcc gctcccgacc tcgtaatcaa ggtgcccaga 1141 ggcacagttg tccgcgagaa ggaatcgggc agaataatcg ccgatatgtc gggaaatgag 1201 cctgtagtaa ttgcaaaagg cggcagaggc ggcaggggaa atgcgcattt cgcgacccct 1261 acccgtcaga ttccccgttt tgcaaagccc ggcttcaagg gtcagaagct tgagttaaag 1321 cttgagctga agctcttggc tgatgtgggt cttgtgggct tccccaacgt cggaaaatca 1381 actctaattt cggttgtttc cgcggcaaag cccaaaattg caaactatca ttttacaact 1441 ttgactcctg ttttgggcgt tgtaaaggca tatgacggca agtcattcgt tatggctgat 1501 attcccggac ttatcgaggg tgccagcgac ggtgttggtt taggacacga attcttgcgc 1561 catgttgagc gttgccgact tattatccac gtcgttgacg tttcgggatg cgaaggcaga 1621 gatcctattg acgattttga gatcatcaac cgcgagcttc gcaatttctc ggatgacctt 1681 gcaaatgctc cgcagatcgt cgccgcaaac aagtcggata tggcgactga tgagcagatc 1741 gcagagttta aggaatatat cgagtcacag ggacttatgt tcttcaccat ttctgcggct 1801 accactatgg gcactaagga gcttatagat gcggcatcgc ttgagcttgc aaagcttccg 1861 cctttaaagg tgtttgaacc cgatcccgtt cccgaatgga ctcccgagga gctttcaagc 1921 gacagaaagt ttgaaattac ccacgaagac ggtatttact ttgttgaagc agaatggctt 1981 gagggcgttt tgcgaatggt caatattgat gactattcat cgcttcagca tttccagttg 2041 gttcttaaat ccagcggtat cattgacaag ctcgaagaaa ttggcagtca ggacggagat 2101 actgtatccg tctgtgattt tgaattcgac tacgttagat aatttcttga aagggtgaca 2161 aaattgttca aaccccttga aaaaagagaa gtaaatcaat acagcccctt ggctcttgct 2221 tttttgggcg actcggtata tgaacagctt gtccgcgaaa agctgacttt gtttgcaaat 2281 atgcctgcaa ataagctcca taatcttgca gttaaatatg tttgctgtga gtttcaatcc 2341 aatgctgtag aggtaattct gccgattctt tcggaagatg agcaggacat tattcgccgc 2401 ggccgcaatt ccagcggaat tacagaaccc aagcattcgg atattgcgac ttatcgcaga 2461 gctacaggtc ttgaaaccct ttttggctat ctcgatcttt tggacagaca ggaaagaatt 2521 caggagcttt tcgagaaaat ctgggaaact gttgaaattg atgccaagta gtattataat 2581 atagaggtat ttgaaaatac tgaaaggaag tttatttata tgtcaggaca ctctaagtgg 2641 aacaatatta agcgtaaaaa agaggctgct gacggcgcaa aggccaagat tttcacaaga 2701 atcggccgtg aaattgcagt tgcagttaag gaaggcggcg ctgacccttc gagcaactcg 2761 aagctccgcg accttatttc taaggcaaag gctaacaatg ttcccaacga caacatcgac 2821 cgcgttatta aaaaagcggc aggggacacc gataagaaca gctacgaaac tatggtatac 2881 gaaggctatg gccccggcgg tgtcgctgta atcgttgagt gcctgaccga taataaaaac 2941 cgcaccgcag gcgatgtcag acactacttt gacaagttcg gcggaaatat gggcactacc 3001 ggctgtgtat cctttatgtt tacccgcaag ggcgtcatca ccatggaata tgatggacag 3061 gatgaggaca aggtaatgga agattgcttt gaagcaggtg ctgaggactt caacattgaa 3121 gacgagatca ttgaagtcaa cgctgagcct aacgatgtgt ataaggttag cgaagcgctc 3181 accggcctgg gatataaggt tctttctgca gaagctgcaa tggttccttc cacctatacc 3241 gagcttacag atgaaaccca tcttaagttt atgaaccttc ttcttgaaaa cctcgatgag 3301 aacgacgacg ttcagcaggt ttggcacaat tgggatatgc ccgaagaacc tgaagaggac 3361 tgatattgca aatatcaaag gcgtgtactg ttcgtacccg ccttttttgt ttgctgtgac 3421 cgctccgcgc cacctgcttg caaagttcct tcggaactca ctgcgcagac gccgctccgc 3481 tgcataaaaa agtccgccga tttacctcga cggactttat tttatccctt tttaactgca 3541 tagaacacag ctgcaccgac agcaatcgca atgaatatga caactacagc taacttaaca 3601 taccatttgt gtttcgattc gtttcttgct gcaactagtt ccttgaaata agtaatagat 3661 aacggctttt tcaaagcaaa gtacagcgga accgagatga ttaccgctaa aaccgcattg 3721 atggtcgatg taattgcgtt tgtgcccaca gccgccaaag ctgtttcaac ctcatatccc 3781 aaaattatct gggtgatgta tgtcttggaa agatacaaaa caatgtatgt tagctgtccc 3841 aaaacagcgg caatgctcat atgtacagtt tcgtttgaaa atcgctttgc cgacttcgca 3901 atcacacctg caacatatcc catggcaaac tttgaaagga aggtaaaagg agcagagata 3961 atgtatacag ggtcgaacag gtcatatagc gcagcaccga tgcctgatgc cagaccaccg 4021 atcggtccgc caaagagtat gcccgccagc aagcacattg agttgccaag gtgaactctt 4081 gtaattaaaa cgccattggg aatcttgatc tgtaaatagt ttccaacata gcaaagtgcc 4141 gccataagtc cgactgcaat gatgaatgat agctttttgt ttttcataat ttttgccccc 4201 tcgggaatgt catatccata ttttattccg aaaaattcta aaatgcaaat ttaaatagtt 4261 gtaaaagcat tcagctttac attgtgcaaa tacaacagta aaattatttc tatatgttac 4321 ttctgatgtt taatattaac aaagaattta gccaagtttt tatcctataa atttcaaacc 4381 tcaaaactgc acaaaaatca atcacttttg cctttgagat taaacaaaaa agtagaaact 4441 caaacttaac aatttttcat tcaacctatt gacaaaatct aaagatacta tataatgaac 4501 atatgaacaa ctgctcatat gttatattga gtgtgaataa atttataaat aggggagtaa 4561 ctatggaaca taaccacaac tgtgcaaact gcgaacacgc tgagtgttgc ggcagaaatg 4621 tcgaaaaggt gcgcctatac gccagcaaaa tgatttccga agaggaagca tattacataa 4681 gcgagctata taaagcaatg tctgacccta cccgtgtgcg aattcttttt tcgcggattc 4741 ccggggaaat gtgcgtttgc gatatcaccg agctcgtcgg tgtcagccag tctgcggttt 4801 ctcatcagct gaggaccctc aaacaagcgg gacttgtccg ctatcgccgc gatggcaaaa 4861 caatgtatta ctctatcgcc gacagccacg tttcaacaat gttggcaatg ggtcttgagc 4921 acatcgcaga gtaaataagg agtcatatac atatgtcaca caaccacgaa acaaattcct 4981 gcacctgcca cgataacgag tgccattgcc atcatcacaa tgagcacacc cacgatcaca 5041 gtctcgaatt ccattgccat ggtgactgtt gctcttgcca ttctcacgat gatgacggct 5101 gcggttgcgg ccattgccat agcgataagc caatcaaaaa ccgcttgttg atgctcattc 5161 cggcggctat agttcttgtt tcatctttta tcttctccga agacctcatc tgggtttcaa 5221 ttttattgct cgcggcatac atcattgtcg gacttgacac cgtaatcagt gccgtaaacg 5281 agcttattcg tgagaaaacg gtcggagaat ctttcttaat gtcaatcgca accttcggcg 5341 caatcgccgt tggcgagctc cgcgaggccg ttgctgtaat ggtattttac tctatcggtc 5401 agattctcga ggaagttgct caaaatcgct ccaaaaagag cattcgcgct ttaatggaac 5461 ttcaccccga tgttgtacac atcaagcaag acggtaaaat cgttcccgta acgcccgaag 5521 aagtcaatgt cggcgatatc gttatggctg ttgccggcga gagaatctct cttgacggaa 5581 aaatcctctc gggaactacc tcgatcgact attccgccct cactggtgag tcgattcccg 5641 tatatgctgc cgaaggtgac aatgttttcg gtggaggaat caaccttagc ggttcgattg 5701 agatcgaggt caccaagcct tattctgaat caagcgccgc aagaataatc cgccttgttg 5761 aggatgcaag aagcaaaaaa gccaagtcag agcgtttcat cgctcgcttc gctaagaaat 5821 ataccgttgc tgtctgcata attgccgcga tgattgcctt tatcttcccg atatttacag 5881 gttacgccga tacatttagc cgctggctat acacaggtct tacattcctt gttgtgtcct 5941 gtccctgcgc tttggtaatc tctgttccgc tgaccttctt tgcaggcttg ggttgtgcat 6001 cctctcacgg aatcttaatc aagagcaccg cctcggtcga aacgatttcc aagctcaaaa 6061 caattgcttt tgacaagacc ggtacaataa caaagggcgt tttgtctgtc acccataccg 6121 aattggatga cgaatctttg cgctttgcgg catatgccga aagccgttca aatcaccccg 6181 ccgctaaagc tatcgtatca tatttcggcg gagatatccc gcttgatgct ataaccgaaa 6241 ccgaagaaat ccccggcaga ggaatcaagg caactgtatc gggtagggaa gtgcttgtcg 6301 gcaatcgaca gatgatgatt gataacggta ttcgtgaaga tgatctcaaa cagcgccacg 6361 ccttcggtat atattcctac gttttggttg atggtgagct taaaggtcac atcattctga 6421 acgatgaact caaatccgat tcaattgatg caatcgacaa gctccacaaa tccggagttg 6481 aagcggttat gcttacaggc gataaccaag aagctgccaa tgaggtttgc aaccgcgtga 6541 gaattattag taactatgcc aacctttcgc ctgagcaaaa atgcttgcga atgatgtcaa 6601 tcactcaatt tgcaaaatca aaccaaggcg gtaccgccgc attcgtcggc gacggaatca 6661 acgatgctcc cgttttggca atggccgatg tgggaattgc aatgggaggt ctcggctccg 6721 atgctgcaat tgaaactgcc gatgccgtaa tcttgaatga tagcttaatg aagcttcctt 6781 tactcattaa aatctctaag cgcacaatgt caatcgtcaa gcaaaatatt gttttctccc 6841 tcggcgttaa aatccttgta atgattttga gcgtattgaa catcgccaca atgtggatgg 6901 ctgtatttgc cgatatcggt gtaatgcttt tggctgtatt gaatgcgctt cgtgctttaa 6961 gataccgcaa acgcgattga ctaatccata ttaaatgtgc taaaatcaaa tagaacaaaa 7021 agctgtcatg attttttgtg acagcttttt atatgaaaga aaggtgaatg ttaaaatgga 7081 atggctttgc ctaaatattt atacgactca cgagggaatt gagcccttaa gcgccgcgct 7141 gatggatatc ggcatttcgg gaattgtcat caacgaccca tatgatatcg accagtttgt 7201 tgcaaacaag actgacgagt gggactatat cgatgacgat ctcgctgaca cctccgataa 7261 ggatacctat atcactgtat atattaccaa cgatgccgat ggtgctgagc ttttaagcga 7321 gattaacacc gcaataatgc gacttaaagt gtttgacgaa gcgaaagcat atggtaacct 7381 caacattgaa aacacatcta tccgcgaaga ggattgggaa aacaactgga agcgtttctt 7441 taaacctgta tatatcggtg aaaagcttgt aatcaagccc acttgggaag atttgccatc 7501 tgataatacc cgcgttgtaa tcgagcttga ccccgaatcc agcttcggca cgggcagaca 7561 ctataccact cagctttgcc ttgagcttct ggaaaagtat gttcattctg gtgataaagt 7621 tgccgacctc ggttgcggca gcggaataat ttcaatcgct gcaatgatgc ttggcgccga 7681 aagcgcaaaa tgtaccgata ttgcagaaaa cgccattcga attgcaaagg aaaacgcctt 7741 caaaaacggt attgctgatg ataaatatgc agtatactgc ggcgatattg cttctgataa 7801 taccctcgca gagaagtttg gcgttggata tgaccttgtt gcggcaaaca tcgttgccga 7861 tgttctgctc tcaatgacag atgttttcaa aaatatcaca cgcgaaggcg gcatacttgt 7921 cgtatcggga atcattgacg accgtttgga cgaagtaatg acaaaaataa cagataatgg 7981 atttgaagtg atcgaatcgg cacacagaga tatctggaac gccgcggcat tgaggcgcgt 8041 atgatagata ttttatacaa cgatgatagc atagttgtct gcatcaagcc tgccgggata 8101 atctccgagg atggcggctt gcccgacctc ttgcgcgccc agcttggttg tgaaatatac 8161 cccatacacc gtttggacaa accggttggt ggcataatgg tatatgcaaa aacaaagcct 8221 gcaagcgcaa agctaagtgc tgatttccaa aaccgtgctg ttacaaaaga atatctctgc 8281 atagttaagg gcattcctca agaacacagc gcagttctca aagatttgct atataaagat 8341 tcccgtgcga acaaaacctt tgttgtcaca cgtgagcgaa aaggcgttaa acctgcaagc 8401 cttgaatatg agcttctcga taccaagtca tcgcctgacg gagaactctc acttctcaaa 8461 gttaaactcc atacaggacg ctcacaccag ataagagtgc agtttgcttc acgcaagctt 8521 ccgcttttgg gcgactcccg atatggcgga aagaaacaag ggattgatgt atgtctgtgg 8581 tcacaccgtc ttaagttttc tcatcctatt atcggcagcg cttttgatta catcgcttgt 8641 gtgcctgatg actatccttg gattttgttc aaaatgtaat gtaaacttgt gaaatttaca 8701 gaatttaata gttaatttac taaataattt tttcaaaaaa aagcttgca // LOCUS sequence009 8736 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence009 VERSION sequence009 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..8736 /mol_type="genomic DNA" /organism="" /note="sequence009" CDS complement(111..1880) /product="DNA primase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_010964611.1" /transl_table=11 /codon_start=1 /translation="MALPSDFLDRLRDANRIDDVMRSYVTLKRTGRDYKCLCPFHSEKT PSCAVHPDDGYFYCFGCGAGGDVITFTMKIENLDYFEAVKLLADRSGIAMPEDTYDDRA AQEKKRLLEMNRTAAKFFYSNLKTPDGKEGLAYLLEKRKLKPETIKKFGLGVATNHWTS LTNYMTGLGYTHAELERASLISRNQQGRYFDFFVNRIMFPIFDLRGNVIAFSGRSLDAD PKGAKYKNSRETSVYKKSRTLFAMNFAKNTAVKSKRLILCEGNVDVISLHQAGFEEAVA TCGTAITAEHARLMSQYCDEIYICYDADAAGQKATQSAISLLSAAGLTSKVIKVNGEGI KDVDDYINKMGPARFKMLMEGSEGAIVFELNKCKQDLDLDGDLGRVEYIKRAVKVLAGI ENRVEREIYISRVANEIGIKTDILTAEVSAAIRKNQTATRKKDWQQISSGLNKRDDINP EAMKFPKEAKAEEGIIAYILKHPDSAAKVSARVAFDKFVTSFNRRVYEVLVEKSQEMTD ITLTSLSQEFSEAEMGKISGILAKSRDIVIDEDTLGEYIAVLTHSRKEAKNAGEDMSDD EFLAYVTRLSKEK" /locus_tag="LOCUS_0790" /gene="dnaG" /note="WP_010964611.1 DNA primase (Clostridium) [pid:32.0%, q_cov:94.4%, s_cov:90.8%, Eval:1.8e-85]" /note="MGA_88" CDS complement(1917..2924) /product="deoxyguanosinetriphosphate triphosphohydrolase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_012583673.1" /transl_table=11 /codon_start=1 /translation="MSENLTPREFTELTEKTILSPYACLSSESKGRVKDEEKCPLRTDF QRDRDRIIHCNAFVRLKHKTQVFLNPTGDHYRTRLTHTLEVSQIARTITRALRLNEDLA EAIALGHDLGHTPFGHAGEEVLNAVSSKGFKHYRQSVRVVECIEKDGKGLNLTHEVKDG ILKHTDSIADTREGYIVRLSDVIAFINHDIEDAIRAGVICNEDLPKSAIEILGKTKSER ITTLVNSLIANGAETIRYSDEIGKAKKELVDYMYENVYRNPVCKSEESKAKMMVEKLYY HFLENPEKLPSDYLALADKFDKETAVCDYVAGMTDKYCTNLFMELYVPKGWHIY" /locus_tag="LOCUS_0800" /note="WP_012583673.1 deoxyguanosinetriphosphate triphosphohydrolase (Dictyoglomus turgidum) [pid:52.9%, q_cov:98.8%, s_cov:100.0%, Eval:1.3e-97]" /note="MGA_89" CDS complement(3049..3669) /product="YigZ family protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003357796.1" /transl_table=11 /codon_start=1 /translation="MPYKTIYDKASDSFIVDKSEFIGQICPVKTNEEAVAFIESVKAEN RKARHNCYAYVLRDENITRYSDDGEPQGTAGPPILDVIVKNGLTDVCVVVTRYFGGILL GKGGLTRAYSQGAAIAVNAAKIMNMCEGYELTITVDYSLYDKINYVLPDFEIKLIDTDY SDVIKIKLIVREEMLSSLEEKLIDISNGKINIAKSDKLYADFA" /locus_tag="LOCUS_0810" /note="WP_003357796.1 YigZ family protein (Clostridium botulinum) [pid:47.3%, q_cov:97.1%, s_cov:93.1%, Eval:4.0e-46]" /note="MGA_90" CDS complement(3741..3947) /product="50S ribosomal protein L31" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_002669000.1" /transl_table=11 /codon_start=1 /translation="MAKEGIHPNYVTSVITCACGNVIETKSTKGNMRVEICSKCHPFYT GKQKLVDTGGRVDRFNKRFGLKK" /locus_tag="LOCUS_0820" /gene="rpmE" /note="WP_002669000.1 50S ribosomal protein L31 (Treponema) [pid:64.6%, q_cov:95.6%, s_cov:97.0%, Eval:9.9e-22]" /note="MGA_91" CDS complement(4104..5180) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MKQNRIIAIFVTLALAFSLCGCRNNTVPPEPDTTITEPDVTTVST SESETAPTTTEEPIPEGDIKIDSEFVGSYLTMRMDDREAPQYEGSYFMVFSTYDEIAEY YETSCDFFFYGRKFTIQCASYSEGDFMANNDVLILKVDEPSSYITHSATSLRISDGKAV FGIERHMPKDAPLGDTQYHLIYTAPKGTFDALKGLEFEAVFAEINDLDSANAFDSERYL YIYPEFWPFVYKADAISAPGTIVDSIESYNELVEFYERYKTSYDFEDDFKKHIGSLYDE RMFDDYILLMVLAPCDANGKPLEVGQLFVYNLEVFIAVNNSSKAVVSDTTPSYLLVTAV SKKDLKGVNLSMFNISFN" /locus_tag="LOCUS_0830" /note="MGA_92" CDS complement(5495..7213) /product="phospho-sugar mutase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_002338467.1" /transl_table=11 /codon_start=1 /translation="MREHELYELWLKNATEDPDLVAELESIKGDDEAIKDRFYRDLEFG TGGLRGVIGAGSYRLNIYTIRRATQGLADYVNGAFENASVAIGYDSRIKSDVFAREAAR VLAGNGIKAYIYPELMPTPMLSWAVRSLGCKAGIVCTASHNPAKYNGYKAYGADGCQMT IEAADIVLAKINGVPMFGGAKLVDFDEGVKSGMIEIISDDVVEAYLEEVKKQQVHPEVC ATSGLKVVYTPLNGSGNKPVRAILKKIGITDVTVVPEQEMPDGNFPTCPFPNPEIKEAL HLGLELCKTVQPDLLLATDPDCDRVGIAVPDGKGDYVLFSGNEVGAMLLEYICKERIAL GTMPEKPVAVKSIVSTDIAMAIAKDYGVELRNVLTGFKFIGEQIGYLEAAGEADRYIFG FEESYGYLIGSYVRDKDAVVGSMMICEMAAYYRSKGISLLEAREAIYKKYGNYFHTVAS FTCEGASGMEQMAKIMNELHTTPYSEIAGFKVVGLLDYLTHEDKDYATGAVNVIDLPKS DVITFKLENGATVVIRPSGTEPKIKAYYTTIAPTREEAVELGATIAADFKAKLGF" /locus_tag="LOCUS_0840" /note="WP_002338467.1 phospho-sugar mutase (Enterococcus faecium) [pid:53.1%, q_cov:97.7%, s_cov:97.8%, Eval:2.4e-159]" /note="MGA_93" ORIGIN 1 ctccgtgatc gccttggtgg tcagcttacc tgttgccttt ccgctttcaa gcaagctttc 61 aattgtaacc tttttttcgc tcatttttgc gtgcctccgt ttatgtcact ttatttttct 121 ttgctaagcc ttgtaacata tgccaaaaac tcatcgtccg acatatcttc tccggcattt 181 tttgcttctt tgcggctatg agttaaaacc gcgatatatt cgcccaaggt atcctcatca 241 atgacgatat cccgcgattt cgccagtatt cccgatatct tgcccatttc agcctcggaa 301 aattcctggc tgagcgaagt caatgtgata tccgtcattt cctgcgattt ttcaaccaaa 361 acttcataga cccgacggtt aaaggatgtg acaaatttgt caaatgcaac tcttgcgctc 421 acctttgccg ccgaatcggg gtgctttaaa atataggcaa ttatgccttc ctcggccttg 481 gcttctttcg ggaatttcat cgcctcgggg ttaatatcgt cccgcttgtt aagacccgat 541 gaaatctgtt gccaatcctt tttgcgggtc gctgtctggt ttttccttat tgcggcgctg 601 acctctgcgg tcaaaatatc ggtcttaatg ccgatctcat tcgccactcg ggaaatatag 661 atctcccgtt caacgcggtt ttcaatacct gccagcacct tgactgcccg cttaatatat 721 tcaactcggc ccaagtcgcc gtcaaggtcc agatcctgct tgcatttgtt cagctcaaag 781 acgattgcgc cttccgagcc ttccatcagc attttgaacc tcgcaggccc cattttgttt 841 atgtaatcgt caacgtcctt aattccctcg ccgttgacct tgatcacctt cgaggtgagt 901 cctgcggccg aaagaaggga tatcgccgat tgtgtcgcct tttgtcccgc agcatcagca 961 tcatagcaga tgtagatctc atcgcaatat tggctcataa gccgcgcgtg ttctgcggta 1021 attgctgttc cgcaggtcgc aaccgcctct tcaaatcccg cctgatgaag ggaaataacg 1081 tccacattgc cctcgcacaa aatcagccgt ttcgatttta cagccgtatt cttcgcaaag 1141 ttcattgcaa agagcgtgcg gctcttttta tatactgacg tttcacgcga gtttttatac 1201 ttcgcgccct tcgggtcggc gtccaatgat ctgcccgaga atgcaatgac attgcctcta 1261 aggtcaaaaa tcgggaacat aatgcggtta acaaagaagt caaagtatcg tccctgctga 1321 ttccgcgaga tcaggctcgc ccgctcaagc tccgcgtggg tatatcccag ccccgtcata 1381 tagttagtca ggcttgtcca atggttggtt gcaacgccaa gcccgaactt tttgattgtt 1441 tcgggtttaa gcttgcgctt ttcaagcaaa tatgcaagcc cctctttgcc atcgggagtc 1501 ttgaggtttg aatagaagaa ctttgccgcg gttctgttca tttccaaaag cctttttttc 1561 tcctgtgccg cgcggtcgtc atatgtgtcc tcgggcatcg caatgcctga cctatccgcc 1621 aaaagcttga ccgcctcgaa atagtcgagg ttttcaatct tcattgtaaa tgtgatgaca 1681 tctccgcctg ctccgcaacc gaaacagtaa aaatatccgt catccgggtg aacagcgcag 1741 gatggggtct tttccgaatg gaacgggcag aggcatttat aatctctgcc ggtgcgttta 1801 agggtgacat aagagcgcat tacatcatca atgcggttgg catctcgcag tctgtccaaa 1861 aaatccgaag gtaaagccac ttatatcact cctttcaata taatcaaact aaaaaatcaa 1921 tatatatgcc agcccttggg aacatacagc tccataaaca ggttggtgca atatttatcg 1981 gtcatacctg caacatagtc gcaaacggcg gtttccttgt cgaacttatc cgccagcgca 2041 agatagtccg aggggagctt ttcggggttt tcaaggaagt gatagtatag cttttcgacc 2101 atcatcttcg cctttgattc ctccgacttg cagacggggt ttctgtatac attttcatac 2161 atataatcaa caagctcttt ctttgcttta ccgatctcat ccgaatagcg gatggtttcg 2221 gcaccgtttg caatcagcga gttgacaagc gttgtaattc tttctgattt tgtcttgccc 2281 aaaatctcaa tcgcagactt cggcaagtct tcgttgcaga tgacacctgc tcgaatagcg 2341 tcctcaatgt catggttgat gaatgcaata acgtcggaca gacgtacaat gtatccctct 2401 ctggtgtcgg caatcgaatc ggtgtgcttc aaaatgccat ccttaacttc gtgggttagg 2461 tttaagccct tgccgtcctt ttcgatgcat tcaacaactc gcacactctg gcgatagtgc 2521 ttaaatccct tggatgatac agcgttcaaa acctcttcac ctgcatggcc aaagggggtg 2581 tgtcccaaat cgtggcctaa agcaatcgct tctgcaaggt cttcgtttaa acgcaaagcc 2641 cttgtaattg ttcttgcaat ctggctgacc tcaagggtgt gggtcagtct tgtgcgatag 2701 tggtcaccgg tggggttcaa aaatacctgt gtcttgtgtt ttaagcggac gaaagcgttg 2761 caatgaataa ttctgtcgcg gtcacgctga aaatcggtgc gaaggggaca tttttcttcg 2821 tctttaactc tgcccttcga ctcgctcgat aagcaggcgt atgggcttaa aattgttttt 2881 tctgtcaatt ccgtaaactc tctgggggtc aaattttcac tcataattcg tccttacttt 2941 ctgaaaatac tgttttaatt ttcgttaaca ctcttatata cataaaaaac aacaaatctc 3001 ctctttttaa aatcgaaaaa tcagagattt gtatgtttgc acaatttatc aagcaaaatc 3061 agcatataat ttatcggatt ttgctatatt tattttgccg ttggagatat caatcaactt 3121 ttcctcgagt gaagaaagca tctcctcacg cacaatcagc ttgattttaa taacatccga 3181 gtaatcggta tcaataagct taatttcaaa gtcgggaaga acgtagttga tcttgtcata 3241 cagcgagtag tcgaccgtta tcgtcagctc atacccctcg cacatattca tgatctttgc 3301 ggcattgacg gcaatagctg caccttggga atatgccctg gtaagtccgc ctttgcccaa 3361 aagtattccg ccgaaatatc tggtgacaac cacgcacaca tccgtcaaac cgtttttaac 3421 aataacatcc aaaatcgggg ggcctgcggt gccttggggt tcgccgtcgt ccgaatatct 3481 ggttatgttt tcatcccgca aaacataggc ataacaattg tggcgcgctt tgcggttttc 3541 cgctttcacc gattcaatga aggcgactgc ctcctcattt gtcttaaccg ggcagatctg 3601 cccgataaac tcggatttgt caacaataaa gctgtcgctc gctttgtcat atatggtttt 3661 atagggcatg gcgcacctcc caaacttaaa gtgaacgaaa aaagagggca caatagccct 3721 ctttcgtttt gaagcgatta ttacttctta agaccgaaac gcttgttgaa gcggtcaaca 3781 cgtccgccgg tatcaacgag cttctgctta cctgtgtaga aggggtggca cttggagcag 3841 atttctactc tcatatttcc cttggtggac ttggtttcga taacgttgcc acatgcacag 3901 gtgataaccg atgtaacgta attaggatgg attccttcct ttgccattaa aatgttccta 3961 ctttccgaac tggtaatatg atacacatag tagcccatca tcctcagttc agacagtagt 4021 actatggaat tatcatcaag atgccgcatc gcggcaaagt gtattataac ataacaaaaa 4081 acaaaatgca agtgtttttt tcatcaatta aatgaaatat tgaacattga aagatttaca 4141 cccttcaggt ccttttttga aaccgccgta accagcagat aactgggtgt tgtatcggat 4201 acaacagcct ttgatgagtt attgacagcg atgaatacct caaggttata tacaaacagc 4261 tgaccaacct cgaggggctt gccgtttgca tcgcatggtg caagaaccat caaaagaatg 4321 taatcatcaa acatccgctc atcatacagc gagccgatat gctttttaaa atcgtcctca 4381 aaatcgtagc ttgttttata tctctcataa aattcgacca gctcattata actctcaatc 4441 gagtcaacga tagttccggg agctgatatc gcatccgcct tatatacaaa aggccagaac 4501 tcggggtaga tatataaata gcgctccgag tcgaaggcgt ttgccgaatc aaggtcgttg 4561 atctccgcaa aaactgcctc aaactcaagt cccttcaaag catcaaatgt gcccttcgga 4621 gcggtataaa taagatgata ctgtgtatcg cccaagggtg catccttggg catatggcgc 4681 tcaattccga aaacggcctt gccgtcggaa attctcaaag aagttgcact gtgggtgata 4741 tatgagcttg gctcatcgac ctttaaaatg agcacatcgt tatttgccat aaagtcgccc 4801 tcactgtatg atgcacactg aatggtgaac tttctgccat agaagaaaaa gtcacagctt 4861 gtttcataat actctgcaat ctcatcgtag gtggaaaaga ccataaagta tgagccctca 4921 tactgaggag cctcgcggtc gtccatacgc atagtaaggt agctacctac aaattccgag 4981 tcaattttaa tgtcgccctc tggaatcggt tcttcggttg tggtgggcgc ggtttcgctt 5041 tccgatgttg aaacggtcgt cacatcgggt tcggttattg tggtgtccgg ctcgggagga 5101 acggtgttat ttctgcaacc gcaaagcgaa aatgcaagcg caagcgttac aaatatggca 5161 attattctgt tttgcttcaa aaaacattcc tcctttcggc gatagtcata ttattatagc 5221 acagtagcat gaattttgca atgcttaggg gcaaaacagt gagtgcgtgc gcctgttcga 5281 cgctttttgt atatgccttc cccttgaggg gttggagcag tggtcgacaa gtcggagcga 5341 aagcgaacgg caagtcggga accgcaaacg ggattggtgt cagcaaatgc tgacggatga 5401 ggtgaacgca aactgccgaa tttcaaatat ctgcactatc cacaaatcat aaaacaagcc 5461 cctcatttta ttgaggggct ttaatgctta tgtattaaaa tccaagctta gccttgaagt 5521 ctgcggcaat agttgcgccg agttcgacag cttcttctct tgtaggagca atggttgtgt 5581 aataagcctt gatcttgggc tctgtacccg aaggacggat tacaacagtt gcaccgtttt 5641 caagcttgaa ggtgataacg tccgacttgg gaagatcgat cacgttaaca gcgcctgttg 5701 cgtagtcctt atcctcgtga gtgagatagt caagcaaacc gacaaccttg aagcctgcaa 5761 tttcgctgta aggagtggtg tgaagctcgt tcataatctt tgccatctgc tccatacccg 5821 aagcgccttc gcaggtgaag ctcgcaacgg tgtgaaaata gttgccgtat ttcttataaa 5881 ttgcttctct tgcttcaaga agggaaattc ccttagagcg gtagtatgct gccatttcgc 5941 agatcatcat cgaaccgaca acagcatcct tatctcttac atatgaaccg atgaggtaac 6001 cgtaggattc ttcaaagccg aagatatatc tgtcagcttc gcctgctgct tcaagatatc 6061 cgatctgctc gccgatgaac ttaaagccgg tcagtacgtt tctgagctca acgccgtagt 6121 ccttcgcgat tgccattgca atgtcggtgg acacgatcga cttaactgca acgggctttt 6181 cgggcattgt gccaagcgcg attctttcct tgcagatgta ttccaaaagc attgcgccga 6241 cttcgttacc gctgaacaaa acatagtcgc ccttgccgtc gggaacagca ataccaacac 6301 ggtcacagtc ggggtctgtt gccaaaagaa ggtcgggctg aacggtcttg caaagctcaa 6361 gacccagatg caaagcttcc ttaatttcgg ggttggggaa ggggcaggtg gggaagttgc 6421 catcgggcat ttcctgttcg ggaactacgg taacatcggt gatgccgatc tttttgagta 6481 tagctcttac aggcttgttg cccgagccgt tgaggggagt atatacaacc ttgaggccac 6541 ttgttgcaca aacctcgggg tgaacctgct gcttcttgac ctcttcgagg taagcttcaa 6601 caacatcgtc agagataatt tcgatcatac cggacttgac gccttcatca aagtcaacca 6661 gcttagctcc gccgaacata ggaacaccgt tgatctttgc caaaacgata tcagccgctt 6721 caatggtcat ctgacagccg tcagcaccgt atgctttata tccattgtac ttagcagggt 6781 tatgtgaagc tgtacaaacg ataccagcct tgcatccgag gcttcttacc gcccaggaaa 6841 gcataggtgt gggcataagc tcaggataga tatatgcctt aatgccgttt cctgccaaaa 6901 ctcttgctgc ttcgcgtgca aaaacatccg acttgattct tgagtcataa ccaattgcaa 6961 cgcttgcatt ttcaaatgca ccgttaacat aatcggcaag gccttgagtt gctctgcgga 7021 tggtgtagat gttcagtctg taagagcctg cgccgataac accgcgcaaa ccgcctgtac 7081 cgaattcaag gtcacggtaa aatctatcct tgattgcttc gtcgtcgccc ttgatggact 7141 cgagctccgc aacaaggtcg gggtcttcgg tggcattttt cagccaaagc tcgtaaagtt 7201 cgtgttctct catttgtggt cctcccatta gattatttca gaatattcca tttataagta 7261 tataacattc accgcaataa ttcaagggga aaataaaata attccacagg gcttaccgcg 7321 ggcacgccgg cgccccaacc gcccccttcg gggcgccgca ggcacctgca cgcccgctgc 7381 ttttgtttgc tcggaatgtg agcgacggcg aagcccatcc caagcaaagc ctgcggcttt 7441 gcttgggaca ccccgcgcct gcggcgcggg gctccgctcg cccgaagggc ggccgaacgg 7501 agagggcttc gccccgaagc aggcgccctt gtcaaaaaca ttgcggcaaa agtgaacaaa 7561 tgttccaaat tgtgttgacg aacttggcac aatgtagtaa aatgtaggaa aagactgctg 7621 gaaggatgag gcaaatgttc tgcaaagttg aaactatcgg attgatggga atgaatgcgt 7681 ttcccgttga tgttgaaatt gagatcagcc gaggaatcga acggttcgat atcgtcggtc 7741 ttgcggatat ttccgtcaag gaatcccgcg agcgaatcaa gtcggctttc cgttcgtcaa 7801 tgtttaaatt tcctgcggcg aatgttgttg taaacctcgc tcctgccgat gtcaaaaaag 7861 ccggctctac ccacgacctt gcaatcgctg ttgccgttct ttctgcatct aacctcatcc 7921 ccgaggattc ttgcgacaat tccgttttca tcggtgagct gtcgctcggc ggcgatgtcc 7981 gcgcggtcag aggcgttctg ccgatgacaa ttcttgcgaa aaagcttggc aaaacaaagg 8041 tgttcgttcc caatgagaat gcctatgaag catccgttgt cagcggggtt gatgtttttg 8101 gcgttgaaac gctttctcag cttgctgacc atctgaacgg tatatcttat attaagaaga 8161 tgcccgaata tgtgcaaaag aagcaggatg aattcacagg gctagacttt gccgatgtca 8221 agggtcagca gtttgccaaa aaggcccttg aaattgccgc ctgcggagga cataacgtca 8281 taatgatcgg cgctcccggc tctggcaaga gcatgcttgc aaaacgcctg ccgtcaattc 8341 tgcccgatat gacctttgag gagtcgattg aaacaacaaa tgtatattcc attgcgggac 8401 ttttggataa ggattcaccg cttgtaacac agcgcccgtt ccgttctcct catcacaccg 8461 tttcaaccgc gggattaaca ggcggcgggg gagtgcctcg cccgggcgag atctcgctgg 8521 cgcataacgg acttttattc cttgatgaac ttgccgaatt caaccgcaca acccttgaag 8581 ttttgcgtca gccgattgag gacagatgcg tgaccatctc ccgcgcatcg ggtacggtca 8641 catacccttg cgacattatg cttgtgggtg cgctcaaccc ttgcccgtgc ggatattacg 8701 gtcaccccac caaaaaatgc gtttgctcaa agaagc // LOCUS sequence010 8120 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence010 VERSION sequence010 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..8120 /mol_type="genomic DNA" /organism="" /note="sequence010" CDS 487..2649 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MKISKRLLAAFMCLLMVMSLVSCGNEAVNNPIDDPVVTEDTTVSE PPVTTTEATTTEATTTEATTTTEATTTQVTTTTEATTTAPVTTTEATTTEAEPEWVITP ADEKLYATADLNVRATPEQNGERISHVDKGDLVEVTGWVDNGWARIKFRGEERYVNGKY LSKDKPAEFTVGTTVKPEEIKPVNGEYTVSGSFSSEFLDNDWDTACKIGTVAGDYESVW GTHYPNLTAVIERVCPLSDIAHIEITLTASNIEPCWNGKIPQCELHWNSRADNGAEMTQ SFNTDTVVLDMDVPEGVYAVILNPYAFSSSVGRVHFEYTIKITAKQEEPIVETDNKPDV SSAEKTKWVATWGSAQLKAGGDHLPKKVKLSGSTLRQQIRTTIEGDVIKLTLTNEYGEK DLIIESVHIAHLGNPQSSAIDKKTDTVVTFGGKQAVTVKKGQRLESDEIEFEFDALDDI AVTMYIKQAPSTVTSHTASRCSTWVVSGNHVSDVSTNGGDTTTSWYFLTRADTLATEES GVIVTFGDSLTDGASVTTNAFARWPDELARLLKKDSELSHYGVINMGIGGTLLRWDISR LERDVLNTPGVKAVVVLYGINDIANTTYDKSGDIISLYKQIIKKCEAKGIKVYCGTLTP TKGNTGGYYSSMVNTTRLNINKWIMSDKSGLDGYIDFASAVASATDSDKMQSQYVSVWN DWLHFNDKGYKHLGKTAYEVLKKELD" /locus_tag="LOCUS_0850" /note="WP_012640418.1 SGNH/GDSL hydrolase family protein (Caulobacter vibrioides) [pid:31.4%, q_cov:50.4%, s_cov:82.0%, Eval:1.3e-48, partial hit]" /note="MGA_96" CDS 2665..3891 /product="SGNH/GDSL hydrolase family protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_012640418.1" /transl_table=11 /codon_start=1 /translation="MKAGKIMAIVLSCVLAASAFAGCAAKKSDGGVPKTKWVATWGSGM RKDFTDQLPKQNSFAGSTVRQQIRTTVSGDVMRLTFSNQYGESDLVIESVHIAKLKDPA SSEIKTKTDTVVTFGGSESIIIPAGETAVSDDIAFSFEALEDIAVTTYFSDVPSTITGH TASRCYIWTKSGNHVDEKELTDAEITSAWYFLARIDTLATEDTKIIVTFGDSLTDGASV TDNIFSRWPDELARQLKANEQLCNYGVINMGNGGTLLRWDMARFERDVLNTPGVDTLVV LYGINDLSGKTEDISQNIIGYYEEIIEKCHENGIKVYFGTLTPTKGNTGSHYSKLINEM RHTINDWIMTNDQADGYIDFASAVASVADKDMMDEAYVSKWKDWLHFNDNGYTKLGQTA YDVLKDELK" /locus_tag="LOCUS_0860" /note="WP_012640418.1 SGNH/GDSL hydrolase family protein (Caulobacter vibrioides) [pid:30.6%, q_cov:87.5%, s_cov:80.9%, Eval:3.0e-46]" /note="MGA_97" CDS 3917..5167 /product="SGNH/GDSL hydrolase family protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_191309483.1" /transl_table=11 /codon_start=1 /translation="MKIGRLLAVVLSLIMIASTVTACDGSSFTPKADEAGWYATWGTAM YDASADETPFNPSLKENTVRQQIRVSIGGDKIKLTFSNIRGDIPVQIEKAHIAKMVEGG ANPAIDTLTDTVITFGGSESVTIEPGKTVTSDEIDFSFDALENLAVTLKMGKYVGGTIT AHRGARANTWVVEGDHVSDETISGGNKMTSWYYLEEVAVWAEAGTKTIVCLGDSITDGA NTTTNKFTRWSDELARQLQANGYENISVVNKGIGGNSIFGGLGTAAKDRFYHDVLEVEG VRYCIVMIGINDIGYTNEDISQSLIDQYKIMIDACHENGIAIYGATLTPIKNSGYYSEL HEQIRVNLNEFIRSEDSGFDGVIDFDAALADPADTEKMSDEYVEGWRDYLHPGDLGYTV MGETAFEALDKIWSAEE" /locus_tag="LOCUS_0870" /note="WP_191309483.1 SGNH/GDSL hydrolase family protein (Amycolatopsis bullii) [pid:33.3%, q_cov:88.2%, s_cov:92.1%, Eval:6.1e-50]" /note="MGA_98" CDS 5693..6706 /product="IS30-like element ISTde2 family transposase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_010956682.1" /transl_table=11 /codon_start=1 /translation="MGKQHYLTYEERLKIEAWLRAKAKVAWIASQLGCSRQTIYNEIKR GQYIHTCDYWDEVRYSADIAQQQTDYNQSAKGRPLKIGSDYAYADFLEQIILKKKYSPA AAIAEARKHDFDTSICVTTLYSYIEKRVFAKLTKKDLWEKGKRKKRTYNQVKRIAHPLL PSINNRSDRANDRAELGHWEMDLIVSAKSGRSVLLTLTERTTRQEMIFKLPNRKATTVR SVFDKLESEDTAFRKKFKSITTDNGSEFLQYDKLTESIHGGKRFDIFYCHSYAAWEKGT NENHNRMIRRFFPKGTDFSKVSSDRVKKVEEWMNNYPRAKLGWKTPNELMNQLLAG" /locus_tag="LOCUS_0880" /note="WP_010956682.1 IS30-like element ISTde2 family transposase (Treponema denticola) [pid:41.2%, q_cov:97.3%, s_cov:96.4%, Eval:2.7e-66]" /note="MGA_99" CDS complement(6688..7314) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MSVSLYFGLPGCGKTTTLTEIAYNAINKKKSPYKYVYGNVHLALP GYTYIDNFCIGNFLLEDCLILIDEATLYADSRDFKNFSGNRLNYFMTHRHYRADIILFV QKWDAVDIKIRTITDNVYYVYKPLLIGHWFSYIYRIPYGIDFVSQKHDGRRYGDIIQGY GKPSFMTKLFAHKLYRPKFYKYFDSWEIKLLPPLPDKYKPYPASN" /locus_tag="LOCUS_0890" /note="MGA_100" CDS complement(7381..7596) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MDGTTTTIANMSLDAITTALGKVMEWVKVVVDGLVGTDGALSELL PLFLVGVAISALLLGVKIIRSFIWGA" /locus_tag="LOCUS_0900" /note="MGA_101" ORIGIN 1 gcttggcgag ccggatgaaa gaggcagacg caagccgatt gaaattcccg acagcgaatt 61 tgttttggat gttgacacag tcataatgtc cattggcacc agcccgaatc cgcttattaa 121 atccaccacc gcagggttgg aagttaaccg ccgcggcgga attattgtca acgaagaaac 181 aggcaagacc acccgcgagg gtgtatatgc aggcggcgat gccgtaaccg gtgcggcaac 241 ggtaatttcc gcgatgggcg caggaaagct cgccgcgaaa gcaattgatg agtacatcag 301 aagtaaataa accaaaatga aagctgccat gcaactatgc gtggcagttt tttgttgatg 361 attgcaagcg agtaaacaaa aggtcaataa aacccacaaa ataggtcacg ttttgatatt 421 tacaaagcag aggcgcggtg gtaaaattaa agtgtatatt tatttatacg aaaggaagat 481 tgtgcaatga agatttccaa acgtttgctt gcggcattta tgtgcttatt aatggtaatg 541 tcgcttgttt cctgcggcaa cgaggcagtt aataatccta ttgacgaccc tgttgtgacc 601 gaggacacaa ccgtttccga gccgcccgtg acaaccaccg aggcgactac tacggaagcc 661 actacaacag aggcaacaac taccaccgaa gccactacca cacaggtcac aactactaca 721 gaagcaacaa ccacagctcc tgtcaccaca actgaagcca caacaaccga agctgagccc 781 gaatgggtga tcactcctgc ggatgagaag ctgtatgcta ccgctgattt gaatgtcaga 841 gccactcccg agcagaatgg cgagcgaatc agccacgttg acaaaggtga cttggtcgag 901 gtcacaggtt gggtagataa cggctgggcg agaattaaat tccgcggcga ggaaagatac 961 gtcaacggaa aatatttaag caaggataag cctgccgagt tcacagtcgg cacaactgta 1021 aaacccgaag aaatcaagcc ggtaaacggt gaatataccg tttcgggaag cttttcaagc 1081 gagttccttg ataacgattg ggatacagca tgcaagatcg gcactgtagc aggtgattat 1141 gaatcggttt ggggaacgca ttatccgaat cttaccgctg taatcgaaag ggtttgtccc 1201 ctttcagata ttgcacatat tgaaattaca cttacggctt caaacattga gccttgttgg 1261 aacggaaaaa taccccagtg tgagcttcat tggaattccc gtgcggataa cggtgcggaa 1321 atgacccaaa gcttcaacac cgacactgtt gttcttgata tggatgttcc cgaaggcgta 1381 tatgctgtaa ttctcaatcc ttatgccttc agctcctctg tcggcagagt tcattttgaa 1441 tatacaatta agataactgc aaaacaggaa gaaccgattg ttgaaacaga caacaagcct 1501 gatgtcagct cggctgaaaa aaccaaatgg gttgcaacct ggggctccgc tcagcttaaa 1561 gccggcggcg accaccttcc caagaaggtt aagctttcgg gaagcacctt gcgtcagcag 1621 ataagaacca ccattgaggg cgatgttatc aagctgacct taacaaatga atacggcgaa 1681 aaggatctca ttattgagag tgtacatatt gctcatcttg gaaatcctca aagctccgct 1741 attgacaaaa agaccgacac ggttgtcacc ttcggcggaa agcaggctgt gaccgttaag 1801 aagggtcagc gccttgaaag tgacgaaatt gaatttgagt tcgacgcact tgatgacatt 1861 gcagtcacaa tgtatattaa gcaggcacct tcaaccgtca ccagccatac agcatcgaga 1921 tgctcgacct gggtcgtttc gggaaatcac gttagcgatg tttcaaccaa cggcggcgac 1981 accaccacat catggtattt ccttacccgt gctgacaccc ttgcgaccga agaatcaggc 2041 gttattgtca cattcggtga ctcgcttacc gacggcgcat ctgttacaac caatgcgttt 2101 gcccgttggc ccgacgaatt ggcaagactt ttgaagaagg acagcgagct ttcgcactat 2161 ggcgttatca atatgggtat cggcggaaca cttttgagat gggatatttc cagacttgag 2221 cgcgacgttt tgaatacccc cggcgttaag gctgttgttg tgctttacgg tatcaatgac 2281 attgcaaaca ccacatacga taaatccggc gatataatca gtctttacaa acagataatt 2341 aaaaagtgcg aagcaaaggg cattaaggta tattgcggta cacttactcc caccaagggc 2401 aatacaggcg gatattactc aagtatggta aacaccacca gacttaacat caacaagtgg 2461 ataatgtcag acaagtcggg tcttgacgga tatattgatt ttgcttctgc tgttgcatct 2521 gccacggaca gcgacaagat gcagtcgcag tatgtttccg tttggaacga ctggctccac 2581 tttaacgaca aaggatataa acatctcgga aagaccgctt atgaggtttt gaagaaagaa 2641 cttgactaaa taagaggatt taatatgaaa gcaggcaaaa taatggctat tgttttatca 2701 tgtgtgttgg cggcttctgc ttttgcggga tgtgcggcca aaaaatctga cggcggagtt 2761 cccaaaacca agtgggtggc aacctggggc tcgggtatga gaaaagattt caccgatcag 2821 ttgcccaagc aaaacagctt tgcaggcagc accgtaagac agcagatcag aacgaccgtc 2881 agcggcgatg ttatgcgctt gacattttca aatcaatacg gcgagtcgga tctggtgatc 2941 gagagtgtac atattgcgaa gcttaaagac cccgcaagct ccgagatcaa aacaaaaacc 3001 gacactgttg tcacattcgg cggaagcgaa agcatcatca tccctgcagg cgaaaccgct 3061 gtgagcgatg acattgcatt cagctttgaa gcgcttgaag acattgcggt gacaacatac 3121 ttctcagatg tgccttcaac cattacaggc catacagcat cgagatgcta catatggaca 3181 aagagcggaa accatgtcga tgaaaaggag cttaccgatg ccgaaattac aagcgcttgg 3241 tatttccttg cccgcatcga cactcttgcg accgaagaca caaaaattat tgtcaccttc 3301 ggcgattcgc tgacagacgg cgcaagcgtc accgacaaca tcttctcccg ttggcccgac 3361 gaattggcaa gacagcttaa agcaaacgaa cagctttgca attacggcgt cataaatatg 3421 ggcaacggcg gaacattgtt gagatgggat atggcaagat ttgaacgcga tgttttgaac 3481 actcccggtg tagacacctt ggtcgtgctc tatggcatca acgatctatc gggcaagacc 3541 gaggatattt cccaaaatat tatcggatat tacgaagaga tcattgaaaa gtgtcacgaa 3601 aacggcatta aggtatattt cggcacactc accccgacta agggaaatac cggcagccat 3661 tattcgaagc ttataaatga aatgcgccac accattaacg attggataat gacaaacgat 3721 caggccgacg gatacattga ctttgcttcg gctgttgcat cggttgccga caaggatatg 3781 atggacgaag cgtatgtatc gaagtggaaa gattggctcc actttaacga caacggctat 3841 acaaagctcg gtcagacagc atatgacgtg ctcaaagacg agttgaaata aattagcgaa 3901 aggaattgtt gaaaaaatga agattggaag acttttggca gttgttttat ctttaattat 3961 gattgcatca acagtaaccg cttgcgacgg cagctcgttc acacccaagg cagacgaagc 4021 cggctggtat gcaacctggg gcacagcgat gtatgatgcc agcgcagatg aaacaccctt 4081 taacccgtca ctcaaggaaa acaccgtccg ccagcagatt cgtgtatcca tcggcggcga 4141 caagatcaag cttaccttct cgaacatcag aggagatatt cccgttcaga ttgaaaaagc 4201 acacatcgca aagatggttg aaggcggagc aaaccccgca attgacaccc tgaccgacac 4261 cgttatcacc ttcggcggaa gcgagagcgt tacaattgag ccgggcaaga ccgttacatc 4321 ggatgagatc gatttcagct ttgacgcttt ggaaaatctc gcagtaaccc ttaaaatggg 4381 caaatatgta ggcggaacga tcactgccca cagaggcgca agagcaaata catgggtagt 4441 tgagggcgac cacgtcagcg acgaaaccat ttccggcggc aacaagatga cctcttggta 4501 ttatcttgaa gaggttgctg tttgggcaga ggcaggcacc aagacaattg tctgcttggg 4561 cgactcgatc accgacggcg caaacaccac cacaaacaag ttcacccgtt ggtcggatga 4621 attggcaaga cagcttcagg caaacggata tgagaatatt tccgttgtca acaagggcat 4681 cggcggaaac tcaattttcg gcggtttggg aactgccgca aaggacagat tctatcacga 4741 tgtgcttgag gttgaaggcg taagatattg catcgttatg atcggtatca acgatatcgg 4801 atatacaaac gaggacattt cccagagcct tattgaccag tataagatta tgattgatgc 4861 ttgccacgaa aacggcatcg caatttacgg cgcgaccttg acacctatta agaacagcgg 4921 atattacagc gagcttcacg aacagataag agttaatctc aacgagttca ttcgttcgga 4981 agattcgggc tttgacggtg ttatcgactt cgacgcggct ttggctgacc ctgccgatac 5041 tgaaaagatg agcgacgaat acgttgaggg ctggagagat tacctccacc cgggcgatct 5101 gggatatacc gttatgggcg aaacagcatt tgaagctttg gataaaattt ggagtgctga 5161 ggaataagat ttgattgaca ggcgaccaca cagggtcgcc tgttttgata ttggcagata 5221 aatttaagca gatctcatag cgggcgaccc tgcgtggtcg cccgctttta acctctcttt 5281 cgcgtacagc cgtctgcttc tccaattaat tgaaaccgag aagaaaacat acagccgtcc 5341 accatcaaca cagattttca ttcacaaaaa tcgggcctat gtacccgccc gtttaactgt 5401 gccccacttt cgggcaccca cataggggcg ccccttttta caatttgtaa atgtcaagag 5461 aaaatttgac aaaatctaag tttctcaata tcatatttat aacctcatag tcaagaagct 5521 ttcgcggcat aagctcgccc ggtgcgagta ccgggcgagt tattccacgg tcatcttgac 5581 aatggtttat aaatatggtt ttggtaatgg tcggcagcga cgcacaagcg tcgttgccga 5641 actttataat tttgagaaac gtattaaact taccggaaag gaagggtacg gaatgggaaa 5701 acaacactac ttgacatatg aggaacggtt aaaaattgaa gcctggcttc gggcaaaagc 5761 aaaggttgcc tggatagctt cacagctcgg ttgcagtaga cagacaatct acaatgaaat 5821 caaaagaggg caatacatac acacttgtga ctattgggat gaagtgagat attccgcaga 5881 cattgcacag caacaaacag actacaatca atccgcaaag ggcagacctt taaaaattgg 5941 gtcggattat gcctatgcgg attttttaga acaaataatc ttaaaaaaga aatactctcc 6001 tgcggcggca atagctgaag caagaaagca tgattttgat acaagtattt gtgtcacaac 6061 attatattca tacattgaaa aacgtgtttt tgcgaagcta acaaaaaaag acctttggga 6121 aaaaggaaaa cgaaaaaaga gaacatataa ccaggttaaa agaatcgctc atccgttgct 6181 accatctatt aacaaccgtt cagatagagc aaatgaccgc gccgagcttg gacattggga 6241 aatggattta attgtttctg caaaaagtgg gcgttccgtt ctgctgacct tgacagaaag 6301 aacaacaagg caggaaatga tattcaagct cccgaaccga aaagcaacta cagtaagaag 6361 tgtatttgat aagttggaga gcgaggatac tgcattccga aagaaattca aatcaataac 6421 aaccgataat ggctcagagt ttttacagta tgataaactg acagaatcaa tacacggcgg 6481 caaacgcttc gacatcttct actgtcactc atatgcagct tgggagaaag gcacaaatga 6541 aaatcacaat agaatgatcc gacgattctt ccctaaaggt acagacttta gtaaagtttc 6601 atcggatcgt gttaaaaaag tggaggaatg gatgaacaat tacccacgag ctaaattagg 6661 ttggaaaaca ccaaatgaat tgatgaatca gttgcttgct gggtaaggtt tatacttatc 6721 cggtaagggt ggaagtaatt taatttccca tgaatcaaag tatttataga acttcggacg 6781 ataaagtttg tgggcaaata atttcgtcat aaaggatggc ttaccatagc cttgaataat 6841 gtcaccatat cggcggccat catgtttctg acttacaaaa tcaatgccgt aagggatacg 6901 gtatatataa ctgaaccaat gaccaataag caagggttta taaacataat aaacattatc 6961 agtaatggtg cgaattttaa tatcaactgc atcccacttt tgcacaaaca aaataatgtc 7021 agctcgatag tgacggtgag tcataaagta attaaggcgg ttaccggaga agtttttaaa 7081 atctctggaa tctgcataaa gagttgcttc atcaatcaaa atcaagcaat cttcaagcaa 7141 gaaattacca atacaaaaat tatcaatata tgtatatccg ggcaaagcca gatgtacatt 7201 accgtatacg tacttatatg gagacttctt tttgttgatt gcattatatg caatttcagt 7261 taaggtagta gttttgccgc aaccgggcaa gccaaaatac aacgatacac tcataacata 7321 aacctttcga aaaatgtgcc ccgcacccgg cacagagtgc cgagggcggg gcatctttta 7381 ttaagcgccc cagataaagg aacggataat cttgacaccg agcaagagtg cagaaattgc 7441 aacacctacc aggaacaaag gaagaagctc agaaagtgcg ccgtcagttc ctacgagacc 7501 gtcaacaaca actttaaccc attccataac cttgccaaga gcagtagtaa tagcatccaa 7561 actcatattt gcaatagttg tagtagtacc atccatgtac taaaactctc ctttcttgaa 7621 gattgcccta aacaggcggt aaaaaatatc tacaaagaac acgacaagca aacatataag 7681 tattccggat atagcatata tgtactgctg agacgagtcc ccagtattcc aagaatgatt 7741 gataatctgc tgaattaaat catacataac aaattacctc cgaactgaaa aaactataat 7801 tcccttgata actttaacca agccgatcaa aagaaaggta caaaaaatcg gaaccatgta 7861 agtgctccaa aaggaggact taacaaaaag ctgaactgcc caaataggat agtaaaacca 7921 ctcaaacatt acttttcaag acctcctaag cgaatgaata tcattatcaa gagaatgatt 7981 ataaataagt agtaaaagaa tgtcatttaa aacctccaaa taatgaataa gcagaaataa 8041 tatcgggtga ccactgaaaa gccatagccg tagctatacc gttaaaagtt ttagatcgaa 8101 cacgcgaaga agaatgaacc // LOCUS sequence011 7961 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence011 VERSION sequence011 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..7961 /mol_type="genomic DNA" /organism="" /note="sequence011" CDS complement(436..792) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MSSSFVEKIVKSCPFEVDIYCEGYPDVIYEIILDDQPTQEQIETA VTALEDFVYGYNKTHILRPIHDVSEISGIPGINYHPRGIYVHIDFGLCSLKAPFLAVKA LQETDLPIFRVALR" /locus_tag="LOCUS_0910" /note="MGA_103" CDS complement(943..4140) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MKTKTLKSLTMSIISTLLCFSCFIGSTFAWFTDQVTSENNIIASG KLDIEMEWADGSFDPADSATIWTDASVGAIFDYDKWEPGYAQARHIKIKNNGSLAFTYQ LMIQPTGELGVLAEVIDVYFIDPAQTVNRSSLTQERLVGTLKNVVSGLDASRIGNGNLE AGQECEITIVLKMQESATNEYMNQSIGSSFAIQILANQYAFESDSFGNDYDIGALPQIA DNYSASVSLNGMLNNENKTAQSLTIGNSTDDINAHIPADVKIADGASELVLSVARADRS SNILMSDGQVSRSLDVHIEGVSPTNDVPIIVNLGQVLPTGLKNSSISLYHVENGVAHNM SLVDTFTAHNQFTYNRDTGEVSIYISSFSEITAVVSISNPWDGTVDTTWYNDVDTEFII DSAEDLAGLGALVSGGNTFEGKTIKLASDLDLGGVGHNYVFYPIGYQYNESDTADTPHA FKGIFDGQGNRISDLYQNTWNIKGHYDNGYYKKSLGLFALIDGGTVKNLVLENFILEGE FAPTGCVAGLGYGGTFENITLRRCQPATYNTGVAGIIGWDAGVNETYTFNNISVGSSNT IHALWGSWDVACGGIMGFLDETSTATMTNCTVAANMDVYNDVCANYQYYQYRYAGMLIG TIGSDGIPESGNLTCTNCNVYIGSWADYYYCEFEKNSSASYTEDFQFSRVDDKDIVFDL SGNAISCTHDHTLNEDKLAYHLPFSQLYTGYSWGATAVYEHDGVNIMKYIYEVIYVDGT HVLNIDYVTDNTTPYNLNAAPDGFSWINGDVEEVTSIPAGNEHSVVVYLNDISTYYARF VDVNGMEIYSEQFKKGATSVKNEPSVPTISGYYGSWEPYDNLLKNATSDVIIRPVYSLE QNSDILSNVTDIGELFDALSQGHTAIMSQSLSGTISSANKSVMSVITNGVTDKDASLTL NSFDLSYDSSSNANKNWTLFQINGDSKLTVSGGLPGYGTLTFNISKLNSNARPTIFDIK YGGTLILERGVTIEIKCADASDISKITTIVGITDLDSTDANGLSVYPGLNIINEGNSIK IIVTGTTTLVGNDSNNT" /locus_tag="LOCUS_0920" /note="MGA_104" CDS complement(4622..5653) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MNFDFGENIKTLRKQKGLTQEQVAELLDVSKQSVSRWENNATYPD ITFLPVLASFYNVTVDFLLGADYETNKSIIEDYEKSRQEAHHRGNISDAYSLSQKVYAS FPNNKSIINNVMVDSYLMGLHNVDKKRKYYLELSISIAERFLKMTEDLEEQCRCINNIS VCNKLLGNCEKAIEWMQKLPSIWSGIETAALGVLEGKDKTDSIQCSLDAVLHLLHRLIF VYATESELPKQDRIKALEKLPYIFGIVFEDGNCGFYHAFLSRVFVELAKLSEENSEQAI AYAKKAVEHAKLYDGLTAQMHTSLLFKGQRISPEEFTSANNQTQTERVAVQLSDDIYKA ILN" /locus_tag="LOCUS_0930" /note="WP_011948545.1 transcriptional regulator (Clostridium botulinum) [pid:28.7%, q_cov:58.9%, s_cov:54.4%, Eval:1.5e-16, partial hit]" /note="MGA_105" CDS 5857..6393 /product="stage V sporulation protein T" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_010966490.1" /transl_table=11 /codon_start=1 /translation="MKATGIVRRIDDLGRVVIPKEIRRTMRIREGDPLEIYTNADGEVI FKKYSPINELSENAASAAEVIYKLGGQPVVILDRDHVVAVAGVPKREYLERRLSPMLDD ILESRRSWMYDGESRRIQPVEGIDRHALAVTPITAQGDIAGAVCFMATDDQPKGTSLLT TLSQTAAMFLGRQLE" /locus_tag="LOCUS_0940" /gene="spoVT" /note="WP_010966490.1 stage V sporulation protein T (Clostridium) [pid:47.8%, q_cov:100.0%, s_cov:99.5%, Eval:2.4e-40]" /note="MGA_106" CDS complement(6654..7583) /product="1-phosphofructokinase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_010963555.1" /transl_table=11 /codon_start=1 /translation="MILTVTLSPAIDKTAECESFNPSEVNRITPISVDFGGKGINVSRA AKKLGLNTYAIGIGFDKADEINRFLKSEGISADFIKCPAPLRTNLKIFDNETKNTVEIN EPASKVKKDVLSKLIQRFESIVVNCDILVLAGSVPSGVPLDIYKTLCLRAKELNPEVKV IIDASGEALRSGIEAAPYMIKPNLEELCGAFGCALKKYSDIKAVAEQIIDGAGVNTVLI SLGAQGAMIVDKERAYHQDAVKVDVKSAQGAGDAMVAGACLALEDGVSLYKTLVFGVCS AAGAVSQNGTAFCGRDFFDEKVKEILKK" /locus_tag="LOCUS_0950" /gene="pfkB" /EC_number="2.7.1.56" /note="WP_010963555.1 1-phosphofructokinase (Clostridium acetobutylicum) [pid:39.2%, q_cov:99.7%, s_cov:97.7%, Eval:2.2e-48]" /note="MGA_107" ORIGIN 1 aatatttttg cgtcttcgcc ggtccagata tcttttgctg taatggtttt gccgaggctt 61 aaaggcagac ccagctcatc caggttaaag cgtgcggtgg cagctttttc acccatgttg 121 aacagaccga ttcccaagac cagcattacg gcaccaattg taaaacttat aatctcatag 181 cgattaaagg aaaaaccggg caacagcgca accaaataca ctatcaatgt gatgggtaac 241 gccgagacca gcgcttcccg aatttttgcc cataattctt tcaattcgct tcacctgccc 301 gaaaaatttc atatttatta tattatatca taaaacccgc ccattgccaa gggcatttgc 361 ggaacatgtt tcgggaattg ggagataaaa aaataaagcg gaggtgactc cgctttatat 421 tattgaacca tacgtttacc gtaacgctac tctgaaaata ggaaggtctg tttcttgcaa 481 agccttgact gccaaaaacg gcgcttttaa agagcagaga ccgaaatcaa tatgtacgta 541 tatgcctctc gggtgataat tgatgccagg tattccgctg atttccgaaa catcgtgaat 601 aggtctcaaa atgtgtgtct tgttatatcc gtaaacaaaa tcttccaagg cagttactgc 661 agtttcaatt tgctcctgcg tgggttgatc atccaaaatg atttcatata taacatccgg 721 atagccctcg caatagatat caacttcaaa cggacaggat tttacaattt tttcgacaaa 781 agaactcgac ataaaacgac ctcctaatca tcttttgtct tatcatacca cacccacgcc 841 aaaaaatcaa ttcccgcagt ataaatcccc tcaatggaaa taagaaccaa gcaacaaaaa 901 gatcgctgca aatgcttagc atctgcagcg atgttgattt tattaagtgt tattgctgtc 961 gttaccaaca agagttgtcg ttcccgtaac gatgatcttt atggagttgc cttcatttat 1021 gatgttaagt ccgggataaa ccgataaacc gtttgcatct gtggaatcaa ggtcggtgat 1081 gccaacgatg gtggtgattt ttgaaatgtc agatgcatcc gcgcacttga tctcgatggt 1141 tacgccgcgc tcaagaatga gggttccgcc atatttaata tcgaagatcg tgggacgcgc 1201 gttgctgtta agcttgctga tattaaatgt gagcgttcca tatccgggca atcctccgct 1261 tactgtaagc ttggagtcgc cattgatctg gaagagagtc cagttcttgt ttgcgttact 1321 gcttgaatca tatgaaaggt caaacgagtt aagagtaagg cttgcatcct tatcagttac 1381 accgttagtg attacgctca ttacggactt gttagctgag ctaatcgttc cgctaaggct 1441 ttgagacata atggctgtat ggccttgcga aagagcatcg aacaactctc caatgtctgt 1501 gacatttgaa aggatatcag aattttgttc caaagaataa acaggtctga taataacatc 1561 tgacgtagca ttctttaaga gattatcata aggttcccat gagccgtaat aaccgcttat 1621 cgtaggaact gaaggttcgt ttttaaccga agtggcaccc tttttgaact gttccgaata 1681 tatttccata ccgttaacgt ctacaaatct tgcataatag gttgatatgt cgttcaaata 1741 aacaaccacg ctatgctcgt tgcctgcagg gatcgaggtt acctcttcta cgtctccatt 1801 gatccagctg aagccgtcag gtgcagcgtt caaattgtaa ggagttgtat tgtctgttac 1861 ataatcaatg tttaaaacgt gtgttccgtc aacataaata acctcataga tatatttcat 1921 aatgttgaca ccatcgtgct catatactgc ggttgctccc cagctatagc ctgtatagag 1981 ctgactgaag gggaggtgat aagcaagctt atcttcattc aaagtgtggt catgtgtaca 2041 gcttatcgca ttgccgctaa ggtcaaatac aatgtccttg tcgtcaactc ggctgaactg 2101 gaagtcttcg gtataggaag cggaagagtt cttttcaaac tcgcagtagt aatagtctgc 2161 ccagctgcca atataaacgt tgcagtttgt gcaggtgagg ttgccggatt cgggaattcc 2221 atcagatcca atggttccta taagcattcc ggcatatctg tactgataat actgatagtt 2281 ggcacaaacg tcgttataaa catccatatt tgcagcaaca gtgcagtttg tcatagttgc 2341 cgtacttgtt tcatcaagga atcccatgat tcctccgcat gcaacgtccc agctgcccca 2401 cagtgcgtga atggtatttg agctgccaac gctgatgttg ttgaaggtat atgtttcgtt 2461 aactccggcg tcccaaccga taatgcctgc aactccggtg ttataggtgg cgggctgaca 2521 tctgcgaaga gttatgtttt cgaaggtgcc gccgtatccg agtcctgcaa cacatccggt 2581 aggcgcaaat tcgccttcga gaatgaagtt ttcaagaaca agattcttga cggttcctcc 2641 atcgatcaga gcaaacaaac cgagagattt tttataatag ccattgtcgt aatgaccctt 2701 aatgttccag gtgttctgat aaaggtcgga tattctgttt ccctgaccgt cgaagattcc 2761 cttaaatgca tgaggagtat ctgcggtgtc gctttcattg tactgatatc cgataggata 2821 gaacacataa ttatgaccta ctccgccaag gtcaaggtcg cttgcaagct tgatcgtttt 2881 gccttcgaag gtgttgcctc ctgataccaa ggcgccaaga cccgctaaat cttcggcaga 2941 atcaattata aattcggtgt caacatcatt ataccaagtg gtgtctacgg ttccgtccca 3001 agggttgcta atagaaacta cagcagtaat ttcgctgaag gacgaaatat atatgctcac 3061 ttcaccggtg tcgcggttat atgtgaattg gttatgagca gtaaaggtat caaccagact 3121 catattgtga gcgacgccgt tttcaacgtg gtataagctt atcgacgagt tcttgagccc 3181 tgtgggaaga acttgaccta aattaacgat aatgggcacg tcgttcgtcg gtgaaacacc 3241 ttcaatgtga acatcgaggc ttcgggaaac ctgaccgtca gacataagga tattagagga 3301 acggtcagcc ctggctacgc taagaacaag ctcggaagca ccgtcagcaa ttttaacgtc 3361 tgcgggtata tgcgcgttta tatcatctgt ggaatttccg atcgtcaacg attgtgcggt 3421 tttattttcg ttgttgagca tgccgtttaa tgaaacggaa gccgagtaat tatcggcgat 3481 ctgcggcaat gctccaatat catagtcgtt gccaaatgaa tcgctttcaa aggcatactg 3541 atttgcgagg atctggatag caaatgatga gccgatggat tgattcatat attcattagt 3601 ggcactttcc tgcattttaa gaacgatcgt gatctcacat tcttgtcctg cctcaagatt 3661 tccgttaccg atacggcttg cgtcaaggcc ggaaaccacg tttttaagag taccgacaag 3721 gcgttcctgt gtgagcgaag agcgattgac agtttgagcg gggtcgataa agtaaacgtc 3781 gatcacttct gccaaaactc ccagctcgcc ggtgggctgg atcatcaatt ggtatgtaaa 3841 agccaaggat ccgttgttct tgattttaat gtgtcttgcc tgggcatatc cgggctccca 3901 tttatcgtaa tcaaaaatag caccgactga ggcatcggtc cagatcgtag cgctgtcagc 3961 gggatcaaac gaaccgtcgg cccattccat ctcaatatca agctttcccg aagcaatgat 4021 attgttttcg cttgttactt ggtcggtgaa ccaagcgaac gtgcttccga taaaacaaga 4081 aaaacacaac aaggtggaga taatgctcat tgtgagtgat ttcagtgttt tggttttcat 4141 ttgctcttct cctcttaaaa ataatctaac gtttaattat aaaaacgcac aatcccataa 4201 taacaataga attatatcat atatagtgta ttaaatcaat agttacagca tattaacaag 4261 aacaataccc gttataatca aacaaaacgt gttggtctta gagattcttg tcatttttga 4321 gtcaacatta ttgccgttcc ttctaaaaag tgaaccccta gcagtataaa tcccctcgct 4381 ttacaaatac taacatcacg attcaagaaa aaaggagatt tatataatat gaaagcaacc 4441 ggaattgtta gaagaattga ggaatacgtt ataataggac aaaccgcatg aaatccgcat 4501 aaacactaag gttttcgctg gtttgcccca ttgaacgcat tggtgtcaaa acagggcttt 4561 tagcgatttt tatacataac aaaagcgagg tggaattcca cctcgctttt gcttttccga 4621 atcaattcaa aatagcttta taaatgtcgt ctgaaagctg tacagcgaca cgttccgttt 4681 gcgtttggtt attagcgctc gtaaattctt caggtgaaat acgctgccct ttgaaaagta 4741 aagatgtgtg catttgggcg gtcaaaccat cgtatagctt ggcatgctct actgcttttt 4801 tggcgtatgc aatggcttgc tcgctgtttt cctcactgag tttcgccagt tccacaaaca 4861 ctcgagaaag aaaagcgtga taaaatccac aatttccgtc ttcaaagaca atcccaaaga 4921 tataaggtag cttttccaat gcttttatac ggtcttgctt tggcaattcg ctttctgttg 4981 cataaacaaa tatcagacga tgcaataagt gcaatactgc atccaaactg cattgaatgg 5041 aatctgtttt gtctttgccc tctaatacac ccaaagcggc ggtctcaata cctgaccaaa 5101 tgctcggtag tttttgcatc cattcaattg ctttttcaca gtttcccaac agcttgttgc 5161 atacagaaat attatttata caacgacact gctcttccag atcttccgtc attttcaaaa 5221 aacgttctgc gatagatata gacaattcaa gataatattt tctttttttg tctacattgt 5281 gaagccccat aaggtaggaa tcaaccatta cattattgat aattgacttg ttatttggaa 5341 aagaagcata tactttttgc gataagctgt aggcatcaga aatgttgcca cgatgatgag 5401 cctcttgtcg acttttttca taatcctcta taatggactt gttggtctcg tagtctgcac 5461 ctaacagaaa atcgacagtg acattgtaaa acgacgcaag aacgggcagg aacgtaatgt 5521 ctggataggt cgcattattt tcccatctac ttaccgattg ttttgaaaca tctaacaact 5581 ctgcgacctg ttcttgtgtg aggccttttt gttttctcag tgtttttata ttttcaccaa 5641 aatcgaaatt catatatata cctccataaa tgtgttttgt agctacaatc atagtatata 5701 aaataatttc ggtacaatca acatctcggt ttgtgatgac tgtaacgaaa aatgagacag 5761 gatggctttt cgctttttaa gaaagttgca gtataaatcc ccacctttga cagataatag 5821 tatcacgatt caaaacaaaa aggagattta tataatatga aagcaaccgg aattgttaga 5881 agaattgatg atcttggccg tgtcgttata cccaaggaga tccgccgcac catgcgcatc 5941 cgcgagggcg acccattgga aatatatacc aacgccgacg gcgaggtcat tttcaagaaa 6001 tattcgccca tcaacgagct ttccgaaaac gccgcctctg ccgccgaggt tatctataag 6061 ctgggcggcc agcctgttgt aattttagac cgcgaccacg ttgtggctgt ggcaggtgtg 6121 cccaaacggg aatatttgga aagacggctc tcgccgatgc tcgatgacat tctcgaatcc 6181 cgccgcagct ggatgtatga cggcgagtcg cgcagaattc agcctgttga gggcatcgac 6241 cgccacgccc ttgctgtcac acccatcacc gcacagggcg acattgcagg cgctgtctgc 6301 tttatggcga ctgacgacca gccaaagggc acctcgcttt tgactactct ttcccagact 6361 gccgcaatgt tcttgggcag acagttggag tagccctctc cgtcacgcta tgcgcgacac 6421 ctctccctga gggggaagtt tgttagcgga gcgaagaatt gaacagtaat ccccagtcag 6481 cttcgctgac agctcccttt acacaaggag gtcttgcgcg gtgtcgtcat cctctcgctg 6541 aatccacctc atccgtcggc atccgccgac accttcccct caaggggaag gctatccccg 6601 aaagcagcag gccttgcacc aaaaatgcaa gacctgcttt attttttaca tatctacttt 6661 ttgaggatct ctttaacctt ttcgtcgaag aaatcgcggc cacaaaatgc cgttccgttt 6721 tggctgacag ctcccgccgc cgagcaaaca ccaaagacga gggtcttata taggctcacg 6781 ccgtcttcaa gtgccagaca agcccccgcg accattgcat cgcctgcgcc ctgcgcactt 6841 ttaacatcaa ctttgaccgc atcctggtgg taagctcttt ctttatcaac gatcattgcg 6901 ccttgtgcgc ccagcgatat aagcacggtg ttaactcctg cgccgtcaat gatctgctcc 6961 gcaacggctt taatgtcgga atatttttta agtgcacagc caaaagctcc gcaaagctct 7021 tccaaattcg gcttgatcat atatggcgcc gcttcaattc cgcttctcaa cgcttccccg 7081 ctggcatcaa tgatcacctt gacctcggga ttgagttctt ttgccctaag gcagagcgtt 7141 ttgtatatat caagcggaac gcccgatgga acgcttcccg ccaaaacgag aatatcgcaa 7201 ttcacaacaa tgctctcaaa cctttgaatc agctttgaaa gaacgtcttt tttgaccttt 7261 gatgccggct cgtttatctc aacggtgttt tttgtttcgt tgtcaaaaat cttcaggttt 7321 gttcgcaagg gagcagggca tttgatgaaa tccgcgctga tgccctccga tttgagaaaa 7381 cggttgattt catccgcttt atcaaagccg atgccgatgg catatgtatt aagtcccaat 7441 ttttttgccg ctcggctgac atttattcct tttccgccga aatcaacgct tatgggcgta 7501 attctgttca cttcgcttgg gttaaagctc tcgcattcgg cagttttgtc gatcgcgggg 7561 ctgagggtaa cggttaaaat catatatggc aacttcctca tttaggttta tattacgata 7621 gtataccttt cttacaaaaa tgtcaaacat ctacaaagcg tttgaactca tctattatac 7681 gtttacggtc gcaatcggta taataaaaat ggtatgagtc cttcaaaaga tatgccctca 7741 aggtcgggtg gtctttaatc agcctatatg accccggcca aaccagctcg tcttttcccg 7801 attggaacgc aacacccttt attcgcatat tcggcagaat cttccttgtc ttttcaattt 7861 ttacaagcag ttcccaaaac cgcggtatcc agccgatata ttcccacaga taagctcctc 7921 tgtggtcgat actgcaggcg cagaaggttg catcgcaaac g // LOCUS sequence012 7925 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence012 VERSION sequence012 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..7925 /mol_type="genomic DNA" /organism="" /note="sequence012" CDS complement(545..2365) /product="1-deoxy-D-xylulose-5-phosphate synthase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_033045549.1" /transl_table=11 /codon_start=1 /translation="MEYRLLSSLNLPEDIKSLTSSDKTELCSELRSKIIETVSNNGGHL ASNLGVVELTLACHSVFDSPNDKIIFDVGHQSYVHKLLTGRYDKFDTLRKKDGISGFLR PDESEHDPAISGHSSSSISVALGMAQAMKLRGDNHHAIAIIGDGALTGGLAYEGLNNAG RSDTNIIVILNYNEMSISKNIGGIAKYLAQMRTRPSYRRTKEFAKRTIEAIPFIGKPIK NFIHNVKQSLKEHILHSTIFEDLGFEFIGPVNGHDVKDLESALNVAKSLSKPTLVQVIT SKGMGYEPAEKNPGEYHGVPSFDIATGEKPKSKVSFGDHMGETLALLAKEDERICAITA AMKYATGLNHFDGELKSRLFDVGIAEEHAVSYAAGLAKMGMIPVFSVYSSFLQRSYDEL IHDVCIAGLHVVLCIGNSGFVGEDGETHQGLFDVPMLSTLPNTKIYSPACFKELDICLK KALYEDTGLVCIRYPKGGENSVTVNPCADYEYIQRQSDVLLVSYGRISNDVMSAAEVLV CDCLRLVNIFPICDQVKEIIGKYKEVYVFEESSRSGGIGEKLAEFAENIEIHAVSGFVP HMKVCEALELYSFTTERIVEEIRNSNGQPT" /locus_tag="LOCUS_0960" /gene="dxs" /EC_number="2.2.1.7" /note="WP_033045549.1 1-deoxy-D-xylulose-5-phosphate synthase (Clostridium botulinum) [pid:42.1%, q_cov:96.7%, s_cov:97.6%, Eval:8.9e-136]" /note="MGA_110" CDS complement(2393..3286) /product="(2E,6E)-farnesyl diphosphate synthase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_000150378.1" /transl_table=11 /codon_start=1 /translation="MSDYNARITEDISLINNAIAQIIRKEYSACSANKVIEAEEYSLNA GGKRIRPLLCLEFYKLFGGERDVSKLAACLELVHTFSLIHDDMPEMDNDELRRGKPTTH IAYGSATALLAGDGLAILPYKVISDSALEGDISFETTTKLTNLLACSSGNEGMIAGQMI DIDGETRQLSKDEIVEMYRRKTGALIKCACLFGAVLAGANDEQMQNTETYAENIGVVFQ LVDDILNIKSTAEELGKPVGTDKYRNKSTLISHIGEDAVLMMISQSTDKAINAIESYED AEFLIRFAEEMAKRRN" /locus_tag="LOCUS_0970" /gene="ispA" /EC_number="2.5.1.10" /note="WP_000150378.1 (2E,6E)-farnesyl diphosphate synthase (Bacillus cereus) [pid:42.7%, q_cov:89.2%, s_cov:89.9%, Eval:1.7e-53]" /note="MGA_111" CDS complement(3279..3470) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MNFDMSIKRLKEICEKLKDENTSLEETASLYKEGMELAKSCREVL DNIKSELDIEYKKVSENE" /locus_tag="LOCUS_0980" /note="MGA_112" CDS complement(3460..4671) /product="exodeoxyribonuclease VII large subunit" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_041272417.1" /transl_table=11 /codon_start=1 /translation="MSSILTVSQINKYISFKLKNDPKLKGIAIKGEISGFVRNSKSGHC YFSLKDESSLIKAVMFSSNAERLKFVPENGMSVIAFGNIDAYERDGVYQLMAFDLVPSG IGEEAIRLEQLKQELLELGVFAKEKKPIYRYPKNIAVVSSADGAALWDIVSVVKRRYPL TKITVFPTLVQGLAAPKNIASALYQADISGADTIILARGGGSKQDLSAFNTREVAIAIY SCETPVISAVGHEVDFSIADMIADLRAPTPTGAAELATPDISDMKFELDMITNQLIDAV YSKLNIREMILDAVETLLESLSPTHKVQRLYETIDDIDHKLSNALESKLRVCELVLSAQ MDMLKTLDPANILKRGYGLVYSNGEVVTDASKLRTGDAISVKLRGGSITAEVKNIEKDE INEL" /locus_tag="LOCUS_0990" /gene="xseA" /EC_number="3.1.11.6" /note="WP_041272417.1 exodeoxyribonuclease VII large subunit (Desulfitobacterium hafniense) [pid:40.0%, q_cov:98.8%, s_cov:100.0%, Eval:3.8e-73]" /note="MGA_113" CDS complement(4668..5615) /product="O-sialoglycoprotein endopeptidase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_041272419.1" /transl_table=11 /codon_start=1 /translation="MPKYLGLDTSNYTTSTALFDSDTGIVRNVKKLLPVKSGELGIRQS DAVFHHTKQLPELLHDLMQDVNGNVQAVGVSTRPRNVDGSYMPCFLVGETCANALSSVS KIEAYKTSHQVGHILAALYSCSRLDLIMDKKPFIAFHVSGGTTDCLLVEPDEEEIIKAT MIGSSLDLKAGQAIDRVGLMLGLDFPCGAELEKLAERSSYKCNIKPTVREGNCSLSGLE NKCQKLFDDGLDPCDIARFCILNIKATIKLMAKYALITYGEMPIICAGGVMSNKIIRSA IEREFDAYFAEPILSCDNACGTALYAAIKDGYLR" /locus_tag="LOCUS_1000" /note="WP_041272419.1 O-sialoglycoprotein endopeptidase (Desulfitobacterium hafniense) [pid:40.6%, q_cov:98.4%, s_cov:98.1%, Eval:2.7e-49]" /note="MGA_114" CDS complement(5617..6024) /product="transcription antitermination factor NusB" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_010965384.1" /transl_table=11 /codon_start=1 /translation="MGVTRHDIRESEFMIIFEKMFRDESVSELLEIALDNEAITVNDEV KETVEGVFANLEQIDTIISSFSEKRNLARMPKINLAILRLAVYEILYKSDIAPIKVVIN EAVGRAKKYALDPDISFVNGVLGAYSRSLEN" /locus_tag="LOCUS_1010" /gene="nusB" /note="WP_010965384.1 transcription antitermination factor NusB (Clostridium) [pid:38.8%, q_cov:97.8%, s_cov:98.5%, Eval:7.5e-17]" /note="MGA_115" CDS complement(6092..6454) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MEQSSRNRRGTLKVSENVIITITKNAACEVDGVSAIANKPFSIKS LLNPNLDNSMVNVVMLDGVAKIAISIIAKSGYNIVNVCELVQEKVKAAVQSMTGVTVSK VNISVVGVDFNENVAE" /locus_tag="LOCUS_1020" /note="MGA_116" CDS complement(6573..7130) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MRKPKLSINLNKRHIILACLTLMLGIAVYVNYALTGTALKPTDVV EGIDLNDSYGEVRYVNGTEYINYSSEDYFAQARLDKVTSRDEAVETLTMMLGGGDVTEE EIATYTESALTLSALIESESTIESLIKAAGYEDCVVYLDGENASIVVKTDGLSAAQAAD IKDILLSEVSVLAENIRIFEVK" /locus_tag="LOCUS_1030" /note="MGA_117" CDS complement(7144..7635) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MDIFTLKDAVIKKLKSSPKIVVYLAATLVCIVLLLIMGRDTTPND AVNDFPKAETEYAAQLERQLEAVISQIDGAGKTRVMVTVESTVSYEYATDDSYSESKYE SEIVIIGSDKALIKKIDNPEVAGVLVICDGGDSAVIKEKILKAVATVLDISSNKVYITK " /locus_tag="LOCUS_1040" /note="MGA_118" ORIGIN 1 cggcttgccg acttcaaact ggggcttaat tagaattaca gcttgtcctc cgtctttaag 61 tattctcgaa gctgctttaa ttgcatattt acaagagata aaggacaagt cagaggctac 121 aaaatcgacc tcacacccaa gggtatcgca gatcaaatcc ttgacgttta agccctcaag 181 gttaactact cttgtatcat caatcaactt ttgcgcaagc tgaccgtgtc caacatcaac 241 agaaaaaact ttaacagcac cattttgaag catacaatcg gtgaaccctc cggtagaggc 301 tccgatatcg caacaaacca ttccgtttaa atcaagagaa aaacttttaa tcgcgccctc 361 aagcttgagt cctcccctgc cgacatattt caacgactcg ccggtgaata aaatatcgtc 421 agcatcactg ataacagcgc cggccttggt cacagcctta ccgttgacca aaaccaaacc 481 gcttttaata tattcctttg cgcgttcacg gcctgttgcg attccgcgtc agacaagttc 541 aaaatcaagt cggttgtcca tttgaattcc ttatttcttc aacaattctc tcagttgtaa 601 agctgtaaag ttctaatgct tcacagactt tcatatgagg tacaaagccg ctaacggcgt 661 gaatctcaat gttttcagcg aattcagcca gcttctcacc gattccgcca cttcgagatg 721 attcctcaaa aacgtaaact tccttatact tgcctataat ttccttaacc tgatcgcaaa 781 tcgggaatat gttcacaaga cgcaggcaat cgcatacaag aacttccgct gcagacatga 841 catcgtttga aattctgcca taggaaacca aaagaacgtc gctttgtctt tggatatatt 901 cataatcagc gcatggatta actgtaacgg aattttctcc gccttttggg tatcttatac 961 acaccaagcc tgtatcttca taaagcgcct ttttaagaca gatatcaagc tctttaaagc 1021 acgccggaga atatattttc gtattgggaa gtgtcgaaag catcggaaca tcaaacaacc 1081 cttgatgtgt ctcaccgtcc tcgccgacaa accctgaatt accgatacat aaaacaacat 1141 gaagtcccgc gatacaaaca tcgtgtatca gctcgtcata tgaacgttga aggaaagatg 1201 aataaacgga gaagacaggt atcataccca tttttgcaag gccggcagca taagaaacag 1261 catgctcctc tgcgatgccg acatcaaaca agcgtgattt caattcaccg tcgaaatggt 1321 ttaagcccgt tgcatatttc attgcagcag taattgcgca aattcgctca tcttcctttg 1381 ccaacaatgc taaggtttcg cccatatggt caccgaacga tactttagac ttgggctttt 1441 cgcccgttgc aatatcaaac gaaggaacac cgtgatattc gcccgggttc ttttctgcag 1501 gctcatatcc catgccctta gaggttatca cctgaacaag tgtaggcttg ctcagcgact 1561 ttgcaacatt aagcgcagat tcaaggtctt taacatcgtg accgtttaca ggaccgataa 1621 attcaaaacc aaggtcctca aaaatcgtgc tgtgaagaat atgctccttt aatgattgct 1681 tcacattatg aataaaattt ttaatcggct taccgataaa tggaattgct tcaatagtgc 1741 gctttgcaaa ttcctttgtt cgtctatatg acgggcgagt gcgcatttgc gcaagatatt 1801 tcgcaattcc gccgatgttt ttagaaatcg acatctcgtt ataattgaga attacgatta 1861 tattagtgtc acttctgccc gcattgttaa gaccttcata tgcaagaccg ccggttaaag 1921 cgccatcgcc aataattgca atcgcatggt gattgtcgcc tcttaacttc atcgcctgcg 1981 ccataccgag tgctacagaa atcgaactgg agctgtgacc gctgattgca gggtcatgtt 2041 ccgattcatc aggcctcaaa aatcctgaaa tgccgtcttt tttgcggagt gtatcaaatt 2101 tatcatatct accggtcaaa agcttgtgaa cgtatgattg gtggccgaca tcaaagatga 2161 tcttatcgtt gggagaatca aaaacgctgt ggcaagcaag tgtcagctca actacgccaa 2221 ggtttgatgc caagtgtccg ccattatttg atacagtttc aatgatcttg cttctaagct 2281 cagagcaaag ctctgtttta tcgcttgatg tgagcgattt aatatcctcg ggcagattta 2341 agctcgaaag aagcctatat tccattttcg ctcacacctt tcatatgtaa gtttagtttc 2401 ttctctttgc catctcttcg gcaaaccgaa ttaagaattc agcatcttcg tatgattcaa 2461 tggcattaat cgctttatcg gttgattggc ttatcatcat caaaacggca tcctcaccga 2521 tgtggctgat aagtgtcgat ttgtttctgt atttgtcggt gccgacaggc ttgccaagct 2581 cttctgcggt gcttttaatg ttcaaaatgt catcaacgag ctggaaaaca acaccgatgt 2641 tctcggcata tgtttcggta ttttgcatct gttcatcatt tgctccagcc aaaactgcgc 2701 caaacaagca tgcacattta atcagagcac ctgttttgcg gcgatacatc tcaacgattt 2761 catcttttga aagctgtctt gtttcaccgt caatatcaat catctggcct gcaatcatac 2821 cctcgttgcc ggatgagcaa gccaaaaggt ttgtcagctt cgttgtagtt tcaaaagaaa 2881 tgtcaccttc gagcgcagaa tcggatatga ccttatatgg caaaattgca aggccgtcac 2941 ccgcaagcaa agcggttgcg gaaccgtatg caatatgtgt cgtgggtttg cctcggcgaa 3001 gctcgtcatt atccatttcg ggcatatcat cgtgaatcag cgaaaaggta tgcacaagct 3061 ctaagcatgc tgcgagcttt gaaacatctc tctcaccgcc aaatagctta taaaactcaa 3121 ggcaaagaag cggtcttatc cgctttccgc ctgcgttaag tgaatattct tccgcttcga 3181 taaccttatt tgccgagcaa gcggaatatt ccttacgaat aatttgggca attgcattgt 3241 ttatgagcga gatatcctca gttatgcgag cattataatc actcattctc gctcaccttc 3301 ttatattcaa tatcaagctc cgacttaatg ttatccaaaa cctctctgca agattttgca 3361 agctccatgc cttccttata gagcgaagca gtttcttcta aagatgtgtt ttcatcttta 3421 agcttttcgc aaatttcttt aagccgtttt atcgacatat caaagttcat tgatttcatc 3481 cttttcgata tttttaactt ccgctgtaat gcttccacca cggagcttga cgcttattgc 3541 atcgcccgtg cgaagcttgc ttgcatcagt tacaacttcg ccgttcgaat ataccaaacc 3601 gtatccacgt ttcaaaatgt tagctgggtc gagcgttttg agcatatcca tttgcgcgct 3661 caaaaccaat tcgcaaacac gaagtttaga ttcaagcgca tttgagagtt tatgatcaat 3721 atcgtcgatt gtttcatata gtctttgcac cttatgagtc ggcgaaagag attcaagcaa 3781 ggtttcaacc gcatcaagga tcatttcgcg gatgttcagt tttgaatata ccgcatctat 3841 tagctgattt gtaatcatat caagttcaaa tttcatatcc gatatatcag gcgttgcaag 3901 ctcggcggca cctgttggtg tcggagcacg caaatctgca atcatatcgg caattgaaaa 3961 atccacctcg tggccgacag ctgaaatcac aggtgtttca cagctatata tcgcaatcgc 4021 gacttctctt gtattaaatg ccgataaatc ttgttttgat ccgccgccac gtgcaagaat 4081 aatcgtatca gcacccgaaa tatctgcttg gtataatgcc gatgcgatgt tcttcggggc 4141 agctaatcct tgaacaagtg ttgggaaaac agtgatcttt gtcagcggat atcgtctctt 4201 gacaacactg acaatatccc acagagccgc gccgtcggca gacgacacaa ctgctatgtt 4261 cttaggatat cggtatatgg gcttcttctc ctttgcgaaa actccaagct ccaaaagctc 4321 ttgtttgagc tgttcaagtc gtatagcttc ttcaccaatt ccggaaggca ccaaatcaaa 4381 tgccataagc tgatatacac cgtcacgctc gtaagcatca atattgccaa aggcaataac 4441 gctcattccg ttttcaggga caaacttcaa acgctcggca tttgatgaaa acatcacagc 4501 tttaatcagc gaagattcat ctttaagcga aaaatagcaa tgacccgatt ttgaattgcg 4561 aacaaagccc gatatttcgc ctttaattgc aatgcccttg agcttggggt cgtttttcag 4621 cttgaaggaa atatatttat ttatctgaga aacggtcaga attgaactca tcttaaataa 4681 ccgtccttaa ttgcggcata taaagctgtg ccgcaagcat tatcgcaaga aagtatcggc 4741 tcggcaaaat atgcatcaaa ttcgcgttca atcgctgagc gaatgatctt atttgacatt 4801 acaccgcccg cgcaaattat tggcatttca ccgtatgtaa tcaaagcata cttagccatt 4861 agtttgatcg ttgctttaat atttaaaata caaaatcttg caatgtcgca aggatctaat 4921 ccgtcatcaa aaagcttttg acacttattt tcaagcccgg acaaactgca attgccttct 4981 cttacagtcg gcttaatgtt gcatttatag cttgatcttt cagccaactt ttcaagctcc 5041 gctccgcagg gaaaatcaag accaagcatt aaaccaacgc ggtcgattgc ttgtcccgct 5101 ttcaagtcaa gcgatgaacc gatcattgtc gccttgatga tttcttcttc atcaggttca 5161 acgagcaaac agtcggtagt gccgccgcta acgtgaaacg caatgaaagg ctttttatcc 5221 ataatcaaat caagccttga gcaggaataa agtgccgcga gaatatgtcc gacctggtgt 5281 gaggtcttat atgcctcaat ttttgaaaca cttgaaagag cattcgcaca ggtttcaccg 5341 actaagaagc aaggcatata tgagccatca acgtttctcg gtctggttga aacgccgaca 5401 gcttgaacat tgccgttaac atcctgcatt aagtcgtgca atagttcggg aagctgtttt 5461 gtgtgatgaa aaacagcatc cgattgtctt attccaagct caccgctttt aaccggcaaa 5521 agctttttaa catttcttac tatacctgtg tcgctgtcaa acaatgcagt cgatgtggta 5581 tagttgcttg tatcaagtcc taaatattta ggcattttag ttttccaaac ttcttgaata 5641 tgcgcccaaa acgccgttga caaatgaaat gtcggggtca agcgcatatt tcttcgcacg 5701 accgacagcc tcgttaatta cgaccttgat cggagcgata tctgacttgt aaagaatctc 5761 atatacagca aggcgcaaaa ttgcaaggtt aattttcggc atacgggcaa ggtttctctt 5821 ttcactgaag cttgaaataa ttgtgtcaat ctgttcaagg tttgcaaaca caccctcaac 5881 agtttcctta acttcatcgt taacggtaat tgcttcattg tccaatgcaa tttccaaaag 5941 ctcggaaaca gattcatctc tgaacatctt ttcaaagatg atcataaact cagattctct 6001 gatgtcatgt cttgttacac ccattgtttt tccatcctta ataatttatc aagcaagata 6061 tgccaagaga atttatccct tggcacaaac tctattctgc tacgttttcg ttgaagtcaa 6121 cgcccacaac ggaaatgttg acctttgaaa cggttacacc ggtcatcgac tgcacagcag 6181 ccttaacctt ctcctgaacc agttcgcaaa cattaacaat gttgtatccg ctctttgcaa 6241 taatggatat tgcgattttg gcaacaccgt caagcattac gacatttacc atgctgttat 6301 ccagattggg gttgagcagg ctcttaatgc tgaaaggctt gtttgcaata gcggatacac 6361 cgtcaacctc gcaagcggcg tttttggtga ttgtgatgat tacattttcg gaaactttaa 6421 gtgttcctct gcgatttctt gatgactgtt ccatacagat tagtcctcct tttatacgtc 6481 ttatgcaggt aatttcttat cctgcgaaaa atatacagat tctatgcaca gttatacgaa 6541 tatagtatat catgttttga tgaattgtac aactacttta cttcaaaaat tcttatattt 6601 tccgctaaaa cactgacttc cgaaagcaaa atatctttga tgtctgccgc ctgcgccgca 6661 ctcaggccat ccgtcttaac aacaatgctt gcattctctc catccaggta tacaacgcag 6721 tcttcatagc ctgcagcctt aatcagactc tcaattgtag attcactttc aataagtgca 6781 gaaagcgtta atgctgattc ggtatatgta gcaatttcct cttctgttac atctcccccg 6841 cccagcatca ttgtgagtgt ctcaacagct tcatcgcgtg atgtaacttt atcaagacgt 6901 gcctgagcga aataatcttc cgaagagtag ttgatatatt cggttccatt gacatatctg 6961 acttcaccgt acgaatcatt taagtcaatg ccttcaacaa catctgttgg ctttaaagca 7021 gttccggtaa gagcataatt cacatataca gcaattccca acatgagcgt taggcaagct 7081 aaaataatat gtcttttgtt aaggttaatg ctgagtttgg gttttctcat tatctttctc 7141 tccttatttg gtaatataaa ccttatttga tgatatatcc aaaacagttg caacagcttt 7201 aagaatcttt tctttaatta ccgcgctgtc gccaccgtca cagatcacta atacacccgc 7261 cacctcggga ttatctattt ttttaattag agctttatcc gaaccgatta taacgatctc 7321 tgattcgtac ttagattcgg aatatgaatc atccgttgca tattcatagg ataccgtgct 7381 ttcaactgta accataactc ttgtttttcc tgcaccgtca atttgagata ttactgcttc 7441 aagctgtctt tcaagctgcg cggcatattc cgtttcggct tttgggaaat cgtttactgc 7501 atcgttcggg gtcgtatctc tgcccataat gagcagcaaa acaatgcaga caagtgttgc 7561 agctaaataa acaactattt tcggcgagga tttcagtttt ttaattacgg catccttcag 7621 agtgaatata tccatttata cctccacgaa ggatagtgaa acctcgatat caccgatctt 7681 gcttttaatc aagttgatga caattatttc gtccttctca tattcacttc caagctcaat 7741 gcttgccttt gtaatagata tgcacctgtt ttcgtcaata gtcgtatcaa ccgatacttt 7801 ttcgctgaca atgccttcgt cctcgtagct gttgtaggtg tcaaagagtt tgtgcatgta 7861 gatatactga ttatgcacct ctgtggacca cttgtcgaag gtttcctgat ccttggcaaa 7921 gccga // LOCUS sequence013 7571 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence013 VERSION sequence013 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..7571 /mol_type="genomic DNA" /organism="" /note="sequence013" CDS complement(2178..2633) /product="thioredoxin-dependent thiol peroxidase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003439443.1" /transl_table=11 /codon_start=1 /translation="MLTVGQKAPDFTLFDTAGNEVSLSGFLGKKVVLYFYPKDNTPGCT RQACAFASHYDDFKAKDIVVIGISRDSVASHVKFAEKYSLPFVLLSDPERKAIEAYGVW QEKKLYGKVSFGVVRTTFIIDEQGNIVSIMPKVKPDTNSVEILEYLA" /locus_tag="LOCUS_1050" /gene="bcp" /EC_number="1.11.1.24" /note="WP_003439443.1 thioredoxin-dependent thiol peroxidase (Clostridioides difficile) [pid:67.3%, q_cov:99.3%, s_cov:97.4%, Eval:2.3e-55]" /note="MGA_121" CDS complement(2646..3701) /product="FAD:protein FMN transferase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011071622.1" /transl_table=11 /codon_start=1 /translation="MIKRMISLLLALLMALSLCACKKEKQKFSAYYFDWFDTATSIIGY EYTEAEFNATCDIIEGLMTEYHQLANIYIQYDGLNNLVTVNSIANGEHSAVKVDEKLID LLLYAKDMYALTGGEMNIALGSVLSIWHDYRTLGLDDPKNAKLPPMDKLTDAAEHTDID DLIIDEENSTVYLNDPETRLDVGAIAKGYAVEMVARHLEEKGITGYLINAGGNIRTIGT RGDGTPWQIGIENPDTSATDKPHIEYLKLSGQSLVTSGSYQRYYTVNGINYHHIIDPDT LMPGERFLSVSVLCDHSGMGDAISTALFNMDLDEGKALVESLENVSAMWVLPDGTQIYS QGFEAFTFDYE" /locus_tag="LOCUS_1060" /note="WP_011071622.1 FAD:protein FMN transferase (Shewanella oneidensis) [pid:34.3%, q_cov:92.0%, s_cov:88.5%, Eval:1.0e-44]" /note="MGA_122" CDS complement(3774..4790) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MKKITAILLAMLMIVSCVAMTGCGAKTLNFGMGVYAYHKTVSNAD GETNGAGELVATAAAVLVDADGKIVKCVVDTADSTVNWTSAGEAVAKNEFKTKYELGTN YNMAAYGSDLNGDGIVKEWFEQIDIFCAAVEGKTIDEVKAMLADGYYGTEELTTAGCTM GVADYVKAVEKAVANAVASGATANDTLKLGVVTTAESANATEEAEGKQEVASTFVAAAV AADGKVNAMSTDVATVTYKFDAAGATTADASAAVTTKKELGANYNMAAYGADLNGDGVV KEWFEQAAAFDAACVGLTASEIAALMVDGYGVESLQTAGCTIAIADMVNAAVKAATL" /locus_tag="LOCUS_1070" /note="MGA_123" CDS complement(4898..5398) /product="Gx transporter family protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_005817206.1" /transl_table=11 /codon_start=1 /translation="MTNKAKKVAYLGLMAAVALILSYVEALFPPIYAAVPGIKVGLPNI VIIFMLYRFGLKEAAAVSLVRLAAVALLFGSVMTLAYSLAGAVLSLTLMALCKRFNIFT TVGVSVVGGVSHNLGQIIVAMIVMETAQIGYYMVVLAITGTIAGVFIGLAGNLLLKYMK NVK" /locus_tag="LOCUS_1080" /note="WP_005817206.1 Gx transporter family protein (Desulfitobacterium) [pid:35.2%, q_cov:94.6%, s_cov:75.6%, Eval:1.2e-19]" /note="MGA_124" CDS complement(5429..5815) /product="NusG domain II-containing protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003416526.1" /transl_table=11 /codon_start=1 /translation="MSKASKPNNKIRNDLILVAALLVIAAAGFILMNSFKQAGDWAVVT VDGVETARFLLSEDTGYVIEVGDGGNILVISDGKAMVSDASCPDLICVHHRPISNVGET IVCLPNKVVISIEKSSSDGLDASA" /locus_tag="LOCUS_1090" /note="WP_003416526.1 NusG domain II-containing protein (Clostridioides) [pid:31.9%, q_cov:86.7%, s_cov:91.1%, Eval:3.4e-09]" /note="MGA_125" CDS complement(5812..6612) /product="Fe-S cluster domain-containing protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_012869100.1" /transl_table=11 /codon_start=1 /translation="MTQILTALLVVGGVGLVMAIVLVVASIVFKVEEEEKTKTIRECLP GANCGACGYTGCDGYAKALALGEAEPNLCIPGSVSVAEKLSEILGVEIKVGEPVVAFVG CNGTCEATSKKALYDGISSCCAASMIYGGPNACRFGCVGCGDCAGVCPTNAICIDDGIA RVDPRVCIGCGMCVKECPKDIIKLLPKDAKVAVMCNSLDKGAVARKNCKNACIGCHKCE KECPSGAIKIVDNLSVIDYEKCIACGRCAEVCPTKCIHNVMLEV" /locus_tag="LOCUS_1100" /note="WP_012869100.1 Fe-S cluster domain-containing protein (Thermanaerovibrio acidaminovorans) [pid:45.5%, q_cov:92.1%, s_cov:91.4%, Eval:2.3e-64]" /note="MGA_126" CDS complement(6628..7227) /product="electron transport complex subunit RsxA" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_005904083.1" /transl_table=11 /codon_start=1 /translation="MDTVKNLIVILMSSVLVNNYVLSRFLGICPFLGVSKKLNQATGMG IAVTFVMLMATAVTWPIQIYILDPNGLGYMQTIVFILVIAALVQFTEIFLKKYIPALHK SLGVYLPLITTNCAVLGVTINNINDGFNFVESIVSSLGCGVGFLLAMVLFSGIRSRIDE TNIPKALRGLPATLIAASFLSLAFFGFAGIVDNLFA" /locus_tag="LOCUS_1110" /gene="rsxA" /note="WP_005904083.1 electron transport complex subunit RsxA (Fusobacterium nucleatum) [pid:52.9%, q_cov:96.0%, s_cov:98.5%, Eval:8.0e-57]" /note="MGA_127" ORIGIN 1 aagagcaaat aaagaggaat caagaacgct caaatcgctt tccggcttaa ttccgtatac 61 cttttccttg aagtattcgg tcatatactg catatcctct tcaattacag cgtgacccga 121 agtgtgaata tttatcttga tgttgtcttc aagtcccaag aatgtgtata tttcctttgc 181 gccgaggtag gtataccaca ttgcgggggc gtttacccag tcttcccata cgcaggagcc 241 gatgatgaag agcattctgt ctttgcttgc gggaagcgat gccaacatat actgatcaaa 301 aggcagatgt gttgccgact tgaacttctt aaagttgtcg cagaaccagc caacctcgcc 361 ggatgactgc aagcttccca aaggctcgtt atcgccatat gtatacgcgc ccgattcacc 421 ctttgaggtg aagtcatagg tcttgccctt ggaagtatag cggaagagcg caagaccgcc 481 cgcgcccgag caggaaggag caaccattgt gaatctatca tcaaatgcgc ccgcaacaga 541 agctgccttg ccccaacggg aaacaccggt aactaccgag ttgtgagggt cgattccaag 601 ttcttcgcca agacctgctt ccaaagcgtc caaaatcttt gagcagcccc aagaccaagc 661 catcaatacg cctgtctgat cctgccagtt cttgccgtag ggataaaggt catagaacgc 721 acctgtgtgc ttggtgtcat cagatgcgat gccgtatgca aaccaatcga gagtgatggt 781 tgcaaaaccg cccgcatttg cggtctgttc gctgatgccc atatgcatac cgacaacaac 841 ggggtatccc gcatcggaag gtgccttaac agattcctcg ggcatcataa cagttgcggt 901 gaactgagtt tttgcgccgg ttgaaattct ttcaatataa acggtaagtg ttccgttatt 961 atagtcatat gtaacgatct catcggttcc gtcacgccat acgccgtaca tatagtactg 1021 atacatatcg ctgatttcct tgcgacgagc ttcccaatcg gccttagatt tcatttcgct 1081 gccgtcaagg aatacaaacg gatcgggata ttcgtcattc cactcgatat cggcgacatc 1141 gggaaatgcg gatgcatcga caaggttttc tcttacttcg tgtgcctttt ccatagccat 1201 aacaacatcc tctactgtaa ggtcggtctt atttaacaac tctcggagct tgattgcagt 1261 tgcagtgata ttttcatatc cgccgtatga ggtatagtcg gtagtttcat atcgttcgat 1321 catcttttcg atgccatcgg tgcaaacttt aacgggagtt tccctctcac cttcaaatat 1381 gatctcgccc caatcgcagg gagccgattc aagatcgggt gtagagaaaa gaccgagttc 1441 gccgacctcg gcgcccgaag catcgtaatc gcttacaata acttcaaagc ctgcgaccca 1501 gccgtcggtc atgatcgagg ctatatcaac agaagcctca accgcatatc ctttgtcggt 1561 tacgcttgca ttaaacgaaa agcttccatc gcccgacatc atatctgatg tgcagttcgg 1621 aagaatggtg aaattccaat cgtcgccgtc aagttcaccg cttttatccc aaagagtgtc 1681 gatattaacg gtcacaacgt ccttttcggg gttaacgtca gcatcagtga cctcaaccaa 1741 aatatagaag aattcgtcat cccaaagagt cttgacggtt gccttggtcg gtacatagaa 1801 tctgtccttg aaggtcaatt cggttgcttc aacctttttc caagccttgt cgatttttcc 1861 gttaacggag gaggtggttg gtgtgcctct tcttgcaatc aatctgccct tttcgtcaac 1921 acatccgccg aggctggcga tatcttcatc gccgccgaca gcaggacctg cacagcctgc 1981 aagcatcgac aagcaaagaa tgagtgccaa aacgagcgat aatagccgtt tcatatatga 2041 tctcctttcg cattcgcaaa atttactttc acataataaa gtatatcaat cagatgagtt 2101 taagtcaagg gagtgtgcag attcggtcaa tagaaaaagc acttccgttt ttggcgaaag 2161 tgcttaaaat aatcagttta tgcaagatat tcgagtatct caacagaatt ggtgtccggc 2221 ttgacctttg gcataatact aacgatgttg ccctgttcat caattatgaa ggtcgtcctc 2281 acaacaccga agctgacctt tccgtatagc tttttctcct gccagacgcc gtaggcttca 2341 attgccttgc gttcggggtc agagagcaaa acaaacggca acgagtattt ctcggcaaat 2401 ttaacgtgcg aagctacgct gtcacggctg atgccgatga cgacgatatc ctttgccttg 2461 aaatcatcat agtgagatgc aaatgcgcac gcctgacgtg tacatccggg ggtattgtcc 2521 ttggggtaaa agtacaaaac gacctttttg ccgaggaaac cgctaagcga cacctcgttt 2581 ccagcggtat caaataatgt gaaatcgggc gctttctgtc ctacagtcaa cattttcatc 2641 gctccttatt cataatcaaa tgtaaaagct tcaaagcctt gggaatatat ctgtgtgccg 2701 tcgggcaaga cccacatcgc gctaacgttt tcgaggcttt caacaagcgc cttaccctcg 2761 tcaaggtcca tattgaacag cgcagttgat atggcatcgc ccattccaga atggtcgcac 2821 aaaacggaaa cgctcaaaaa tctctcgccc ggcataaggg tgtcggggtc gattatgtgg 2881 tgataattga tgccgttaac ggtgtaatat ctctgatatg aaccgctggt gaccagcgac 2941 tgtcccgaga gctttaaata ttcgatatgt ggcttgtcgg tagcgcttgt gtcggggttt 3001 tcaatgccta tctgccaagg tgtgccgtct ccgcgggtgc caattgtgcg gatatttccg 3061 cccgcattga taagatatcc tgttatcccc ttttcttcca gatgacgagc aaccatttca 3121 acggcatagc cctttgcaat tgcgccgaca tcaagccttg tttcgggatc attaagatat 3181 actgtcgagt tttcttcgtc gatgatgaga tcgtcaatgt cggtgtgctc agcagcatca 3241 gtcagcttat ccatcggcgg aagctttgca tttttggggt catcaagacc caaggtgcgg 3301 tagtcgtgcc agattgataa aacacttccg agagcgatgt tcatctcccc acccgtgagg 3361 gcatacatat ccttggcata taacaaaaga tcgatcagct tttcatctac cttaaccgca 3421 ctgtgctcgc cgtttgcgat tgaattcacc gtcacaaggt tgttaagacc gtcatactga 3481 atgtatatat tcgcaagctg atgatactcg gtcatcaaac cctcgataat gtcgcaggtg 3541 gcattgaatt cggcttctgt gtactcatat ccgatgattg atgtcgcggt gtcaaaccaa 3601 tcgaagtaat atgccgagaa cttctgcttt tcttttttgc aggcgcaaag gctcaaagcc 3661 attaaaagcg caagcaaaag cgaaatcatt cttttaatca atcttatcac ctaccttgtg 3721 taaaataaaa gggatgccgt atgacatccc tttttgcgct tagttcctta aaattagagg 3781 gttgcagcct taacagcagc gtttaccata tcagcaatag caatggtgca gcctgcggtc 3841 tggagggatt caacaccgta gccgtcaacc ataagagcag cgatttcgga agcggtaagc 3901 cctacgcaag cagcgtcgaa tgcagcggcc tgttcgaacc attccttaac aacgccgtcg 3961 ccgttgaggt cagcgccgta tgcagccatg ttgtagttgg cgccaagttc cttcttggtg 4021 gttacagcag cagaagcatc agcggtggta gcaccggcag catcgaactt gtaggtaacg 4081 gtagcaacgt cggtggacat tgcgttaacc ttgccgtcag cagcaactgc agcagctaca 4141 aatgtggaag caacttcctg cttgccttca gcttcttcgg ttgcattagc actttcagcg 4201 gtggtaacaa cgccgagctt gagggtgtcg ttagcggtag cgcccgatgc aacagcgttt 4261 gcaacagcct tttcaactgc cttaacatag tcagcaacgc ccatggtgca gcctgcggtg 4321 gtgagctctt cggtgccata gtagccatca gcgagcatag cctttacttc gtcaatggtc 4381 ttaccttcaa cagcagcaca gaagatgtcg atctgctcga accattcctt aacaatgccg 4441 tcgccgttga ggtcggagcc gtaagcagcc atgttgtagt tggtgccgag ttcatacttg 4501 gtcttgaatt cgttctttgc aactgcttcg cctgcggaag tccagttaac ggtgctgtca 4561 gcggtgtcaa caacacactt aacgatcttg ccgtcagcat caaccaatac agcagcagcg 4621 gtagcaacaa gctcgcctgc gccgttggtt tcgccgtcag cgttggaaac agtcttatgg 4681 taagcataaa cgcccatacc gaagttgagg gtctttgctc cgcatccggt cattgcaacg 4741 caggatacga tcataagcat agcaagtaaa attgcggtga tcttcttcat gattttatct 4801 cctttgaaac attattttga tttgcgtagt ttgcaagtta gattatgaca taaaattatc 4861 aatctgtcaa ctgaaatttt cgacaaaatg aacattatta tttaacattt ttcatatatt 4921 tcaacaatag gtttcccgcc aacccgatga acactccggc tatggttccg gtgatagcca 4981 aaaccaccat ataatagcct atttgcgcag tttccatcac tatcatagcg acgattatct 5041 gacccaaatt atgggataca ccgcccacca cgctgacacc tacggtagtg aaaatattaa 5101 accgtttgca aagcgccata agcgtaaggc ttaaaactgc tcccgcaaga ctgtatgcca 5161 gcgtcatcac gcttccgaaa agaagcgcaa cagccgctaa tcgaaccagc gacaccgccg 5221 ccgcttcctt taagccgaag cgatagagca taaaaattat gacaatattg ggcagaccca 5281 ccttgattcc cggtaccgcc gcatagatcg gagggaagag cgcctcgaca tatgaaagaa 5341 tcagcgccac ggccgccatc aagcctaagt atgccacttt ttttgctttg ttagtcatgt 5401 atttctccaa agaaacgaag cctattcatc aagcggaggc gtcaagtcca tcgctcgatg 5461 atttttcaat gctgattacg accttgttcg gcaggcaaac gattgtttcg ccgacgtttg 5521 aaatcggtcg gtgatgaacg caaatcaaat cggggcagga tgcatcgctg accattgctt 5581 taccgtcgga aatgaccaaa atgtttccgc cgtcaccaac ctcgatcaca tatcccgtat 5641 cctcactcaa gagaaaacgc gcggtttcaa caccgtcaac agtcacaact gcccaatccc 5701 ctgcctgttt aaaggaattc attaggataa agcctgccgc cgcaatgaca agcagtgcgg 5761 cgacaagaat aaggtcgttt cttattttgt tgtttggttt gctcgcttta ctcatacttc 5821 aagcataaca ttatggatgc acttggtggg gcaaacctct gcacatcttc cgcaggcgat 5881 gcacttttca tagtcgataa cggaaaggtt gtcaacaatt ttaattgcgc ccgaaggaca 5941 ttccttttcg cacttatggc atccgataca agcgtttttg cagttctttc ttgcaactgc 6001 gcccttatca agggagttgc acataactgc aaccttggca tctttgggaa gaagcttaat 6061 gatgtccttg ggacattcct taacgcacat tccgcagccg atacaaactc tggggtcaac 6121 tcttgcaatg ccgtcgtcaa tgcagatcgc attggtgggg caaacgcctg cacagtcgcc 6181 gcatcccaca cagccgaaac ggcaagcgtt ggggccgcca tatatcattg aagcggcgca 6241 gcagctgctg atgccgtcat aaagcgcctt tttcgatgtt gcttcgcaag tgccgttgca 6301 tccgacaaag gcaaccacag gctcgccaac cttgatttca acacccaaaa tttccgagag 6361 cttttcggca acggaaactg agccgggaat acaaaggttc ggctcggctt cgcccaaagc 6421 aagcgctttt gcatatccgt cacagcctgt atatccgcag gcaccgcagt ttgcgccggg 6481 cagacactca cggatggttt ttgttttttc ttcttcttca accttgaata ctatcgatgc 6541 cacaacaagg actatcgcca taacaagtcc aacgccaccg acaaccaaaa gggcggtcaa 6601 tatctgagtc atatataata gccctcctta tgcaaacagg ttatcaacga ttccggcaaa 6661 gccgaagaac gccaaagata ggaatgatgc agcgataagc gttgcaggca aacctcttaa 6721 tgcctttgga atgtttgtct cgtcgattct tgagcgtatg cccgagaaca ataccattgc 6781 caaaaggaag cccacaccgc aacccagcga gctgacaatt gattcaacaa agttgaaacc 6841 atcgttgata ttgttgatgg taacacccaa aactgcacag ttggttgtga taagcggcag 6901 atatacaccc aagctcttat gaagcgcggg aatatacttt ttgaggaaga tctcggtaaa 6961 ctgtaccaaa gcggcaatta ccaagataaa tacgatcgtc tgcatatagc caagaccgtt 7021 ggggtcgagg atatagatct ggataggcca tgtaacagcg gtagccatga gcattacgaa 7081 tgtaacggcg atacccattc ccgttgcctg attaagcttt ttggaaactc ccaagaaggg 7141 gcagatgccc aagaatcggc tcaaaacata gttatttacc aaaaccgagg acatcaggat 7201 tacaataaga ttctttacag tatccattag cactcctcct ttgcttcagc ggcttcacag 7261 cttgccttgt tgcaaactgc cgcattggga catcctgcac agccaaagct ctttttcttg 7321 ggatacttgc ccttggtgat aacgcttaca acggcgatga gaagaccgta cacaagcata 7381 ccgccgggag ccttggtcag atagctgatg gtgtagtttg aaagaacggg aatctggatg 7441 ccggcaaagc tgcctgcacc gaaaacttcg cggatcgttg ccatagccaa aagcgcgata 7501 gtaaagccca agcccatacc gataccgtca agggcagatt tgccgacggt gtttttgctt 7561 gcaaacatct c // LOCUS sequence014 7516 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence014 VERSION sequence014 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..7516 /mol_type="genomic DNA" /organism="" /note="sequence014" CDS complement(1799..4165) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MRRLLVFALALMTMATSVMFSSCSIGKAEENAVKTVYVSPDGDDT NGNGTKEAPFATIGKAQEFVKTLKKKDGDITIEIADGFYFLENTLVFDETDSGSEDCTV IYRAAEGANPIISGGRILDGEWVVAEEVNWLKDGLVAYKTTLERDAKLRAIYVDGKRAA MTRRSATPLRAGGFYTIQKGMADWAWISSSSDLKTYNVFAANFDLPVNTPNPENIELES GSTWVKATICAESLDTTKDGDIRVNFQMPYAAIAQNLGWNCNYNPTAKNDVINVFEWLE HEGEFYFDQAGSTLYYIPYADEDINEAQVIIPELERLIDIRSTEPDKKQVEYITFDGIT FAYSDWNLYEVDGSFGNATTQNCTIYTKFSDINWHNDLYRAFDVAPAAVLVNSANHVNF INGGFESTGYCGLHLENAVSDCLVEGNFVAYTGGAGIVVGHLQHIYENDTEKQKVSETS IGPEFEKFPKGTEAVPKNITLKNNYLLENCYFFPGNSPITTFFTYNLTVEHNFVYKCSY SGMSIGWGWCNFDGTEGSQLPGQPTSTSRFNHVNFNRVEEICSVLQDAGGIYTLGQQGN EDWSEMTEMTYNYINCFRKPTVANGSRMVNGFHPDEGSAYILFDHNVVTNVIRNVYELN EWMRKHDCTVTNGFSNTSRSETTAPNCTLEQYVNEDYIWPVEGYDIVLYSGLEDEYVHM VSADVMPDDYYELAANVSIKCGESLNRRGLLDGADTVWLAPVGTETFAEGENMTKAAGN EKTITVPATPGEYKLYIIYADGTVSQASTFTVYAE" /locus_tag="LOCUS_1120" /note="WP_197444080.1 right-handed parallel beta-helix repeat-containing protein (Maioricimonas rarisocia) [pid:22.3%, q_cov:75.4%, s_cov:65.5%, Eval:5.1e-17, partial hit]" /note="MGA_130" CDS complement(4331..6517) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MRRIFSLILAITMTFSMVLTVSADEVTTYGLVDTLTDGKEYVMVW NSSATDNAGDKHALAIDDEGVFGNNKLPSSHFNGDNYKLNAYFSFYVWIAHQDGDGWRF ENKDTGLYLGYDTSDEDGLTLVSDNTGKDTLWAFKKSTGGCTIHASSNSSYRIRYSTGN EYIRLQSGSSSNSYVYLYELGTLGCPKHTYNGCLDTICANCGKTTRLNSGLSHKYADKN DATCGACGFERYIFPEEEVGENSAVKCFSAVFYPQSSSTKAATNFEYLFDITGLVASVA PLEYVTHADITVEVSNIEGNGNKVPSCKMYVNQPGQKQLGLEKFDGVSKVSFSADIDDS VSKIWLVPENFVSQTEISFKITATVTYDELNEPDYGEPLATVVTFSDYQHWDINGLHSQ LDGIFSAMHKRVNPDYIIFGGDYTTEMHVTYASDEGRKEVLGFIGDWWPHINAENGNYI QIQGNHDPDDMAGMLETGPLEFDELIVYNIQEQDFPCGMGSDSARETVEATAQALEKYL NKCIRSGEQRPIIIASHLGLHYEAREGSNTQYIYILFDVINEAATNLDIIYIHGHFHST GDPESGGAIVYFPVGSTLNVADESCFDAEGKALQDRAGHGRPSVLNFTYMNYGYVGYVL ESLIKLEPFAHLEPEYVLTGGALNIYDEFITLDRYASTGKIGKFSQVIPRAHADAKPKL LPQDYIYVVGVGAILIVIILAVVIIAKTSKSKKK" /locus_tag="LOCUS_1130" /note="MGA_131" misc_feature complement(6661..>7516) /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_207285076.1:glycoside hydrolase family 11 protein" /note="WP_207285076.1 glycoside hydrolase family 11 protein (Dictyoglomus turgidum) [pid:54.5%, q_cov:39.4%, s_cov:31.7%, Eval:6.1e-34, partial hit]" /note="MGA_132" /locus_tag="LOCUS_1140" ORIGIN 1 caaatttaac tccatcgccg tttgcggtgt taacggtgac tcgtgaagta tcgccgtcgg 61 ggcgtggtga accctgtgtc agtttaacgc ccaaatcatt ccacttaagc tcagagctga 121 tatactgtgc aacataaagc tcacgctcgg tcttatagta tacgctgtcg cacagcttgg 181 taaagttttc aagaccgctt cccgtacagc accagaactg gttcttttca acatcgggat 241 ggcagtaaac tttgaaatat cccgttgcca taggctggaa ataggtggtc atacctgttt 301 tagggttgat tgaggaaatt atcgcgttaa taagcgtgct ttcatagtag tcggcatact 361 tggtattctt cgtgatctta taaagctcgc gggtgatctt gagcatattg taagtgttgc 421 aggtctcgca gttgcattgg gttctttcgg catccaaaat gttgtcaatt ccgaaatgct 481 cccattggct gtttccgcct gtgatatagg tgtgtttgtt aacgaccata ttccagaacg 541 cttcaacata ttcaagatat ttgcttgcat caacagtttc gccgttaagt tccttgccgt 601 gaagtgtgcg atatcggttg attgcgccca catacttagg aatttgggtg tttgcgtgtc 661 ggccgttcaa aacgttgtcc ttgccctcca aaaccatttc aaacagccaa tcctcgtcaa 721 actgcgaagc ggcaaatgca tgctcgggct tgcctgtgca tttataaagc tcatataaag 781 cgtcgttcat tgcgccatat tcaattccca aaacgcggcg ctttaagtca taatcccact 841 ttgaaacgcg gttatatacc cagtcgccca gtcttgagcc aacttcgaga gcttcttcgt 901 ttcctgtgtg cttatataca tccacaatac ccgacatgat cttgtgcata ttataccagg 961 gcacccagtt agggccttga gccttgcctt ccataatgtc gaactgcttt tcaatattgg 1021 ttttatcctc aatctgtgcg ccgaaaacaa atcctgtgcc caaagaatcc tgacattcct 1081 tgaggcctga aatcagctca tcaagctgag ccttcatcca tattctgtcg ctttcgtttg 1141 gtgcagtcaa ataggcctga gcgcaagcgg tcaaatagtg acccaaggtg tgtccgccga 1201 tatagctgtt ttcccaaccg ttataagggc cgacaccacg ggtgtcaacg cccgcagttt 1261 cgcggaaacg ggcaagaagc ctgtcggcat caaaggtctt caaaaagtca atatcctttt 1321 gcgataccgt tgcataatag ccgtcggtga tgacaacatc ccgaagggag aaatcttcga 1381 gatttttaag ggtgttcatt ttgtttttgc acatagaaag tcctcctttt ggcgaaatgt 1441 tctttcaagt taatgataca atatgtgcgc attaaaatca atgatggata tgaagaaaat 1501 ttttgactaa ataaacgaaa gctgcaagtt ttgctttgtc ggggcaggcc gggagagagc 1561 cgcggcagcc gcaccgtcgg tcagggggct tcgcccccga cggtgcctcc cgcgcctgcg 1621 gcgcggggca tccgtgccct ccttgcgggg gcacggatga gctgccgccc aactcttgcg 1681 tacacctgca gtctttgcat tatatcgcac tcacttgtgc cccgacatct cgccaagcag 1741 tatcgcgtag tcaataaaac accccctgca ttctctgcag ggggctatgc tttatcagtt 1801 attccgcata aacggtgaag gtgcttgcct gggaaactgt gccgtcggca tatatgatat 1861 atagcttata ttctccgggt gttgcgggaa cagtgatggt cttttcgttg cccgcagctt 1921 ttgtcatatt ttcaccctcg gcaaaggtct ctgtgcctac gggtgccagc caaacggtgt 1981 ctgctccatc aagcaggcct cgacggttaa gcgactcgcc gcatttaatt gatacatttg 2041 ctgccaactc atagtagtcg tcgggcataa cgtctgcgct taccatatgg acatattcat 2101 cttcaagtcc cgagtaaaga acaatatcat atccctcaac aggccagata tagtcctcgt 2161 ttacatactg ctcaagggta cagttggggg ctgttgtttc cgatcttgat gtattggaga 2221 agccgttggt aacggtgcaa tcgtgctttc gcatccattc gttcagctca tatacatttc 2281 tgattacgtt tgttacaacg ttgtggtcaa acagaatgta tgcacttccc tcgtcgggat 2341 ggaaaccgtt gaccattcgc gaaccgttag caactgtcgg cttgcggaaa cagttgatgt 2401 agttataggt catctcggtc atttccgacc aatcctcgtt gccctgctga ccgagggtat 2461 aaattccgcc tgcatcctgc aaaacagagc agatttcttc aacacggtta aagttaacat 2521 ggttgaatct ggatgttgag gtgggctggc cgggaagctg agagccttcg gtgccgtcaa 2581 aattacacca tccccagccg atactcattc cgctgtatga gcacttataa acgaagttgt 2641 gctcaacagt taagttatat gtaaagaatg tagtgattgg cgagttgccg gggaagaaat 2701 agcagttttc caagagatag ttgtttttaa gcgttatatt tttcggaaca gcctcggtgc 2761 ctttggggaa cttttcaaac tcgggaccga tacttgtctc actaaccttt tgcttttcgg 2821 tgtcgttctc ataaatatgc tgcagatgtc ccacaacgat tcccgcaccg cctgtatatg 2881 caacaaagtt accctcaacc agacagtcgg aaacagcgtt ttcaaggtgg agtccgcaat 2941 atcctgtcga ttcaaatccg ccgttgataa agttaacatg gtttgccgaa ttcaccaaaa 3001 ccgccgcggg agcaacatca aatgcgcggt aaaggtcgtt gtgccagtta atgtcagaga 3061 acttggtata tatggtgcaa ttctgggtgg tggcgtttcc aaacgatcca tcaacctcat 3121 agaggttcca gtcggaatat gcaaaggtaa ttccgtcaaa tgtgatgtat tcaacctgtt 3181 tcttatccgg ctcggtactc ctaatatcaa tgagtctttc cagctcggga attatcacct 3241 gagcttcatt gatgtcctca tctgcatagg gaatataata gagggtgctt cctgcctggt 3301 caaaatagaa ttcgccttcg tgttccaacc attcaaacac gttgataacg tcatttttag 3361 cagtggggtt atagttacag ttccagccta aattctgagc aatagctgca tatggcatct 3421 ggaaattgac tcttatgtcg ccgtccttgg tggtatccaa agattcggca caaatggtcg 3481 ccttaaccca ggttgagcct gattcaagct caatattttc agggttggga gtattaacag 3541 gcaggtcgaa atttgccgca aaaacgttgt atgttttaag atcggaactg cttgagatcc 3601 aagcccaatc ggccataccc ttctgaatcg tatagaatcc gcctgcgcgc aagggagttg 3661 cacttcttct tgtcatcgca gcgcgcttgc cgtcaacata aattgctctg agctttgcat 3721 ctctttcaag ggtggtctta tatgctacaa ggccgtcctt gagccagttg acctcttctg 3781 caacgaccca ttcgccatcg aggattctgc cgccgcttat aatcgggttt gcgccctctg 3841 ccgcgcggta aataactgtg cagtcctcac tgcccgagtc ggtttcatcg aaaaccaagg 3901 tgttctcgag aaaatagaat ccgtcggcaa tttcaattgt aatgtcgccg tccttttttt 3961 tgagtgtttt aacaaactcc tgcgccttgc cgattgtggc aaatggggct tccttggttc 4021 cgttgccgtt agtgtcgtcg ccgtcagggg aaacatacac cgttttaact gcattttctt 4081 cggcttttcc gatactgcag gaagaaaaca taaccgaggt tgccatcgtc attaatgcaa 4141 gagcaaaaac aagtaatctt ctcataatta aaatgttcct ttctcagtaa ttgttaagaa 4201 atgttccacc taaaattata gcagatgcct aatttcagtc aagcaaatat tagaaatgtt 4261 caaccccaag tgtccgaata atcaaaaaca aagccatatg ggccgaacgg ctcatatggc 4321 tctaaacaat ttatttcttt ttcgactttg atgtttttgc aatgattacg actgccagaa 4381 tgattacaat caaaatcgct ccgacaccga caacataaat ataatcctgt ggcagaagct 4441 tcggctttgc gtctgcgtgc gcgcggggga taacctggga aaatttgccg atttttcctg 4501 tcgaggcata tctgtccaag gtgatgaact cgtcatatat gttcaaagcg ccgcctgtca 4561 aaacatactc aggctcgaga tgggcaaaag gttcaagctt tatgagactt tcaaggacat 4621 agcccacata tccatagttc atatatgtga agttcaaaac tgacggcctg ccgtgtcctg 4681 ctctgtcctg aagagccttg ccctcagcat caaaacagct ctcatccgca acgtttaagg 4741 ttgaaccgac agggaagtaa acaattgcgc cgcccgattc agggtcacct gttgagtgga 4801 agtggccgtg tatatagata atatccagat tcgttgccgc ctcgttgatg acatcaaaga 4861 gaatatagat atactgtgtg ttgcttcctt cgcgcgcttc atagtgaagc ccaaggtggg 4921 atgcaattat aatcggtctt tgctcgcccg aacggatgca cttgttaaga tatttttcca 4981 aagcttgggc ggttgcttca accgtttctc tggcgctgtc gcttcccatt ccgcagggga 5041 aatcctgctc ttggatgtta taaacaatca gctcgtcaaa ttcaagcggg cctgtttcaa 5101 gcattcctgc catatcatcg gggtcgtggt taccttgaat ctgaatataa ttgccatttt 5161 ctgcatttat atgtggccac cagtcgccta tgaagcccaa aacttccttt cttccttcat 5221 cggaagcata tgtcacatgc atttctgtgg tatagtcgcc gccgaatatt atataatcgg 5281 gattgacacg cttatgcatc gcgctaaaga tgccgtcaag ctgcgaatgc aagccgttaa 5341 tatcccaatg ctgataatcg gagaatgtga caaccgttgc aagcggctcg ccgtaatcag 5401 gctcattaag ctcgtcatat gtaaccgtgg cggtgatttt aaagctgatt tctgtttgag 5461 aaacaaagtt ttcaggaacc agccatattt tactgaccga gtcatcaata tcggctgaga 5521 agctgacctt gcttacaccg tcaaactttt ccaatcccag ctgcttttgt ccaggctggt 5581 tcacatacat tttgcaggaa ggaactttat ttccgttccc ttcaatattt gatacttcaa 5641 cagtaatgtc tgcgtgggtg acatattcaa ggggcgcaac agatgccacc aagcctgtga 5701 tatcaaacag atattcaaag tttgttgccg cctttgttga actcgactgg ggataaaaca 5761 ccgcgctgaa gcatttaacg gcagagtttt cgccgacctc ctcctcgggg aagatatatc 5821 gttcgaaacc gcaggcgccg caggttgcat cgtttttgtc ggcatattta tgcgaaagcc 5881 ccgaatttaa tcttgtggtt tttccgcagt tggcgcatat ggtatccaga cagccgttat 5941 aggtgtgctt gggacaacca agggtaccca gctcataaag ataaacgtag ctgttgcttg 6001 aagagcccga ctgcaatctg atatattcat tgccggtgct gtatcttatg cggtaagatg 6061 aattcgacga ggcatgaata gtgcatccac ctgtgctttt tttgaaagcc caaagggtgt 6121 ccttacctgt gttgtcactt accaacgtta agccgtcttc atcggaggtg tcatatccca 6181 aataaagccc ggtatccttg ttttcaaagc gccaaccgtc gccgtcttga tgggctatcc 6241 aaacgtagaa ggagaagtat gcattgagct tatagttatc gccgttaaaa tggctggatg 6301 gcagcttgtt gttgccgaaa acgccttcat cgtcaatcgc caaggcgtgc ttatcgcctg 6361 cgttatcggt tgcggaactg ttccaaacca taacatattc cttgccatcg gtcagcgtgt 6421 caacaagacc gtaggtggtg acctcgtctg cgctaacggt caaaaccatt gaaaatgtca 6481 ttgtaatcgc aagtattaac gaaaaaattc tcctcataaa tatccatcct tgcttttctg 6541 atttatacaa tgaattatag cataccaaag tcacgaccgc aatatgtttt tatgtttaat 6601 aactatacta aaccgcgtcg ggcttgtttt tcccaacgcg gtttgcattt aaaatgtatg 6661 ctattttccc acaacggcat cgtcgatata gaaattgtga gttcccgagt ctgtttcaac 6721 atataaaagt atgttccagg ctccctcggg aagggtatat gcctcgtttt taagttcaac 6781 ccattcgccc tttgcgcctg tggcttgcgc aatgcaatca tagcttgttc cgccgtaggc 6841 atcaatatac tgaatggtca gcttaaactc ggttgtatca acagcttcct gcatagccat 6901 aacgctgaag cggaaggtct cgcctgcctt gaaaacggac gaattcaaat catgctccgt 6961 gccgttccaa gcgtctgctc tgccggatac tgccagcgat tttgaaccgc tatatgccgc 7021 actgccgtcg gatgatacct tcgatgagcc tcttgaaccc cagccgtctt tgcccgattc 7081 aaagtctgcg cagatgtagt ttccgttttc atccggctcg attggctttg gcaggtcgtc 7141 tgggttgggc tcaattatct cgccgccgac agtcagcttg tttttcttga caactgcgct 7201 gccttggctc tgatatccct cgacagtcag cgatgcttca tacatcttgc ccataggcag 7261 tcctaaagcc tcccaagcgg caaagtgggt cgaaagatta acctctcctt ttgtcttttt 7321 ctcttgtctt acgctccaat attgaacaaa ggttgtgttt ccgtcaattg aaggctgatt 7381 tacgcggacg gatttatata catcatatag tccgccgtca acggtgatgg ttgcaattgg 7441 gtttcctccc ggcgggcgcc agtttcccca gttttcaaca acatagtatt caaccaaagg 7501 ttctcttgtc cagccg // LOCUS sequence015 7112 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence015 VERSION sequence015 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..7112 /mol_type="genomic DNA" /organism="" /note="sequence015" CDS complement(1269..2786) /product="DUF5605 domain-containing protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_004080612.1" /transl_table=11 /codon_start=1 /translation="MHVERWGLFEVSFNGKTQGNPFTDYGIKGKFVGDNEEVTVDGFYD GDGVYKVRFMPSFEGKYTYTVSGSFSDETFSGEFEAISPSENNRGKVEVANKYHFKYAD GSNYFSIGTTCYVWNLQSDELVKQTIETLSKSAFNKIRFCIFPKHYAYNVNEPRSYPFE GTPIDSTGMNMSNLWGYNADSQGNSWDFSRFNPKHFEHIEYCVNELMKLGIEADIILFH TYDRWGFSKMTHEQDLFYLKYVIARLSAFRNVWWSLANEYDLLKKTHEDWQDIGNFIKE NDKYGHLRSIHNCIPFYDYTEDWVTHCSIQRQDLYKTAEFTNEWRDKFAKPVVLDEIAY EGNISAAWGNITGEEMTRRFWEAFCRGGYPGHGETYESPDSVLWWSHDGILKGTSPERF AFLKKIADEVPGGQMKYSPECWGGVSGIPEDDDIAQKTGFRIHYYSFMRPINQGYHFDD ENDYTVEIIDTWDMTVTPAGTYRGWFSVDLPGKQYIAVRIQKAVQSK" /locus_tag="LOCUS_1150" /note="WP_004080612.1 DUF5605 domain-containing protein (Thermotoga) [pid:43.5%, q_cov:98.8%, s_cov:96.0%, Eval:8.2e-124]" /note="MGA_134" CDS 3007..4152 /product="glycoside hydrolase family 5 protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_010964144.1" /transl_table=11 /codon_start=1 /translation="MIKRIFCLALVFVLAMSLISCKKDDYSPKPFDDSQNIECETSWEA VSNMALGWNLGNTLDACGEWINSEDPSAYETAWGNPVTTKEMIAAVKDEGFNAIRVPIT WADHIDEKGIIDEPWLDRVEEVVDYIMSLDMYCVINVHHDAGADGWVRASTANYAKNGD RYAKIWEQVATRFKDYGEKLIYESVNEILDEYSTWNTPSDDAVEGLALYVQRFVDTVRA CGGYNETRNLIVMTYSGASGGAISSFVLPKDSVEDHLILEIHNYDPVDFCWRDSWMNSL DFWGTDQDIAEMDAFFADTYSRMQNLNVPLVIGEWGSEAKDDNEDERAKHAAHFVEKAT EYGFATFWWDCGHFALMDRPNACVLRTKIVDAMVSAYESAQ" /locus_tag="LOCUS_1160" /note="WP_010964144.1 glycoside hydrolase family 5 protein (Clostridium) [pid:34.5%, q_cov:88.2%, s_cov:88.9%, Eval:3.1e-53]" /note="MGA_135" CDS complement(4352..5926) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MAKVNYDNEYQGNPFLPLWEYIPDGEPYVFEDPDNPGKYRVYIYG SHDMLKTEYCGKDLVVWSAPVEDLSAWRYDGVIFESIVNGNADVLYAPDVAMVKDPING KVTYYLYPNNMGWKRNSMVCKSDRPDGPFEACNWKPNSTTETYGVMGFDPAVFVDDDGQ VYGYWGFQNSWWGKLNSENMADLIPGEASHKNIPSYDEMMAEDYDPTQFNIVQDENTKK WGFFEASSIRKVGNKYVFIYSRNGLPEEPTGKNYSQLAYGYSDSPEGPWKWGGIIVDAA GEVIPNDHGGYDRTFNGGNTHGSICNIDGQWYIFYHRNLHAYARQAMVEPITVEWDEKP VSDGGEVRISMAEVTSNGFYVEGMNPYVKRSAGNVCYLTGGAKIVPAYTTDTTTLPITD IYYDVVAGFKYFNFDIDAPEGKSTSLEIEIIPGGINATIDVYIRPTSAVNTPVERTDGV ITSVGKGSKKIGTFTLTKDMPMEWTTLKIETPQIDRLSGEWGVFFVFQSKRTKNTCDFY SMQFVAE" /locus_tag="LOCUS_1170" /note="WP_011068727.1 family 43 glycosylhydrolase (Bifidobacterium longum) [pid:28.1%, q_cov:65.6%, s_cov:40.1%, Eval:2.4e-17, partial hit]" /note="MGA_136" ORIGIN 1 atcaagagcc tttatctgct ttacgccctc ttttgatgct gcagtcatag gaaaactttg 61 ggtctcggga tccattggca gatagtctac catcatactt ctgaatccgt cgggagaacc 121 gttaagatcc tcaaggagat ttgtatggtg aagaatatag tttgtgcctt caaattccaa 181 gaaatgagtg tggttattcg accatttcat tcccgaagct ccttgtgcat tctgtcctgc 241 gttatagaaa tatgcgccct tatattccca gctatcagca acaagcgggg tggttgtggt 301 catatatgcc attgcgcaag cgggagggac atcaaatcct tcatattcct cccaacccac 361 agagtgatcc acccagtcgt tgcagtatgt atagtagtat acaccgtcga taaagttaag 421 ctcgcttgcc tcgttaaaat atggtgcatc aattgaaaca aactcactgt ctatggatat 481 catatcctcg ccgagtcgtg caattttcgg aacgagagaa tggataatac ctgaatttcc 541 tccgccaaag gatagccaac ccacaccgtc atcgtcaata caaacaccgg gatcaaacgg 601 agcgggacag tttgtaagtc cgggcatatt ctgataaatc aaaggcttac ccaaggggtc 661 tgtccaacct gttacggggt ctgtcgatgt aagaacacca acaccggttc cgctgttggt 721 gaaatagaga tagaagtgtg taagtccgtc ttcttcaact ctcgatacga tcgaaggtgc 781 ccaggaattg aatatccaag gtgctatttc accgacattt attatgccct catataccca 841 gtttgccata tcatctgttg agaagatgac aagagattta atgtgctcat atcctgagcc 901 gtttccgtgt cccttaacct caagctgctg ctggtcactt gtgccgtata cgtaaagtct 961 gccgttgtga acaacacctg tggggtctgc acaataaatg tttgaagata ttggatttgc 1021 atttgcttct gttttataca cttttatact cacctcatca atagttatgc cgttttcaag 1081 actcgcaatt gcatcttcgg gaattaatga ttctttttca gcgttatcat ccgttgaaat 1141 cgtctcatca ttatccactt gcgattcatc ctttaaattc gatgcgccct gacatccgct 1201 aagcaacatc gcgcctataa ttaacagtgc caataaagat ttaaatctca taaatgcctc 1261 ccttggtctc atttgctttg aactgccttt tgtatcctta cggcaatata ttgcttgccg 1321 ggaaggtcaa cactaaacca gcctctatac gttcctgcag gggtaaccgt catatcccag 1381 gtatcaatta tttcaacggt atagtcattt tcatcgtcaa aatgatatcc ttggtttatc 1441 ggacgcataa agctgtaata atggatcctg aatcctgttt tctgggcaat atcatcatcc 1501 tcgggaatac cgctgacacc gccccagcat tcgggactat atttcatctg tccgccggga 1561 acctcgtcgg cgatcttttt aaggaatgca aatctttcgg gagatgtgcc tttaaggata 1621 ccgtcgtgtg accaccaaag aacgctgtcg ggactttcat atgtctcgcc gtgtcccgga 1681 tatccaccgc ggcaaaatgc ctcccaaaat cttcttgtca tctcttcacc ggtaatattt 1741 ccccaagcag cagatatgtt tccttcatat gcaatctcat caagaacaac cggctttgca 1801 aatttatcgc gccattcgtt cgtaaactct gcagttttat ataaatcctg acgctgaata 1861 ctgcaatgag taacccaatc ctcggtatag tcataaaagg ggatacagtt gtgtatcgag 1921 cgaaggtgac cgtatttatc gttttctttt atgaagtttc caatatcctg ccaatcctca 1981 tgagttttct taaggagatc atattcgttt gcaaggctcc accatacgtt tctgaatgcg 2041 gaaagtcttg caattacata tttaagataa aacagatcct gctcgtgagt catcttcgag 2101 aagccccaac ggtcatatgt gtggaaaaga attatatcgg cttcaattcc gagcttcata 2161 agctcgttaa cgcaatattc aatatgttca aaatgcttcg gattaaaacg gctgaaatcc 2221 cagctgttgc cctgcgaatc ggcgttatat ccccaaaggt ttgacatatt cattccggtt 2281 gaatctatcg gtgttccttc aaagggatat gatctcggtt cgtttacgtt ataagcataa 2341 tgcttcggga atatgcagaa gcggatcttg ttgaatgcag acttactaag cgtttcaata 2401 gtctgtttaa caagctcatc cgattgaaga ttccaaacat aacaagttgt tccaatgctg 2461 aaataatttg aaccgtccgc atacttaaaa tgatatttat ttgcaacttc aacctttccg 2521 cggttgtttt cagaaggaga aatcgcctcg aattcgcccg agaaggtttc atctgaaaag 2581 cttcccgaaa cagtatacgt atatttcccc tcgaaagaag gcataaatct tactttataa 2641 actccgtcgc cgtcataaaa tccgtcaacg gtcacctctt cgttgtcgcc aacaaatttt 2701 cctttaatgc catagtcggt aaagggattg ccctgtgttt taccgttaaa agagacctca 2761 aaaagccccc atctttcaac atgcattaac ctcatctcct tgatcgctat atatgttttt 2821 ggcaagatac caaataaata atatcgtgaa atttaaggac tgtcaacaag ttttcgacat 2881 caaattgtta attcttgaaa tcgaaaaaag ataatatgat aacactttgc tttcttgaca 2941 gccatatata tagcttgtat aatcaaggta taataatcgg aattcgatta aaaataggag 3001 gacaatatga tcaaacggat tttttgttta gctttggttt ttgttttggc aatgagcctt 3061 atatcttgca aaaaggatga ttacagccct aaaccgttcg atgattcgca gaacattgaa 3121 tgtgaaactt cttgggaagc ggtttcaaat atggccttgg gttggaacct tggaaacacc 3181 ttggacgcct gcggagagtg gatcaacagc gaagatcctt ctgcttatga aacagcttgg 3241 ggcaatcccg tcacaacaaa ggaaatgatc gccgccgtta aggatgaagg cttcaacgcc 3301 atccgtgttc ctataacttg ggcagaccat attgacgaaa aaggcattat tgacgagcct 3361 tggcttgaca gagttgaaga ggtcgttgac tatataatgt cgcttgatat gtattgcgtc 3421 atcaatgttc atcacgatgc cggtgccgac ggttgggtgc gcgcctcgac agcaaactat 3481 gccaaaaacg gcgacagata tgcaaagatc tgggaacagg tagcaacccg cttcaaggac 3541 tatggcgaaa aacttatcta cgagtcggta aacgagatac ttgatgaata cagcacctgg 3601 aacactcctt cggatgacgc cgttgaaggt cttgcgcttt acgttcagcg atttgttgac 3661 acagtcagag cgtgtggcgg ctataacgaa acaagaaatc ttatcgttat gacttattca 3721 ggtgcatccg gcggtgcaat ttcgagcttt gtattgccga aggacagcgt tgaagaccat 3781 ctgattcttg aaatacataa ctatgatccc gtcgatttct gctggcgtga cagttggatg 3841 aattctcttg atttctgggg aaccgatcaa gacatcgcag aaatggatgc tttctttgcc 3901 gatacatatt caagaatgca aaatcttaac gtacccttgg ttatcggcga atggggttct 3961 gaagccaaag acgacaacga ggacgaaaga gcaaagcatg ctgctcactt tgttgaaaag 4021 gcaacggaat acggctttgc aacgttctgg tgggattgcg gacactttgc tttaatggac 4081 agaccaaacg cctgcgtctt gcgcactaaa atcgtggacg caatggtttc agcttatgaa 4141 tccgcacaat agaataagac aaacgatgaa caggcaagct aaaaagcttg cctgttttga 4201 tatattgctt actgggtatg aaaaccgaat agcatatttg atattcgaat atttaaccgt 4261 cgaattgcaa gattatcagc ccaatatata caagattatc tgatcaaaaa aataagcctc 4321 cttaaacaaa ggaggcttat ttaatgtgtg tttattcagc aacaaactgc atcgaataga 4381 aatcacatgt atttttggtt ctcttgcttt ggaaaacaaa gaagactccc cattctccgc 4441 taagccggtc aatctgcggg gtttcaattt taagcgttgt ccattccata ggcatatcct 4501 tggttaatgt aaaggttcca atctttttgc ttcccttgcc gacggatgtg ataacgccgt 4561 cggtgcgttc cacaggtgtg tttacagccg aagtaggtcg aatataaacg tcgatggttg 4621 catttattcc gccgggaata atttcaatct caaggcttgt ggatttgccc tcgggagcat 4681 caatatcaaa attgaaatac ttaaatccgg caaccacgtc ataataaata tccgtgattg 4741 gaagagtcgt agtatcggtg gtatatgcag gaacgatttt tgcaccgccc gtaagatagc 4801 atacgtttcc ggcagaacgc ttaacataag ggttcattcc ttcaacatag aagccgttcg 4861 aggtaacctc tgccatagat attctaacct ctccgccatc ggaaaccggc ttttcgtccc 4921 attcaaccgt tataggctca accattgcct gccttgcata tgcgtgaagg tttctgtgat 4981 agaagatata ccactgtccg tcaatattgc aaatacttcc gtgagtattt ccgccgttaa 5041 aggtgcggtc atatccgcca tggtcgttgg gaatgacttc gcctgcagcg tcaacaatga 5101 ttccgcccca tttccatgga ccctcggggc tgtcgctata tccatatgcg agctggctat 5161 agttctttcc ggtcggctct tctggcaaac cgttacggct atagatgaag acgtatttat 5221 taccgacttt tcttattgat gatgcttcaa agaagcccca ttttttcgta ttttcatcct 5281 gaacgatgtt aaactgtgtg ggatcgtaat cctctgccat catttcgtca tagctgggga 5341 tattcttgtg gcttgcttca ccgggtatca aatcagccat attttcgctg ttaagcttgc 5401 cccaccaaga gttttggaaa ccccaatatc cgtaaacctg tccgtcgtca tcaacaaaaa 5461 ctgcagggtc aaatcccatg acaccatagg tttcggtagt actgtttggc ttccagttgc 5521 aagcctcaaa aggcccgtcg gggcggtctg atttacatac catcgaattt cttttccaac 5581 ccatattgtt ggggtaaaga taataggtga cctttccgtt aatcgggtct ttaaccatag 5641 caacgtcggg cgcataaaga acgtctgcgt ttccatttac tatcgattcg aaaataactc 5701 cgtcatatct ccaggccgac aggtcctcaa cgggggccga ccaaacaacg aggtcttttc 5761 cgcaatactc agttttaagc atatcgtgtg agccatatat ataaactctg tattttccgg 5821 gattatcggg atcctcaaaa acatagggtt caccgtcggg aatatattcc caaaggggga 5881 gaaatggatt tccctgatat tcgttgtcat aatttacttt tgccacatag tcatctcctt 5941 tatcaaaaat ggatattgca tccgcgcagg atgtgaatag catcataacg gatatcagcg 6001 ctattgtaaa agataaaatt cgtttattca taagcatctc caatcgtcat actttaagac 6061 aataatatat taattcgcaa aatattacaa tatgttagat gtaatttttt tatatttcac 6121 agtaacaaag tacaggatac tctttcaaaa tctaaaatat cctttttcaa taactgcgac 6181 tggcttatac ggctattttt tatgccgtaa aatgcgattc atagcttaat aatttgtatg 6241 cataaactaa aaccacgtga taaacacgtg gtcttaattt gaatatttac tacttctttg 6301 gtccgtaatg gaaggttatg taaacggttt caatcctact cattgaagga ccgttaggat 6361 caagaacgca aggagaaatt ccgttcgagc ttccggttgc tgtacgtgtg gtattcggag 6421 catccgtgat ccaagcgtta tagaggttaa ctcttgtaca gttgttgcca tcgcttgtcg 6481 tataaggcac tgcggtgagc ttaacgatct ttccgttgat gacgacctct ttaatgtcga 6541 taacatagcc ggggaagagc ttttcgccgt ttgcaatacc aatggctgag aacccaatgc 6601 tgttagaata gccaaccggt gtgcctgtga aatcaagtcc aacagtatag gtgcctgcgc 6661 cggtaatttc gacgtcggtg ttcttaattc ctgcagcaat atcgttagga tcatactcgt 6721 ttccggggtg gttaattgcg ttccagtctc ccgatatcca cataagccat gcagcagcgt 6781 tattgcccgt aaggttaatt gcgttttcat tataggttgt gggcgcgttt tcaacctttt 6841 tatccattct gtctcttgcg gcagccttga cctcttttct tgtcatatca gattcagact 6901 cgtaattgcg gtttgaatac aaatttgcaa gatcagggtg catcatctta agctctctgc 6961 ggatgaaaat actgctgcaa tcccaaagac aagatgtcaa atcataataa tcgcatacat 7021 caaggaaatg ttcaagatat tcaacctgat ttttctttaa ctttccgtca cttgtggcat 7081 atgcgccgta ttctccgata acaacaccat ag // LOCUS sequence016 6803 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence016 VERSION sequence016 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..6803 /mol_type="genomic DNA" /organism="" /note="sequence016" CDS 332..964 /product="histidine phosphatase family protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011861969.1" /transl_table=11 /codon_start=1 /translation="MTGYRIHFIRHALTEANEEGRYIGITDSPVSKKGKLELAEKKQNY IYPEVDKVYVSPLKRCIATAAFIYPEGYARVVPEIREMNFGDFEGKLLVDIKDTPEYKQ FIKGGLDNPAPNGESLRKVIERCYEGISFIIEDMMKNGYHSAAVVTHGGIIMNMLSCFG MPKYNPNEFACDFGEGFTVLATAQFWQSSGCFEILGMCPYEKEDDEA" /locus_tag="LOCUS_1180" /note="WP_011861969.1 histidine phosphatase family protein (Clostridioides difficile) [pid:31.8%, q_cov:79.0%, s_cov:84.8%, Eval:1.2e-13]" /note="MGA_139" CDS 954..2264 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MRLKFTVSESDSGMTVGEFLKNRCGLSRRLIISLKQVANGITKNG EHIRTVDRIGAGDIIEIADESDTPLEPNGELFAPLVYEDEFVAIFNKPANMPAHPSHKH RSDTLGNYFAYLYPDLTFRIINRLDRDTSGLCVCAKSAYAANALQGKVEKTYFAAVCGK ISESGTVDAPIARERESIITRCVRADGQRAVTHYDVIDRTLEHTLLKIHLETGRTHQIR VHMAYIGHPLAGDDLYGGDTSIKRQALHCGEVSFVHPATGEKITVSVPLPDDIKSLFER KKRMEKIASFQVDHRKFGVGMYISRIDGDIVTYDVRMVKPNGGHYISNPSLHTIEHLFA TYARSSFMGKDVIYVGPMGCRTGFYLLVRNVQHENAIKLVKESFEFVKNFEGTIPGYSE IECGNWLEHDLESAKKDVVPLLEVLENYTPEQLRYPE" /locus_tag="LOCUS_1190" /note="WP_001079134.1 RluA family pseudouridine synthase (Bacillus cereus) [pid:41.5%, q_cov:63.3%, s_cov:97.0%, Eval:8.5e-50, partial hit]" /note="MGA_140" CDS 2419..4140 /product="M23 family metallopeptidase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_005811628.1" /transl_table=11 /codon_start=1 /translation="MDFKSIMLNLASFLGFVGDCTMNAVKGILKFVLGGTAKVLGKIFG TVFGWMKKKLKQPFLDILCYVLTPIAHAWGTLAHSKIHFKKASKEGFWRGVKVFFATLW KCLGGLGEVTRWLFNHVAPVVCIVFLISLIKYAGTIQYAISVEYNGSNIGIIENQATYN QAQALVQDKLTYTENDQSLIVTPKFSVQMLLNEGETVDSDNLSEIMIDSGDVAVTYAYG LYINDELVGVYNEEEMQKIKAVLEHQLGRYYTANTADVSFVDDVVLTQGRYIESNLTTA DGAIELIQSERTVEAYYVVQKGDSVSLIASKLDISKDELLEHNSFLEDGTHTGDLITYY FTEPYLPVMTTHYETYDRTVERQVVYQYNPKTEIGCETLKQSGSDGFENVTALVTEING VESDRVIVSRTVIEEMVPRIFITGTKVNTYIDDMWVIEKLGTFCWPVAKENYISSLYGY RRWDHSNHKGLDIAAKRGTDIYAAAAGKVIHAGTYSTYGKLVIIDHGDDILTYYAHQSK IYVSKGDYVQKGDVIGAVGMTGSALGNHLHFELRVDDDRINPMYCLGGVGDHIVNE" /locus_tag="LOCUS_1200" /note="WP_005811628.1 M23 family metallopeptidase (Desulfitobacterium hafniense) [pid:27.5%, q_cov:82.9%, s_cov:98.3%, Eval:3.0e-37]" /note="MGA_141" tRNA 4296..4379 /product="tRNA-Leu" /inference="COORDINATES:profile:Aragorn:1.2.38" /locus_tag="LOCUS_t0040" /note="Aragorn_4" CDS complement(4583..5011) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MADNNNNINVDEVVENIKNLNNTADTTGAYDTQDINDNKLMAILA YIGILVLIPLFAAKKSKFARFHTNQGLVFFLANLALGLVYNIVVQILGGIPVISILVVA LGYLVSLVLFVVMIIGIVNAVQGRAKELPVIGKIRILK" /locus_tag="LOCUS_1210" /note="MGA_142" CDS 5257..6276 /product="SDR family oxidoreductase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_008765598.1" /transl_table=11 /codon_start=1 /translation="MKVLFIGGTGTISTSISRKLIREGHELWLLNRGSRNDIFPEGLVN YITCDINNEADATKKLEGMSFDVVCDFIGFVKPQLERDYRLFKGKTKQFMYISSASAYQ KPLAEPYIDEATPLCNPYWGYSRNKIECEEYLMELYRKEGFPITIVRPSHTYCERSVPI GVHGNGGAWQVVKRMLEGKPVIIHGDGTSLWTLTHADDFAKGFVGLMGNVHAIGQAYQI TSDESLTWTQIHKIIADTLGVEFKPYYVPSDFLAAVSNYDFEGGLIGDKANSVIFDNSK LKRAVPDYCATIRFDQGAKQALDYMLTHPECQTPDPEFDEWCDRVIDALENAKKEILK" /locus_tag="LOCUS_1220" /note="WP_008765598.1 SDR family oxidoreductase (Bacteroides thetaiotaomicron) [pid:58.3%, q_cov:98.8%, s_cov:98.5%, Eval:2.2e-108]" /note="MGA_143" ORIGIN 1 aatcaagtcc gcattcgcgc ttgccctttt cataatggga caatagaccc tgggacacac 61 ccaagtcatg cgccgcctgc ttctgggaaa ctttgcgttc ctttctgagc aaggtcatta 121 ttctcgagaa gtctgttgcc acaaagatca cctacgtctt atgaattcgt cgaaatatgg 181 gagtttgtcc gatatttgac gtagtgctta ttatactcca aattttacaa attgtaaagc 241 caaaacatcg gcgtcattat caatgaaatt caacgggaat ttttgtgtaa aatgttgatt 301 ttacgccgtt ttcaaagaaa ggatgattct tttgacaggt tatcgcatcc attttatccg 361 ccacgcgctc accgaagcta acgaagaggg tagatatatc ggcatcaccg attcgcctgt 421 ttcaaaaaaa ggcaagctcg aattggcgga aaagaagcaa aactacattt atcccgaggt 481 tgacaaggta tatgtcagcc ccctcaagcg ttgcattgca acggcggcat tcatctatcc 541 cgaaggatac gcaagagttg tccccgagat ccgcgagatg aacttcggcg actttgaggg 601 caagcttttg gtggatatca aggacacccc cgaatataag cagttcatta agggcggact 661 tgacaacccc gcacctaacg gtgaaagctt aagaaaggtt atcgagcgtt gctatgaggg 721 tatcagcttt atcatcgagg atatgatgaa aaacggctac cactcggcgg cggttgtcac 781 ccacggcggt atcattatga atatgctttc ctgcttcgga atgcccaagt ataaccccaa 841 cgagtttgct tgcgattttg gcgagggctt caccgttttg gcaactgcac agttctggca 901 gtcgtccggc tgctttgaga tcttgggcat gtgcccttac gaaaaagaag acgatgaggc 961 ttaaatttac cgtttcggaa tcggacagcg gcatgaccgt cggtgagttt ttaaaaaacc 1021 gttgcgggct gtcccgacgg ctgatcatca gcctcaagca ggttgccaac ggcatcacca 1081 aaaacggcga gcatatccgc acagttgacc gaatcggggc aggggatatc attgaaatcg 1141 ctgacgagag cgacacccct ttggagccca acggcgagct ttttgcgccg ttggtatatg 1201 aggacgagtt tgttgcaatt ttcaacaagc ccgcaaatat gcccgcacac ccgtcgcata 1261 agcaccgaag tgacaccttg ggaaactatt ttgcatattt atatcccgat ctgacatttc 1321 gcatcatcaa ccgacttgac cgcgacacct cggggctgtg cgtctgcgct aaaagcgcat 1381 atgccgcaaa cgctttgcag ggaaaggttg aaaagacata ttttgcagcg gtctgcggga 1441 aaatatctga aagcggaaca gttgacgcac ccattgcaag ggagcgcgag tcgataatca 1501 cccgttgcgt gcgggcagat ggtcagcgcg ccgtgactca ttatgatgtc attgacagga 1561 ctttagagca cacgcttttg aaaattcacc ttgaaacggg aagaactcac caaattcgtg 1621 tgcatatggc atatatcggg caccctttgg cgggggatga cctttacggc ggggacactt 1681 caattaaaag gcaggcactc cattgcggtg aggtcagctt tgttcatccc gcaacgggcg 1741 agaaaataac ggtaagtgtg cccttgcccg acgatattaa atcacttttc gaaaggaaga 1801 aaagaatgga aaaaattgca agctttcagg tagaccaccg caaattcggc gtgggaatgt 1861 atatttcccg aattgacggc gatattgtga cctatgacgt gagaatggtt aagcccaacg 1921 gcggtcatta catatctaac ccctcgttgc acacaattga gcatcttttt gcaacatacg 1981 ccagaagctc gtttatgggt aaagatgtaa tatatgtcgg cccgatggga tgcagaacgg 2041 gattttatct gcttgtcaga aacgttcagc acgaaaacgc aattaagctg gttaaggaaa 2101 gctttgagtt tgttaaaaac ttcgaaggaa caattcccgg atattcggaa atcgagtgcg 2161 gaaactggtt ggagcatgac cttgaatcgg caaagaaaga tgttgttcct ttgcttgagg 2221 tcttggaaaa ttacaccccc gagcagctcc gttaccccga ataggcggaa aatcattccg 2281 cttttcatcg ttaaaatcac caaaaatcag cggttttgag ccatttcaca gcttttgccg 2341 ttgatttttt tcaaaataat gttataatag ttaaactgcc gagtgtcggc aaaaattcgt 2401 gatgaaagga gcgtgccgat ggattttaaa agtataatgc tgaacttagc ctcgtttttg 2461 ggctttgtcg gcgattgcac aatgaatgcg gtcaagggca ttttgaagtt tgttcttggc 2521 ggaacagcaa aagttttggg caaaatattc ggcacggtct tcggctggat gaagaaaaag 2581 ctcaaacagc cttttttgga tatcttatgc tatgtgctca ctccgattgc tcacgcttgg 2641 ggcacgttgg cacattctaa aatacacttc aagaaagcct cgaaagaggg cttctggcgc 2701 ggtgtgaagg tgttctttgc aaccctttgg aaatgtcttg gagggcttgg cgaggtcaca 2761 aggtggctct ttaaccatgt tgcacccgtt gtgtgcattg tgttcttaat ttcgctcatt 2821 aagtatgcgg gcacaattca gtatgcgatc tccgttgaat ataacggaag caatatcggt 2881 attattgaaa accaggctac atataatcag gcacaggcat tggtgcagga caagctgaca 2941 tataccgaaa acgaccaaag cttaattgtt acaccgaagt tctcggtgca gatgctctta 3001 aacgagggcg aaactgttga cagcgacaat ctttcggaaa ttatgatcga ttcgggcgat 3061 gtggctgtaa cttatgccta cggtttatat atcaacgacg agcttgtcgg ggtatataat 3121 gaagaggaaa tgcaaaaaat caaagcggtg cttgagcatc agcttggaag atattacact 3181 gcaaataccg cagatgtcag ttttgttgat gacgttgtat tgacccaggg ccgttacatt 3241 gaatcgaatc tgaccaccgc tgacggggcg atcgagctga ttcaaagcga aagaacggtt 3301 gaagcgtatt atgttgtgca gaagggagac tcggtctcct tgatcgcgtc gaagctggac 3361 atttcaaagg acgagctttt ggagcataac tccttccttg aggacggcac ccacacaggt 3421 gatctgatca catattactt caccgagcct tatctgccgg ttatgaccac ccactatgaa 3481 acatatgacc gcacagttga gcgtcaggtc gtatatcaat ataatcccaa gacggagatc 3541 ggctgcgaaa ccttgaagca gagcggttcg gacggctttg aaaatgtcac cgcacttgtc 3601 accgagatca acggcgttga atcggacaga gttattgttt caaggactgt aattgaggaa 3661 atggtaccca gaatcttcat tacgggaaca aaggtcaaca catatattga tgatatgtgg 3721 gtgattgaaa aactcggtac cttctgctgg cctgttgcca aagagaacta tatcagctcg 3781 ctttacggct accgcagatg ggatcactcc aaccacaagg gccttgacat tgcggctaag 3841 cgcggaacag atatatatgc cgctgccgca ggaaaggtta tccacgcggg aacatattca 3901 acatatggca agctggtaat aattgatcac ggcgacgata ttctgacata ttatgcacat 3961 cagtcgaaga tatatgtttc aaagggcgat tatgttcaaa agggcgacgt catcggtgct 4021 gtcggtatga ccggctcggc attgggcaac catttgcact ttgagctgcg agtggatgat 4081 gacagaatca atcccatgta ttgcctcggc ggcgtgggcg accatattgt caatgaataa 4141 aataaaagca ggctgtatgg cctgcttttt tgttttgcga atgagtgatc acgccacttg 4201 ctgttttttc gaaaaaattt taattagggt attgacaagc cgcaaactcg gtgctataat 4261 gtaaaagctg tcagcaagac agcttaattt catatgcggc agtgctggaa taggcagaca 4321 ggcacgtttg aggggcgtgt gtccttgacg tatgggttca agtcccattt gccgcaccaa 4381 cttaacagtc caaggcttta gcctcgggct gttaagtttt ttactgacat attgacgaag 4441 aaccgagaac acgaagtgtt ctctgatttt gcgcttcgga atctttcgga cacaacaaaa 4501 gtttggcgcg aaattgagga gcagtcccat ttgccgcaaa aacaaaaccc gagcaacttt 4561 ctgctcgggt tatttttatt atttacttca aaattcttat cttgccgata acgggaagct 4621 ctttagctct gccctgaaca gcgttgacaa tgccgatgat cattacgaca aataaaacaa 4681 ggcttacaag atagccgagt gccacaacga gaatgctgat tacggggatg ccgccgagaa 4741 tctgaacgac gatgttataa acaaggccca aggcgaggtt cgcaaggaag aagaccaagc 4801 cctggttggt gtggaaacgg gcgaacttgg acttctttgc agcgaacagg ggaatgagca 4861 ccaaaattcc gatgtatgct aaaattgcca tcagcttgtt gtcgttaatg tcctgggtgt 4921 catatgcgcc ggtggtgtcg gcggtgttgt taaggttctt gatgttttca actacttcat 4981 caacattgat gttattgttg ttgtctgcca tttttgttgg ctcctttcgg tgatatgtat 5041 ttcgccgatc cttcggcttc aaaaaatatt ttatcacata ctcgccttta atgcaatagt 5101 gtaagatgat atgatttgaa atatttgtcc gattatacaa aaatgtcccg ttattttcta 5161 cgatttccca atatcatttt tggcaaacgt ttgatatact ttgtgtaaga atatgaaaca 5221 caaatcaata tgtttatttt gcaaaaggag gacaatatga aagtattatt catcggcgga 5281 acaggaacca taagcacctc gatctcccgc aagctcattc gcgaaggtca cgagctttgg 5341 cttttaaacc gtggctcgcg caacgacatc ttccccgagg ggctggtcaa ttacatcacc 5401 tgcgacatca acaacgaggc ggatgcaaca aagaagcttg agggaatgag ctttgatgtt 5461 gtctgcgatt ttatcggctt tgtcaagcct cagcttgagc gtgattaccg cctgtttaag 5521 ggcaaaacca agcagtttat gtatatcagc tccgcatcgg catatcagaa gccccttgcc 5581 gagccgtata tcgacgaggc aacacccctt tgcaatccat attggggata ttcccgcaac 5641 aagatcgagt gtgaggaata tttaatggag ctttaccgca aggaaggctt ccccatcacc 5701 attgtaagac ccagccatac ctattgcgaa cgcagtgtgc ccattggtgt tcacggcaac 5761 ggcggagcat ggcaggttgt taagcgtatg cttgagggca agcctgtaat catccacggc 5821 gacggcacca gcctttggac acttacccac gccgacgatt ttgccaaggg ctttgtcgga 5881 cttatgggga atgttcacgc aatcggtcag gcatatcaga taacatcgga cgagtcgctg 5941 acctggacac agattcataa gattattgct gacaccttgg gagttgaatt taagccatat 6001 tatgttccct ccgacttctt ggctgcggtt tcaaactatg acttcgaggg cggacttatc 6061 ggcgacaagg caaattcagt tatctttgac aattcaaagc taaagcgcgc tgtacccgac 6121 tattgcgcga ctatccgttt tgaccaaggc gcaaagcagg cgcttgacta tatgctcacc 6181 caccctgaat gtcagacacc cgaccccgag tttgatgagt ggtgcgatag ggtgatcgat 6241 gcacttgaaa acgcgaaaaa ggagattttg aaatgatcag cattaaagga aaatgggcac 6301 ttgtgacagg tgcatcgaga ggtatcggat atttggcagc aaaatgcctg gcagagcacg 6361 gcgcaaacct tgttttgcac gcaagaaagg ttgagcattg cgacaaggtc ttggcagagg 6421 tcaaggcttt gggcgtcgag gcatatgttg ttgcggcaga gctgagcgac cttgcacagg 6481 ttgaaaaaat gatggtcgag atcgacgaaa agggaacgcc catcgacata attttaaaca 6541 atgcaggcgt gcagatcgcc tacagaaacg aatacctcaa gacccctgca agcgattatg 6601 aaaagagctt tttaatcaac accatcgctc cgatgatgat atgttatcac tatattcctg 6661 cgatgatcga gcgcggattc ggaagaattt tgaataccac cagcggcatt agctttgatc 6721 ctcagcaggc aggctattct gcatccaagg cggcactgga taaggtcacc atcgacctcg 6781 gctcgaagct tcagggaagc aat // LOCUS sequence017 6706 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence017 VERSION sequence017 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..6706 /mol_type="genomic DNA" /organism="" /note="sequence017" CDS 773..2053 /product="MATE family efflux transporter" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003437109.1" /transl_table=11 /codon_start=1 /translation="MLYNIVDRIYIGHMPGDGSLALTGVGVCMPIIMIISAFAALIASG GAPKASISMGKGDNDSAEKIMGGCFSLQLIISAVLTTVLLIWNKDLLLMFGASENTIGY ANDYMNIYAIGTVFVQLTLGMGAFITAQGYTKISMLTVLIGAVSNIILDPIFIFGFKMG VKGAALATILSQAISCVWVLMFLCGKKTYLKLKKHNLHIDGKLIFPCIALGTATFIMQS SESVISVCFNSSLLKYGGDIAVGAMTILTSVMQFAMLPMQGIAQGAQPILSYNFGAKNA ERVKKTYRLLLISCLSYSFIIWGAIMLFPQVFAGIFTPDTALIEFTATALRIYCGVLCI FGIQIACQMTFVSIGNAPCSIIVAIVRKFVLLLPLIYIMPQLIADKTMGVYTAEPVADL IAVTFTAILFTVQFKKALKSLTTANPR" /locus_tag="LOCUS_1230" /note="WP_003437109.1 MATE family efflux transporter (Clostridioides difficile) [pid:53.4%, q_cov:97.2%, s_cov:90.8%, Eval:1.7e-124]" /note="MGA_146" CDS 2328..2921 /product="sugar O-acetyltransferase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011203642.1" /transl_table=11 /codon_start=1 /translation="MTEKKKRDLGYLYNANYDNELLSEIAKCNDLCHEFNQIKPSDRES QQQILQKIFCKMGENVTVNTPFWCDYGYNTEVGDYFFANHNCQILDGGKVTFGNHVFIA PNCLFTTAEHALDVEQRNEGLEVALPITIGNNVWIGAGTTVLGGVTIGDNTVIGAGSVV TKDIPSGVIAVGVPCRVIRKISDADKNKYSHYQG" /locus_tag="LOCUS_1240" /note="WP_011203642.1 sugar O-acetyltransferase (Bacteroides fragilis) [pid:59.7%, q_cov:97.0%, s_cov:97.9%, Eval:2.5e-63]" /note="MGA_147" CDS complement(3300..5240) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MKRFAILVLTVVMIFNLCVPVSAAKVGVMRDLTSAELLDKIRIGW NLGNTFDAYSGDGNYTNGWIELYSDRSPSAYEKAWTGGVLVTPELIKAVKDMGFKAIRM PVTWGPHMDEEGNIDKAWLDRIEEVVNYILDEGLYCLINSHHDCGGKGWLAADAQEYPE ISARFKTMWTQIAERFKDYSDYLMFEAYNEILDRQDNWGGTTPANFEAANKLNQDFVDV VRATGGNNAKRHLSVNVYACSSGSDSALNSFKLPEDTIEDRLFVQIHCYDPQRFCWTPS YIPNPTDQWVANRKEFTDGLNSTFAKIERIFVDKGIPVIIGEFSADNKNNTPEREAYAT DFVTIAREHGISALFYWDVNFTEDHVDDDPPYAPCGLIDRGQVKWLYPTVAKALIEAAG VAHNYSGWTEYNADDHIRHCTDLNCDSFERQPHVWSNSSDSTCDLCNYVRFSPSGLPSL TINDKIAYRGSKVLLDVSLKSCGLADTVKLTYRYDPNFFTPDIQNSEWLVDNSVTATFG DGIATLTTEAPLNPNYTLAQLGFTVSENAPLGQTAIEFEASLSNGSTSVASIPASVTIT VSEILRGDTDGNCSVDKGDAIYLLYSVLFGESQYHLNQPCDFNGSGSVDKDDAIYLLYH VLFGSSIYPLS" /locus_tag="LOCUS_1250" /note="WP_010964144.1 glycoside hydrolase family 5 protein (Clostridium) [pid:32.3%, q_cov:57.0%, s_cov:89.7%, Eval:1.0e-52, partial hit]" /note="MGA_148" CDS 5614..6150 /product="sigma-70 family RNA polymerase sigma factor" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011393839.1" /transl_table=11 /codon_start=1 /translation="MLSFYLSQLELNSQSEKFAKLYTKHRDKMMSAAFAVLKNHHDAEE AVQNALFAIAKNINSLPDPDTRYGANYAVKAAKNHALNMAKKRKTEPLFIDIHAADIDI ADDYISRDEAKSVVEAICAMKPIYRDVLTAKYLYGMTAKEIASVYGLTLQTVKSRLNRG TKILEEAFERSDIDV" /locus_tag="LOCUS_1260" /note="WP_011393839.1 sigma-70 family RNA polymerase sigma factor (Moorella thermoacetica) [pid:25.1%, q_cov:85.4%, s_cov:82.0%, Eval:1.2e-07]" /note="MGA_149" ORIGIN 1 attcacgatc ttgccgtttt caattaccac cagagtagga atgctcataa tgccgaactg 61 acttgccagc tctacttctt catccacgtt gatctttccg accttgatgt cggagcgctc 121 atcggcgatt tcctcaacaa tcggtactac cattcggcag gggccgcacc aaggagccca 181 aaagtccaga aggactttct tatcggaatt taatacttca ttttgaaaat tatttttatt 241 gatattgata gcagacattt ttacgtcctc cttttttctt tgtgaactaa ttatatcacg 301 gcttttgaca cagttctgtg atgacatcac atttctgctt ttactttaat gtagacaata 361 tcataagtca atatgcactt tcggatattt tgcgtattta cgcatcattc ccagctgcat 421 acaatattcc aatcggcgtt tcctttgttt actgcaaacc aatttttgaa gttttgcctt 481 ttctcccgcg atctcggggt tcttctcggc gatcatttcg ctgccatacc gacacaagtc 541 tccttgtgag ctatcagcgt atccggcaag tcctgtgcgg cctgcagatc atctttcgtt 601 gcaatttccg acggcttgaa ttctgaggtg aaatgttata taatatacgt tgcaaattat 661 gattttacgg ggtgaaaata tgagcgataa caaagaactg ctcggcacgg cgccaattgg 721 aaagttgcta ttcaaattgt cagttccaac ggtggttgcc cagcttatca atatgctata 781 caacattgtt gaccgcattt atatcggtca catgccgggt gacggaagtc ttgcacttac 841 gggtgtgggt gtatgtatgc ctatcattat gatcatctcg gcttttgcgg cgctgatcgc 901 ttcgggcgga gcacccaagg catctatctc catgggtaag ggcgacaacg actctgccga 961 aaaaattatg ggcggatgct tttccttgca gctgattatt tctgccgttc tgaccaccgt 1021 tttgctaatc tggaacaaag atttgctttt gatgtttggt gcaagtgaaa acaccatcgg 1081 ttatgccaac gattatatga atatctatgc cattggtacg gtttttgttc aactaactct 1141 tggtatgggc gcgtttatta cggcacaggg ctacaccaaa atcagtatgc tcacggtact 1201 cataggtgcc gtcagcaata tcatccttga tccgattttt attttcggct ttaaaatggg 1261 cgttaaaggt gcggcgcttg ctactattct ttctcaagca atctcttgcg tttgggttct 1321 tatgttcctt tgcggaaaga agacttatct taagctcaaa aagcataatc ttcatataga 1381 cggaaagctc attttccctt gtatcgcact gggaacggca acctttatta tgcagagtag 1441 tgaaagtgtc atttcggtct gctttaattc ttcgctctta aaatacggcg gtgatattgc 1501 tgtaggcgct atgacaatac ttacaagcgt gatgcagttt gcaatgctcc caatgcaagg 1561 tatcgcgcag ggcgcacaac cgattttgag ctataacttt ggtgctaaaa acgctgagcg 1621 tgtaaagaaa acatataggc tgttgcttat atcctgtctt tcatattcct ttatcatttg 1681 gggcgctatt atgctgttcc cgcaagtttt tgcagggata ttcacacccg atactgcact 1741 cattgaattt accgcaacgg cacttcgcat ttattgtggt gtgttatgta ttttcggtat 1801 tcagatcgct tgccagatga cttttgtttc tatcggcaac gcaccttgtt ccattattgt 1861 tgccatcgtt cgcaagttcg ttttactttt gccgctgatc tacattatgc cgcaacttat 1921 tgcagacaaa acaatgggag tttatacggc ggagcctgtt gcagacttga tagccgtaac 1981 ctttaccgct atccttttca ccgtacagtt taagaaggca ctaaagtctt taacaacagc 2041 aaatccgagg tagacagcac agtaaaaatt gcagtaacat atgagaacgg acagatcttt 2101 catcacttcg gccgtaccga actgtttagg gtttataccg caggagacgg aaaaattatc 2161 aacagcgaag tgcttcttac gacgcatcgt tgtaagaaag tgctcggcga gtttgatttc 2221 gcattggccg cggggttcgg cgtagacctt ggatttttac gtttaccgtt tggcagaggc 2281 tatgaagcag tattgactat ttgtatcact tttttatgga ggatcgtatg actgagaaga 2341 aaaaaagaga tttgggatat ttatataacg ccaattacga taacgagttg ctttctgaga 2401 ttgctaaatg caatgacctg tgtcacgagt tcaatcagat caagccatcc gaccgcgaga 2461 gtcaacaaca gatcttacaa aaaatatttt gtaaaatggg tgaaaatgtc actgtaaata 2521 cacctttttg gtgcgattac ggatataata ctgaggtcgg agattacttc tttgcaaatc 2581 ataattgtca gattctcgat ggcggaaaag taacattcgg taatcatgtt tttattgccc 2641 ccaattgctt gtttacaacg gcggagcatg cgcttgatgt tgagcaacgc aacgagggac 2701 ttgaggttgc attgccgata accatcggaa ataatgtctg gataggtgca ggaactaccg 2761 ttcttggcgg tgtaacaatt ggtgataata cggttatagg tgccggcagt gtcgtaacaa 2821 aggatattcc ttcgggtgtc attgcggttg gtgttccttg ccgtgtcatc agaaaaattt 2881 ccgatgcgga taaaaacaaa tattcgcatt atcaggggta aacacatgaa caaaaagcag 2941 gaggctaatg cttttgtcaa gaaatgcatc gcaaccgccc ttattcagct actcaaagaa 3001 aaaactttga agatatatct ataactgagc ttgttaaaaa agccgatgtc ggcagaactt 3061 cgttttatcg caattttgaa tgcaagaaac gactgaggaa ttgacaaggc tttgggagat 3121 agctcaacag gagcaataaa aatcctgtct gaaatgcaaa ttttgagggc accttaaacg 3181 gcccttttcg ttgctatctc cgacattttt tcaaggaaca aattaaagtc tccttcccgc 3241 ttttgcagga aggagacttt ttatattatt taattgcgca tatttagctg ctgaatgcgt 3301 cagctcaacg gatagatcga ggaaccgaag agcacatgat ataggagata aattgcgtca 3361 tccttgtcga ccgagccgct gccgttaaag tcgcacggct ggtttaaatg atattgcgat 3421 tcaccgaaca gcacgctgta aagcaggtaa atagcgtcac ccttatcgac agaacagttg 3481 ccgtcagtat ctccgcgaag tatctcagat acggttatgg ttacagatgc gggaatgctt 3541 gccaccgatg tgcttccgtt gctcagcgat gcctcaaatt cgattgctgt ctgacccaaa 3601 ggcgcattct cgctgacggt gaagcccaac tgcgcaagag tataattcgg attgagtggg 3661 gcttctgttg tcaacgttgc gattccgtcg ccaaatgtcg ccgtaacgct attatcgaca 3721 agccactccg aattttgaat atcgggggta aaaaaatttg gatcatatct atatgtcagc 3781 ttaaccgtat cggccaaacc gcagctcttt aaggatacat ctaacagcac ctttgatcca 3841 cggtaagcga ttttgtcatt gatagtcagc gacggcaagc ctgacggtga gaatctgaca 3901 taattgcaca agtcgcaagt ggaatcggag ctgttgctcc aaacgtgtgg ctggcgttca 3961 aacgaatcgc agtttaaatc tgtgcaatgg cgaatatggt catccgcatt gtattccgtc 4021 catccgctgt aattgtgtgc aactcctgcc gcttcgatca atgccttggc aactgtcgga 4081 tacagccact tcacctgacc gcggtcgatg agtccgcagg gcgcataagg cggatcgtca 4141 tcaacatgat cctcggtgaa gttgacatcc caatagaaca gggcggaaat tccgtgctct 4201 cttgctattg tgacgaaatc tgtggcatat gcctcacgct cgggtgtgtt gtttttattg 4261 tcagccgaga actcgccgat aatgacgggg attcccttgt ctacgaaaat tctttcaatc 4321 tttgcaaatg tgctgttaag tccgtctgtg aattccttac ggtttgcgac ccactggtcg 4381 gtggggttgg gaatatagct cggtgtccag cagaaacgct gagggtcata acagtgtatc 4441 tgcacaaaca gtctgtcctc aattgtatcc tcgggaagct tgaagctgtt aagcgcagaa 4501 tcggagcctg acgaacaagc atatacgttg acgctaagat ggcgctttgc attgtttccg 4561 cctgttgctc ttacaacgtc tacaaagtcc tgattgagtt tgttggcggc ttcaaaattc 4621 gcaggagttg ttccgcccca gttgtcttgt ctatccaaaa tttcattata tgcttcaaac 4681 atgagataat cgctatagtc tttaaatctt tcggcaatct gagtccacat tgttttgaag 4741 cgggcgctga tttcgggata ttcctgcgca tctgctgcaa gccatccctt gccaccgcaa 4801 tcgtgatggg agttaataag acaataaagg ccctcgtcga gaatatagtt tacaacctct 4861 tcgattctgt caagccaggc cttgtcgata tttccctctt cgtccatatg aggaccccag 4921 gtaacaggca tacggatcgc tttaaatccc atatccttga cagctttaat aagctcgggt 4981 gtaacaagaa ctccgcctgt ccacgccttt tcataagcgg aaggtgaacg gtcggaatac 5041 aattcgatcc atccgttggt atagttgccg tcgcccgaat aggcatcaaa tgtgttgccc 5101 aggttccagc cgatcctaat cttatcaagc agctccgcag aggtgagatc tctcatcact 5161 ccgaccttag ccgcgctgac aggcacgcaa aggttaaaaa tcattacaac cgtcagaacc 5221 aatatggcaa atcttttcat ttctgttgcc tccctattca ttatacttca aaccgcattt 5281 attcttaaat ctttcggtga gcgtatgcag tcgtcagcct gcccgaccgt gatttgcaat 5341 gccatttatt atatcttagc atatcttcca tttcaggaca acagttttta tcataaaaac 5401 cttcgatttt ttcatcaaat gtgcgatctg agcggaggag atcgtgcgtt agtgcacagg 5461 ttcttcgatt gtttccacaa cgcagaccgg ctctcccttg acacacttga taaaatatcc 5521 gagaatattt tttgaaaagt tgcacccttt ttgctttgga tgttgtatat ataggtgaaa 5581 ggcaatgaaa gacgatccac cggaggaaaa gaaatgctgt cattttatct ttctcagctt 5641 gagctaaaca gtcaatctga aaaatttgca aaactataca ctaagcaccg cgacaaaatg 5701 atgtcggcgg cattcgctgt gcttaaaaac catcacgatg ccgaggaagc ggttcaaaac 5761 gccctcttcg ccatcgcaaa aaacataaat tcccttcccg atcccgacac ccgttacggc 5821 gctaactatg ccgttaaagc agcaaagaac catgccctca atatggcgaa aaagcgcaag 5881 accgagcctt tgtttattga tattcacgcc gccgacatcg acattgcgga cgattacatc 5941 agccgagatg aagcaaagag cgtggttgaa gcgatatgtg ccatgaagcc gatataccgc 6001 gatgttttaa cggcaaagta tctttacggt atgaccgcga aggagatcgc atccgtttac 6061 ggtttgacct tacagacggt taaaagccga ttgaaccgcg gaacaaagat tttggaggaa 6121 gcatttgaaa ggagcgatat tgatgtttga cgagaaacag accgcaatta tcaagcgtgc 6181 gctggcagaa tatgatgacc gcgaaagtac gatgattgtc ggcgacgagc aggttaaata 6241 tgaatttaca aaccattttg aagagcaggc ggaagccctt aaaaagcggg tgctgatggg 6301 cgttaaggta tccgttaaaa aggtgctttt gctggcggcg gcagttgttt tggtgctcag 6361 tgtgaccgtt gcaatggtcg caggaaacga tatgcacgtt atccgctttg gcaatgatat 6421 caattacaat gagtattccg agattgatga tgccgaaaaa gctgattatt tcgatgtgta 6481 tttaaggata ccctcgacaa atgaaaaaac gttggatatc ccagcaatga ttatcgaagc 6541 agacctgccc atccccgagg gatataagtg cagtatgttc gacccgcttc acccaataac 6601 ttacagcatc catttcagca aggacagcga aaaggttgca tacagacacg catctttgac 6661 catccacatt tatgagattt atgaaaacac aggcgtgcgc cttgac // LOCUS sequence018 6631 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence018 VERSION sequence018 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..6631 /mol_type="genomic DNA" /organism="" /note="sequence018" misc_feature <1..671 /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_003357393.1:cell division ATP-binding protein FtsE" /note="WP_003357393.1 cell division ATP-binding protein FtsE (Clostridium) [pid:56.4%, q_cov:95.0%, s_cov:92.5%, Eval:3.5e-62]" /note="MGA_151" /locus_tag="LOCUS_1270" CDS 661..1566 /product="permease-like cell division protein FtsX" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_010963820.1" /transl_table=11 /codon_start=1 /translation="MRLNSFKYLCGQGVKSLWFNRVNSFASLCIVTVSLVMVGISVLVA TNITKMIGSIESKNELIVVINDGTPDNNIALIGDSITHMDNISEVSFYSKEEAWEEMQQ DMTEDEKALFKYMDSNPLPDSYKVRVTDISELDETVNAISALEFVEMVKAPNDFASILT SIRNICTILFSAVTLALVIVCFVIISNTTRTSVYARRREINIMRYVGATKAFIEIPFFV DGLIIGVLSSGIAFGLTWFAYTEIYNMMASDFNLWSIFGISGLIPFETIALRTGLAYLA CGVVLSSFGAVISTRKHLNV" /locus_tag="LOCUS_1280" /gene="ftsX" /note="WP_010963820.1 permease-like cell division protein FtsX (Clostridium) [pid:28.3%, q_cov:100.0%, s_cov:100.0%, Eval:1.5e-33]" /note="MGA_152" CDS 1685..2983 /product="peptidoglycan DD-metalloendopeptidase family protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011391790.1" /transl_table=11 /codon_start=1 /translation="MAKTLIKRILSLLTALILVMTMIGYTDTTVITHADKQADLEKELA DLKEQQDKYEDLLKSAKDDLYEERQYQKTITAQIETTEEYIRTLVELMNEYDAEIAGIE AEIALIELDILETQQLINEQKIEIDENIDLYEQRLRALYLSGNDSVASIILGATDFFDM LMKIELVTRVARYNDTLIQGLIDLKDSYENNRLMLEGKIAERELAIAEVDNKKADTALL KADWESQLADLNALYEQSDERIEELKDERDAYEENLEEIEKEAEKLEEEIQKIIAEKAR ANYMGDLPEGSFLWPVPGYYYVSSEYGYRWGKLHKGLDIAGSGIKGEPITAANSGEVIF VINNCKHNYGKKKSCGCGGGYGRYCIIDHGGGYTTLYAHATDIIVKEGDHVTTGDVLGY VGSTGYSTVWHLHFEIRIDGKAKDPRKFDLIIK" /locus_tag="LOCUS_1290" /note="WP_011391790.1 peptidoglycan DD-metalloendopeptidase family protein (Moorella thermoacetica) [pid:27.5%, q_cov:95.8%, s_cov:98.4%, Eval:3.5e-32]" /note="MGA_153" CDS 3140..4198 /product="S41 family peptidase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003437815.1" /transl_table=11 /codon_start=1 /translation="MYTKLEQIDTYVRAYYDGEIDEDALIEALAEGYISVLGRDESKYL DETEYSIYKEHLSGTHLGIGVYCEEVGGYPTVTSVLANSPASLAGLQVGESVVSINGES VLNLGYDRAYELLRSDAGTPLVITVRSAGVDRSVNLTTAQMTVPSVSAKIIGDFGYIKV FEFNDKSYQQFTAAYSMLTTSGVKGIVVDLRNNEGLSFDAATNILNAYLPIDSVVAITT DLSGNQSILARASGTHVITVPVTVLTNAKTAGPAELFAAALRDNLNAQIVGAYTKGEGT FTENYSLYDGACIILPVASLQSSDTAFNGTGVKPSYDVAVEGDTNEYLATLDENTDPCL KKAIELLTQAMG" /locus_tag="LOCUS_1300" /note="WP_003437815.1 S41 family peptidase (Clostridioides difficile) [pid:27.0%, q_cov:93.2%, s_cov:84.2%, Eval:2.1e-29]" /note="MGA_154" CDS complement(4798..5295) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MRKLLTVIILTLIICTLVACSDEKKNNGGDNSESANSSDVSTNEP IVTDAPESENEVTTTTPAPVEDPATTTTTEATTEATTTEATTTEQTTTEQTTTEATTTT EATTTKKEETTPATEDEDEEEIPVVEAEDGEEEEEEDIVWEDVNIDEILADLEENGFDI DL" /locus_tag="LOCUS_1310" /note="MGA_155" CDS complement(5437..5682) /product="30S ribosomal protein S20" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_010964586.1" /transl_table=11 /codon_start=1 /translation="MANIKSAKKRVRVIEAKTLRNKAKKSALKTAIKKANAAEEANKEV AVREAIKKVDQACAAGILHKNAAARKKSQLAKKLNG" /locus_tag="LOCUS_1320" /gene="rpsT" /note="WP_010964586.1 30S ribosomal protein S20 (Clostridium) [pid:53.6%, q_cov:98.8%, s_cov:95.5%, Eval:3.4e-14]" /note="MGA_156" ORIGIN 1 acgtttccta tacatatccc cacagcggcc agcaagcctt gagccacgtt aaccttaaaa 61 ttaacgacgg tgagtttgct tttgttgtcg gaacctccgg cgcaggtaaa tccaccctca 121 ttaagcttct tttgaaagag cttaccgcca ccgaaggcga ggtatatgtt aacggatata 181 gccttaacaa gctcaaaagc cgcaagattc cccagttaag acgcaccatc ggcgttgttt 241 ttcaggattt ccgacttatt cccaacttaa ccgtatatga caacattgca tttgcacttc 301 gtgcaatcga tgctccgata aaatacatcc gtacccgtgt gccttatgtt atcagccttg 361 tgggactcac cagcaaggca aagtcatatc caagcgatct ttcgggcggc gaacagcagc 421 gcgttgcgct ggcaagagct ttggtaaatg acccccagct tattattgcg gacgagccta 481 ccggcaacgt tgaccccgca agaagttatg agatcgttga cctgcttaaa gcaattaacg 541 aatgcggcac caccgttttg atggtcacac accagcacga ccttgtaaga tatttcggcg 601 gacgaattat caatatcaac aagggctctg tcgtcttcga cgaggcaata ggaggcgcag 661 atgaggctta acagttttaa atatctttgc ggtcagggcg ttaaaagcct ttggtttaac 721 cgcgttaatt cttttgcatc tttgtgcatc gtcaccgttt cgttggtgat ggtcggcata 781 tctgttttgg ttgcaacgaa catcacaaag atgatcggct cgattgaatc gaaaaacgag 841 cttatcgtcg tcatcaacga cggcaccccc gacaacaata tcgccttgat cggtgacagc 901 attacgcata tggataatat ttccgaggtg agcttctatt caaaggaaga ggcttgggag 961 gaaatgcagc aggatatgac cgaggacgag aaggcgttgt tcaaatatat ggactcaaac 1021 cctttgcccg attcatataa ggtcagagtt accgacatca gcgagcttga tgaaaccgtt 1081 aatgcaattt cggcgcttga atttgtcgag atggtcaagg cgcccaacga ctttgcgagc 1141 attttgacaa gtataagaaa tatctgcaca attttgttct ctgctgtgac cttggcgctt 1201 gtaattgttt gctttgtaat tatttcaaac accacccgca caagtgtata tgcccgtcgc 1261 agggaaatta acatcatgag atatgtcggc gcgaccaagg cattcatcga gattcccttc 1321 tttgttgatg gacttatcat cggtgtgctt tcaagcggaa ttgcctttgg actaacctgg 1381 tttgcatata ccgagatata caatatgatg gcaagcgatt ttaacctttg gtcgatattc 1441 ggcatttcgg gacttatccc ctttgaaaca attgctttgc gtaccggctt ggcttatctt 1501 gcctgcggag ttgttttaag ctccttcggc gctgtaattt caacaagaaa gcatttgaat 1561 gtttaaaaaa ttgcgtgcaa atcgcgctcc ggggcacctg ttcggacggc tccgccaccc 1621 ttcacagacg cccctccgct accctataac tccctttttc taatcaagaa aggaaacccc 1681 ataaatggca aaaacactca ttaaaagaat attgtccctg ctgaccgcgc tgatattggt 1741 gatgacaatg atcggatata ccgacaccac cgttatcacc cacgctgaca agcaggccga 1801 ccttgaaaaa gagctggccg acctaaagga acagcaggat aaatatgaag accttttgaa 1861 atctgctaaa gacgaccttt acgaagagcg tcagtatcag aagaccataa ccgcgcagat 1921 cgaaaccacc gaggaatata tccgcacgct cgttgagctg atgaacgaat acgatgccga 1981 aattgcaggc atcgaagcgg aaatcgccct tatcgagctt gatattcttg aaacccagca 2041 gctcatcaat gagcagaaga tcgagatcga tgaaaacatt gatctgtatg agcaacgctt 2101 gcgcgcgctt tatctttcgg gcaacgactc tgttgcgtca ataattttgg gcgctaccga 2161 ctttttcgat atgctcatga agatcgagct tgtaacccgc gttgcgcgtt ataatgacac 2221 gcttattcaa gggctgattg acctcaagga ttcatatgaa aacaaccggc ttatgcttga 2281 gggcaaaatt gccgagcgcg agcttgcaat cgcagaggta gataataaaa aggctgatac 2341 cgccctttta aaggcggatt gggaaagcca gcttgccgat ttgaacgctt tgtatgagca 2401 gagcgatgag cgaattgaag agctcaagga cgagcgtgac gcttatgagg aaaacctcga 2461 ggagattgaa aaggaagccg aaaagctcga ggaagaaatt cagaagataa ttgccgaaaa 2521 ggcaagagca aactatatgg gcgacctgcc cgagggcagc ttcctctggc ccgttccggg 2581 atactactat gtatccagtg aatacggata ccgttggggc aagctccaca agggccttga 2641 tattgcaggc tcgggaatta aaggcgaacc gattaccgct gccaactcgg gcgaagtaat 2701 ctttgtaatc aacaactgca agcataatta cggcaagaag aagtcctgcg gctgcggagg 2761 cggctacggc agatattgca tcatcgacca cggcggagga tataccaccc tttatgctca 2821 cgccaccgac attatcgtta aagaaggcga ccatgttaca acgggcgatg tgctgggata 2881 tgtcggctcc accggctatt caacagtttg gcatttgcac tttgaaataa gaatcgacgg 2941 taaggcaaag gacccccgca agtttgacct tatcatcaaa taaatcccga agggacgagc 3001 gattataaac aagaaaattt cagtcggcct cgccattgct ttaatggcga tttccgccgc 3061 cataaccttt ataatctcaa cgagctattc gctgaatata tataacgatc tggttgcgga 3121 cgttcaacag agagccgaaa tgtatacaaa gcttgaacag attgatacct atgtcagagc 3181 atattatgac ggcgaaattg acgaggacgc tttaattgaa gcccttgccg aggggtatat 3241 ctccgttttg ggcagggacg agtcgaaata tttagacgaa accgaatatt cgatatataa 3301 agagcacctc agcggaactc atctgggcat cggcgtatat tgcgaagagg tgggcggata 3361 ccccaccgtt acaagcgttt tggcaaacag ccctgcatcc ttggcgggac ttcaagtcgg 3421 cgaaagcgtt gtttcgatca acggcgaaag cgttttaaat ctcggatatg accgtgcata 3481 tgagcttttg cgaagcgatg caggcacccc tctggttatt accgtcagaa gcgcaggcgt 3541 tgacagaagc gttaatctta caactgcaca gatgaccgtt ccgagcgttt ccgcaaagat 3601 tatcggagat tttggatata tcaaggtctt tgaattcaac gacaagtcat atcagcagtt 3661 caccgccgca tattcgatgc tgacgacttc aggagtcaag ggaattgttg ttgaccttag 3721 aaataacgaa ggcctcagct ttgatgctgc aaccaacata ttgaatgcat acttgcccat 3781 cgactctgtt gttgcaatta caaccgatct ttcgggcaac cagtcgattt tggcaagagc 3841 atcaggcaca cacgtaataa ccgttcctgt gaccgttctg acaaatgcca agaccgcagg 3901 ccctgcggag cttttcgccg cagcactgag agataactta aacgcacaga tagtgggcgc 3961 atatacaaag ggagagggaa ccttcaccga aaactattcc ctttatgacg gcgcttgcat 4021 cattttgcct gtggcatcgc tgcagtcgag cgataccgcg tttaacggca caggtgtcaa 4081 gcccagctat gacgtagctg ttgagggaga tacaaacgag tatctcgcaa cgcttgacga 4141 aaacaccgac ccctgcctta agaaagcgat tgagcttttg acacaggcga tgggataaaa 4201 aattaaggcg cccaagcagg gtgcctgttt tttacaacgt cgattgtagc gcatccaaaa 4261 atgttgcttc ctacgatcgc aaagttttga caagaatccg cgaaacagat tcttgaatgt 4321 gctttcgttc aaacactaaa tcatcctccc aattaggcac acacgcctct attacaatag 4381 gagggtggtg agggcaacgc ctgtgaccgc cgccggtggc ggatgaaggg agcaggggtt 4441 ggaacagcgg tcgacaagcc ggaacgttag tgaacggcga gtcggttacc gcaagcgggg 4501 cttttgtcgg aagagtctaa tggataattc cgaccgcaag gctttcacaa atctgcgacc 4561 tcctcggcaa aacattaatg cttgtcggtg ccctcctaaa ggtttcccct ttggcgagaa 4621 cttcaaggta caaaatgaat tgtgcttcgc gcatgaatag tcaaaaccat tttgtcaaaa 4681 tgattttaac atgaattgat gcaacaagtt gcatcgtgaa tagcagaaac aagtttctac 4741 cggaaacaag tttctgcatt taaaaaggca ccccttttcg ggtgcctttt tagtttatca 4801 aagatcgata tcaaatccgt tttcttcaag gtctgccaaa atctcgtcga tattgacatc 4861 ctcccaaacg atatcctctt cttcctcttc ttcgccgtcc tcagcttcaa caacaggaat 4921 ttcctcttcg tcctcatctt cggttgcggg tgtggtttct tccttcttgg tcgtggtggc 4981 ttcggtggtg gttgtagctt cggttgtagt ctgttcggtg gtagtctgct cagttgtggt 5041 tgcttctgtg gtggtagctt cggttgttgc ctcggtcgta gtggtggttg ccggatcctc 5101 aacaggtgca ggcgttgtgg tggtcacttc attttccgac tcgggagcat cggtcacgat 5161 cggctcgttg gtggaaacat ccgagctgtt agcagattcg gaattgtcgc cgccgttatt 5221 tttcttttca tcactgcagg caacaagagt gcagataata agagtgagta tgataacagt 5281 caaaagtttt ctcattatgt ataatccttt caaaacaggt taattatatt ttacgacata 5341 tgtgcctaaa tttcaacagg caaatgtcgg aaattgcgga aaacaaaagc tccgcttatt 5401 gaactaagcg gagcccaaag cctttggttt cagaaattag ccgttaagct tctttgcaag 5461 ctgggacttc tttcttgcag cagcattctt atgaagaata ccggcagcac aagcctgatc 5521 taccttcttg atagcttctc taactgcaac ttccttgtta gcttcttcag cagcgttagc 5581 cttcttgata gcggtcttga gcgcagactt cttagccttg tttctgagag tcttagcttc 5641 gataactctg actctcttct tagcagactt aatgttagcc attaagacac ctcctatgtc 5701 atgtttaaaa tccacttatt tggataagct acttgcacga ctgagagaaa gtgcaaaagg 5761 ttaatgactc cttacttatt caacaagtat cttagttaat atatcaccat ttttcaaaaa 5821 atgcaatagg tttttcgcaa attctttgaa aatttataaa aaatttttcc caaaatcctt 5881 tattttagga ggtttgacat gatttcacgt tcagacttgg cgcttgaagc tgccgactcg 5941 ctgttaacag gtgaaaagct acccgacggg gtgagcctta aaagctatgt gagaggcgca 6001 ttcaacataa ccgacgttaa gatatatggc gacgatgccg caaaaaagct cggaaaatcc 6061 aaggggagat atttgaccct tgaaacaaaa aacagcttcg acacccatcc cggcgacttc 6121 gcaaaggaca gccttgccct tgccgacgag cttcgctcga tgattggcaa ccccgagagg 6181 gtgctggttg ttgggcttgg aaatttcgat gttaccccag acagcctcgg cgcacgggtt 6241 gccgacagaa taattgccac acggcatatt aaagacaact tccccgagct ggataagatg 6301 tttcaggcaa acgtaagcgt tttaaaaacg ggagtaatgg gcaaaacagg tatggaatcg 6361 gcagaggcgg ttaaggcgac agcaaaaacg gttaagcctg attgcataat cgtctgcgat 6421 gcgctggcct gctcgggggt gtcaaggctc ggacacgcaa ttcagatgac cgatacaggt 6481 atatcgcccg gatcgggagt gatgaactcg cgcaaggaaa tttcaaagcg aacggtcggc 6541 gtgccatgcg ttgcaatcgg tgtgccgacg atggcggact cgaaggagct tgaaatgatg 6601 gtgacaccga aaaatatcga caagctgata c // LOCUS sequence019 6622 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence019 VERSION sequence019 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..6622 /mol_type="genomic DNA" /organism="" /note="sequence019" misc_feature <1..547 /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_026468327.1:glycosyl hydrolase" /note="WP_026468327.1 glycosyl hydrolase (Amycolatopsis balhimycina) [pid:38.1%, q_cov:94.5%, s_cov:39.1%, Eval:6.2e-31, partial hit]" /note="MGA_158" /locus_tag="LOCUS_1330" CDS 808..1425 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MKKIILIMLVLAMALSMVACGNNNNADNGNNDAVVDDTNNNENNV EETPAEPVAALDVLNAAWEKYTEDEKVYFMGGDYDNFTQGPGVFNHENAEYLAGLLIVP ADAVQYISETASLLHNMNLNSFTCGSYVIEDAANVDTFVSLMTDAIKNNQWMCGFPEVL SVVKVGDNNVVITFGNTDLVNLIETRLVEVYPDAVTTQEPLV" /locus_tag="LOCUS_1340" /note="MGA_159" CDS 1517..2917 /product="MBOAT family protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_010964872.1" /transl_table=11 /codon_start=1 /translation="MLFSSIPFLYYFFPIVLIAYFAVPKFLKNSVILLSSLVFYAWGEP RFVILMAITIAVGFAAGLLMEKAKTSALKRTAMIVSVAICLAFLGYFKYVDFFIENFNA VTGLSVKLLNVALPIGISFYTFQIISYIVDVYRGSVGAQHNVINFAAYVAMFPQLIAGP IVRYSDIARQLESRNHSIEQISYGIRRFVIGLGKKVLIANTLGELCDIFKASDDKTVLF YWVYAIAFSLHIYFDFSGYSDMAIGIGHIFAFKFIENFDHPFISSSITEFWRRWHMSLG SWFRDYVYIPLGGNRVSKLRWFFNIFVVWALTGFWHGAEWNFIIWGLMFGILLVIEKVV LLDKLKKTKVINHIYVMFFVLISFVIFNASSMSEAFSYIGGMFGAGGIKFASVECFYYL RSYGIMLIIGIIGSTPLIKNVCLKLEAGQKSSKIINVLEPVALAAILILCTAFLVDGSF NPFLYFRF" /locus_tag="LOCUS_1350" /note="WP_010964872.1 MBOAT family protein (Clostridium) [pid:42.7%, q_cov:100.0%, s_cov:100.0%, Eval:4.1e-114]" /note="MGA_160" CDS 2932..4035 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MNKKIKSIVTVALASLVVSGFFIICLIKPATEYSDSERRYLDQFP ELSIETLLNGKFMTGFEDYTLDQFPLRDTFRSIKSFTAFYLMGQLDNNDIYVHDGYIAK LEYPMNTDSIQTAGDKFSAIYDKYFADKDMNVYMTVVPDKNAYLHDEAGRLSMDYDKFV SLMKESAPNFEYIDIFPLLDYTDYYRTDTHWKQEEIFDVAQHIASTMGVTLDAEYEKVL ATDDFKGVYMGQVSLPIDSDEMYYMTNDNLEGCTVINGEIGEQMPMYVSDKLTDRDPYE MFLGGSLSLITIENPNAETDRELIIFRDSFGSSIAPYFAEAYSKITVVDIRYIHSAMLG NFINYEKQDVLFLYSTLVLNNSSTIKG" /locus_tag="LOCUS_1360" /note="MGA_161" CDS complement(4554..5084) /product="inorganic diphosphatase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_000233562.1" /transl_table=11 /codon_start=1 /translation="MNIWHNINPKRISSDSFEAVIEIEKGSKCKYELDKETGSLMLDRI LYTSTHYPANYGFIPRTYADDLDPLDVLVLCAESIRPMTLVKCYPIGVISMLDNGRHDE KIIAIPFNDPNYNVYKDISDLPKHIYDEMCHFFKVYKEREGKEPVVNDVADAQRAKEII RSAMDGYIENYCK" /locus_tag="LOCUS_1370" /note="WP_000233562.1 inorganic diphosphatase (Leptospira) [pid:46.2%, q_cov:98.3%, s_cov:97.2%, Eval:4.0e-40]" /note="MGA_162" ORIGIN 1 acacaaaaat atgatcgcca actgggatct tgccgcaaac gcccttgccg agcttcgcga 61 tgcaggcgtt cccgttttgt ggcgcccatt ccacgagttt gacggcggct ggttctggtg 121 gggtaaggga agccctgagg actttatcaa gctttggcgt ttgatgtatg accgttacac 181 aaatatgttt aacttaacca acctcatctg ggttcttggc tatgccgact atgtccgcga 241 cggttggtat gttggcgatg attattgcga tatcatcggc tccgacacct ataaattcgg 301 gcttcacgaa gcagcttatc agaagctttg gatagatttc ggcagatccc gcaaaccctt 361 cactctgcac gaatgcggca acctgccgga catcaccgat ttcgttcgca agcgcacaat 421 gtggagctgg ttcctgatct ggcatacaag ctgggcgacc aacaacgatg ttgaaaacct 481 caaaaagatg tacaactccg agttcgcttt aaccctcgat aagcttccga agtttgagtg 541 gaattgattt atcgctttaa actgaatacg taattgcaaa aaaattgcat acgaatcggt 601 ataatttttt aacttttttg ccaaaaactt tgtaataaaa aacaagccga aatcacgtaa 661 aatcgaggtt ttacggcttg acttatgcat acaaccgtgg tataatcacg gtgttacatc 721 acaaatctcg gttgatacag aaatgtaccg accgattttt atgtaaagcg taacacatat 781 ttttcgattc taaggagaaa ctaaaaaatg aagaagatca ttcttatcat gctcgttctt 841 gcaatggcat tgtctatggt tgcttgcgga aacaataata atgctgataa cggcaacaac 901 gacgcagtag ttgatgacac aaataataac gaaaacaatg ttgaggaaac ccctgccgag 961 cctgtggcag ctttggatgt tcttaacgca gcttgggaaa agtatacaga agatgaaaag 1021 gtatacttca tgggcggcga ctatgacaac ttcacccagg gtcccggcgt attcaaccac 1081 gaaaatgctg aatacctcgc aggacttctc attgttcccg cagatgctgt acagtacatc 1141 tctgaaaccg catccctttt gcacaatatg aacctcaaca gcttcacctg cggttcttat 1201 gtaattgaag atgctgcaaa cgttgacacc tttgtttctt tgatgactga tgcaatcaag 1261 aacaaccagt ggatgtgcgg cttccccgaa gttctttccg ttgttaaggt tggcgataac 1321 aacgttgtta tcaccttcgg taacaccgac ctcgttaacc tcatcgaaac cagactcgtt 1381 gaagtatatc ccgacgctgt tacaacacag gaaccccttg tctaattaaa cggcaaacca 1441 aaaaagcaaa acaaatgaaa gtgagtttgc ccgcgcggca aactcacttt tgcgttcata 1501 atttcaggag gtcaaaatgc tattttccag catacctttc ctttactatt tcttccccat 1561 agtcttaatt gcatattttg ccgtgcctaa gtttttgaaa aactcggtga tcttgctttc 1621 aagcttagtt ttctatgctt ggggagagcc cagattcgtc attttaatgg caattaccat 1681 tgccgtgggc tttgctgcag gccttttaat ggaaaaggca aaaacatctg ccttaaagcg 1741 aaccgcaatg atagtttccg ttgcaatctg tctggcattt ctcggctact tcaaatatgt 1801 cgactttttc attgaaaact tcaatgccgt aacgggtctt tctgtgaagc ttttgaatgt 1861 tgcattgcct atcggcatca gcttctatac cttccagata attagctaca ttgtcgacgt 1921 ttatcgagga agtgtcggtg cgcagcataa tgtaattaac tttgccgcat atgttgcgat 1981 gttcccgcag ctcattgcag gccctatcgt gcgctattcg gacattgctc gccagcttga 2041 atcaagaaat cactctattg agcagatatc ttacggcatc cgcagattcg ttattggctt 2101 gggcaaaaag gttttaattg caaacacctt gggcgagctt tgcgatattt tcaaagcatc 2161 ggacgacaag accgttttgt tctattgggt atatgccatt gccttctcgc ttcacatcta 2221 tttcgacttc tccggctact cggatatggc gatcggtatc ggccacattt ttgccttcaa 2281 gtttattgaa aacttcgacc accccttcat ttcttccagc ataaccgaat tctggcgccg 2341 ttggcatatg tccctcggct catggttccg cgattatgta tatattccct tgggcggcaa 2401 ccgagtttca aagcttcgct ggttcttcaa tatcttcgtg gtttgggcgc ttacaggctt 2461 ctggcacggt gctgagtgga acttcataat ctggggcttg atgttcggaa ttctgctggt 2521 tatcgaaaag gtagtgctgc tggataagct taaaaagaca aaggtaataa atcatattta 2581 cgttatgttc ttcgttctta tcagctttgt aatcttcaat gcaagttcaa tgagcgaagc 2641 gttcagctat atcggcggaa tgttcggcgc aggcggaatc aagtttgcat cagttgagtg 2701 cttctattac ctaagaagct acggaattat gctcatcatc ggcatcatcg gctcaacacc 2761 gcttataaag aatgtttgct tgaagcttga agcaggtcag aagtcatcaa aaatcatcaa 2821 cgtgctcgaa cctgtggctc ttgctgcaat attgattctt tgcacagcat tcctggttga 2881 cggttccttc aacccgttcc tatacttcag attctaaagg agggactaag catgaacaaa 2941 aaaattaaaa gcattgtcac agttgcgctt gcgtcccttg ttgtctctgg attcttcatt 3001 atctgcctta tcaagcccgc aacggaatat tccgacagcg aacgcagata tttggaccag 3061 ttccccgagc tgagcattga aactctcttg aacggcaagt ttatgaccgg ttttgaggat 3121 tatacccttg accagttccc ccttcgcgac actttccgtt caattaaaag ctttaccgcg 3181 ttctatctta tgggacagct cgacaataac gacatctacg ttcacgacgg atatatcgca 3241 aagcttgaat acccgatgaa taccgactca attcaaactg caggcgacaa gttttctgca 3301 atttatgata aatatttcgc agacaaggac atgaacgtct atatgaccgt tgtccccgac 3361 aaaaacgcat atcttcacga cgaagcgggc agactgtcaa tggattacga taagttcgtt 3421 tcgttaatga aagaaagcgc acctaacttt gaatatatcg acattttccc gcttttggat 3481 tataccgact actatcgcac cgacacccac tggaagcagg aggaaatctt tgatgttgca 3541 cagcacatcg catcaacaat gggtgttact ctcgatgcgg aatatgaaaa ggttcttgca 3601 accgacgatt tcaagggtgt atatatgggt caggtttccc ttcccatcga ctcggacgag 3661 atgtattata tgaccaacga caatcttgag ggctgcacag ttatcaacgg agaaatcggc 3721 gagcaaatgc ctatgtatgt ttccgacaag ctcaccgacc gtgacccata tgagatgttc 3781 ctcggcggaa gcctttcgct catcaccatc gaaaacccca acgcagaaac cgacagagag 3841 cttataatct tccgcgattc cttcggctca agcatcgcgc cttattttgc tgaggcttac 3901 tcaaagatca ccgttgtaga tatcagatat atccattcgg caatgcttgg aaacttcatc 3961 aactatgaga aacaggacgt tttgttccta tattccacct tggtgctcaa caattcctcg 4021 acaattaagg gataaaaaag aaagcaggct tcgtgcctgc ttttttaatg cgtaaacttg 4081 tttctgatat tcattctcaa aagggggaaa ccgcagaaag acaagaaagg cgctcaaaag 4141 gaggaagggc gcaaccgccg ccctctcttt tctttctgag gtttccccct ttgtaacccc 4201 catcctgact atcttttctc tcccggctgc gctatgctct tcgatatccc atgcgcttac 4261 agagctaata attgtaacaa aggagcaact gatagagagt gatcttttca aagacagtag 4321 tgcaatacgt tgagagcctt aatcttgaag caaaatgtgt aaagatatag tagcaaaaga 4381 ggtcgcgcat gggattcaag tgtgagttct aagcttttgc gcgttgcaat agcggtgtcg 4441 cctgcggcga atatccccac ccccgatccc ggctttgccg aaataacccc ctcccacggg 4501 gagggggatt tctaccacac aaaaaagcca ccgtactgcg gtggcttttg tcgttatttg 4561 caataatttt caatatatcc atccattgcc gagcggatta tctcctttgc tcgctgggca 4621 tctgcgacat cattaacaac tggttccttg ccctcacgct ccttatatac cttgaagaag 4681 tggcacattt catcgtaaat gtgcttgggc agatcggaaa tatctttata tacgttgtaa 4741 ttgggatcgt taaagggaat agcaatgatc ttctcgtcgt gtctgccgtt gtcaagcatc 4801 gaaataacac cgattggata gcattttacc agtgtcatag gtctgatgct ctctgcacaa 4861 agcactaaaa cgtccaatgg atcaaggtcg tcggcatatg tgcgcggaat gaagccgtag 4921 ttggcggggt agtgggtcga ggtataaaga attcggtcaa gcatcaaaga tcctgtttct 4981 ttgtccaatt catatttaca ctttgagccc ttttcaatct cgataaccgc ttcaaagcta 5041 tcgcttgaaa tacgttttgg attaatgtta tgccatatat tcatagtttt tcctccttca 5101 atgatgttta acaaattata acttatcgga tttgctttgt caatttgatt tttttcaaaa 5161 attctaatta tgttgcattt tgctattgct ttttgaaatt gcctaatata taatcatagt 5221 ataagtaact atgcgcgttt tcatattgaa acatcgttcg ggattttgta taataaatta 5281 ttattatatc cgattgtgag gtacacggct atgaaaaaag aattcattaa aggcgcaaac 5341 ccctatatgc ccctttggga acacgttccg gacggagaac ccagagtatt tgaatataac 5401 ggcgagaaga gggtatatgt ttacggctct cacgaccttg aaaagaatgt atattgcggc 5461 cgtgatcagg tgtgctggtc ggcacccatc gatgacttga caaattggac ctgccacggt 5521 gtatgctata ccgccactga cggatcaatt ctctacgccc ccgactgtgt gcagaagggc 5581 gacaccttct atatgtacgg tgctgaaggc tgcggctcaa gaattatggt tgcaagctca 5641 aagacccctt ggggaccttt caccaaccct gttaagaccg accttggctt cgaccccggc 5701 gttttggtgg atgacgatgg caaggtatat gcatactggg gcttctgcgg cacacattgg 5761 gcagagctta acgacgatat ggcaactata aagcccggta cctatgttgc caacggcatc 5821 ggccattgcg atgcttcttg ggcacaagaa accgaacata tcgaccttaa agacgctttc 5881 tttgaagcat cttcccccag aaaggttatg ggcaagtatg tctatgtata ttccaagaga 5941 tacagcaccc ccgtccccga actcggcgta tttgacaagt gcaacggctt cctgtcctat 6001 atgtacagcg acaagccttt agagggttat gttcatggtg gggatatctc cttcaacggc 6061 ggcgaaattt tgcctcagcc ggacggcaca ggcaagcaga cctataagtg gggcaataac 6121 cacggcggtc tttgcgaaat caacggcaag tggtatatct tctatcaccg ccagacgggt 6181 gtaaacgaat tctcacgcca ggcaatgctt gaacctgtcg acgttgctct cagctcggac 6241 ggaaagctct tcatcggcga tattacatat gacgaaaacg gcgagccgat aagctctaag 6301 cctgttgaaa tgacctccca gggagcgcac atcaacggtc tcgatgcata taagctcatc 6361 tccgcaggat atacctgcca tatcagcaac accaatttgg catatgatac atatgttaaa 6421 cccgtatatg atcagattga ctctatcagc gctcccgttg tgggaatcac cgacaaggct 6481 gttattggat ttaagtatct tcagtttggt actatctctc ccaagactgt caccgtttac 6541 gccaccgatg ccaagcagat aaaagtaagg ctcgataagc acaacggcaa ggtgatcggc 6601 acagtcagct ttgaaaacgg tg // LOCUS sequence020 6446 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence020 VERSION sequence020 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..6446 /mol_type="genomic DNA" /organism="" /note="sequence020" CDS complement(232..1605) /product="rhamnulokinase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003243094.1" /transl_table=11 /codon_start=1 /translation="MAYCLAIDIGASGGRHILGEIADGKLVMTEVYRFENGMKELSGSL VWDIDELFENVVKGLEKCKELGKIPATVSIDTWGVDYVLLDEKGKEILPCYAYRDSRTV GVPEEAYKIIPQTELFKRTGIPKQNYNTVFQLWCDKKSGRLDNASHMLLLPDYLKYKLT GKMASEYTICTTTGLVNADTKNWDDSIIDALGFDRSLFVEISAPCTLLGNLCEEIKSRV GFDCLVLHCPAHDTASAVAACPVDDSSVFISSGTWSLVGTENLEAVTDERAMLAGLANE GGINYRYRFLKNIMGMWLFQSIRKELDKKYTYDEMMEMAMVSSFAEKIDPTDDLFLAPE SMINAVRTYLGKPDLPLGDVLSSIYHSLAQSYDKTVREIENISGKKVTHISIVGGGSRD RYLNRLTREYTGKTVSAGPVECTATGNIISQLMYLNENLSLGDARALVKHSFNIEEVK" /locus_tag="LOCUS_1380" /gene="rhaB" /EC_number="2.7.1.5" /note="WP_003243094.1 rhamnulokinase (Bacillus) [pid:39.0%, q_cov:98.2%, s_cov:93.8%, Eval:4.9e-88]" /note="MGA_165" CDS complement(1620..2306) /product="class II aldolase/adducin family protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011392225.1" /transl_table=11 /codon_start=1 /translation="MEYMELREQLCDVCHKMWQLGWVAANDGNVSVKLPDGNFLATPTG ISKSFITPEKLVIINDKGEVISGEPGYKPSSEIKMHLRCYKERDDVGAVVHAHPPTATG YAVAGKSLDEYSMIETVIAIGSIPLTPYGTPSTNEVPEAIAPYLKEHDVFLLQNHGALT VGADLITAYYRMETLELYAKISLTAHLLGGAKEIEKPQIDKLLDLRENYYHVTGKHPGY KHYNDK" /locus_tag="LOCUS_1390" /note="WP_011392225.1 class II aldolase/adducin family protein (Moorella thermoacetica) [pid:46.8%, q_cov:89.9%, s_cov:98.1%, Eval:1.6e-49]" /note="MGA_166" CDS complement(2319..4118) /product="L-fucose isomerase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011107686.1" /transl_table=11 /codon_start=1 /translation="MALSRLIGDYPVIGIRPTIDGRRGVLKVRESLEEQTMNMAKSAAK LFEENLKYSNGEPVKVVIADTTIGRVAEAAACADKFRKEGVDITLTVTPCWCYGAETMD MDPNTIKAVWGFNGTERPGAVYLASVLATHAQKGLPAFGIYGHDVQDATDTEIPEDVKE KLLRFGRAAVAAATMRGKSYLQIGSICMGIGGSIISTDFIEDYLGMRVESVDEVEIIRR MTEGIYDKAEYEKALAWAKQYCIEGFDKNPEELQKTRAEKDADWEFVVKMMVIIKDLMN GNPNLPEGCEEEMVGHNAIAAGFQGQRQWTDFYPNCDFPEAMLNTSFDWNGAREPYILA TENDVLNGIGMLFMKLLTNRPQMFADVRTYWSGDSVKRVTGYDIDGKAKAADGFIHLIN SGACCLDANGRAKDENGNGVMKPWYEVTEEDQKAIMANSTWNYADLGYFRGGGYSSRFV TKAEMPATMIRLNLVKGLGPVLQIAEGWTVSLPDDVTDTLWKRTDYTWPCTWFAPRCTG EGAFKSAYDVMNNWGANHGAISYGHIGADLITLCSMLRIPVCMHNVPEEKIFRPAAWNA FGMDKEGADYRACQNFGPLFKKC" /locus_tag="LOCUS_1400" /gene="fucI" /EC_number="5.3.1.25" /note="WP_011107686.1 L-fucose isomerase (Bacteroides thetaiotaomicron) [pid:67.4%, q_cov:98.2%, s_cov:99.5%, Eval:1.8e-234]" /note="MGA_167" CDS 4334..5209 /product="AraC family transcriptional regulator" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_005775503.1" /transl_table=11 /codon_start=1 /translation="MIYQKTFQADELPSKAHISCFRYKTRDFDYYPIHSHSYYEISFIV SGERYFYFNGEQLKIDKNTLLFVPPLAAHGNKNITAVDDIVLQISANLFNCISELFDSK MFFALKNDSCAGIALEDGSEISAVINRLYDLCDRIDGSYDDKGTTDNAVMRELERDSLV LKLVSLMIEFGLITVKSGVSSLSKLGLIDELINRLIANPHDKIDMTEAAKFVGMSYSHF SRLFKALTGTNYAEYCNILRIRHAEELLRDTNLSIAQVAYAIGIDTPSYFTRLFKNING ISPAEYRAKR" /locus_tag="LOCUS_1410" /note="WP_005775503.1 AraC family transcriptional regulator (Bacteroides) [pid:26.2%, q_cov:91.8%, s_cov:88.2%, Eval:1.9e-14]" /note="MGA_168" ORIGIN 1 attacctgcg caggacgaaa gatgcaacag gtttgcaacg gttgccagaa cgagtattaa 61 ggacagtgct tttttgaaca taaaaacgcc tcccaaacaa cattgttata ctataattat 121 agtagtttgt tagcttaccg gcaatgatga aagcatattt tttcattgat aaatgcgcga 181 gcacacattg ataaaagcaa aagccccgaa aaaaatcgga gctttttgcg tttatttaac 241 ctcttcgatg ttgaatgaat gcttgaccaa cgctcttgca tcgccaaggg acaaattctc 301 attgagatac atcagctgtg agattatgtt tcccgttgcg gtacattcaa cagggcctgc 361 gctgacagtt ttgcctgtat attcgcgtgt taagcggttg aggtatctgt cgcggcttcc 421 tccgccgaca atgctgatat gagtgacctt tttgccggag atattttcta tttctctaac 481 agtcttgtca taactctgcg caagggagtg atagatactg cttaaaacat caccaagagg 541 caggtcgggc ttgcccagat atgtacgcac agcgtttatc atactctcgg gtgccaagaa 601 caggtcgtcg gtggggtcga tcttctcggc aaatgagctt accatcgcca tttccatcat 661 ttcgtcatag gtgtattttt tatccagctc ttttcttatg ctctggaaga gccacatacc 721 cattatattt ttgaggaaac gatagcgata gttgattcca ccctcgtttg caaggcccgc 781 aagcattgcg cgctcatcgg tgacggcctc gaggttttcg gtgccgacaa gactccatgt 841 gccggatgag atgaaaacgg agctgtcatc aactgggcag gcggcaaccg ctgaggcggt 901 atcgtgggca ggacaatgca aaacaaggca gtcgaacccg actcttgact tgatttcctc 961 gcacaaattg cccaaaaggg tgcagggcgc ggaaatttcg acgaacagcg agcggtcaaa 1021 gccaagcgca tcaataatac tgtcatccca gtttttggta tcggcattta caagccctgt 1081 ggtggtgcaa atggtatatt cactcgccat tttccccgtc agcttatatt tgagataatc 1141 gggtaaaagg agcatatggg aggcattatc cagcctaccc gattttttat cgcaccaaag 1201 ctggaagacg gtattgtaat tctgcttcgg gatgccggtt cttttgaaaa gctccgtctg 1261 cggtatgatt ttgtacgcct cttcgggcac gccgacagtt cgcgagtcgc ggtaagcata 1321 gcaaggaaga atctctttgc ccttttcatc cagcaaaaca taatcaacac cccaagtgtc 1381 aattgaaact gtcgcaggaa tcttgccaag ctctttgcac ttttcaagac ccttgaccac 1441 attttcaaaa agctcgtcaa tatcccaaac aagcgagcca ctaagctcct tcatcccgtt 1501 ttcaaagcga tatacctcgg tcataaccag cttgccgtcg gcaatctcgc ccaaaatatg 1561 acgtccgccg gaagctccga tatcaattgc caaacaatat gccataggtt tatcccctat 1621 catttatcgt tatagtgctt atatcccggg tgctttcccg taacgtggta ataattctcg 1681 cgcagatcca aaagcttgtc aatttggggc ttttcaatct ccttggcgcc gcccaaaaga 1741 tgtgcagtga gggaaatttt ggcgtaaagc tcaagagttt ccattcggta atatgccgtt 1801 atcagatcgg caccgacagt taatgcaccg tgattttgca aaaggaaaac atcgtgctct 1861 ttaaggtaag gtgcgatcgc ttcgggcacc tcgttggtcg agggggtgcc atagggcgtt 1921 aaaggaatcg agccgatggc gatgaccgtt tcgatcatcg aatattcatc caggctcttt 1981 cccgcaacgg catagcccgt tgcagtcgga ggatgtgcgt gtacaactgc gccaacatca 2041 tcgcgctctt tatagcagcg aaggtgcatt ttgatctcgc tggagggctt gtatcccggt 2101 tcgcccgaga tcacctcgcc cttgtcgttg attattacca gcttttcggg ggttatgaag 2161 cttttgctga tgcctgtggg ggtggcaagg aagttgccgt cgggcaactt gacggaaacg 2221 ttgccgtcat tcgccgcaac ccagccaagc tgccacattt tgtggcagac atcgcaaagc 2281 tgttctctta attccatata ttccataagc taaactcctc agcacttttt gaacagaggg 2341 ccgaagtttt ggcatgctct gtaatcggca ccctctttat ccattccgaa ggcattccaa 2401 gccgcggggc ggaagatctt ttcttcgggg acgttgtgca tacaaacggg gatgcgaagc 2461 attgagcaaa gggtgataag atctgcgccg atatggccat aggagatcgc gccgtggtta 2521 gcgccccagt tattcataac gtcatatgcc gacttgaatg cgccctcacc tgtgcatctg 2581 ggagcaaacc atgtgcaagg ccatgtatag tcggtgcgtt tccaaagggt gtcggttaca 2641 tcgtcgggaa gtgaaactgt ccagccttct gcaatctgca aaacggggcc caagccctta 2701 acaaggttga ggcgaatcat tgttgcaggc atttcagcct ttgtaacaaa gcgcgacgaa 2761 tatccgccgc cgcggaaata accaaggtcg gcatagttcc aggtggagtt tgccataatt 2821 gccttctgat cttcctcggt tacctcatac caaggcttca ttacgccgtt gccgttttca 2881 tccttggccc gaccgttggc atccaaacag caagcgcccg aattgataag atggataaat 2941 ccgtcggcag ccttggcctt gccgtcgata tcatagcctg ttacgcgctt aacggagtcg 3001 ccgctccaat atgtacgcac atcggcaaac atctggggac ggttggttaa aagcttcata 3061 aacagcattc cgatgccgtt taaaacgtcg ttttcggtgg caagaatata aggctcgcgg 3121 gcaccgttcc agtcgaacga tgtattgagc atcgcttcgg ggaagtcgca gttgggataa 3181 aagtcggtcc actggcgctg accctggaag cctgcggcga tggcattgtg gccaaccatt 3241 tcttcttcac agccctcggg caaattcggg ttgccgttca taaggtcctt aataatgacc 3301 atcattttga caacaaattc ccaatcggca tccttttcag ctcttgtctt ctgaagctct 3361 tcggggttct tgtcaaagcc ttcaatgcaa tattgcttcg cccaggccaa agccttttca 3421 tattcggctt tgtcgtaaat accttcggtc attcggcgga tgatctcaac ctcgtcgaca 3481 gattcaacgc gcataccgag gtaatcctca ataaaatcgg tgctgatgat cgagccgccg 3541 atacccatac agatcgaacc gatctgtagg tatgattttc ctctcattgt cgcagcagcg 3601 acagcggcac ggccgaagcg aaggagcttt tccttgacgt cctcgggaat ttcggtgtcg 3661 gttgcgtcct gaacatcgtg gccgtagatg ccgaatgcag gcaagccctt ttgagcgtga 3721 gtcgccaaaa cggaagcaag atatacagcg ccgggacgtt cggtgccgtt gaagccccag 3781 actgccttga tggtgttagg gtccatatcc atggtttctg cgccgtagca ccagcaggga 3841 gtgactgtta aggtgatatc gactccctct ttgcggaatt tatccgcaca ggcggcggct 3901 tcggcaactc tgccgatggt ggtatctgca atgacgacct tgacaggttc gccattggaa 3961 tatttaaggt tttcttcaaa aagcttagcg gcacttttag ccatattcat agtctgctct 4021 tccaatgatt cgcgaacctt caatacgcct cttctgccgt caattgtggg tctgattccg 4081 attacgggat aatcgccgat aagtcttgac aatgccataa aaaaactacc tccggaatta 4141 tattttcaat ctgaaattgc tgatcgggtg tctatatttt gattttatca ctattttcca 4201 aataaatcaa taacattagc aatcggatac caaaaaaggt gaatacacat gtgtggaaat 4261 ttaattatcc ttttttgctt tttataattg acaatcagag taaaacagta taaattgtaa 4321 atgaggtgat actgtgatat atcagaagac ttttcaggcg gatgaactgc cgtcaaaggc 4381 gcatataagc tgttttaggt ataaaacaag ggatttcgac tattatccga tccattccca 4441 ctcatactat gagatatcat ttattgtcag cggcgaaaga tatttctatt ttaacggcga 4501 acaattaaaa atagataaaa atactctttt gttcgttcct ccgctggcgg cacacggcaa 4561 caaaaatatc accgcggtgg atgacattgt tttacagata tccgccaatc tttttaattg 4621 catatccgag ctttttgatt caaagatgtt cttcgcattg aaaaacgact cttgtgccgg 4681 catcgccctt gaggacggaa gcgaaatatc tgcagttatc aacagattgt atgatttgtg 4741 tgaccgaatt gacggaagct atgacgacaa gggcaccacc gataatgcgg ttatgcggga 4801 gcttgagcgc gactcgctgg ttttaaagct agtgtcgctg atgattgaat tcggattgat 4861 aaccgttaaa tcgggagtgt caagcctttc aaagctggga cttattgacg aactgatcaa 4921 ccgtttgatt gcaaaccctc acgataagat tgacatgacc gaagcagcga agtttgtggg 4981 tatgagctat agccatttca gtcggctctt taaagcgctt acaggcacaa actatgcaga 5041 atattgcaat attctgcgga ttcgccacgc agaagagctt ttgcgcgata caaatttgtc 5101 catcgcacag gtagcatatg ccattggtat tgatacgccc agctatttca cacgcctttt 5161 caagaacatc aacggtatct cccctgcgga atacagagca aagagatgat aaatcaaagc 5221 aaaaagagat aatacccaag caaattgttt tattgtgttc cctatggcaa tattatatca 5281 ttgttatagg gacattttat tttcccgaaa ccgtttccga aaggggcaat ggtaatgaaa 5341 aaagtgcttt taatactgtg catactggta ttttccctca cttgtctgtg ctcctgcgca 5401 ggagctaacc cgactgtaat gcgggatatt tccaccatga aattggtggc agagatgggt 5461 gtgggaataa atttaggcaa tacttttgac tgctcgggcg actggataag caaaaatgtt 5521 gaatcggtcg aaactgcctg gggcagtccc gttattacaa aagaaatgat tgaatgctgt 5581 gccgaggcgg gattcggagt aatgcgcttg cctgtaacgt ggggcacgct cgctgatgaa 5641 aattataacg ttgataagga ttttatgaaa cgcattaaag aggtcgttga ttggatcctt 5701 gacagcggaa tgtactgcat tttaaatacc caccacgacg gctggccgga aaagttcacc 5761 gaggactatg aaggcgcaat gaaaaagtat gaaaaccttt ggaagcagat tgcaaaggaa 5821 ttcaaaaact atgacgacaa gctgatattt gagtcgatga acgaggtcgg ctttgatgat 5881 atatggaatt cctatgcagg aaacgagggc aaggacgaag cattccgaat gttcaatgga 5941 atcaatcaga cctttgtcga tgttgttaga agctcgggcg gtaacaattc tcagcgccat 6001 cttttgattg cggcatattg gacatcaatc gagcgcgctt gcgacgattt gtttattctg 6061 cctgatgacc ctgcgggacg atttgcggtc tccgttcatt attacggtcc ctcaacgctg 6121 acgcttatca gcgaggatgt gagctgggga aaagccaaga ctacttgggg aagcgaagcg 6181 gattatgctg agcttactat gtggatgaat atgattgaag aagagctgat cgacaatggc 6241 attcccgttt tcatcgggga atacggctgc ttcggaaata ataaaacaag agaaacaaga 6301 acacaatata tgtatgacgt tgcaagctat gcatatttaa gaggcatctg cccgattctt 6361 tgggacaccc caggcggaga actcaaccgc gatcttgcaa ggtttatgga cgaagaattc 6421 attgaaaaac ttacagggat tcccta // LOCUS sequence021 6416 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence021 VERSION sequence021 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..6416 /mol_type="genomic DNA" /organism="" /note="sequence021" CDS 3..800 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MFTSAEVGFTKDASPASISETKGSFVFVKSADFEFGASAFMASVK GKGRIEVRLDDLANEPCAYIEFDNDEYTNVFSNNFAEFDGRMHHIYFVFSDENICLSDW SFIKAEDTPRAEENIREYINLDVNIEDYEEISLSEAVVTGSTPWNNGKDVAQKAVDGNV DTFFDGIEQGWLEIDLLAETEISVIGFAPRKGFIDRMVGGHFYGSNDGENWNEITSVKI LPKVGMNYVRLLRTEKYRYIRYSMPEGNNTMCNIAEIKLYKNK" /locus_tag="LOCUS_1420" /note="MGA_170" CDS complement(869..1963) /product="glycoside hydrolase family 5 protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_086845922.1" /transl_table=11 /codon_start=1 /translation="MKNEKANGLTAAEVAREMGLGISLGNTFDAYSCTDCDKIYYEWIP TVGDNKPQDYETCWGAVPTTQKVINGMRDCGFNTIRIPVFWGNMMENDGTWTINEDFIE RVKEVVDYCEKAGVYSVINIHHFDEFIIRRNDLESCKEIFTTVWTQIAEYFKDYPHTVV FEGFNEYIGGNQFNEEGKLVEQGDSNAYLMAEVLNQAFVDAVRATGSNNADRVLIVSGY WTNIDKTTSDRFVMPTDTVEDRLMVSVHYVDNSMYWAKRIGTQEWLDYIDDQCDKLDRA FTEKGIPVFMGETSGGYPRENFGRNAIHTTSSECLEIVLNELFERGYVPVIWDTNNHFY SRTEYVINDKDNEAVIKRIVSNLK" /locus_tag="LOCUS_1430" /note="WP_086845922.1 glycoside hydrolase family 5 protein (Amycolatopsis kentuckyensis) [pid:28.3%, q_cov:98.4%, s_cov:92.2%, Eval:1.3e-32]" /note="MGA_171" CDS 2314..2916 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MRKLIVKGRYLSFDDGEPFFYFGDTAWELFHVLDKDEAKHYFTER SRQGFNVAQAVALAEQGGLTVENAYGRLPLHFTDGTPDPTRPDTDGEYSYWDHVETIVL LGRKDIHERIKFDVNVEDLHGRASATATYPEIKAYVLEKFGLKVSNLYIAQIKEKCGLD KRENFNIGAGKSRPLICPPEKEQAIMDAFRHFGMIDT" /locus_tag="LOCUS_1440" /note="WP_000914581.1 23S rRNA (uracil(1939)-C(5))-methyltransferase RlmD (Streptococcus pneumoniae) [pid:50.0%, q_cov:50.5%, s_cov:19.0%, Eval:9.3e-21, partial hit]" /note="MGA_172" CDS complement(3025..3462) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MTLSEKIVSLRKAHGWSQEDFAEKLYVSRQAISRWENGTALPDAQ NVLQISKLFGVTTDYLLNDDYESDKDIPAVQDATQKTECLISKKKRGHLIAAICFTVAT FCWLMVVSSNPGGIELGLSCFSLALCASSAVAQFVLFFKKK" /locus_tag="LOCUS_1450" /note="WP_011459857.1 helix-turn-helix transcriptional regulator (Desulfitobacterium hafniense) [pid:55.4%, q_cov:57.2%, s_cov:24.2%, Eval:9.8e-21, partial hit]" /note="MGA_173" CDS complement(3654..3917) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MSEKGFILKEKLTYFKNYGVDIMPFDDFYPSGHRLCVTIIMHGNR VATCGDIRFEQTPGKWKPIPKQIDKKIDPAEPTLQITPRQIA" /locus_tag="LOCUS_1460" /note="MGA_174" ORIGIN 1 ctatgtttac aagcgcagag gttggattca caaaggatgc ttctcccgcc tcgataagcg 61 aaacaaaggg atcgtttgtt ttcgttaaga gcgctgactt tgaattcggt gcaagcgctt 121 tcatggcttc tgtcaagggc aagggtcgaa ttgaagttcg ccttgatgat ttggcaaatg 181 agccttgtgc ttatattgaa ttcgacaacg atgaatatac aaacgttttc tctaataatt 241 ttgccgagtt cgacggaaga atgcaccaca tttatttcgt cttctctgat gagaatattt 301 gtctttcgga ttggtcgttt attaaggcag aagacacccc cagagcagag gaaaatatca 361 gagaatatat caaccttgat gtcaacattg aggattatga agagatttct ctttcagaag 421 cggtcgtaac aggttctact ccttggaaca acggcaagga cgttgcccaa aaagcagttg 481 acggcaatgt ggacaccttc ttcgacggaa ttgaacaggg ttggcttgaa attgacttgt 541 tggcagaaac agagatcagc gttattggct tcgctccgag aaaaggcttt atcgacagaa 601 tggtcggtgg acacttctac ggttcgaacg acggtgaaaa ctggaacgag atcacttctg 661 taaaaattct tcccaaggtt ggaatgaatt atgttagact tctcagaact gaaaaatatc 721 gctatatccg ttactcgatg cctgaaggaa acaacacaat gtgcaacatt gccgagatca 781 aactttataa aaataaataa agtcttttgg ccaaattgga aaaaataata aaacagaccc 841 gatctctcgg gtctgtttta ttttgatatt atttcaaatt acttacgatt cgcttgatta 901 ctgcttcatt atccttgtcg ttgatgacat attcggttct cgaatagaag tggttgtttg 961 tatcccaaat aacgggaacg tatccgcgtt cgaacagctc attcaaaacg atctcaagac 1021 attcgcttga ggttgtgtga atagcgttac gtccgaagtt ttctctggga tatccaccgg 1081 aggtttcacc cataaatacg ggaattccct tttcggtgaa cgcgcggtca agcttgtcac 1141 actgatcgtc aatataatca agccattcct gtgttccgat tctttttgcc caatacattg 1201 agttgtcgac gtagtgaaca gaaaccataa gtctgtcttc aacagtgtcg gtgggcatta 1261 cgaacctgtc agatgtggtc ttgtcgatat ttgtccaata tcccgaaacg ataagtacac 1321 ggtcagcatt gtttgagcct gttgctctga cagcgtcaac aaaagcctga tttaaaacct 1381 ctgccatcaa atatgcatta gagtcgccct gttcaacaag ctttccttct tcgttaaact 1441 gatttccgcc gatatactcg ttaaagcctt cgaacacaac ggtatgagga taatccttga 1501 aatattctgc aatctgagtc caaaccgttg taaagatctc tttacagctt tcaagatcgt 1561 ttcttctgat gataaattcg tcaaaatgat gaatgttgat tacggaataa actcctgcct 1621 tttcgcaata atcaactacc tctttaactc tttcgatgaa gtcctcattg atggtccatg 1681 tgccgtcgtt ttccatcata ttgccccaga aaacagggat tctgatggtg ttaaatccgc 1741 agtcacgcat tccgttgatg accttctgag tggtaggaac agcaccccaa caggtctcat 1801 aatcctgtgg cttattgtcg ccgacagtgg gtatccattc atagtaaatc ttgtcacagt 1861 cggtacagct ataggcatca aaggtgttgc caagactgat tccaagaccc atttcacgtg 1921 ccacttctgc tgctgtcaat ccgtttgctt tttcattctt catagcaaca tcacccttcg 1981 cttcacaccc gacagataat aacatgcaac aaatcaaaac aaataaaagt attcttttca 2041 tttatgcctc caaattgatt attagaccaa cgtctacggt tattttacca tattacgtga 2101 agctgtcaag cacatgatgt gtagctttta ctgaaaattc caaaatttgt tttgcgaaat 2161 atagcaaatt gcaggacgtt gttttacgcg ctgatcttaa ttgatactat tctgtactcc 2221 cccgatgggt actgattcta tcgtaatatt ggggataacg gaaatgttaa ttaagaatca 2281 aataaaagaa aaatgattat ggagggattc cgaatgagaa aactgatagt taaaggcaga 2341 tatctttcat ttgatgacgg tgagccgttc ttctatttcg gcgacaccgc ttgggaactg 2401 tttcacgttt tggataaaga cgaggcaaag cattatttta ccgaacgctc ccgccaaggt 2461 tttaatgttg ctcaggcagt agcattagca gaacagggcg gtttaacagt tgaaaatgca 2521 tacggaagac ttcctcttca tttcaccgac ggtacgcccg acccgacaag acctgatacc 2581 gacggagaat attcctattg ggatcacgtc gaaactattg ttcttttagg tcggaaagat 2641 attcacgagc gaataaagtt tgatgtaaat gtggaagacc tgcacggtag agcatccgct 2701 accgctactt atcccgaaat taaggcatat gtcttggaaa agtttggtct aaaagtttcc 2761 aatttgtata ttgctcaaat caaggaaaag tgcgggttag acaagaggga aaactttaat 2821 attggagcgg gcaaaagcag accgcttatt tgtccacccg agaaagaaca agcaatcatg 2881 gatgcattcc gccattttgg tatgattgac acctaattcc tttgtttctt ttggatgaat 2941 tctatattcc taaaatgctt aaagcagggg cgaaagcccc tgctttaact gttcgacata 3001 ttgggatttg ttgtgcagaa agttttattt tttcttaaaa aacaaaacaa actgtgcaac 3061 cgcactactt gcacaaagtg ctagggaaaa gcaggaaagc cccaactcga taccgcctgg 3121 attagatgat acaaccatca gccagcaaaa tgtcgctact gtaaaacaaa ttgcagcaat 3181 caaatgtcct cgtttctttt ttgaaattaa acactctgtt ttctgtgttg catcttggac 3241 agcgggaata tccttgtcac tttcataatc atcatttagc agataatctg ttgtaactcc 3301 gaacagcttg ctaatctgca atacattctg tgcatcaggc agtgctgttc cattttccca 3361 acggctgatt gcctgccgtg aaacatacag tttttccgca aagtcttcct gtgaccatcc 3421 atgtgccttc ctaaggctaa ctattttttc tgacaatgtc atcgtaaaac ctccttggtt 3481 gtgatgcatt catgataaga aaaagcactc acgaacacca ccacatcaac tttacatttc 3541 cgcaacatga ctttacatgc tgtcaaattt aagtttgtcg aactgattat atcacagaca 3601 caacaaattt tcaatcatcc agcactaatt ctgccaaggc actaaaaaag tggtcaggca 3661 atctgtcttg gggtgatttg gagtgttggt tcggcagggt caatcttttt atctatctgc 3721 ttcggtatag gcttccattt ccccggggtc tgctcaaagc gaatgtcacc gcaggttgca 3781 acacggttgc cgtgcataat tattgttaca cacaaccggt gccccgaagg atagaaatcg 3841 tcaaacggca ttatatcaac accgtaattc ttaaaatagg taagtttttc tttcaaaatg 3901 aaaccttttt cagacacgat tcatcgctca ttttatcaca agtgtatcat ttcatcatgc 3961 ataaatcagt attttattat tgtttcatat ttttatattg cctaccgcaa aaaagattga 4021 tatatcttga ttttaagacg atatatgccc tttttgttct atagttaggc ctttcactat 4081 tgactacaaa aatttataat gttataatta tgacatataa aggaggtatg gcaaatgctt 4141 agcagagatt ttaataaagg gtggcaattt ttaattgacg gtaaaaccga agaggttacc 4201 cttcctcacg actttatgat tgggaccgat aggacagcca attcgcctac aggtgccgac 4261 tacggcttct tccagccttg caaaggtacg tatattaagc acatcgaaaa agatccttct 4321 gcctcgaaac attttattaa gttcgacggc gttatgggac ttaccgaggt gttcgttaac 4381 ggcgaccttg ttaaattcca tccttatggt tacaccgcat ttatttgcga tatcagcgat 4441 tttttgcatg atggtgttaa cgagctgaag gtcaatgtcg atgctaccgc acagcccgca 4501 tcacgttggt ataccggcgc aggtatatat agagatgttg agcttttaac ctctgacagt 4561 gactatattc agccttggtg cgttgtaata actgttgata agatcgacaa caacaatgct 4621 tatgtaacag ttgacgttga catttttgca tctgcacgca gcgaagctga aataagcata 4681 aacgttcctg aaataaatca tatcacttct cgcagcacct ggcttgaaga gggcgataac 4741 catttcagct ttaagacaat acttcacaat attgagcgtt ggacattgga atcccctgtt 4801 ctttattccg cagaagtaat actgaagact gagaactctt tggacaagga aactattaac 4861 atcggtatca gagagattgc ttgtgaccct gaaaaaggct tcttgcttaa cggcgaaccg 4921 gttaagcttt acggtacctg caatcaccac gacaacggaa ttgtcggtgc gtcatcatac 4981 cgctctgcag aagaaagacg tgtaagaata cttaaggaaa acggctttaa tgcaatcaga 5041 tgcgctcata atccgccgtc aaaaatgctt ttggatgtct gtgacagaat gggtatgctt 5101 gtaattgacg agatttttga ctgctgggtt gcaggaaagc gtcctcatga ctatcacctt 5161 tggtttaatc aatatgccga agaggatatc acagcaatgg tcaagcgtga cagatgtcat 5221 ccctctgttg ttatgtggtc aacaggtaac gagatttatg aacgcggcgg aatgaacaac 5281 ggatactatc ttggaaagat gatcgcagtt accatccgca agcatgacaa aacaagattc 5341 cttactcatg cgttctgcca cttctgggac aactgggaat ttagcaagaa aatggaagaa 5401 acagcagact atcccgctga caagcttgac ttctggtgtg aaaagattgg tcctcaagca 5461 ggaaatcttg atgtcttggg atataactac ctcacccatc gaatggaaaa ggatgtacga 5521 cgtttccctg agcacttgtt tgcagtaaca gaatcatatc ctttggatgc cgtttggaca 5581 aagcatttga tggatgctct gcctcagctc gttggtgaat ttgtatggac aggttgggac 5641 tatttcggcg aaacgggtat cggtcacatt acttatgaca ccgattcggc acccggttgg 5701 ggacttacac ctcatccgaa ccacatttcc gactgcggag actttgacat ttgcggattt 5761 aagaaggctc cttcatatta ccgcgatgca gcttggtatg aaggttctgt acatattctt 5821 tctgccgacc ccgacaacta tggcagaaaa tacagcattt cttcctgggg attctataat 5881 gttgaccgca cctggacata ttcgggcaag gaaggcaaaa tgacaaccgt tcatctatat 5941 accacagcgc ccgaatgtga gcttttgcaa gacggaatat cgcttggcaa aaaggctcct 6001 aactataaag gtgttgctga attcgaggtt gaatataagc ccggtaagtt agaggctttg 6061 tcatatgaaa atggcttagt cgttggaaag gatgagcttt taacagtcgg aagtgcaacc 6121 aatatgacaa ttgaagttga cctcacaggc gaaagcggaa aggctgaccg tgtctatgcc 6181 gaaatcaccc tgcgtgacga aaacggaaac cccgcttggg aagcaaacga tgaagttact 6241 gttacggtta agggcggcaa ggtattggga acaggctcgg gcagagttga tgacgagcac 6301 atttatacct ccaatgtctg ctccgtttat cacggcaagc tcctcgcagc aattattcct 6361 ttggaaaatg acattcagat atttgcatcc actgaaaacc tgaacgctga atgcaa // LOCUS sequence022 6300 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence022 VERSION sequence022 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..6300 /mol_type="genomic DNA" /organism="" /note="sequence022" CDS 472..1317 /product="16S rRNA (cytidine(1402)-2'-O)-methyltransferase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_010963630.1" /transl_table=11 /codon_start=1 /translation="MASKLYVVGTPIGNLGDMTYRAVETLKNVDFIAAEDTRVSVKLLN YFDIKKPLVSYHEHNHKYSGENIINRIIAGESCAVITDAGMPCISDPGEDLVRLCAENN IPVEVVPGPSALISALAVSGLDTSKFAFEGFPSTAKRSRYEMFATCVNDPRTLIFYEAP HKLVATLNDLLKFFGDRKITLCRELTKIHEEIIRTTLAEAVNLYDDDKHQPRGEYVLVV EGAKETVEEVTEESALEQVKSLVAKGMRGADACREIAKTSGISKSELYAMLLESQKGEK " /locus_tag="LOCUS_1470" /gene="rsmI" /EC_number="2.1.1.198" /note="WP_010963630.1 16S rRNA (cytidine(1402)-2'-O)-methyltransferase (Clostridium) [pid:50.2%, q_cov:95.0%, s_cov:96.1%, Eval:2.6e-69]" /note="MGA_177" CDS 1314..1754 /product="ribosomal protein S18-alanine N-acetyltransferase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_010880336.1" /transl_table=11 /codon_start=1 /translation="MIIREMRVPDVGAVLDIEKTCFTADAWCEEDFEYRFDDDGFVNLV CEDMGKVVGYITTGYVLGELSIDSVAISPEYRRKGIAKKLIERAIQKTDPDVVLLEVRK SNVPAISLYESLGFEKVGLRRDYYQCPTEDAILMTLSIRELK" /locus_tag="LOCUS_1480" /gene="rimI" /EC_number="2.3.1.266" /note="WP_010880336.1 ribosomal protein S18-alanine N-acetyltransferase (Aquifex aeolicus) [pid:43.7%, q_cov:95.9%, s_cov:91.6%, Eval:9.1e-22]" /note="MGA_178" CDS 1770..2780 /product="tRNA (adenosine(37)-N6)-threonylcarbamoyltransferase complex transferase subunit TsaD" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003357496.1" /transl_table=11 /codon_start=1 /translation="MRILAIESSCDETAASVVEDGVKVLSNIVASQIEEHKLYGGVVPE IASRRHTENICGVVKEALEVAQCSMDDIDAVAVTYAPGLIGALLVGVSYAKGLAYASNK PLVPVHHIAGHIAANYISHPELKPPYLCLVVSGGHSHIVEVLDYTRFNVIGRTRDDAAG ECFDKVARTLGFPYPGGKYIDDAAKKGNKSAYKFPHPKLSGNEYDFSFSGIKTAVINLV HNSAQKSEEINKEDVAASFQKTVADILVEKLMTAASNLGYTEIALAGGVSANSGVRNKL KKECDKRGYNLYMPEFKYCGDNAAMIGAQGYHDYMAGKRADASLNAVATLSLEEI" /locus_tag="LOCUS_1490" /gene="tsaD" /EC_number="2.3.1.234" /note="WP_003357496.1 tRNA (adenosine(37)-N6)-threonylcarbamoyltransferase complex transferase subunit TsaD (Clostridium botulinum) [pid:56.7%, q_cov:99.7%, s_cov:98.5%, Eval:6.9e-107]" /note="MGA_179" CDS 2786..3676 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MKFAKLLSLLLALVLMLGLCACDEIGDNTPVDTTDKTDTPPVKEP YPISFGNETFESCPESVVSLSPALTDILMHIGVTDKVVGISEYCSLPGLDVETIGSPAN PDLEAIIALKPELIITLSPIASTDKITLEKAGIRTLEMSSPKSYGELCEIYINLSMVFY GAVDSKDIAYDALSPLDAALMEAKNLAFNKSFICIEGTYRDGLVVSGMDTLEDDLFSVF GTNLLADYDSHFIHEEICGELEPDVVFLYDNVDNDGIEELFEDADIVYISASALERPTA ELYSVIISSIEDIKG" /locus_tag="LOCUS_1500" /note="WP_004082604.1 cobalamin-binding protein (Thermotoga maritima) [pid:30.1%, q_cov:45.9%, s_cov:43.1%, Eval:5.4e-12, partial hit]" /note="MGA_180" CDS 3813..5057 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MKKLLCIFLALTMVLSLVGCGKQIDDNPPPVSDDNPGVSDTDTPT EDETPDQPIENQWNYDFDGAFIEENGLEYIWAQLDEQTRIALGEVMNAIKNVEIYCSLS RGIPTEGSEEFLKLVSFCSMAYTYESNVFRRHTDENGKVIGITLNYNVNYEEEAHTRTQ ELDSAINEIISGMPDGSDYDKIKYLHDALILKCDYSENAVSPFTAYGALVEGRATCQGY ADAMHLLLSRAGYETCFATGIGESEAVTHKWNYVLVGDDWYIIDPTWNDPEGEEDKSYI NYDYLFISEEVLLTDHKETFDSPYYDFPLADSMELNYHIVNGYYAEDYEQLKEIVKGQV EACVANGTKYIYVRCANQEVFDLANSKLFSGDCEMQKILIEVKDATDANIRTNSWVKVT DEGPKTLTITLKYED" /locus_tag="LOCUS_1510" /note="WP_011948155.1 DUF5050 domain-containing protein (Clostridium botulinum) [pid:33.2%, q_cov:45.2%, s_cov:37.2%, Eval:1.0e-20, partial hit]" /note="MGA_181" ORIGIN 1 cgtcgaatgc cgatgagata attcccgttc acgcagattt gaaaacttgg cgcgcaccca 61 agcaggtgga tttaatcacc tgcaacccgc catataaaat tgacaacacg ggcgcaaaga 121 acgatacgga agcggtatcc atcgcgcggc acgaaatgct ttgcacgatt tatgacgttt 181 gcgaggcggc aaagaaaaat ctcaaattcg gcggcagact ttgcatttgc aaccgccccg 241 aacgcctggc cgactgcatt gatgccatgc gcaaaaacgg aatcgagccg aagcgtctgc 301 gctcggtgca taaggataaa caaagcgatg catggcttat tctcattgag ggaatgatgg 361 gcggtgcgaa gtttatgaag gttgaaaagc cccttattgt taaaggcgaa aacggcgaaa 421 gctattcgga tgaaatgaag aggatatata aactttaatt tggaggatat aatggcaagc 481 aagctttatg ttgtgggaac acccatcgga aatctgggag atatgaccta ccgcgcggtt 541 gaaaccctta aaaatgtaga tttcatcgcc gcggaggaca caagagtttc cgtcaagctc 601 ctcaattatt ttgatattaa gaagcccctt gtgagctatc acgagcacaa ccacaaatat 661 tcgggagaaa atatcatcaa ccgaattata gcaggggaaa gctgcgctgt tatcactgat 721 gcgggaatgc cctgcatctc cgacccgggc gaggacttgg tgcgcctttg cgcggaaaac 781 aacattcccg ttgaagttgt gcccggaccc agcgcgctga tttcagccct tgctgtttcg 841 ggacttgata catcgaagtt tgcatttgag ggcttcccct caaccgcaaa gcgctcgcga 901 tatgagatgt ttgccacgtg tgtcaacgac cccagaacgc ttatattcta tgaggcaccc 961 cacaagctgg tggcaaccct taacgacctt ttgaaattct ttggcgacag aaaaatcacc 1021 ctttgccgtg agctgactaa gattcacgag gagattattc gcacgaccct tgcagaagcc 1081 gtcaatttat atgatgatga caagcatcag ccgagagggg aatatgtttt ggtggttgaa 1141 ggcgcgaagg aaactgttga agaggtcaca gaagaatcgg cccttgagca ggtcaagagc 1201 cttgttgcaa agggaatgag aggcgccgat gcctgcagag agattgcaaa gacctcgggg 1261 atttcaaaga gcgagctata tgcgatgctg cttgaatcgc agaaaggcga aaaatgatta 1321 taagagagat gcgtgtcccc gatgtggggg cagttctgga tattgaaaaa acctgcttca 1381 cagcggatgc ctggtgtgag gaggattttg aatatcgttt cgatgatgac ggatttgtta 1441 accttgtctg cgaggatatg ggcaaggtcg tcggatacat caccacggga tatgttttgg 1501 gggagcttag catcgacagc gttgcaatca gccccgaata ccgccgaaaa ggcattgcca 1561 aaaagctgat tgaaagggca attcaaaaaa ccgatcccga tgtggtgctt ttggaggtgc 1621 gaaaatcaaa tgtgcctgca atatcgcttt atgaatccct cggatttgaa aaggtcggat 1681 taagaaggga ctattatcag tgcccaaccg aggatgcaat acttatgacg ctgagcataa 1741 gagaactgaa ataagaaggt agattaaaaa tgagaattct tgccattgaa agctcctgcg 1801 acgaaactgc cgcttcggta gttgaggacg gagtcaaggt attatcaaat atagttgctt 1861 cgcagatcga ggagcataag ctatacggcg gagttgtccc cgaaatcgct tcccgcagac 1921 ataccgaaaa catctgcgga gttgttaaag aggcgctcga agttgcacag tgctcgatgg 1981 atgacattga tgctgtcgct gtgacatatg ctcccgggct tatcggcgcg cttttagtgg 2041 gtgtcagcta tgcaaagggc ttggcatatg cttcaaacaa gccgcttgtg cctgttcacc 2101 acattgcggg acatattgcc gcaaactata tcagccaccc cgagctgaaa ccgccttatt 2161 tgtgccttgt tgtcagcgga ggacacagcc acattgtcga ggtgcttgat tacacccgtt 2221 tcaatgtgat cggccgtacc cgtgacgatg cggcgggcga gtgcttcgac aaagttgcgc 2281 gcaccctcgg cttcccttat ccgggaggca agtatattga cgatgccgcg aagaagggca 2341 acaaatcggc atataaattc ccccacccga agctgtcggg aaacgaatat gatttcagct 2401 tctcgggaat caagactgcg gtcataaatc ttgtccacaa ttccgcgcaa aaaagcgagg 2461 agattaacaa ggaagatgtt gcggcatcct tccaaaagac cgttgccgac attttggttg 2521 aaaagctgat gacggcggca tccaacctcg gttacaccga aattgccctt gcgggcggtg 2581 tttccgccaa ctcgggagtg agaaacaagc tcaaaaaaga gtgcgataag cgggggtata 2641 atctttatat gcccgagttc aaatattgcg gcgacaatgc cgcaatgatc ggcgcacaag 2701 gctatcacga ttacatggcg ggcaagcgtg cggatgcttc gcttaacgcc gttgcgacac 2761 tttccttgga ggaaatataa aaacaatgaa atttgcaaaa ctattatcac ttttgctggc 2821 gcttgtgctt atgctcggcc tttgcgcctg cgatgagatc ggcgacaaca cccctgttga 2881 caccaccgac aagacggaca cgccccctgt caaggagccg tatcccataa gcttcggaaa 2941 tgaaaccttt gaatcatgcc ccgaaagcgt tgtcagcctt tctcctgcgc tgaccgatat 3001 tttaatgcat atcggcgtga ccgataaggt cgtgggcatc agcgaatatt gctcgcttcc 3061 gggactggat gttgaaacta tcggaagccc tgcgaatccc gaccttgagg cgataatcgc 3121 cttaaagccg gagctgatta tcaccctttc gcccattgcc tcgacagaca agataaccct 3181 tgagaaggcg gggatcagaa cccttgaaat gtcttcgccc aagagctatg gcgagctttg 3241 cgagatatac ataaatctct cgatggtctt ttacggcgcg gttgattcaa aggacattgc 3301 atatgatgcg ctttcgcctt tggatgccgc acttatggag gctaaaaatc tggcatttaa 3361 caagagcttc atttgcattg aggggacata tcgggacgga ttggtcgttt cgggcatgga 3421 caccctggag gatgacctgt tttctgtatt tggcacaaac cttttggcgg actatgacag 3481 ccatttcatc cacgaggaaa tatgcggtga gcttgagccg gacgttgtgt tcttatatga 3541 caacgttgac aacgacggaa ttgaagagct tttcgaggat gcggacatcg tttatatatc 3601 agcatctgcc cttgagcgac ccaccgccga actttattct gtcattatta gcagtataga 3661 ggatataaaa gggtaaataa gggaattttg taattattct gttattaaca ttggatgttt 3721 ttcaaagtat tatttaatag tgcaatattt acgacagcaa agttgtttta tataaggtaa 3781 gaatgttttt gtttatgaaa ggaataatgc cgatgaaaaa gcttttatgt attttcttag 3841 cgctgacaat ggttttgagt cttgtcggat gcggcaagca gatcgacgac aacccgccgc 3901 ccgtaagcga tgataacccc ggcgtcagcg acaccgatac cccaacggag gatgaaaccc 3961 ccgatcagcc gatagaaaat cagtggaact atgattttga cggcgcattt attgaagaaa 4021 acggccttga atatatttgg gcacagcttg acgagcagac cagaatcgcc ttgggcgaag 4081 ttatgaacgc aattaagaac gttgaaattt attgctcgct cagccgcgga attcccaccg 4141 aaggctcgga ggaatttttg aagctcgttt ccttctgctc aatggcttat acatatgaga 4201 gcaacgtttt ccgcagacat accgatgaaa acggcaaggt aatcggaatt actcttaact 4261 ataacgtcaa ctatgaggaa gaagctcaca caagaaccca agagcttgat tccgcaatca 4321 acgaaataat ttcgggtatg cccgacggca gcgattacga taagatcaag tatctgcacg 4381 acgctctgat cttgaaatgt gattacagcg aaaacgctgt cagccccttc accgcctacg 4441 gcgcattggt tgagggcaga gcaacctgcc agggatatgc agacgctatg catcttttgc 4501 tttccagagc gggatatgaa acctgctttg caacgggtat cggcgaaagc gaagcggtga 4561 cccacaagtg gaactatgta cttgtaggtg atgattggta tatcatcgac cccacctgga 4621 acgaccctga gggcgaagag gacaagtcat acatcaacta tgactacctg ttcatcagcg 4681 aagaagttct gttgaccgac cacaaggaaa cctttgacag cccttattac gattttcctt 4741 tggcagacag tatggagctc aactaccata ttgtaaacgg ctactatgcc gaggattatg 4801 aacagctgaa ggaaattgtt aagggacagg ttgaagcttg cgttgcaaac ggcaccaagt 4861 atatctatgt cagatgtgct aaccaggaag tgtttgacct tgcaaactcc aagctcttca 4921 gcggcgactg tgagatgcaa aagatcctca ttgaggtcaa ggacgcaaca gacgcaaaca 4981 tccgcacgaa ttcatgggtc aaggtgactg acgaaggacc taagactctc accatcaccc 5041 ttaaatatga agactgacaa tattaaatcg gaggttatac agtaatgaac aagttcagaa 5101 gaatttcggc tttgcttttg gcaatgctga tgaccgtcac aatgctcgct tcctgcggaa 5161 acatcgagga aaagccccct gttgatgatg tacccggtat cgtaacagag gatcccgttg 5221 ttaccgagcc ccctgtgacc accacagagc ctactaccga ggcaaccacg gagcctacta 5281 ccgaggcaac aacagaagct accactgagg caacaacaga agctaccacc gaagctacaa 5341 ccacagaagc taccacaact gaggataaga atgcatatac cgttgaagaa atgaacgagc 5401 ttatgtatgc tacaacctct gttaacgtaa gaaaaggccc ctctgttgat ttcgacagaa 5461 tcggccattt ggatgaaggc gaagctgtaa ccgttacagg cagagcatcc accggatggt 5521 atagaatcgt tcttgacggt gaggaaggct ttgtttccaa cctttacctc tctgacgaaa 5581 agcctgaaga ggaagctacc aagcctgctg aggatgaaga ggacattgta attgaagaac 5641 ccgatgatga agacattgta attgacgacg atgtcaccgt taccgccggt gactgggttg 5701 aagaaaacgg ctggagctat atgtataatg ccctctataa ggatgaatat cgacaggctc 5761 tcaacgaaat tatgacaggt attcagaatt tggatgaaga gatttatctg acacctctta 5821 ttgaaaaaaa tgaaattagc gatttcatta acttgatcat gcctattttg acagtgaaat 5881 attgttatta cgacaatctg gatacaaaaa ctaatgatca gggtcaaaaa gtgctcaatt 5941 tcacaacata cagcacaggt catctcagat cgattagagt gacctactat gttgacacca 6001 aggctgaggc tgtgaagatg atgaatgagc ttgatgacgc agcaaacaag gttgtaaaga 6061 agctttcaag ctctatgtcc gattacgaaa agatccttta cttgcacgac tggatcgttg 6121 taaactccgt tcccgacaag gaaaatgtcg gcggcaagtg ggcaaacacc gcttacggct 6181 ctatcgttga cggcgagcct acatgcttgg gctatgcaaa gggtctcttc tacttgctcc 6241 acaaggcagg ctttgaagat atcaccatgg caattggcga aggctccaag aaaaacgtaa // LOCUS sequence023 5973 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence023 VERSION sequence023 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..5973 /mol_type="genomic DNA" /organism="" /note="sequence023" CDS 349..1416 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MKDYGFGNFLNELRKRRGLSQYQLGMLVGVSDKAVSKWENGTSKP QSSILFKLSEVLGVSVDELLACKYRSEDIRKTKGVFAMKKEIYKQVHQRLHNQYGETPP IEVINRYLSEMQELDGTDMIIWFDFLGKLREYAKSFGEHIRLGGGIGSSFAAYVCGATE INPLMPHYYCPKCKKVEFDRSVDDGWDLAEYKCVCDEKMLHDGHNIPFETYRHVFVKNA SFDIAVSPDFIEQAKEFAKKHFKDCKLIKIKRDMKKEMYSFVVMPKSESIADDVVLTIH EYYDRFCDYPLFNICVNGDMKRLKQIESLTNVSCEHVDFCEPAIVDEFKKGNTDGIPEF RIDFFKDMISQAQQN" /locus_tag="LOCUS_1520" /note="WP_002382781.1 PolC-type DNA polymerase III (Enterococcus) [pid:33.9%, q_cov:45.4%, s_cov:11.4%, Eval:2.2e-18, partial hit]" /note="internal stop codon at [1414:1416](+)" /note="MGA_183" CDS 1606..1908 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MEDTRRGVYARKGVSDELRKQLADIGMDEWFADSIAKIKYLFPKA HGVLYVKYAAMLMWYKVHYPKEFEKCMKYSVPCPNLDRGCFLWVKKCCIAIQTLI" /locus_tag="LOCUS_1530" /note="WP_004081285.1 DNA polymerase III subunit alpha (Thermotoga maritima) [pid:44.1%, q_cov:68.0%, s_cov:4.7%, Eval:4.2e-12, partial hit]" /note="internal stop codon at [1414:1416](+)" /note="MGA_184" CDS 1944..2534 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MEQCFDKVKIRGLKKSDIDDIVRWNTFETKWMTLTRPWYKPEPID DKAFREYLLDLAKNEPMIDFQPEVEYNGVNIGRCRAHFIDGKGKFSVLEDVGVKQIYIA LEIFICEPAYMNEDVCAKATAAYAEYLAGKVHGTIFAQTWSGNGIMMDACKRVGFSEHC VTVKESDTSDESFEIVTFKLDLDKFARFKEEYR" /locus_tag="LOCUS_1540" /note="MGA_185" CDS 2531..3502 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MKRIIALVLACVMVGAMLCACSIDLSDYDIEFGSYYRYENANKYT AGNGSAKNVSEIDIDWISGDVTIEYSSDVSEVEFSESYEKDIDSELKMRWWVDGETLKI KFAESNAKLIGELRKTLTVEVPYELAGISITTVSANITTEVITAEEAEFDTVSGNITTP MCFYKEVDADSVSGDIHIQTNADADIDIDTVSGHVTVLSGIKDLSVSTVSGNAEVYSYS ADYDAEFDTTSGDVIIHVMENTGLELEFETVSGDFESDIEISYKDGKYKRGDKGAKFDV DTVSGNCTVRLYDPSQEEGPIAAPSAPNFGEADESSAGAGRN" /locus_tag="LOCUS_1550" /note="MGA_186" CDS 3732..4133 /product="RNHCP domain-containing protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003436247.1" /transl_table=11 /codon_start=1 /translation="MSNYKDKRNFISTPCNDSFTCRFCGAKVTPENAGTTQRNHCPVCL MSVHLDNEPGDREADCGGLMEPIAVWVRNGGEWAIVHRCKRCGKLSSNRVAADDSPLKL MSVALKPLSEPPFPIESIRELNELLSDSK" /locus_tag="LOCUS_1560" /note="WP_003436247.1 RNHCP domain-containing protein (Clostridioides difficile) [pid:61.3%, q_cov:91.7%, s_cov:93.2%, Eval:5.1e-42]" /note="MGA_187" CDS complement(4181..4846) /product="nitroreductase family protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003813444.1" /transl_table=11 /codon_start=1 /translation="MTQLEAIRSRHSVRQYKDQPIEPELRALLCEEIEEINAESRLNIQ LICDEPKAFDSFMAHYGNFTGVRNYFAIAYKKGEDAQEKIGYYGERLVLFAQMLGLHTC WVALTYKRMPDVIKISKDEKLSLVISVGHGRNRGVAHKSKPISTLAPNYDSSPEWFKNG VDAALLAPTATNQQKFTLTLEGDKVKAKAGLGFYSKMDLGIVKYHFEIGSGKDSSIWA" /locus_tag="LOCUS_1570" /note="WP_003813444.1 nitroreductase family protein (Bifidobacterium bifidum) [pid:36.6%, q_cov:96.8%, s_cov:97.0%, Eval:2.3e-34]" /note="MGA_188" misc_feature complement(5080..>5973) /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_011861512.1:sensor histidine kinase" /note="WP_011861512.1 sensor histidine kinase (Clostridioides difficile) [pid:44.4%, q_cov:99.3%, s_cov:43.0%, Eval:3.1e-68, partial hit]" /note="MGA_189" /locus_tag="LOCUS_1580" ORIGIN 1 atacagctca gcgcccgctt gtggcggggc gtctcattga cggtcgtttc ggtcctagct 61 atgtcatcct ttcccaatgg gcctgtatca gcgccccaga aattcaccgg caaaccggcc 121 taactgtgcc agtccctttt ccatcgccgc gtcagtgggg gtggagaaat tcagccggaa 181 ggccaggtca gcgcaagaga aattgcaaag gcaaatatgg cgaagtgaat atgacattgt 241 cccccacacg tatggatggg ggattttttc taccgcaggt agatatctta catattgaac 301 atccacgtaa aaatgctata atgtaattag caagcaacgg aggatgttat gaaggactat 361 ggttttggta attttctgaa tgagctgaga aagcgtcgtg gcctgtcgca atatcagctt 421 ggtatgctcg tcggcgtttc cgacaaagct gtttccaaat gggaaaacgg cacatctaaa 481 ccgcaaagca gtattctgtt taagttgagc gaggttttgg gagtatcagt cgatgagctt 541 ttggcttgca aataccgttc cgaggatatc agaaagacaa aaggagtatt tgctatgaaa 601 aaagagatat acaaacaagt ccatcagcgg ttacacaatc agtacggcga aactccgccg 661 attgaggtta taaaccgata tttaagtgag atgcaggagc ttgacggcac ggatatgatc 721 atctggtttg attttctggg caagctcaga gaatatgcaa aaagttttgg cgaacacatc 781 cgccttggcg gcggaatcgg ttcgtcgttt gcggcatatg tctgcggtgc aacggagatc 841 aaccctctta tgccccatta ctactgcccg aaatgcaaaa aggttgagtt tgaccgcagt 901 gttgacgacg gttgggactt agctgaatac aaatgtgttt gcgacgaaaa aatgcttcat 961 gatgggcata acataccatt tgaaacatac cggcacgttt tcgtcaagaa cgcaagcttt 1021 gatattgccg tatcacccga tttcattgaa caagcaaagg agtttgccaa aaagcacttc 1081 aaagattgca agctgattaa aataaagcgg gatatgaaaa aggagatgta ttctttcgtg 1141 gtgatgccga aatcggaaag tattgcagac gatgttgtgc tgacgattca cgaatactat 1201 gacagattct gtgattatcc gttgtttaat atatgtgtta acggagatat gaagcgatta 1261 aaacaaattg aatcgctgac gaatgttagc tgtgaacacg ttgatttttg cgagcctgct 1321 attgttgatg aattcaaaaa aggaaatacc gacggcattc ccgaattcag aattgacttc 1381 tttaaggata tgatttcgca agcacagcag aactaattcc gcgacctgat taagctttcg 1441 ggattatccc acggcacggg cgtttggacg gataatgcgc aagagttaat tgagagcggc 1501 attgaagtcg gtaaggttat agcatatcgt gatgatgttt ttaactacat acaggaaaaa 1561 ctcacgcaaa ggggcatttc aaacacggga tatgcctgca aaattatgga agatacacgg 1621 cgaggtgttt atgcaagaaa aggcgtgtcg gatgagttga gaaaacaact tgccgatatc 1681 ggaatggacg aatggtttgc cgattccatc gcgaagatca agtatctgtt cccaaaggca 1741 cacggcgtgc tgtatgtgaa atatgccgcg atgttgatgt ggtacaaagt acactatccg 1801 aaagagtttg aaaagtgtat gaagtacagt gtcccctgtc cgaatttgga cagggggtgt 1861 tttttgtggg tcaaaaaatg ttgcatcgca atacaaacgc tgatataata tagttagtgg 1921 ctttgaagga gatgattacg gatatggaac agtgctttga caaagtaaaa atcagaggtt 1981 tgaaaaagtc tgatattgac gacattgtgc gttggaatac atttgaaacc aagtggatga 2041 cgcttacacg tccgtggtat aagcctgagc cgattgacga taaagctttt cgcgaatacc 2101 tgcttgattt ggcaaaaaac gaaccgatga tcgactttca gccggaagtt gaatacaatg 2161 gagtgaatat cggcagatgc cgcgcacatt tcattgacgg aaaaggaaag ttttcagttc 2221 ttgaggatgt cggagttaag cagatataca tagcgttgga aatattcatc tgtgagcctg 2281 cttatatgaa tgaagatgtc tgcgctaaag cgacggcggc atatgcggag tatctggcag 2341 gcaaagtaca cggcacaata tttgcccaaa cttggtcggg caatggaata atgatggatg 2401 cttgcaagcg ggtcggattt tcggagcatt gcgtgacggt gaaagaatca gatacaagcg 2461 atgagtcatt tgaaattgtg acattcaagc ttgatttgga taagtttgca aggtttaagg 2521 aggaataccg atgaaaagaa ttattgcttt agttttggcg tgtgttatgg tcggagcgat 2581 gctttgcgct tgctcgattg atttgagcga ttatgacatc gaattcggat cctattacag 2641 gtatgaaaat gcgaataaat acaccgcagg aaacggttcg gcaaagaatg tttccgaaat 2701 tgacattgac tggataagcg gagatgttac gattgaatat tcgtcggatg tgagcgaagt 2761 tgagttttcc gagagctatg aaaaagatat tgacagcgag cttaaaatgc gctggtgggt 2821 tgacggcgaa acgcttaaaa tcaagtttgc agagtcgaac gcaaaattga tcggtgagct 2881 tagaaaaacg cttacggttg aagtgcctta tgaacttgcg ggaataagca ttaccacagt 2941 atccgctaat attacaacag aagtgataac tgcggaagaa gcggaatttg acactgtttc 3001 gggtaacatc actacaccga tgtgcttcta taaggaagtt gatgctgaca gcgtttcggg 3061 cgatattcac attcagacaa atgctgacgc cgacattgac atcgacacag tttcgggaca 3121 tgtaaccgtt ttgtcgggca tcaaggatct gtcggtcagc acagtcagcg gaaatgcaga 3181 ggtttattca tacagcgctg attatgacgc ggaatttgac actacttccg gcgatgttat 3241 aattcacgta atggagaata caggtcttga gcttgagttt gaaacggtca gcggcgattt 3301 tgaatcggac attgagatta gctataagga cggaaaatat aagcgtggcg ataagggtgc 3361 aaagtttgat gttgacaccg tttcgggcaa ctgcacggta aggctttacg acccgtcaca 3421 ggaagaaggg cctatcgctg ccccgagcgc acccaatttc ggcgaagccg atgaatcaag 3481 tgcaggcgcg ggcagaaatt gatagatatt ccaatgagaa aggaagtatg atgttatgat 3541 tgagtcaagg aggaggagca ctcggatttg atttcaggct tgacctgaac atttcattta 3601 agaaaggaga attgttttat gactaaattc aatacgagga aggacattgt ataactgcgg 3661 gaggtttgct taaaatcttt tcgcaaatcc tcccataggt ttacaaatga aactacggag 3721 gataacacaa tatgtcaaat tataaagata aaagaaactt catttcaaca ccctgcaacg 3781 acagctttac atgccgattt tgcggagcaa aggtaactcc cgaaaacgca ggaacgacac 3841 aaagaaacca ctgccccgtt tgccttatga gtgttcattt agacaacgaa ccgggagata 3901 gagaagctga ctgcggaggg cttatggagc cgattgcagt gtgggtcaga aacggcggtg 3961 agtgggcaat cgtgcacagg tgcaaaaggt gcggaaagct ttcatccaac agagttgccg 4021 cagatgacag ccctttgaaa ctgatgtcgg tggcgctgaa gcctttgagt gagccgccat 4081 tccccattga gagtatcaga gagctgaacg agcttttatc tgatagtaaa taacattaaa 4141 accccgacag aaaactgtcg gggtctcttt ttaaaattat tcacgcccag atggaggagt 4201 ctttgcccga gcctatctca aagtgatact tgacgatgcc gagatccatt tttgaataga 4261 aaccaaggcc cgcctttgct tttaccttat ctccttcgag agttaaggta aatttttgct 4321 gattggtggc ggtgggcgcc aaaagtgcgg catctacacc gtttttgaac cactcgggtg 4381 atgagtcata atttggcgca agggtggaaa tcggctttga tttatgcgca acgcctcgat 4441 ttctgccatg tccgacggaa ataaccagcg agagcttctc atcttttgag attttgatca 4501 catcgggcat acgcttatag gtcagagcga cccagcaggt gtgaagcccg agcatttgag 4561 caaacagaac aaggcgctcg ccatagtagc cgatcttctc ctgggcatcc tcgccttttt 4621 tatatgcgat cgcgaagtag ttgcgaacgc ccgtgaagtt gccgtagtga gccataaagc 4681 tgtcgaaagc cttaggttca tcgcagatga gctggatatt cagcctgctt tctgcgttga 4741 tctcttctat ctcctcgcaa agaagtgcgc gaagctcagg ctcgatgggt tggtctttat 4801 attgccgaac ggaatgacgg gatctgattg cttcgagttg ggtcatttta tgcctccgag 4861 tgtggtgatg ttggggtgat tatagcacaa gacgaggcgt ttggcaagag cggagcgccg 4921 tctgcgaggg tggcggagcc gtccgagcag gtggcgcgga gcggtatttg atgcaggcag 4981 cttggctgaa cgacatcaga aaggaaaaag accgccctgt caagcggtct tttcctattg 5041 aagacactat atgaaaatgc ggaaattatg gaccaaagat taaatatact tcttgaattt 5101 caaaattgcc ttgaacatat caccgtcggt gatgatttca aaggttccgt tgcatatttc 5161 ggtataactc tttgcgatcg caagaccgag accgtttcct tcggcggttc tcgattcgtc 5221 accgcggaca aagcgctgag ttatctcatc cacgttgaaa tccaacggat atgcggaaat 5281 gttcttgaat tcgatctcga tattatcgtt cttttccttt gcggttatga atacacgcgt 5341 attcttcagt gtatatttga ggatattatt gatcagattg ttgacaacgc gggacatctt 5401 acggccgtca gcaaagatat aaagctcctt gggggcgtca acgcagaatg gcagacccga 5461 gctttgaatc tcattatcct gttcggcgag agcctgattg atgaggagtg atacatcgag 5521 tttttcaaga gtaatgcttt cgttgccgct ctgcaccttt gagatgtcaa acaggtcttg 5581 tgtaagcttt tttagtctgt cgctcttttt ggcgattact gcgacgtaat cctttgcctc 5641 ctcgggaagg ccgtcaattt tggacaacag ctctgtatag ctgataatgg atgttatcgg 5701 tgttttcaaa tcgtgcgata cgtttgtaat cagctcagac ttcaatcttt cagccttcac 5761 ctgtgcagac accgattcgt cgaggccttt tgcaatatca ttgatatttt cagccagctt 5821 tttcatatct tcgaatttca gctcgggaat cttatgggat acgttgccgt tgcgaacctg 5881 acgtgcgcca tttttgatcc ggtcaatatc gcttgctctg cgggcaagaa caaagcatgc 5941 aaaaccgagc agcatgattc ctatgaacag cca // LOCUS sequence024 5880 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence024 VERSION sequence024 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..5880 /mol_type="genomic DNA" /organism="" /note="sequence024" CDS 804..2372 /product="M18 family aminopeptidase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_010963927.1" /transl_table=11 /codon_start=1 /translation="MLTFGERLRKARKRKGLSQVDVFDAIGLNNKSLSRYEKGETTPNP ETLQKLIRLYDVSSEYILGLTDVMGSSAEGETSSDADGNLIEMIDHKSSARKLINFISS SPSRFHVVANIARKLAHDGFIELKEANDWNIEAGGKYYVTRNQSSIIAFKVGADAKGFN IMASHSDSPTFKFKPNAEMETLGKYVRINTEKYGGMIMSTWLDRPLSVAGRVTVMTGGK VKSSLVNIDEDTLLIPNVAIHMNRNANDGMTYNPQVDTIPLMGSEAAKGKLMGLVAASA GVKESDIISSDLYLYCRTPATVWGNDGEFVSCPKLDDLQCAYATMQGFLAGDNAETVSV LAVFDNEEVGSGTKQGADSDFLRAVTDRIANALGKEKSAMLANSFMVSADNAHAVHPNH PEYADPTNKPFMNGGIVIKHNGNQRYATDAISETIFKRICAAIGVPTQTYANRSDIAGG STLGNISTAQVSLNTVDIGLAQLAMHSSYETAGSMDTLYLERAAAEFYRTAIISLGDGE YELRG" /locus_tag="LOCUS_1590" /note="WP_010963927.1 M18 family aminopeptidase (Clostridium) [pid:46.5%, q_cov:78.9%, s_cov:97.9%, Eval:2.6e-104]" /note="MGA_191" CDS complement(2474..2737) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MKVTVKNGTLDQREIDAYVTRAVNLYHPKRIEEMTLTLDGEYVDI EYKFAPVNFDRIRRITGYLVGTLDRFNNAKRAEVEQRVKHSL" /locus_tag="LOCUS_1600" /note="WP_003436320.1 anaerobic ribonucleoside triphosphate reductase (Clostridioides difficile) [pid:79.4%, q_cov:39.1%, s_cov:4.3%, Eval:1.1e-09, partial hit]" /note="MGA_192" CDS complement(2828..3907) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MADNRLLEQETREDVFEEINELYRKTQESRENIVTKTYRTVLTVL VGVTAMLCITVVVLAIGWAHEQGTIVPEIVEVEKEVTVTVPEYIIIDPSEEYDHSLTND SFELWDTNYGPIWMPAMANVSKNEYINEKFIKDEVTGYLTYEDENLDILQGIDVSIYQG DIEWDKVKEAGFDFVIIRCGFRGYVTASVNADANFRSNIQGALDAGLKVGVYFFSQAID TEEALEEANFVLDLIDGYEISFPVIYDWEVVIDKDGDPVRTAEIEPEQLTANALVFCER VEMAGYTPMIYCNKKTAIWKYDLSMLEDIDIWLAEYSDTPTYFYDFAMWQYSSKGQVPG IEGNVDLNIAFKDYSKKEK" /locus_tag="LOCUS_1610" /note="WP_013389345.1 RICIN domain-containing protein (Bifidobacterium bifidum) [pid:29.5%, q_cov:61.8%, s_cov:26.0%, Eval:8.4e-13, partial hit]" /note="MGA_193" CDS 4171..5448 /product="aminotransferase class I/II-fold pyridoxal phosphate-dependent enzyme" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_005083681.1" /transl_table=11 /codon_start=1 /translation="MSIFDYSKEQLKSFYDEQVKLLAEYKARGLKLDMSRGKPSPEQLD LTNDMLTHCLDGDHISERGVDCRNYGVLDGIYEAKRLFMPMLGIGRYEIIIGGNSSLQL MYDTIAKCMLLGTKDSDKPWCKLEKVKWLCPAPGYDRHFAICEGFGIEMIPVPMNSDGP DMDMVEKLVAEDDAIKGIWCVPKYANPSGITYSDEVVRRFAALNPKAKDFRIFWDNAYC VHDLYDDHDQLINILDECKKTGKQDMVLISGSTSKISFPGGGIAAIGASEENINFLKDQ MSNQTIGYDKLNQLRHARFFKNFDGLMEHMKKHRDIIRPKFDVVLEALDNEIAPLGIGD WTKPKGGYFIAFDAEEGTAKRIVSLCADTGVVMTKAGATYPYGNDPKDSNIRIAPTYPS VSELKLAMEIFCVAVKLATAEKLLSE" /locus_tag="LOCUS_1620" /note="WP_005083681.1 aminotransferase class I/II-fold pyridoxal phosphate-dependent enzyme (Mycobacteroides abscessus) [pid:46.3%, q_cov:99.5%, s_cov:99.1%, Eval:1.3e-111]" /note="MGA_194" ORIGIN 1 agcgggggag atttccgctg ccgcggcaac tcagatgctc ataagtgtat atcaggtttc 61 gctcatcgtc aactttggcg ttgtgggcgg tcttgtgccc gaaatgagtt tgaccagcac 121 agcggttgtt gaaaaggcgg tgcattatga ctttgacacc tcggcaatag acggctatga 181 gattggaaga tattcggaat atcctgatgt atacattccc gcaagcgaag agcttgttaa 241 aatggcgctt gagatcgaac cgagccttaa aaaggtcata tgtgcttctg ctgacaagtt 301 tgtggcatcg gcagaggcaa agactgcttt aaacgagcag tttggggcgc acatctgcga 361 tatggaaact gcgggcattt tgctcacagc taaccgcaac ggcattcccg cgcttttgat 421 aaaagcagta tcggacagcg ttgacggggg agctgaggag ttttcaaaga tgatctcaaa 481 cgccgcctat gtctgcatca gcgttatgat gaaaattttg gcgaagctgt aacaaacagc 541 ggcgctcgct gcccgaaccg cccttgggac ggttcgggca ttttaacgcc cctttcccca 601 tatatgctcg gggaaagggg cgttaaaaca gcccgcgggg gcttttgccc ccgtgggcgg 661 cgagcgcgtc gcacaaactt tctcggcggc gggcgatggg tgagaaatct cacgatcggg 721 gctgtacaaa ttctcgcaga tgtgttataa ttaaagaaaa gcacgtccaa agcgggcgaa 781 tttcttaaaa ggtgggaatt taaatgttga cattcggcga aagattaaga aaggcaagaa 841 agagaaaggg cctttctcag gtagatgttt tcgatgcaat cgggcttaac aacaagagcc 901 tctcgcgata tgaaaaaggc gaaaccacgc ccaaccccga gactttgcag aagcttatca 961 gactttatga cgtttcaagt gagtatattt tgggacttac cgacgttatg ggctcttctg 1021 ccgagggtga aacctcgtcg gatgccgacg gaaacctaat cgagatgatc gaccataagt 1081 caagcgcaag aaagcttatc aacttcattt cttcaagccc cagccgtttc catgttgtgg 1141 caaatattgc aagaaagctc gctcacgatg gctttatcga gcttaaagag gcaaatgact 1201 ggaatattga agcaggcggg aaatactatg tcacccgcaa tcagtcatcc atcatcgcct 1261 tcaaggttgg tgccgatgcc aagggcttca acattatggc atcccacagc gacagcccca 1321 ccttcaagtt caagcccaat gccgaaatgg aaaccttggg caaatatgtc cgcatcaata 1381 ctgagaagta cggcggaatg ataatgtcca catggcttga cagacctctt tccgttgcgg 1441 gcagagtcac cgttatgacc ggcggcaagg tgaaatccag ccttgtcaat attgacgagg 1501 acaccctgct gattcccaat gttgcgatcc atatgaaccg caacgcaaac gacggtatga 1561 cctataaccc gcaggtggat accattcctc ttatgggctc agaagccgca aagggcaagc 1621 tcatgggtct tgttgcagcc tctgcaggcg tcaaggagag cgacattatt tcaagcgatc 1681 tatatctata ttgccgtacc cctgcaactg tctggggcaa cgacggcgag tttgtttcct 1741 gtcccaagct tgatgacttg cagtgcgcat atgccacaat gcagggattc ttggcagggg 1801 ataatgccga aactgtttcc gttttggcgg tgtttgataa cgaagaggtt ggctcgggca 1861 ctaagcaggg cgcagattcc gatttcttga gagcagttac cgacagaatt gcaaacgctt 1921 tgggcaagga aaagagcgcg atgcttgcaa acagctttat ggtttccgcc gacaacgctc 1981 acgctgttca ccccaaccac cccgaatatg cggatcctac caataagccg tttatgaacg 2041 gcggtatcgt catcaagcac aacggcaacc agcgctatgc aacagatgca atcagcgaga 2101 ccattttcaa gcgcatctgc gccgcgatcg gtgtgcccac ccagacatat gccaacagaa 2161 gcgacattgc cggcggctca accttgggca atatttcaac tgcacaggtt tcgctcaata 2221 ccgttgatat cggattggct cagcttgcga tgcactcaag ctatgaaacc gcaggaagta 2281 tggacaccct ttatttggag cgtgccgctg cggaattcta tcgcacagca atcatcagcc 2341 tcggtgacgg ggaatatgag ctaagaggat aagactttag aataactttg ctcatctgac 2401 atataaaaaa tcagacccaa aggttttcct tcgggtctgt ttttttatgg ctgatggagc 2461 atggagtgga agatcaaagc gaatgcttaa ctctttgttc aacctcggcg cgcttggcgt 2521 tgttgaagcg gtcaagtgta ccaacaagat accctgtgat gcgtctgatg cggtcgaaat 2581 taacaggagc gaacttatat tcaatgtcaa catattcgcc gtctagtgtc aaggtcatct 2641 cctcgatcct cttgggatga taaagattta ctgcgcgggt gacatatgca tcaatttccc 2701 gctggtcaag tgtgccgttt ttaactgtta ccttcatata tgtatacctc ctgcgttgat 2761 attttgggct tgcaaagaga taatatcaca atatattgtg tttgtcaata ctttttaaga 2821 attattctca tttttctttt ttgctgtaat ccttaaacgc aatattaagg tcaacatttc 2881 cctcaattcc gggcacctgt cccttcgagg aatattgcca cattgcaaaa tcgtagaaat 2941 atgtaggcgt atcggaatat tccgccagcc aaatgtcgat atcctcgagc attgaaaggt 3001 catatttcca gattgcggtc ttcttgttgc aatagatcat cggggtatag cctgccattt 3061 caactcgctc acaaaagacg agggcattgg ctgttagctg ttccggctcg atttcagctg 3121 tgcggacagg gtcgccgtcc ttatcgatca caacctccca gtcgtatata acggggaaac 3181 tgatttcata gccgtcgatg aggtccaaaa caaagttggc ttcttcaagg gcttcttccg 3241 tatcaatcgc ttgcgagaag aaatatacac cgactttaag acctgcatcc aaagcgccct 3301 gaatatttga acggaagttt gcgtctgcat tcacagaagc ggtcacatat ccgcggaatc 3361 cgcaacgaat aattacaaaa tcaaatcccg cttccttaac cttgtcccat tcaatatcgc 3421 cctgatatat tgaaacgtcg ataccttgaa gaatgtcgag gttttcatcc tcatatgtca 3481 aatatcccgt aacttcatcc ttgatgaact tctcgtttat gtattcgttc tttgaaacat 3541 tcgccatcgc aggcatccaa atcggaccgt agttggtgtc ccaaagctca aagctgtcgt 3601 ttgtcagcga gtggtcatat tcttcagatg ggtcgatgat tatatattcg ggcaccgtga 3661 cggtgacttc cttttcaacc tcgacaattt cggggacgat agtgccctgt tcgtgtgccc 3721 agccgattgc gagcactaca acggttatgc aaagcattgc cgttaccccg acaagcaccg 3781 ttaaaacggt gcgataggtt tttgtcacga tgttttcgcg gctttcctgc gttttgcggt 3841 aaagctcgtt gatctcttca aaaacatctt ctcttgtttc ctgctccaaa agcctgttgt 3901 cagccatttt caaaatcctc cgccgaaaaa taatctcata cgacaagttt agcatatttt 3961 cgacagatag taaacaggta tgcttttcct tttttcggag gtcgtttttg cataaatttt 4021 gcataaatag ctctgcgagg tctgcaaaaa tggcgaaatt taatgaaatt tggcatattt 4081 ttgcaagatt ttgtgaaatg acttgcaatt ttcttcgtac tgtaatataa taaagcacaa 4141 tgacactaat ttttgcggag gttgcgcgct atgtccatat tcgattattc aaaggaacag 4201 cttaaaagct tttacgatga gcaggtcaaa ttgcttgctg agtataaggc aagaggttta 4261 aagcttgata tgtcaagagg taagccctcg cccgaacagc tcgatttaac caacgatatg 4321 ctcacccact gtcttgacgg cgaccacatt tccgagcgcg gagttgactg ccgaaactac 4381 ggcgttctgg acggaattta tgaagcgaag cgccttttta tgcccatgct cggcatcggc 4441 agatatgaaa ttataatcgg cggcaactca agcctgcagc tgatgtatga caccatcgca 4501 aaatgtatgc ttttgggcac aaaggacagc gataagccct ggtgcaagct tgagaaggtg 4561 aagtggcttt gcccggcgcc gggatatgac agacactttg caatttgcga aggatttgga 4621 attgaaatga tacccgtgcc gatgaattcg gacggccccg atatggatat ggttgaaaaa 4681 ttggtcgcgg aagatgatgc aattaagggt atctggtgtg tgccgaaata tgccaacccc 4741 tcgggaatca cctattcgga tgaggtcgta agacgttttg ctgcactcaa tcccaaggca 4801 aaggacttca ggatcttctg ggataatgca tattgcgttc acgaccttta tgatgaccac 4861 gaccagctca tcaacatctt ggatgaatgc aaaaagacag gcaagcagga tatggtgctc 4921 atatccggct ccacatcgaa gatatccttc cccggcggag gaatcgcggc gatcggtgcc 4981 agcgaggaaa acatcaactt cttaaaagac cagatgtcca accagaccat cggatatgat 5041 aagctgaatc agcttcgcca cgcaagattt ttcaagaact tcgacggact tatggaacat 5101 atgaagaagc atcgcgacat tatcaggccc aagtttgatg ttgttcttga ggcattggat 5161 aacgagatcg cgcctctggg aatcggtgat tggaccaagc cgaagggcgg atatttcatc 5221 gcgtttgacg cagaagaggg cactgccaag agaatcgttt cactttgcgc cgacacaggc 5281 gttgtaatga ccaaggcagg tgcaacttat ccttacggaa acgaccccaa ggattcaaac 5341 atccgcattg cacccacata tccctctgta tccgagctga agcttgcaat ggagatattc 5401 tgcgttgcag ttaagcttgc aacagctgag aagcttttga gcgaataagc aatatatgcg 5461 ccctgatttc ggggcgcatt ttttgtgcac agcaagagaa aagtattgct ttttgtccga 5521 ttgtgtgcta tccttttagc aacaccattg aagggagatt ccaatatgaa ttgtaaaaaa 5581 tgcggaaatg aagtaactga aaatatgacc gcttgcccta tgtgcggtga gcccatcgta 5641 actgaaacaa caaccgaaac cgccgcaaaa acctcggcaa cgagtctgga tgaagctcgc 5701 aagaagagag cgaaaagcaa agcgatctct accgttatcg gcattgtgct ggcagttatc 5761 atcgctgttg tcaaggcgct gacaggcgga ggcggagata ttgaaaagac tccgaacaaa 5821 ctcgactata gcacctatgt atatgatgac ggcacaggcg tagtcaacac aaaggtatac // LOCUS sequence025 5758 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence025 VERSION sequence025 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..5758 /mol_type="genomic DNA" /organism="" /note="sequence025" CDS 137..571 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MIEQDTIKLLRECDAGIKMGVDSIDDVLEYADDEALKKALTSCKN EHIKLKDEIQGYLDEYHDEGKDPALMAKGMSWMKTNIMLAFKESDKTIADLMTDGCNMG VKSLSKYLNQYEAADERSKDITKRLIKLEEKLAKDVRQFL" /locus_tag="LOCUS_1630" /note="MGA_196" CDS complement(618..1712) /product="redox-regulated ATPase YchF" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003427022.1" /transl_table=11 /codon_start=1 /translation="MKLGMVGLPNVGKSTLFNALTNAGAESANYPFCTIEPNVGIVSVP DERLDALAKMYQPTKFTPATLEFVDIAGLVKGASKGEGLGNKFLANIRECDAIIHVVRC FESDDIIHVEGSVDPKRDIETIDLELIFADMEVLERRLDKAKKMIKGDKKYQADIDLCE GLLAHLEAGKPARSYAYSDEEREMIKTTPLLSMKPVIYAANMSDSDFTSDIETNPHYQV VKEIGADEGSSVLPICAQIEQEIGDMDEEDKQMFLADLGLEISGLNRVIKEGYALLGLI SFLTAGKDECRAWTITKGTKAPQAAGKIHTDFERGFIRAEVIAFDDLMACGTMVAAKEK GLIRSEGKEYVMRDGDVVLFRFNV" /locus_tag="LOCUS_1640" /gene="ychF" /note="WP_003427022.1 redox-regulated ATPase YchF (Clostridioides difficile) [pid:61.4%, q_cov:100.0%, s_cov:100.0%, Eval:3.6e-128]" /note="MGA_197" CDS complement(1743..1904) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MDGKGTVAACGITMGSCLAMIISFSINHSIFWAIVHGCMSWVYVI FRLIVGGY" /locus_tag="LOCUS_1650" /note="WP_003427864.1 hypothetical protein (Clostridioides difficile) [pid:63.9%, q_cov:67.9%, s_cov:64.3%, Eval:2.4e-07, partial hit]" /note="MGA_198" CDS complement(1935..2939) /product="tryptophan--tRNA ligase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_004454934.1" /transl_table=11 /codon_start=1 /translation="MSDVKKKVIFSGIQPTGTFTLGNYIGAVRNWGPLQDEYDCIYSIV DMHALTVKRDPVKFRQQTMESYALLLACGIDPKKSIAFIQSHNPSHAQLNWLLCCATQF GELTRMTQFKDKSQKHPDDINAGLFTYPTLMAADILAYNADLVPIGADQKQHLELARNI AVRFNQRFGDMFVVPEGYIPKVGARVMSLQEPTKKMSKSDENQNAVVLILDDKDTIIRK FKRAVTDSDTVVRYAEGKDGINNLMSIYSAVTGKTNDEIEREFEGKGYGDFKLAVGETV ADHLAPVRGEFARLMADKNYLKECYTDGAQRAFKLSNKIITKAYRKVGFVDYR" /locus_tag="LOCUS_1660" /gene="trpS" /EC_number="6.1.1.2" /note="WP_004454934.1 tryptophan--tRNA ligase (Clostridioides difficile) [pid:58.8%, q_cov:98.8%, s_cov:99.1%, Eval:2.5e-109]" /note="MGA_199" CDS 3090..3284 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MKLFRIICVIIAAFGAVALGVVYFAVGTEPLWPLYVCTMVTLGGL LGNAVGSVIQLILEEKRKT" /locus_tag="LOCUS_1670" /note="MGA_200" CDS 3802..5439 /product="polysaccharide biosynthesis protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_012048381.1" /transl_table=11 /codon_start=1 /translation="MKKQGLLVGSFVLLLAVFIAKAAGLLFKIPLTNILGGTGMGYYSA AYTVFTPIFALCAASLPSAITQLVSESEALGKYRSIKSIKRVSLIVFSAISLVVSIVMA LLSDLIARRIIGSPESAWAIAAIAPCVFISTITAIYRGYFEGLRNMTPTAISQIIEAIC RLVFGLGFAYLADIYSPALGISNRLPFIAATAVLGVTVSNLAGLIYLMLCSKFSGRIGQ ELSELDTSDERYRAVLKRIVLLMIPMSLASLASSLMGAVDLSTIILGIKSSLGKNPQVY MEKYEEVIASGVSLDELPNFLYGSFTGLAMTVFSLAPSLCSAFGKSALPTITECWAKGD SRRVRFEIKRIITIVMYISIPAGLGLCAMSDNILGLLFSSRAVEAMVSVKPLQILSLGT PLLAVSGAAFAMLQAVGRQDLPVKITVVGAIIKLLGNTLLIPLPEMELSGAALSTVISY GVICIWSVCALYKITKTKTTPFVSVVFPILAGGVASVGAKTASIYLFKDLSKLLNSLFS VCFAVIIYIIAVVLLDITTKNALKSKIF" /locus_tag="LOCUS_1680" /note="WP_012048381.1 polysaccharide biosynthesis protein (Clostridium botulinum) [pid:26.8%, q_cov:99.8%, s_cov:99.4%, Eval:3.0e-50]" /note="MGA_201" ORIGIN 1 cacggcgctg cgccgcaggt gcggcggttc gtggcctgcc gtgccgagcg gagcggtcgg 61 ttggcataaa cttccagcat tacacaacta aaaatcagcc ataatatatc aaatgattat 121 gtttggagtg ttgcagatga ttgagcagga cacaattaag cttttaagag aatgcgatgc 181 aggaattaag atgggcgttg attcgattga cgatgttttg gaatatgctg acgatgaggc 241 tttgaaaaag gcacttacaa gttgcaaaaa cgagcatatt aagcttaaag atgagattca 301 gggatacctc gatgaatacc acgatgaggg caaagacccc gcgcttatgg caaagggaat 361 gtcctggatg aagacaaaca ttatgctggc gttcaaagaa tcggacaaga ccattgccga 421 cctgatgaca gacggatgca atatgggtgt gaaatcgctg agcaagtatt tgaatcaata 481 tgaagcagca gatgaacgct caaaggacat cacaaaacgt ttgatcaagc ttgaagagaa 541 gctagcaaag gacgtaaggc agtttttata atgaaaaaac aaccgttggg ggttaccaac 601 ggttgcttgt ttttttatta tacattaaat ctgaaaagaa caacgtcgcc gtcacgcatg 661 acatattcct tgccttcgga acgaatcaag cccttttcct ttgcggcaac cattgtgccg 721 cacgccataa ggtcgtcgaa tgcgatgacc tctgcacgga tgaagccgcg ttcaaagtcg 781 gtatggatct tgcctgcagc ctggggtgcc ttggtgccct tggtgatcgt ccatgcgcgg 841 cactcgtcct tacctgcggt gaggaaggaa atgaggccta aaagtgcata gccttctttt 901 atgactcggt taaggccgga aatttcaaga cccaaatcag ccaagaacat ctgcttatct 961 tcctcgtcca tatcccctat ctcctgctcg atctgagcac agatgggcaa aacagaggag 1021 ccttcgtcgg cgcctatctc ctttaccacc tgatagtggg ggttggtttc gatgtcggag 1081 gtgaagtcag aatcggacat attcgcagca tagattacag gtttcattga aagaagcgga 1141 gtggttttga tcatctcgcg ttcttcatcg ctgtaagcat atgaacgggc gggcttgcct 1201 gcttcaaggt gagccaaaag tccctcgcaa aggtcgatgt ctgcctgata tttcttgtca 1261 cccttgatca tcttctttgc tttatcaaga cggcgctcaa gcacttccat atcggcaaag 1321 ataagctcaa ggtcgatggt ttcaatatca cgcttggggt cgaccgagcc ttcaacgtgg 1381 ataatatcat ccgactcgaa gcatcttaca acgtgaataa ttgcgtcgca ctcgcgaatg 1441 ttagccaaga atttatttcc caagccttcg cccttggatg caccctttac aagacctgcg 1501 atatcaacaa attcgagggt tgcaggggtg aactttgtgg gctgatacat ttttgcaagg 1561 gcatcaagcc tttcgtcggg cacggaaacg attccgacgt tcggttcgat ggtgcaaaaa 1621 ggatagtttg cagattcagc tcccgcgttg gtcaaagcgt tgaaaagagt gctctttccg 1681 acgttgggaa gtcctaccat accaagtttc atgttattat taagtccttt cggtttgtgt 1741 tattaatatc cgccgacaat aaggcgaaag attacatata cccagctcat acagccgtgt 1801 acgattgccc agaagatcga atggttgatt gagaaggaaa ttatcattgc aaggcaggag 1861 cccattgtga ttccgcaagc ggcaactgtt ccctttccgt ccattttaaa tccctcctgt 1921 cggaattatg tcatttatct gtaatcgaca aagccgacct tgcggtatgc cttggtgatt 1981 atcttgtttg aaagcttgaa tgcgcgctga gcgccatcgg tatagcattc cttgaggtag 2041 ttcttgtctg ccatcaagcg tgcgaattcg cctctgacgg gcgcaagatg gtcggcaacg 2101 gtttcaccga cagcaagctt aaagtcgcca tagcccttac cctcaaactc acgctcgatc 2161 tcatcgtttg tcttacctgt aacggcagag tagatgctca taaggttatt gatgccgtcc 2221 ttgccctcgg catagcgaac aacggtgtcg gagtcggtaa ctgcacgctt aaacttgcgg 2281 atgatagtgt ccttatcgtc aagaatgaga acaactgcgt tctggttttc atccgacttg 2341 gacatcttct tggtgggttc ctgcaagctc ataacacggg cgccaacctt gggaatatat 2401 ccttcaggga caacgaacat atcgccaaag cgctggttga agcggacagc gatgtttctt 2461 gcaagctcaa gatgctgttt ctggtcggca ccgatgggca caaggtcggc attatatgcc 2521 aaaatatccg ccgccataag ggtgggatat gtgaaaagtc ctgcgttgat gtcgtcaggg 2581 tgcttttgag atttatcctt aaactgagtc attctggtca gctcgccgaa ctgggtcgca 2641 cagcaaagaa gccagttgag ctgagcgtgg ctggggttat ggctctgaat aaaagcgatg 2701 gactttttag ggtcaattcc gcaggcgagg agcaaagcat aagactccat agtctgctgg 2761 cggaacttga cggggtcgcg cttaacggtt agcgcgtgca tatcaacaat tgagtagatg 2821 cagtcatact catcctgcaa agggccccag ttgcggacag caccaatata gttacccagg 2881 gtgaatgtac ctgtgggctg gatacctgag aatatgacct ttttctttac atcagacata 2941 tataaaacct ccaaaaataa ggatttaaac tattaaatca gtatatcaca taattaagcg 3001 gatgtcaatt taaatggcga aacgagcact tgcaaagaga ggatttttgt ggtaatatat 3061 agaaaaaaga gccgaggagg caatgtgtta tgaaactttt cagaattatc tgtgttataa 3121 ttgcggcttt tggcgcagtc gcgctgggtg tggtatactt tgccgttgga accgagcccc 3181 tttggccgtt atatgtttgc actatggtaa ccttgggcgg acttttggga aatgcggtcg 3241 gctcggttat tcaactgatt ttggaagaga agcgcaaaac gtaaagagaa tgaatgattt 3301 tgttccccgc ttgcagtgat gcaggcgggg ttttacacct catccgcctc attcctcggc 3361 accagtcccg tttgcggtgc ccgactcgcc gttcactaac gttccggctt gtcgaccgct 3421 gctccaaccc cttctccctt cttccgccac cggcggcggc cacaggcgtt gcccctcaag 3481 gggaatgctt gcatacccgc ttgcacttag gtgtaggcgg ggttttgttt gcgcggacgc 3541 ggcagcccgc ggggcgaagc cccgcgccgt gcgccgaagg cgcacgaaag gcattttgca 3601 aaaaatgcct tggttgccgc aaggcggttc aagtgtgctt cgcctaaatt ttgcaaccga 3661 tggggcgatt attcagcctc tccctatggg agaggtgtca cgcacagcgt gacggagagg 3721 gctttacaca gtaccttgtg aatatttgta ccctctgcca aatacaaatg tacaagaccc 3781 tttgttgaga ggacggttgc tttgaaaaaa cagggcttgt tggttggttc atttgtattg 3841 ctattagcgg tatttattgc aaaagccgcg gggcttttgt ttaaaattcc gcttacaaac 3901 atcttgggcg gaacgggaat gggatattac tcggcggcgt atacggtttt tacgccaata 3961 tttgcacttt gtgcggcaag cttgccatca gctatcacac agcttgtatc ggaaagcgaa 4021 gcactcggga aataccgaag cattaaaagc atcaagcgag tttcgctgat cgttttcagc 4081 gcaataagcc ttgttgtcag cattgtaatg gcacttttgt ccgacttgat tgcgcggcga 4141 atcatcggca gtcccgaatc tgcttgggcg attgccgcga ttgcgccctg cgttttcatt 4201 tcgactatca cggcgatata tcgaggctac tttgaaggac ttagaaatat gactccgacg 4261 gcaatttcgc agatcattga agcgatatgc cgtctggttt tcgggctggg atttgcatat 4321 ttggcggata tctattcccc tgccttggga ataagtaatc ggttgccgtt tattgccgca 4381 acggcagttt tgggcgttac cgtttcaaac ctcgcggggc ttatatattt gatgctctgc 4441 tcaaaattct cgggcagaat cggccaagag ctttcggagc ttgatacatc tgacgaacga 4501 taccgcgcag tacttaaacg cattgttctt ttgatgattc caatgtcgtt ggcatcgctg 4561 gcatcaagcc ttatgggcgc ggtggattta tctacaatta tactgggaat aaagtcgtcg 4621 ctgggcaaaa atccgcaggt atatatggaa aaatatgaag aggttatcgc ttcgggtgtg 4681 agcctcgatg aattgcccaa cttcctttat ggctcgttca caggacttgc gatgacggtg 4741 ttttcgctgg cgccgtcgct atgctcggct ttcggaaaat ctgcactgcc gacgataact 4801 gaatgttggg caaagggcga tagccgacgt gttcgctttg aaatcaagag aataattacc 4861 attgtaatgt atatctcaat tcccgcggga ttggggcttt gcgcgatgag tgataacatt 4921 ttgggattgt tattttcctc acgcgcggtt gaggcgatgg tatcggttaa gcccttgcag 4981 attttaagcc tcggcactcc ccttttggcg gtcagcggag cggcatttgc aatgcttcag 5041 gcggttggaa gacaagacct gcccgttaaa ataaccgttg ttggggcaat cattaagctg 5101 ttgggaaata cgcttttgat ccccctgccg gaaatggagc tttcaggcgc ggcattatca 5161 actgtaatca gctatggcgt tatatgcata tggtcagtct gtgcgctata caaaatcact 5221 aaaacaaaaa ctacaccatt cgtgtctgta gtcttcccaa ttttagcggg aggtgttgca 5281 tctgtaggtg caaaaaccgc atcaatttat cttttcaaag acctctcaaa gctcctaaat 5341 tcgttgtttt ctgtatgttt tgctgtcata atctacataa tagcagtagt gttgttggac 5401 ataacaacta aaaatgcatt gaagagtaaa attttttgat tttttacttg cattttgcgt 5461 ttttaatgtg tataataagc aatgcgctgt tctgccgcga catttattgg aggctatcga 5521 gcagaacaat tatctctatt aaaaatacag gaggaaaata aaaatgacaa aagttgaatt 5581 ggtaaacaat atcgccctca aggctgattg ctccaagaag gatgcagaaa aggctctcaa 5641 cgctgtaatc ggttctatct ctgatgcact cgtaaacggt gaaaaggtaa ctctcgttgg 5701 cttcggtact ttcgaagtta gagaacgtgc tgctaaggaa ggcatcaacc ccaagagc // LOCUS sequence026 5751 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence026 VERSION sequence026 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..5751 /mol_type="genomic DNA" /organism="" /note="sequence026" misc_feature <1..632 /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_009888359.1:threonine--tRNA ligase" /note="WP_009888359.1 threonine--tRNA ligase (Clostridioides difficile) [pid:46.4%, q_cov:99.0%, s_cov:32.4%, Eval:1.3e-52, partial hit]" /note="MGA_203" /locus_tag="LOCUS_1690" CDS 926..2422 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MNMKKVLAVVMAVMLAISAMAISVFAAEYEIKLSSAGSKGNGAAY STVEFTIPVWAQYGYAVAGDSIKLSLPAAEGASYVVVANGVSYALGLNADGVYEIVFGT LAHGWNDRDLNTVIPQSTVVGDNAALTVIGTFKILKDADGKETYRVSAYDFTLPGAGNW TMTKFTAASWNWSNGSIGDIKYDVKAVSNDNPNSVSYCWDWNPVNGADIAASDSTWNAG LTNLHWDATLINKAQVIGAETAKVVVKLDKAIVGNYYFGLLAKYANGYYYNLPGANFPG LGNETKNYAAYIEIEAPTDTITFEVPKEVLYSTNYGAFNESFDVVCVDATHEDMLWNIK GYELVQRTDSVGTTVLKKDKGFMGGNATKTAWENNENVTYTLVQTVAGYRATAQNGTLG DYSWTKDTISYCGQEVNIYWNQWYNVAPQSVTLVLGYTDVETPADDIVVEDPVESTEEE SEDITVEEPVEEDTNPGTGLALAVVPMVLAAAAVVASKRR" /locus_tag="LOCUS_1700" /note="MGA_204" CDS 2826..3503 /product="ABC transporter ATP-binding protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003973151.1" /transl_table=11 /codon_start=1 /translation="MGYIIATNGLCRDFTIGDGSVIHALKDINITVTEGKLTILKGRSG SGKTTLINLLGALDRPTKGEVLFDGQDITKLSDAKRDELRRYQMAFVFQSVALMSSMTA YENVDFGLRLSKFPFDQREERVKKCLEEVGLGKRMYHRPGELSGGEQQRVAIARALAHE PKIIFADEPTAELDSGTSHHIVELFKKLVEEEHMTIVMTTHDPSLLEIADRVYTLEDGE IIE" /locus_tag="LOCUS_1710" /note="WP_003973151.1 ABC transporter ATP-binding protein (Streptomyces) [pid:49.5%, q_cov:92.4%, s_cov:90.4%, Eval:3.4e-52]" /note="MGA_205" CDS 3496..3756 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MSKKKQKLAEHLAEILVPGGDESEYAIECENLVKIYKTDQIEVVA LQGLDLTIKKGELVAIVGSSGSGNRPCSICWADLINPVQVH" /locus_tag="LOCUS_1720" /note="WP_011028504.1 ABC transporter ATP-binding protein (Streptomyces) [pid:50.0%, q_cov:65.1%, s_cov:17.6%, Eval:1.7e-08, partial hit]" /note="frameshifted, insertion/deletion at around 3702" /note="MGA_206" CDS 3717..4478 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MLGGLDKPSAGALTICGRNLLKFTEDDYMVYKRNVVGFVWQNNAR NLVPYLTAVQNVELPMLLQGKKERRAKALDLLEAVGLSHRVNSRLDQMSGGEQQRVAIA IALANDPMLLLADEPTGSVDTKTSDQILNVFKKLNEERGITIVIVTHDLRLAKKIDRVI AIRDGRTSSEIIKKSHAEILKESKGLADGEISQEQISEEEYVSEELVVLDRTGRLQLPK EYLEALNIKGGERVKADLDLEAERIYIHKAQ" /locus_tag="LOCUS_1730" /note="WP_011028504.1 ABC transporter ATP-binding protein (Streptomyces) [pid:47.0%, q_cov:98.4%, s_cov:73.4%, Eval:4.7e-56, partial hit]" /note="frameshifted, insertion/deletion at around 3702" /note="MGA_207" ORIGIN 1 agggcacagc agagcagtgg aacgaagctc agcgcgtaat gggtgagatt ttggatgcca 61 tcggaatcga ctatgagatc ggtattgatg aagctgcatt ctatggcccg aagctcgaca 121 ttcagtgcaa aaacgttttt ggcaaggaag ataccatcgt aaccatccag atagatatgc 181 ttttggctca gaagttcggc atggaatatg ttgacaccga cggcgagaag aagacacctt 241 acatcatcca ccgcacatcc atgggctgct atgaaagaac acttgctctc ttgcttgaaa 301 aatatgcagg tgcgttgcct ctctggctct cacccttgca ggttaaaatt atgcccatct 361 ccgacagaca gcttgaattc gctgaaaagc tggcacaaaa gatggatgac ctcgtaatca 421 gatgcgaaat tgataacaga agcgaaaaaa tcggttataa gatccgccag gctcagcttg 481 ataagactcc ttatatggta attatcggcg acaaggaagt tgaaaataac gaagtttctg 541 taagaaatcg ccgcgaaggc gagcttggct caatgagtcc tgatgctttg gttgcacgtc 601 ttttggaaga aatcgcgtcg aaagcaaagt aaaattgcaa atataatggt aaaactgctc 661 aaacgccctg ccaaattcgg cggggcattt gtaatttctt acaaatcaaa aattttttga 721 aaaagtttga aacaaaatgc gacttattca acacttaatt aacagcgaaa ggcaagacgg 781 atgaaactaa aatcggcaaa aagtaagaaa tgcttgacaa aagccgacga tagtgttata 841 atgaccccgt ccgaaccttt cggacaacac aacaaaagat ctctataccc gtatagggat 901 gaaaatttta aaggaggaat ttttcatgaa catgaaaaag gttttggcag ttgtaatggc 961 tgtcatgctc gccatctctg caatggcaat ttctgtattc gctgctgaat acgaaatcaa 1021 gctttcttct gctggttcta agggcaacgg tgctgcttac tccacagttg aattcacaat 1081 ccccgtttgg gctcagtatg gttacgctgt agcaggcgat tccatcaagc tctctctccc 1141 cgctgctgaa ggcgcttcct acgttgtagt agctaacggc gtttcttacg ctcttggtct 1201 caacgctgac ggcgtttacg aaatcgtttt cggtactttg gctcacggct ggaacgacag 1261 agacttgaac actgttattc ctcagtctac cgttgttggc gataacgctg ctcttaccgt 1321 tatcggtacc ttcaagatcc tcaaggatgc tgacggcaaa gaaacctaca gagtttctgc 1381 ttacgacttc acccttcccg gtgctggcaa ctggactatg actaagttca ctgctgcttc 1441 ctggaactgg agcaacggtt ctatcggcga catcaagtat gatgttaagg ctgtttctaa 1501 cgataacccc aactccgttt cttactgctg ggactggaac cctgtaaacg gtgctgacat 1561 cgctgcttcc gattccactt ggaacgctgg cttgaccaac ctccactggg atgctaccct 1621 catcaacaag gcacaggtta tcggtgctga aaccgctaag gttgttgtta agcttgacaa 1681 ggctatcgta ggtaactact acttcggcct ccttgctaag tatgctaatg gttactacta 1741 caacctccct ggtgcaaact tccctggtct tggcaacgaa accaagaact atgctgctta 1801 catcgaaatc gaagctccta ccgacaccat caccttcgaa gttcctaagg aagttctcta 1861 ctccaccaac tacggtgctt tcaacgaaag ctttgacgtt gtttgcgtag atgctactca 1921 cgaagatatg ttgtggaaca tcaagggcta cgagctcgtt cagagaactg attccgtagg 1981 caccactgtc ctcaagaagg ataagggctt tatgggcggc aatgctacca agactgcttg 2041 ggaaaacaat gaaaatgtaa cttacaccct cgttcagaca gttgctggtt acagagctac 2101 cgctcagaac ggtactctcg gcgattactc ttggactaag gacactatct cttactgcgg 2161 ccaggaagtt aacatctact ggaaccagtg gtacaacgta gctcctcagt ctgtaaccct 2221 cgttcttggt tacactgacg ttgagactcc tgctgacgat atcgtagtag aagatcccgt 2281 tgaatctact gaagaagaat ccgaagacat cactgttgaa gagcccgttg aagaagatac 2341 caaccccggt accggcctcg ctctcgcagt agttcccatg gttcttgctg cagctgcagt 2401 agtagcttct aagagaagat aattcctcct ttatgaagga aataaactga cttagtcagt 2461 aatattgata ccacccgatg cagacgggtg gtatcttttt ttatgcccgg aaactatatg 2521 ttgtaggaca ttttcgaagg cggtttttct gtgaaaattt ttcgatatat attgacacat 2581 aaccgtcact ttggtataat atattaacaa cgcaaagggc gaattgcgcc ctcgcgtcgg 2641 aagaaactga atatctgcat ttaatcaaag caaatggctt ttgttggtga aaattccaag 2701 aaaagtgttt gcttattcgt gtttatagag gtaactaccc caaaattgtg caagatgcac 2761 aaacttccaa ggtaacattt aactctgaca cgttttcgga ttagacattt ttcttggagg 2821 tgcaaatggg atacataatt gcaaccaacg ggctctgccg tgatttcacc atcggcgacg 2881 gcagcgtcat ccacgccctg aaagacatta acattactgt cacagagggc aagcttacaa 2941 ttttgaaagg acgttccggt tcgggcaaaa caacgctcat aaatcttttg ggcgcacttg 3001 accgccccac aaagggcgaa gtcctctttg acggtcagga catcacaaag ctctcggacg 3061 ccaagcgcga cgagctcaga cgctatcaga tggcatttgt attccagtct gttgcgctga 3121 tgtcaagtat gacagcatat gaaaatgtcg acttcggtct gcgtctttca aaattcccct 3181 ttgatcagag agaggaaaga gttaaaaagt gccttgaaga ggttggcctc ggaaagagaa 3241 tgtatcaccg tcccggcgag ctctccggcg gtgaacagca gcgtgttgct attgcaagag 3301 ctttggcaca tgagcccaag atcatctttg ccgacgaacc tacagctgag cttgactcgg 3361 gcacctcaca tcatatcgtc gagcttttca aaaagcttgt cgaagaagaa catatgacaa 3421 ttgtcatgac gacccacgac cccagtttgc ttgagattgc agacagggta tatacgcttg 3481 aggacggtga gatcattgag taagaaaaaa cagaagcttg ccgaacacct cgcggagatt 3541 ttggtccccg gcggcgatga atcggaatac gcaatcgaat gtgaaaactt agttaagatc 3601 tataaaaccg accagattga ggttgtcgcc cttcagggct tggatcttac aattaaaaag 3661 ggtgagttgg tcgcaattgt cggctcctcc ggctcgggta atcgaccctg ctcaatatgc 3721 tgggcggact tgataaaccc agtgcaggtg cattaaccat ctgcggcaga aaccttttga 3781 aatttaccga ggacgactac atggtatata aacgcaatgt cgtcggcttc gtttggcaga 3841 ataacgcgcg aaatcttgtg ccctatttga cagcggttca gaacgttgaa cttccgatgc 3901 ttctgcaggg caaaaaggaa cgccgagcca aagcacttga ccttttggag gctgtgggac 3961 tttctcacag agtcaactcc cggttagatc agatgtcggg cggtgaacag caaagagttg 4021 cgattgcaat cgctcttgca aatgacccga tgcttcttct ggcggacgaa cccaccggtt 4081 cggttgacac caagacctcc gaccagatac ttaatgtatt caaaaagctg aacgaggaga 4141 ggggaatcac gatcgtgatc gtaacccacg accttcgctt ggccaagaag atagaccgtg 4201 taatagccat tcgtgacgga cgtacctcaa gtgagatcat taaaaaatcc cacgctgaga 4261 tactcaaaga atcgaaggga cttgcagacg gcgaaatttc tcaggaacag atttccgaag 4321 aggagtatgt ttctgaagag ctggtggttc ttgacagaac gggacggctt cagcttccca 4381 aggaatatct tgaggcgctc aatattaagg gcggcgaaag agtcaaggca gaccttgatc 4441 tggaagctga gaggatctat atccacaagg ctcagtaaac ttctttttta ccctatgagg 4501 aaaaaatata cgctatattg cgaattttaa gaaaggtgga ctttacagtg aaagacacaa 4561 tgtttaggcg cataatttca cttttgctcg cattagtgat gatcgtgcct acattatctg 4621 tttcggtttt cgctgaaggc ttggtgatca catcgcccgc gcccgtaacc gaagatgacg 4681 aaacagaaat caaggaaacc tccgcgcagg tcattgatga acagaacaga gcatacacat 4741 attcaacata ttacgatgct cacatcgacg acccccgccc cgatgcagaa gttgtcatcg 4801 actattccac atacttcaac cccagcgatg attcgggcat ttacaccgac accattgacg 4861 gcgttgactg tttggtatgg cctgaggcaa gcggcgaagt aagtttcccc gttaccgttg 4921 acaaagccgg tctttataat atggagatca tgtactacgc tttggcaagc tctgctaacg 4981 atatcgaaat taccgttgct atcgacggca agagccctta tgctaccgca gaacgtatcg 5041 ttctcgacaa gctttgggta gatgctgaaa aatcttattt ggtaaatgac cagggcgtta 5101 agacctttaa gctggacgtt cacggcaacc agatcagacc tactttggct gaaagccttg 5161 cttggcaggt aacctccttt gaagataccg acggtttgtt caacgaccct cttcgtttct 5221 acttctccga aggcgaacac gttgtaacaa tcaagtctga aaaggcaaga atggctattg 5281 cttacgttaa gctttataac gaaaaggcat tggctcccac cgctgaagca aagaatgtca 5341 ccaccgatgc ttccgttgca ggcaagacca ccggtgtcag catcgtcctc gaaggcgaag 5401 ctgcagaata taagtctgac atcacccttt atgctacata tgaccgtaca acctatttga 5461 cctctcccgc cagccccacc aagatgatct acaacaccat cggtgctcag aactggaagg 5521 acgcaggcca gtcggtaacc tggaagttca atatggacga agcaggctgg gtcaagatcg 5581 gtatcagagg taagcaggac cagatgagag gtctttactc caacagacgt ctttatatcg 5641 acggcgttgt tccctgtgct gatgcagacc aggtcaagtt ctactactcc acatcttggc 5701 agtgtgtaac tcccaccgat gctgacggca acaccatcta cttctggctt g // LOCUS sequence027 5740 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence027 VERSION sequence027 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..5740 /mol_type="genomic DNA" /organism="" /note="sequence027" CDS 95..337 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MCTLTKCAGEAPPRQQGASRAHRGAPRLRRGVWVLRFAQNPQGFA PRGSLAMSKQAPTLRKVPAKGGRFSGGEAKKQPPK" /locus_tag="LOCUS_1740" /note="MGA_209" CDS complement(356..1345) /product="ornithine carbamoyltransferase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_002682235.1" /transl_table=11 /codon_start=1 /translation="MNEFKNRSFLKLLDYTPEEIGKLIDLAADLKAKKKAGISHRLCEG KSIALVFEKTSTRTRCAFEVAAADLGMHPVYLDPKSSQMGKKESIADTARVLGRMFDGI EYRGFGQEIVEDLAKYAGVPVWNGLTNEFHPTQILADFLTIKEHFGTLAGKKLVYMGDA RYNMGNSLMVGCAKMGMHFVACAPEKYFPNAELVAECQKVANETGAKLEFITNPEDAVK NADVIYTDVWVSMGEPDEVWKERIEELLPYQVNKKLMDTAGKQCRFMHCMPAFHDLNTT TGMEIYEKFGIDCMEVTDEVFESEQSIVFDEAENRMHTIKAVMAATLG" /locus_tag="LOCUS_1750" /gene="argF" /EC_number="2.1.3.3" /note="WP_002682235.1 ornithine carbamoyltransferase (Treponema denticola) [pid:64.8%, q_cov:98.5%, s_cov:95.9%, Eval:1.1e-120]" /note="MGA_210" CDS complement(1347..2522) /product="acetylornithine transaminase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011393770.1" /transl_table=11 /codon_start=1 /translation="MSITQLDKQYVAPTYGRFPLELVSGKGSIAYDSDGKEYIDLGSGI GVTAFGYCDDEWQKAVNKQISTLQHTSNLYYTEPCAKLAEALCLKTGLKKVFFSNSGAE ANECAIKVARKYSAEKKGEEYYTIITLINSFHGRTLTTLSATGQDKFHALFNPLTPGFA HCKANDCDELIALVNEVKPAGIMLECVQGEGGVIALDEKFIKCAYELARENDIPLIIDE VQTGNGRTGYMYAYQSFGICPDIVSTAKGLGGGLPIGATMLSEKVQNVLGAGDHGSTYG GNPVCCAGALSVVERLTDDFLAEVKAKSEYIFKALENAEGVESVSGKGLMIGIKTVKPA GDVVNACIEKGVLCLTAKDKVRLLPALNIPIETLAKAIEIIKEVCAEKGEI" /locus_tag="LOCUS_1760" /EC_number="2.6.1.11" /note="WP_011393770.1 acetylornithine transaminase (Moorella thermoacetica) [pid:44.1%, q_cov:98.7%, s_cov:97.3%, Eval:2.0e-87]" /note="MGA_211" CDS complement(2530..3393) /product="acetylglutamate kinase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003435171.1" /transl_table=11 /codon_start=1 /translation="MQGLFSNAERAEVLTQALPYIKRYNGKTVVVKYGGNAMINPQLKE QVMEDIVLLWLIGVKVVLVHGGGPEISETMQKLGKKAEFVDGLRVTDKETVDIVQMVLA GKINKTLVNLLEMKGGKAMGISGIDGRLIEAQIKDERLGYVGEITKIHINPVKDLLEKG YIPVVSTVACDKQGNTYNINGDTAAAHIAGALNAERLIMMTDIAGILRDKDDPSTLIPK VTVAEAHELNRLGVISGGMIPKVDCCIEALNHGVNNVIIMDGRIPHSILMELLTDEGAG TMVTKG" /locus_tag="LOCUS_1770" /gene="argB" /EC_number="2.7.2.8" /note="WP_003435171.1 acetylglutamate kinase (Clostridioides difficile) [pid:52.0%, q_cov:97.6%, s_cov:98.3%, Eval:7.2e-83]" /note="MGA_212" CDS complement(3415..4629) /product="bifunctional glutamate N-acetyltransferase/amino-acid acetyltransferase ArgJ" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003435168.1" /transl_table=11 /codon_start=1 /translation="MKIINGGVCAAKGFKANGIHCGIRKNHSKKDLALILSEVQANAAA VYTTNLVKGAPLILNKKNLADGKAQAVICNSGNANTCNANGLEIAQDMCDLVAKELGVK AGDVVVASTGVIGQPLNIEPIANGIKPLADGLSADGGNACAQAIMTTDTISKEVAVEFE IGGKTCHIGGIAKGSGMIHPNMATMLVFITTDCAISSEMLQGALSSDIQNTFNMLSVDG DTSTNDMVVVLANGMAGNDEISVDGEDFKQFMLALNTVNVTLCRMIAGDGEGATKLLEC KVTGADKLETAKIAAKSVICSSLLKAAMFGADANWGRVLCALGYSGADLDVSKIGVSFK SPKGEIEVCRNGAGVDFSEDIAKEILLEKEIEILVTLGGGEYSANAWGCDLTYDYVKIN GDYRT" /locus_tag="LOCUS_1780" /gene="argJ" /EC_number="2.3.1.1; 2.3.1.35" /note="WP_003435168.1 bifunctional glutamate N-acetyltransferase/amino-acid acetyltransferase ArgJ (Clostridioides difficile) [pid:53.7%, q_cov:99.8%, s_cov:99.8%, Eval:4.7e-116]" /note="MGA_213" CDS complement(4647..5570) /product="N-acetyl-gamma-glutamyl-phosphate reductase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_004197909.1" /transl_table=11 /codon_start=1 /translation="MTKVFIDGSAGTTGLRIHERLSLRDDITLITLSDDLRKDPAAKKQ AINSADIVFLCLPDDAARESVALCDNPNTKIIDTSTAHRTNDDWAYGMPELSGQREKIR SSNRIANPGCHASGFVALVAPLVEKGILKPDALLSCFSLTGYSGGGKKMIADYESDARN GLLDAPRQYALGQTHKHLKEMAKISGLENVPVFCPVVADFYSGMEVTIPLHKAQICGTL DDIKSAYAEYYTDGLIKYCPDADTDGMLSSNAFSGRDDMQVGAYGNDDRIILVARFDNL GKGASGAAIQNMNILIGADESAGLNI" /locus_tag="LOCUS_1790" /gene="argC" /EC_number="1.2.1.38" /note="WP_004197909.1 N-acetyl-gamma-glutamyl-phosphate reductase (pseudomallei group) [pid:48.7%, q_cov:99.0%, s_cov:98.7%, Eval:3.6e-75]" /note="MGA_214" ORIGIN 1 caacacaatg tagaatattt ttgtccctat tgtagcacaa ccatatcaaa agtgcggtgg 61 tttggcaacc gcaaaaatga ggttttaatc gggcatgtgt accttgacaa agtgtgcggg 121 cgaagccccg ccccgacagc agggcgcctc acgcgcccat cggggcgccc cgcgcctgcg 181 gcgcggggtg tgggttttgc gctttgcgca aaacccacag ggcttcgccc ctcgcggcag 241 tttggcgatg agcaaacaag cgccgacgtt gcgaaaagtg cccgccaaag gcgggcgatt 301 cagcggtgga gaagcgaaaa agcagccacc aaagtgactg cctttgtttt atatattatc 361 ccagcgttgc cgccataact gctttgatgg tgtgcattct gttctccgct tcgtcaaaga 421 cgattgactg ctcgctttca aacacctcat cggtgacttc catgcagtcg atgccgaact 481 tttcatatat ctccatgcct gtagtggtgt tcaggtcgtg gaatgcgggc atacaatgca 541 taaatctgca ctgcttacct gctgtatcca tcagtttctt gttcacctga taaggcaaca 601 gttcttcaat gcgctctttc caaacttcat ccggctcgcc cattgatacc caaacgtcgg 661 tataaataac gtcggcattt ttaaccgcat cttcggggtt ggtgataaat tcaagcttcg 721 cgcctgtttc atttgcaact ttttgacact cagccacaag ctccgcattg gggaaatact 781 tctcgggagc gcaggcaaca aagtgcatac ccatcttcgc acatccgacc atcagagaat 841 tgcccatgtt gtatcttgca tcacccatat atacaagctt cttgcccgca agggtgccga 901 aatgctcctt aattgtgagg aaatccgcaa gaatctgagt ggggtggaac tcatttgtca 961 gaccattcca tacaggcaca cctgcatact ttgccaagtc ctcaacaatt tcctgtccga 1021 atccgcgata ttcaatgccg tcaaacattc tgcccaaaac gcgggcggtg tcggcaatgc 1081 tctccttttt gcccatctgt gagctcttgg gatcgaggta aacggggtgc atacccaaat 1141 ctgccgccgc gacctcaaat gcacatctcg ttctggtgct ggtcttttca aacaccaagg 1201 caatgctctt gccctcgcaa agacggtggg aaattcccgc ctttttcttt gccttcaagt 1261 ctgccgcaag atcgatcagc ttgccgatct cctcgggagt ataatccaaa agcttcaaaa 1321 agcttctgtt tttaaattcg ttcatctcag atctctccct tctcggcgca aacttctttg 1381 attatctcaa tcgctttcgc gagcgtttca ataggaatat tcagcgccgg caaaagtctt 1441 accttatcct tagccgtcaa gcacaaaacg cccttttcaa tgcaagcatt aacaacatct 1501 ccggcaggct taacagtttt tattccgatc atcaggccct tgccgctgac cgattcaacg 1561 ccttcggcat tttcaagtgc tttaaaaata tattcgctct tggctttaac ttctgctaaa 1621 aaatcgtccg tgagcctttc aacaacgctc aacgctcccg cacagcaaac agggtttccg 1681 ccatatgtgg aaccgtggtc gcctgcgccc agaacgtttt gaaccttttc gctgagcata 1741 gttgcaccga tcggcaagcc gccgcccaag ccctttgcag ttgaaacaat gtcggggcat 1801 ataccaaacg actgatatgc atacatatat cccgttctgc cgttgcctgt ctgcacctcg 1861 tcgatgatga ggggaatatc gttttcccgt gccagctcat aagcacactt gatgaatttt 1921 tcatccaacg cgataactcc gccctcgccc tgaacacatt ccagcataat tcctgcgggc 1981 ttgacctcat taacaagcgc aattagctca tcgcagtcgt tcgccttgca gtgggcaaat 2041 ccgggagtta aggggttaaa cagcgcgtgg aatttatcct gtcccgtggc ggaaagggtg 2101 gttaaagttc tgccgtggaa gctgttaata agggtgataa tggtatagta ttcctcgccc 2161 tttttctcgg cggaatattt tcttgcaacc ttaattgcgc actcgttcgc ttcagcgccc 2221 gagttggaga aaaacacctt tttcagccct gttttaaggc acaaagcttc ggccagcttc 2281 gcgcaaggct cggtataata taaattcgag gtgtgctgaa gtgttgagat ctgcttattt 2341 accgcctttt gccactcatc gtcgcaatat ccgaacgcgg ttacaccgat tcccgatccg 2401 aggtcaatat attccttgcc gtccgaatca taagctatgc ttcccttgcc cgaaacaagc 2461 tcaagcggga aacggccgta tgtaggggcg acatattgtt tgtcaagttg tgtaatgctc 2521 atttataaat cagcctttcg taaccatggt acctgcgccc tcgtcggtca aaagctccat 2581 aagtatggag tgagggattc gtccgtccat gataatgacg ttgttgacac cgtggttaag 2641 cgcttcaatg caacagtcaa cctttggaat cattccgccc gaaataacgc ccaatcggtt 2701 aagctcgtgg gcctcagcaa cggtgacctt tggaataagg gtcgaggggt cgtccttatc 2761 tctgagtatg cccgcaatgt cagtcatcat aatcagtctt tcggcgttca atgcgcccgc 2821 aatgtgcgcc gcagcagtgt cgccgttgat gttatatgta tttccctgct tatcgcaagc 2881 aacagttgaa acaacgggga tatatccctt ttcgagaaga tccttaacag gattgatgtg 2941 aatttttgtg atctctccga cgtagcccaa gcgttcatcc tttatctgcg cttcaatgag 3001 tctgccgtcg atgcccgaga ttcccattgc cttgccgccc ttcatttcaa gcaggttgac 3061 aagtgtctta ttgatctttc ctgccaaaac catctggacg atatcgacag tttccttgtc 3121 ggtaactcga aggccgtcaa caaactccgc ctttttgccg agcttttgca tcgtttcgct 3181 tatctcgggg ccgccgccgt gtaccaaaac gaccttgaca ccgataagcc acagcaaaac 3241 aatatcctcc atgacctgtt ctttaagctg agggtttatc attgcattgc cgccatattt 3301 gacaacgaca gttttgccgt tatagcgctt gatatatgga agcgcctgtg ttaaaacttc 3361 cgccctttcg gcgtttgaaa aaagtccctg cattattttt acctcttcaa aaaatcaagt 3421 gcgataatcg ccgttgatct taacgtagtc atatgtcaag tcgcatcccc aagcgttggc 3481 ggaatattcg ccgccgccca aggtgaccaa aatttcaatt tccttttcaa ggagaatttc 3541 ctttgcaata tcttctgaga agtcgacgcc tgcgccgttg cggcaaactt caatttcacc 3601 cttgggagat ttaaagctca cgccgatctt tgaaacatcg aggtctgcac cgctatatcc 3661 caaagcgcaa agaactcgtc cccagtttgc gtctgcgccg aacatcgccg cctttaaaag 3721 gcttgagcaa atgacgctct ttgcggcaat tttagcggtt tcaagcttat cggcaccggt 3781 gaccttgcac tctaagagtt ttgttgcgcc ctcgccgtcg ccggcgatca ttcggcacaa 3841 ggttacgtta actgtattaa gtgcaagcat aaactgctta aagtcctcgc cgtcgacaga 3901 aatctcatcg tttcctgcca ttccgtttgc caaaacaacg accatatcgt tggtcgaggt 3961 gtcgccgtca acgctgagca tattgaaggt gttctgaata tcgcttgaaa gcgccccttg 4021 gagcatttcg gaggatattg cacagtcggt ggtgatgaat acaagcatcg tcgccatatt 4081 gggatggatc attccgctgc ccttggcgat accgccgata tgacaggtct tgcccccgat 4141 ctcaaactca actgcaactt ccttggatat cgtgtcggtg gtcataattg cctgagcgca 4201 agcgttgccg ccgtcggctg aaagtccatc tgccaaaggc ttaatgccgt ttgcaatcgg 4261 ttcaatgtta agaggctgac cgattacacc tgtcgatgca acgacaacat cgccagcctt 4321 tacgccaagc tcctttgcaa caagatcaca catatcctga gcgatctcaa ggccgtttgc 4381 gttgcaggta tttgcgtttc cgctgttgca aataaccgcc tgtgccttgc cgtctgccaa 4441 attcttttta ttcaaaatta atggcgcacc cttaaccaga tttgtcgtat atacagccgc 4501 cgcattcgct tgaacctcgc tcaaaatgag ggctaagtct tttttggagt ggtttttgcg 4561 gattccgcag tgtattccgt tggctttaaa gccctttgcg gcacaaacac cgccgttaat 4621 gatcttcatc tgttctttct cctgttttat atattaagtc ctgccgattc atcggcaccg 4681 attagtatgt tcatgttctg aattgccgcg ccggatgcgc ccttgccaag gttatcaaac 4741 cgcgcaacca aaatgattct atcatcattt ccgtatgcgc ccacctgcat atcgtccctg 4801 ccggagaagg cgtttgatga aagcattccg tcagtatctg catcggggca atatttaatc 4861 agcccgtcgg tataatattc ggcgtatgcc gatttgatgt catcaagtgt gccgcaaatc 4921 tgcgccttgt gcaaaggtat ggtcacttcc attccgctgt aaaaatcagc aacaacggga 4981 caaaagacgg gaacgttttc aagtcccgaa attttcgcca tttctttaag gtgcttgtgt 5041 gtctgaccca aagcatactg acggggagca tccaaaagcc cgtttcttgc gtctgattca 5101 taatcagcga tcattttctt gccgccgccc gaatatcccg ttagtgagaa gcaggataaa 5161 agcgcatcgg gcttcaaaat tcctttttca accaagggtg ccacaagggc aacaaatccg 5221 ctggcgtggc aaccggggtt tgcaattcgg ttggatgatc ttattttctc acgctgtccc 5281 gaaagctcgg gcattccata tgcccaatca tcgttggttc ggtgtgcggt ggaggtatca 5341 atgatcttgg tgttgggatt atcgcacagc gcgaccgatt cacgcgccgc atcatcgggc 5401 aggcagagaa agacaatatc cgccgaattt atcgcctgct tttttgcggc ggggtctttt 5461 cttaaatcgt ccgagagggt gatgagggtg atatcatccc tgagtgataa cctctcgtga 5521 atacgaaggc ctgtggtgcc tgcgcttccg tcaataaaaa cttttgtcat tattttaaaa 5581 tctctttcac atattttatc tgcgtttcaa ccgacttgac cgaggttccg ccctcggaaa 5641 ctctcttttc aacgcaggtc aaaaggtcga tctcgccgta tagatcagca tcgaaaagct 5701 cgctgtgggc tttatatgct tcgagcggca actcttcaag // LOCUS sequence028 5382 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence028 VERSION sequence028 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..5382 /mol_type="genomic DNA" /organism="" /note="sequence028" CDS complement(762..1364) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MIYLNPSQSELLNDPKTTACFTGHRPEGIPFDIKFSDVNRGIVFS SIYLEIYEAYHRGYRTFITGMADGIDLLAGEAVEKLRDVYMNVRLVAVLPFKNQSGHYD DHYSTFRFTNLLHSANEVISISDDYYSGCFYARNRYMVDNSSLLIAAVATREGGSAYTV DYARSKGIDIKTVNLKALKKDLGLKNKELPDQTSIIF" /locus_tag="LOCUS_1800" /note="MGA_217" CDS 1487..2278 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MQKKLLKRAWAVTHTDRLKRNIEKLKAYFGEKTELMCVVKANCYG HGIEKLIPCMQDECDINWFAVSNLVEAQELRDLGVTGEILILGYTPPENAPELIEYDII QAITCEEYAKKLARYCPVGEKIRAHIAIDTGMTRIGIRAKDIDKCADEVERIVRTERIG VEGMFTHLAVADSEEATDKTYTDNQIETLMSLKKMLNKRLVVLEQVHFLNSAGSAYHFD ERSSLARVGIMLYGLSPNPEVKLPFELEPVMELKACVSQVK" /locus_tag="LOCUS_1810" /note="WP_009893196.1 serine racemase VanT catalytic subunit (Clostridioides difficile) [pid:34.9%, q_cov:97.3%, s_cov:35.1%, Eval:3.7e-35, partial hit]" /note="internal stop codon at [2276:2278](+)" /note="MGA_218" CDS 2402..2623 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MLIKGKRVPVIGRVCMDQLMIDVTDVENVCEGDEVTLIGRDGEDE ITADELAALYGTIGYEIVCGISPRVPRV" /locus_tag="LOCUS_1820" /note="WP_071542276.1 alanine racemase (Moorella thermoacetica) [pid:57.5%, q_cov:100.0%, s_cov:19.6%, Eval:1.0e-18, partial hit]" /note="internal stop codon at [2276:2278](+)" /note="MGA_219" CDS 2812..3291 /product="ribosome maturation factor RimP" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003732818.1" /transl_table=11 /codon_start=1 /translation="MADNSTVAKVRALAEPLCDELGLFLWDVRFEKEGATWYLRVFIDK DGGINMDDCEALHRPLNLLLDEHDPIPQNYIFEVGSCGLARSLTRPEHFEVCIGDEVRI RFIRPHNGEKEIIRTLTGYNKNLIAVSDGETEETIELSETAFVKLYDDGDLFGGL" /locus_tag="LOCUS_1830" /gene="rimP" /note="WP_003732818.1 ribosome maturation factor RimP (Listeria) [pid:37.4%, q_cov:91.2%, s_cov:94.8%, Eval:2.7e-23]" /note="MGA_220" CDS 3344..4390 /product="transcription termination factor NusA" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003231912.1" /transl_table=11 /codon_start=1 /translation="MNTKDLFEALKSIQQTSGIGGEELIEKIKQGILKAVKRDYPDTEN VYINIDPEKQKFEMNLLKLVVEEVNDPANEITLDEAKTYHKRIALGQMCEIPLSPATFG RVAASSAKQSIRSDIKQFERDRLVAQYQDKEHELVSATVQKVEPATGNAIVTIGSDEIY FPRNEQIPGEELKAGDIIKVYVVGVINPDKKPSVKVSRTHRDFVRRLFELEVPEIYDGT VEVKAISREAGSRSKIAVVSNNPDVDAIGACIGTRRARITAIVDELGGEKIDIINYSED DAEFIAKALAPAEVINVTLADDGTRSCTVVVPNNQLSLAIGNKGQNAKLAARLTGYKID IVPLNKEQ" /locus_tag="LOCUS_1840" /gene="nusA" /note="WP_003231912.1 transcription termination factor NusA (Bacillus) [pid:43.4%, q_cov:97.4%, s_cov:90.6%, Eval:9.3e-78]" /note="MGA_221" CDS 4391..4672 /product="YlxR family protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003388362.1" /transl_table=11 /codon_start=1 /translation="MQKKKIPVRTCLGCGEPKEKKSLIRVVRSPEGEISMDLTGKKSGR GAYICPDANCLKKAKKAKRLEKSFECAIPEEVYEKLEAELLGREEQNG" /locus_tag="LOCUS_1850" /note="WP_003388362.1 YlxR family protein (Clostridium) [pid:60.0%, q_cov:91.4%, s_cov:94.4%, Eval:1.3e-24]" /note="MGA_222" CDS 4665..4988 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MADITGSLTMCRRAGKLVLGMDEVKNACRSKKAMGVIVAKDLSER SLGEIAYTCATEGIKLYRTDCTMDDIGYALGKVYGIMAVTDAGFMKSMAKKSQELDAES IGY" /locus_tag="LOCUS_1860" /note="MGA_223" ORIGIN 1 aacattttga atgtttgaaa cgagcgcgga tgagtttgta tagcaagcgg aattgatgag 61 gcatacggca atttcgcctg taacgctatt ctgatccttt gctccgtttt cgtaaagagg 121 ataattgatg atcttgttaa tgtcgtcgcc ccagagggtt ctggttgcgg ggccgtggga 181 gaagctggtc agcgagccac tgacctcgtc cttataataa aggtcgtggg ggaagacata 241 tgtgctggtg ccgcccaaat attcaacaag ccttgtccag ccctcgttat ttatcttgat 301 atatttctcg ggggtgatgc cgaaggcatc ttcaatgccc ttgtaaagat atgtaaaacc 361 gcctgcttcg aaaagctgtg caagtgtgcc gcctgtatct ccgaccgttg cgagagtctg 421 gggagatatg ggtaccacct tgacggtgag cgtgtcgggc agaattcgca aaagagccat 481 actgttaatt gtttcgccct cggcgcagac aaacaaagcg gttcttcttg ccgaagcata 541 gtcattttca ttgtcaacaa cagtttgctg cgaattttcc ttctgattaa gcttgtcttg 601 cttcggttgg gtgacaaatt tatccagcag agccacagcc gcgcttccga aaattacaaa 661 acagatcagc attgtcacaa catatacaat taagacaggc gcttgtgaag catgttttct 721 tgacatggtt aactccttga tgtaaaatag atacggaaat atcagaatat gatagaagtc 781 tggtcgggta gttctttgtt tttgagcccc agatcttttt tgagggcttt aagatttaca 841 gttttaatat caattccctt tgatcttgca taatcaacgg tatatgccga gccgccttcg 901 cgggttgcaa ccgcggcgat caatagggat gaattatcca ccatataacg gttgcgggca 961 taaaaacagc ccgaataata atcatcgctg atgctgatga cctcgtttgc cgagtgcaaa 1021 agatttgtga agcggaaggt tgaatagtgg tcgtcataat ggcctgactg gtttttgaag 1081 ggcaacaccg ccaccaagcg cacattcata tatacatcgc gcagtttttc aacggcttcg 1141 cctgccaaaa ggtcgattcc gtcggccatg ccggtgatga aggtgcggta tccgcgatgg 1201 tatgcttcgt agatctcaag atatatcgag ctgaaaacga ttccgcggtt gacatcggaa 1261 aacttgatgt caaagggtat gccctcgggg cggtgacctg taaaacaagc ggttgttttg 1321 ggatcattta acagctccga ttggctggga tttaaatata tcacttgttc ttcggcgcct 1381 ccttcgggag aattttcaca acacatcgaa tatatattat aagaatatca catcgggctc 1441 aatttttcaa gcccattgag ttacattaaa ggacggaggg accctcttgc aaaaaaagct 1501 ccttaaaaga gcgtgggcag tgacccacac ggacagactt aaaagaaata tagagaaact 1561 caaggcatat ttcggcgaaa aaaccgagct tatgtgcgtt gttaaagcaa attgttatgg 1621 ccacggaatt gaaaagctga ttccatgtat gcaggacgag tgcgatatca actggtttgc 1681 ggtttcaaat ttggttgaag cccaggaatt gagagatttg ggagttaccg gggagatact 1741 cattttgggc tataccccgc cggaaaatgc ccccgaactg atcgaatatg acattattca 1801 ggcgatcacc tgcgaggaat atgccaaaaa actggcaaga tattgccccg ttggcgaaaa 1861 gatcagagcg cacattgcaa ttgacacagg tatgaccaga atcggaataa gagcgaagga 1921 tattgataag tgcgccgacg aggttgaaag aattgtacgc accgagcgaa ttggtgttga 1981 gggaatgttt acccaccttg cggttgccga cagcgaggaa gcaaccgaca agacatatac 2041 agacaaccag atcgaaactc tgatgagcct taaaaagatg ctcaacaaac ggcttgttgt 2101 gctggaacag gtgcattttc tcaactctgc aggttcggca tatcactttg atgagcgttc 2161 aagcctggcg cgtgtgggaa ttatgctcta tggcctcagc cccaaccctg aagttaaatt 2221 gcccttcgag cttgagcctg taatggagct taaagcctgc gtatcgcagg tcaaataggt 2281 tgaagcgggg gtcgatgtca gctacggcag gacatatacc accgacaaga ccacaaaaat 2341 cgctgttgta accatcggct atgccgacgg atatccgagg cttttgtcgg gcaaggcgag 2401 cgtgctcatt aaaggcaagc gtgtgcccgt tatcggcagg gtgtgtatgg accagttgat 2461 gatcgatgtg acagatgttg aaaacgtctg cgagggcgac gaggtaacct tgatcggtcg 2521 agacggcgag gacgagataa ctgccgatga gcttgccgct ctttacggca ccatcggata 2581 tgagatagtc tgcggaatct ctccgagagt gcccagggtg tgatgctgcg gaacggtaaa 2641 atggcgcaaa accgccgttt ttgcgcaaaa acaggggaac ttttttcaaa aaaacccttg 2701 cattttcaaa aaagcgtgtt atactattta tagaatattg tattaagaaa ggctggaatt 2761 aaaaactccc gccttttgtg tttagttgga agatttttaa ggaggataat aatggctgac 2821 aattcaactg ttgcaaaggt cagagctctg gccgagcctc tttgcgatga gctgggctta 2881 ttcctgtggg atgtccgatt tgaaaaagag ggcgccacat ggtatttgag agtattcatc 2941 gacaaggacg gcggaatcaa tatggacgac tgcgaagcgc tccatcgccc gcttaacctt 3001 ttgcttgacg agcatgaccc cattccccag aactatattt tcgaggttgg ctcctgcgga 3061 cttgcaagaa gccttacccg ccccgaacac tttgaggtct gcataggcga cgaggtcaga 3121 atccgattta tccgtcccca caacggcgaa aaggaaatta tccgcacgct gacgggatat 3181 aacaaaaact taattgccgt ttcggacggc gagaccgaag aaaccattga gctgagtgag 3241 accgcttttg tcaaattgta tgacgacggc gacctgttcg gcggtttata atataagtca 3301 tttaaattca aactgaatat acagaaagga ttggtcacaa aacatgaaca ccaaggattt 3361 atttgaagcg cttaaaagca ttcagcaaac aagcggaatc ggaggcgagg agcttattga 3421 aaaaattaag cagggcatcc tcaaggccgt aaagagggat tatcccgaca ccgaaaatgt 3481 ctacatcaac attgaccccg aaaagcagaa gtttgaaatg aacctgctca agctggtcgt 3541 tgaggaggtc aatgaccccg caaacgaaat tactcttgac gaagcaaaaa cttatcacaa 3601 gagaatcgct ttgggccaga tgtgtgaaat tccgctttct cccgcaacat tcggcagagt 3661 tgccgcatca agcgcaaagc agtcgattcg cagcgacatt aagcagtttg agcgcgacag 3721 attggttgca cagtatcagg ataaggaaca cgagcttgtt tccgcaaccg ttcaaaaggt 3781 tgaacctgca acaggcaacg cgatcgtaac catcggatcg gacgaaattt atttccccag 3841 aaacgaacag attcccggcg aagagctcaa agccggcgat atcatcaagg tttatgttgt 3901 gggtgttatc aaccccgaca agaagcccag cgttaaggtc agccgtaccc acagagattt 3961 tgtaagacgt cttttcgagc ttgaagttcc cgaaatttat gacggcaccg ttgaggtgaa 4021 ggcgatctcc cgcgaggcag gctcaagaag caagatcgca gttgtttcca acaaccccga 4081 tgttgacgct atcggcgctt gcatcggcac aagacgcgca agaatcaccg ccattgttga 4141 tgaattgggc ggcgaaaaga tcgacattat caactatagc gaggacgatg ccgaattcat 4201 cgcaaaggct ttggctcccg ctgaagtaat taacgttaca cttgccgacg acggcaccag 4261 aagctgcacc gttgttgttc ccaacaacca gctttctctt gcaatcggca acaagggaca 4321 aaacgcaaag cttgcagccc gtttgaccgg ctacaagatc gacattgttc cccttaacaa 4381 ggagcagtaa atgcaaaaga aaaagatacc cgtcagaacc tgtcttggct gcggtgagcc 4441 gaaggagaaa aaatctctca tccgcgtggt gcgttcaccc gagggagaga tatcaatgga 4501 cttaacgggc aagaaatcgg gaagaggcgc atatatctgt cccgatgcaa actgcttgaa 4561 gaaagcgaaa aaagccaaga ggcttgaaaa aagcttcgaa tgtgcgatcc ccgaagaagt 4621 ttatgaaaag cttgaagcag agcttttggg aagggaagag caaaatggct gatataacag 4681 gaagccttac catgtgcaga cgagcgggca agcttgtttt gggtatggat gaggttaaaa 4741 acgcctgccg ctcgaaaaaa gcgatggggg ttattgttgc caaggatttg agcgagcgaa 4801 gcctcggaga aattgcatat acatgtgcaa ccgaaggaat aaagctctat cgcaccgact 4861 gcacgatgga tgacatcggc tatgcgctcg gaaaggtata cggcattatg gctgtgaccg 4921 atgcgggatt tatgaagtcc atggcaaaaa aatcgcagga gctggatgct gagagtatcg 4981 gctactgatt ggaattaagg agatatgcct atgattacta aatataagtt aaacgattta 5041 gctaaagact taaagcttaa cgccaacgat attattgagt gcttggctca tcagtatggc 5101 gcgaagaaaa cggtttcatc cctcacaccc gaggaagtga actacgtttt ggaggtcttc 5161 tcccagaagc accaggttga aaacttcaac gcatacttcg ctgataagac cgccaccaag 5221 aaggctaagg aagaacccaa ggctgaaaag cccaagaagg aagctcccaa ggctgagcct 5281 aagaaggaag aacctaaaaa ggaagctccc aaggctgaag ttaaaaagga acagcccaaa 5341 aaggaggctc ctaagcccga ggttaagaag gaagaaccca cg // LOCUS sequence029 5371 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence029 VERSION sequence029 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..5371 /mol_type="genomic DNA" /organism="" /note="sequence029" CDS complement(244..402) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MWPTIIVGAIVAAIFIAVIVKMIKDKKAGKSSCSCGCAGCPMSGS CHNKNNK" /locus_tag="LOCUS_1870" /note="MGA_225" CDS complement(416..2575) /product="ferrous iron transport protein B" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011460242.1" /transl_table=11 /codon_start=1 /translation="MDIKIALAGNPNCGKTTLFNALTGSNQYVGNWPGVTVEHKEGKYK KQDGVIITDLPGIYSLSPYTLEEVVARNYLIGERPDAILNIVDGTNLERNLYLTTQLTE LGIPVVVAINMMDVVRKNGDKINTEALSKKLGCKIVEISALKGTGIEEAAEAAIEAANE HKVFVPMHNFSGAVEHALAHIEEAAIHELPADQQRWYAIKIFERDEKVLSAFKLDEKTV AHIEEDIVAAEAEMDDDAESIITNERYNYIASILKGVYIKKNSSRLSTSDKVDLVLTNR WLAIPIFVLVMFFVYYISIGSIGDWTVGFMNDTLFGGIIVPGVASFLENIGCASWLVSL VADGIVGGIGAVLGFVPQMMILFFLLSILEDVGYMSRVAFILDKVFRKFGLSGKSFIPM LVASGCGVPGIMASRTIDQDRDRKMTIMTTGFIPCSAKTPIIGMIAGALFGGSPLIATA AYFIGIGAVIISGIMLKKSKPFAGNPAPFVMELPQYHAPVMSNILRSTWDRGWGFIKRA GTVILAASVIIWILNSLSFDGGLHFIAEGMESNSILNVIGSAIAVIFKPLGFGGWQAAV ATILGLVAKEEVVGVFGSLSSMANADIAFEAVESADSVKLAIIAQEFFGGSKLAGFSFM IFNLLCAPCFAAMGAIKREMNNWKWTAFAIGYMSVFAYAVSLITYQLGMFIATGLFTFW TAVAFAVLALMLYFIFRKDKNALNH" /locus_tag="LOCUS_1880" /gene="feoB" /note="WP_011460242.1 ferrous iron transport protein B (Desulfitobacterium hafniense) [pid:58.8%, q_cov:98.9%, s_cov:97.9%, Eval:3.6e-240]" /note="MGA_226" CDS complement(2639..2860) /product="FeoA family protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011460243.1" /transl_table=11 /codon_start=1 /translation="MKTLKDIKIGKTCRVVKLHGEGAIKRRIMDMGITKGVEIYVRKVA PLGDPIEINLRGYELSLRKADADMIEVE" /locus_tag="LOCUS_1890" /note="WP_011460243.1 FeoA family protein (Desulfitobacterium) [pid:75.3%, q_cov:100.0%, s_cov:100.0%, Eval:4.7e-27]" /note="MGA_227" CDS 3138..3506 /product="metal-dependent transcriptional regulator" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_005811011.1" /transl_table=11 /codon_start=1 /translation="MTLQESGEMYLETIYVLTKEKGAGVRAVDVSEHMGYSKPSVSRAV GLLKQGGYLETDKDGLLILTDIGRAVAEKTYERHSVLTEFFKAIGVDADVASLDACKVE HCISDDTFEAIKNHLSKI" /locus_tag="LOCUS_1900" /note="WP_005811011.1 metal-dependent transcriptional regulator (Desulfitobacterium) [pid:53.4%, q_cov:95.1%, s_cov:91.3%, Eval:3.3e-33]" /note="MGA_228" CDS complement(3550..3861) /product="thioredoxin" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_007329897.1" /transl_table=11 /codon_start=1 /translation="MAVIVINKDNFETEVLKSDKPVVLDFWATWCGPCRMVSPIVDEIA EERDDIKVGKINVDDDGELANQFGVNAIPTIVKIENGEVKATSIGYKEKAALIEALGL" /locus_tag="LOCUS_1910" /gene="trxA" /note="WP_007329897.1 thioredoxin (Rhodopirellula) [pid:53.0%, q_cov:97.1%, s_cov:92.6%, Eval:1.7e-29]" /note="MGA_229" CDS complement(3985..4254) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MQMRSKTAINEPPPAELSPPPSPVAEASAMSIQHHHQPPQEMRNG DIFSNLLGGIGIGTDKLLILLVLFILYKNKADIKLLIALAYLML" /locus_tag="LOCUS_1920" /note="MGA_230" CDS complement(4301..4654) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MEDLAGKLTALLQDEESLKQIQELAEMMGLSSPSESPPLPQQVGE IPDIGQIMGLVNLLQEAKTDDENICFLNALRPLLGEERRPRVDKAVKLLRLLNMLPAIK ESGILGGDLFGIF" /locus_tag="LOCUS_1930" /note="MGA_231" CDS complement(4691..4927) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MNLSKEQLDALIGTVSQKSGISKEQLQSELQKGTFDSLLSTLPAG EAQKLTAALANPATAGILLNTPQAKELIKKLFG" /locus_tag="LOCUS_1940" /note="MGA_232" ORIGIN 1 cggatttaat cccgacgcaa agggtgaggt atctcacgca ttccgcagga tgcgtgggaa 61 gtgcgccgcg cgcccacggc aaactcagga agcctgcgcc gaatggccct ctgtcagttt 121 tgttgccacc tttcccgaag ggaaaggctt ctccatatgc ctcatttcac gcggcacccg 181 caaaagccct cccgccccga cttgggatca gtgtcggagc gggagggcgt atttacaggt 241 gcgttatttg ttgtttttat tgtggcagga accgctcatc gggcagcctg cgcatccgca 301 ggagcaggag cttttgcctg cctttttgtc tttgatcatt ttaacgatta ccgcaatgaa 361 gatagcggca acgatcgcac caacaataat tgtcggccac atttttcatt cctccttagt 421 gattgagggc atttttgtct tttctgaaga tgaagtatag cataagtgca agcaccgcga 481 atgcaactgc agtccagaat gtgaataaac cggttgcaat gaacataccc agctgatatg 541 tgatcagcga tactgcatat gcgaatacgc tcatatatcc gattgcaaac gctgtccact 601 tccagttgtt catttctctc ttaattgcac ccattgctgc gaagcaggga gcacacaaaa 661 ggttgaagat cataaagctg aagcctgcaa gcttgcttcc gccgaagaat tcctgagcga 721 taattgcgag cttaacagag tctgccgatt caacagcctc aaatgcaatg tcagcatttg 781 ccattgacga aagcgaaccg aatacgccca caacctcttc ctttgcaacg agtccgagta 841 ttgttgcaac cgccgcctgc caaccgccaa agcccaaagg cttaaagatt acagcgattg 901 ccgagccgat aacattgaga atagagttgc tttccatacc ttctgcgatg aagtgaaggc 961 ctccatcaaa ggaaaggctg ttgagtatcc aaatgataac gcttgcagcg aggatcacag 1021 tacctgcgcg cttgatgaag ccccagcctc ggtcccaagt ggagcgcaaa atgttggaca 1081 ttacaggcgc atggtactga ggaagctcca taacaaaggg cgcgggatta cctgcaaaag 1141 gtttggattt cttgagcata atgcccgaga taattactgc accgataccg atgaagtatg 1201 ccgcagttgc aatcaagggg cttccgccaa agagggcacc tgcaatcata ccgatgatag 1261 gtgtttttgc agagcaagga ataaatcctg tggtcataat ggtcattttt ctgtcgcggt 1321 cctggtcgat ggtgcgggat gccataattc cggggacacc gcagcctgaa gctacaagca 1381 tcggaatgaa gctcttgccc gaaagaccga acttgcggaa gaccttatca agaataaatg 1441 caactcttga catatatccc acgtcctcaa gaatcgagag caggaagaaa agaatcatca 1501 tttgaggaac gaagcctaaa accgctccga taccgccgac gataccgtct gcaaccaggc 1561 taacgagcca actcgcgcat ccgatgtttt caaggaagct tgcaacgccg ggaacgataa 1621 ttccgccgaa gagggtgtcg ttcataaatc caactgtcca atcgccgatc gaaccgatgg 1681 aaatataata aacgaagaac attaccagaa cgaaaatggg aattgcaagc cagcggttgg 1741 tcaaaacaag gtcaaccttg tctgatgttg aaagtcttga actgtttttc tttatgtaaa 1801 cgcccttgag aatcgaggca atatagttat atctctcgtt ggtgatgatc gattctgcat 1861 cgtcatccat ctctgcttct gccgcaacga tgtcttcctc gatgtgtgca accgtcttct 1921 catccagctt gaatgccgaa agaacctttt cgtcgcgctc aaatatcttg attgcatacc 1981 atctctgctg atctgcggga agctcgtgaa tagcagcctc ctcaatgtga gctaaagcgt 2041 gttcaaccgc accgctgaag ttgtgcatag gtacaaatac cttatgctcg ttagcagctt 2101 caatcgccgc ttctgcagcc tcctcaatgc ctgtgccttt gagagccgat atctcaacga 2161 tcttacagcc gagcttcttt gaaagtgcct cggtgttgat cttgtcgccg ttctttctga 2221 caacgtccat catgttgatt gcaacaacaa cgggaattcc cagttcggtg agctgagttg 2281 taaggtatag gttgcgttca aggtttgtgc cgtcaacaat attgagaatt gcgtcgggac 2341 gctcaccaat gagatagttt ctcgcaacga cctcttcaag ggtgtagggc gagagggaat 2401 agatgccggg aaggtcggta atgataacgc cgtcctgctt cttatatttg ccttccttat 2461 gttcaactgt tacgcccggc cagttgccga cgtactgatt cgagcctgtg agtgcattga 2521 aaagagtggt cttgccacag ttcgggttgc ccgcaagggc gattttaatg tccattctgt 2581 ttcctccatt agttagcata cactaactgt tgtctatgaa aatcgggcgt cacccgaatt 2641 attcaacctc gatcatatca gcgtcagcct tacgcaatga aagctcatag ccacgcaggt 2701 taatttcaat cgggtcgccc aaaggagcaa cttttctgac gtatatctca acgccctttg 2761 taatgcccat atccataatt ctgcgcttaa ttgcgccttc accgtggagc ttgacgacac 2821 ggcaggtctt gccgatctta atatctttga gagtcttcat actaatcctc cgaaataagt 2881 cgatatgcgt gcaaagcatc gagttagcct cggctaacta aatagaattt tacaactttg 2941 tcttggtttt gtcaatcatt ttgacgaaaa aaggacaggc tttttgtcaa atttgtatgt 3001 ttgctgacgg gttagccaaa gctaactcgc ctttttgtgc aaaacatcca aattgcacgg 3061 aaaaatcttc acttgaaaaa ccacggcctt tgtggtatca ttataatata ttatcggcaa 3121 aggaggctca tacaaaaatg acattgcagg aatcaggcga gatgtatctt gaaaccatat 3181 atgttcttac aaaggaaaag ggcgccggtg tccgcgcagt tgatgtcagc gagcatatgg 3241 gctattccaa accaagcgtc agccgtgcag tcgggctttt aaagcagggc ggatatcttg 3301 aaacagataa agacggtttg ctgattttaa ctgacatcgg cagagccgtc gccgaaaaga 3361 cctatgagcg ccacagcgtt ttaaccgaat tcttcaaagc catcggtgtc gacgccgatg 3421 tggcatcctt agatgcctgc aaggttgagc attgtatttc ggatgacacc ttcgaggcga 3481 tcaaaaatca tttgagcaag atataaaaaa gacccaccgt ttatagcggt gggttttctt 3541 ttgtttaaat caaagaccaa gagcttcaat cagcgcagcc ttttctttat atccgatgct 3601 ggttgccttt acctcgccgt tttcaatctt gacgatggtg ggaattgcgt taacgccgaa 3661 ctgatttgca agctcgccgt catcatcaac gtttatcttg ccgaccttga tgtcgtcgcg 3721 ctcctcggcg atctcgtcca caatagggga taccattctg caggggccgc accatgttgc 3781 ccagaaatcg agaacaacgg gcttgtcgct cttcaaaact tcggtttcaa agttgtcttt 3841 atttattaca ataaccgcca tacttttaac ttcctttcga tttatatatt cttttagtat 3901 ctttttaaaa ttaggaatta ttcctatatt taaattataa catatttcca aaaaatgtca 3961 acccctgccg aaaacggcaa gggtctaaag catcagatat gccaaggcga tcaaaagctt 4021 gatatccgcc ttgtttttat atagtatgaa cagcactaaa agtataagta gcttatctgt 4081 cccgatgccg attcccccga ggagatttga aaatatatcg ccgtttctca tttcctgcgg 4141 tggctgatgg tgatgttgaa tcgacatagc acttgcttca gccacgggag agggcggcgg 4201 gctgagttct gcgggcggcg gctcattgat tgcggttttt gagcgcattt gcatctgccg 4261 aagcctttcc attgcttcaa gttgcatctt tgaaaattcc tcagaatatt ccaaacagat 4321 cccctcccaa aatacccgat tctttaattg caggaagcat atttaacagt cgcaaaagct 4381 taaccgcttt atcgacacgc ggtcgccttt cctctcccaa aagcggccgc agagcattta 4441 aaaagcagat gttttcgtca tctgtctttg cttcctgcaa cagattcacc agccccataa 4501 tttgcccaat gtcgggaatt tctccgacct gttgaggcaa tggcgggctt tcggaaggcg 4561 atgaaagacc catcatttct gccagctctt gaatctgttt aaggctttct tcatcctgaa 4621 gaagagctgt gagcttccct gcaaggtctt ccatatgtaa tatcaccctc cttccgaatc 4681 acatcgacaa tcagccgaac agctttttaa tcagttcttt tgcctgcggc gtattgagca 4741 aaatgcctgc cgttgcggga tttgccagcg ccgccgtaag cttttgggct tcccctgcag 4801 gaagtgttga gagcaggctg tcaaaggtgc ctttttgaag ctcgctttga agctgttcct 4861 ttgaaattcc tgatttttgt gaaactgtgc cgatgagcgc atccagctgt tcttttgaaa 4921 ggttcataac tatgcctccg aatttatcta ttgaaaaaga tttaaaggta tgctaaaatg 4981 tagtagtatt tatagcccaa agggggaaac cgtttgaaga taattgcatt ttccgataca 5041 caccgtaggt ttgagcgggt tgaaaagctt tttgaaaaga cacatcttta tgcggacgcc 5101 tattgctttg cgggcgacgg acttgacgat gtggagaata tgttttatct ttatcccacc 5161 aagcctatcc atcaggttgc gggaaattgc gattggggcg caatggaaaa gttcatcgac 5221 gttttcgagg tcgagggaca taagatcctt ctcacccacg gtcatcttca aaacgcgaag 5281 tatggctccg acggactttt gagagccgcc cgcgacaacg gttgtgacct tgtaatcttc 5341 ggtcataccc atgagaagct ctgcgagtat c // LOCUS sequence030 5369 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence030 VERSION sequence030 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..5369 /mol_type="genomic DNA" /organism="" /note="sequence030" misc_feature <1..900 /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_010965428.1:UDP-N-acetylmuramoyl-L-alanyl-D-glutamate--2 ,6-diaminopimelate ligase" /note="WP_010965428.1 UDP-N-acetylmuramoyl-L-alanyl-D-glutamate--2,6-diaminopimel ate ligase (Clostridium) [pid:46.6%, q_cov:99.0%, s_cov:61.2%, Eval:7.4e-70, partial hit]" /note="MGA_234" /locus_tag="LOCUS_1950" CDS 925..1947 /product="phospho-N-acetylmuramoyl-pentapeptide-transferase " /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003232192.1" /transl_table=11 /codon_start=1 /translation="MPYWINLTVGLLSLIIAAAFGLILIPYLRKLKAGSHILEIGPAWH KSKEGTPLMGGFMFILSVVLSMVAGFFIISAVKQANGIALDPKAGLKLLSAIGFSLGLT AVGFIDDYIKVVKKRNMGFNVKAKTICQALVVALYMIAQHLLGEMTTEVVFPIFGAVDF GFFYYPIMAVAIYFMVNAVNFTDGVDGLCGSVTTVYSVAFAIIFVVLGNWEFSALSMAV AGGCLGFLVWNLHPAKVFMGDTGSMFLGGITVALGFASGLELLIPLVGIIYVCEAMSDV IQIASYKIRKKRVFKMAPIHHHFEMCGWSEYKIVIIFSAVTLVAGFLGILSAVLYSAGK " /locus_tag="LOCUS_1960" /gene="mraY" /EC_number="2.7.8.13" /note="WP_003232192.1 phospho-N-acetylmuramoyl-pentapeptide-transferase (Bacillus) [pid:39.6%, q_cov:92.9%, s_cov:93.8%, Eval:3.4e-61]" /note="MGA_235" CDS 1987..3249 /product="stage V sporulation protein E" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003244810.1" /transl_table=11 /codon_start=1 /translation="MANSAAKKRYNFILSAESPTKENGKKLPVQETVEPQNGKKPKEKE PGLRLYDGPLDTVFFIIIIVLLVCGIVMMFSASYIEGLSKGDGYMYVRTQCFAAVVGVL LMVFISFWDYHILMNSKIVISAFVVLLGLLTYTTFFGDAEYGARRWIYIGNQSIQPSEM MKPVLIVFLAYIMVKKAGNFKSFRKDVFPLIVVMGLVCINMVFQRHISGLLLMGVIGLV VIFVGGMPWKQFMQLIAVIAVAAVVAILLYSMLTGGGLSYILDRIKSMGQADEEINDDT WQTAQSLIAIGSGGWFGLGFGESRQKYLWLPESQNDFIISIIVEELGYLGGLVVVLLFG LFIYRGFHIARKAPDRFGMLIVMGIIFQLGTQAILNIGVACNAFPNTGISLPFFSSGGT ALLIQLAEMGVVLAVSRQSEV" /locus_tag="LOCUS_1970" /gene="spoVE" /note="WP_003244810.1 stage V sporulation protein E (Bacillus) [pid:33.2%, q_cov:86.4%, s_cov:97.3%, Eval:1.1e-46]" /note="MGA_236" CDS 3362..4498 /product="undecaprenyldiphospho-muramoylpentapeptide beta-N-acetylglucosaminyltransferase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003232184.1" /transl_table=11 /codon_start=1 /translation="MLKVILAGGGTAGHVNPALAISEIIKESYPDAKFLYVGTPNGIER ELVRKAGLDFAPMEVAGFQRKINMTNLKRNVKAAMYLLKSPKRAKAIINEFKPDLVIGT GGYVSGPIVMQAAKMGIKTCIHEQNAFPGVTTKLLSKKVDKVMLTVEKANDYLDCDKSK CVVTGLPVRSGFAKKKIGKSEARRQLGFDDSVTILSTGGSLGAGIINETVSDLIAWYEQ KGVKVNHIHSFGMNGRQSFLKSLVDKGVNLAERPNYIVKEYIDNMSVCMEAADLIISRC GAGALTEIEAVGCGSVLIPSPIVAENHQYHNGMVLANAGAAILYEQKNMTSQVLIDTVS GLLNEPARLEELSRNAASLYISDTNSRIAEVIAEVLKK" /locus_tag="LOCUS_1980" /gene="murG" /EC_number="2.4.1.227" /note="WP_003232184.1 undecaprenyldiphospho-muramoylpentapeptide beta-N-acetylglucosaminyltransferase (Bacillus) [pid:38.0%, q_cov:99.5%, s_cov:100.0%, Eval:7.0e-66]" /note="MGA_237" ORIGIN 1 caaaagcgcc ttgagggaat caagttcgag ctgggcgtat ttacaaacct cactcaagac 61 cacttagatg tccacggcac gatggaaaac tactatcagg cgaaaaagct cctctttgaa 121 aagagcaagc aggcacttat aaataccgac agcgactggg gcaagcgcct gtttaatgaa 181 ataacctgcc cgaaaaagag cttttcaatt atagataaag ccgattatac tgctgacgga 241 atcaagcttc tgccccattg ctccagctac tggtattcaa acggcgaaaa gacctttaaa 301 gcggctgtga gacttcccgg aatgtacaac gtttccaaca cccttgctgt tttggcatcc 361 ctcgagcttt tgggccagtc gcccaacatc tgtgtgccct tcatctcggc tgttcaaggc 421 gttcgcggca gatgcgaagt tgttgatacc gacagagatt tctccgttgt actcgactat 481 gcccacaccc ccgatgccat tgaaaacatc ctcaaaaacg tcggtgaatg cgctacgggc 541 agagttgtct gcctgttcgg ctgcggcgga aaccgcgacg caaaaaagcg ccccttaatg 601 gcgcaggcag cggcaaaata tgccgacttc ttggttatca cctccgataa tccccgaaac 661 gaagacccga atgcaatcat ctctgaaatc gttgggggac ttcccgaaga ttacaatagc 721 tacgttgcaa ttgaaaaccg ccgtgatgcc atcttctggg caatcaaaaa cgcgaaacca 781 aatgatgtta ttgtcttggc gggcaaggga catgaggact atcaggttct taaagacaat 841 gttaaaattc acttcgacga gcgcgaagtg gtgaaggaag ctctttgtga gcttaaataa 901 acacacaaag gaacggaaat taaaatgcct tattggataa atttaactgt aggacttttg 961 tccttgataa ttgctgcggc tttcggactt attctgattc catatcttcg caagcttaaa 1021 gcaggctcac atattcttga aataggtcct gcgtggcata aatccaaaga gggcacacct 1081 ttaatgggcg gttttatgtt cattttatcg gttgtgcttt caatggttgc aggctttttc 1141 attatttctg ctgtcaagca ggcaaacggc attgccctcg atcccaaggc gggcttaaag 1201 cttttgtcgg caatcggctt ttcgctgggc ttaactgctg tcggctttat tgatgactac 1261 ataaaggtcg ttaaaaagcg caatatgggc tttaacgtca aggcaaagac catctgtcag 1321 gcacttgttg ttgcgctcta tatgattgca cagcaccttt tgggcgagat gacaaccgaa 1381 gttgttttcc cgatcttcgg tgctgttgat ttcggctttt tctattatcc cataatggca 1441 gttgcaatct attttatggt caatgctgtc aacttcaccg acggtgttga cggcctttgc 1501 ggctcggtga caactgtata ttccgtcgca tttgcaatca tctttgttgt tttgggcaac 1561 tgggaattct cggcactttc aatggctgtt gcgggcggat gcttaggctt tttggtctgg 1621 aatttgcacc ccgcaaaggt atttatgggc gataccggtt caatgttttt gggcggtatc 1681 actgtggcac tcggctttgc atcgggactt gagctgctca ttccccttgt tggcataatc 1741 tatgtctgcg aagcaatgag cgatgtcatt cagatcgcgt cctataagat aagaaaaaag 1801 agagtattta aaatggctcc gatccaccac cactttgaaa tgtgcggctg gagcgaatat 1861 aaaattgtaa tcattttcag cgctgtgacc ttggttgcag gcttcttggg aattttgagc 1921 gcagtgctct attccgcagg caaataaacg caaaataaaa acaaacaaaa cgggagggcg 1981 aacgatatgg caaattctgc ggcaaagaaa agatataatt tcatattgag cgccgaatct 2041 cccacaaagg aaaacggcaa aaaactgcct gtgcaggaaa ccgtcgaacc ccaaaatggc 2101 aaaaaaccga aggaaaagga gccgggcttg cgcttatatg acggtccgct tgatacagta 2161 ttcttcatta tcatcattgt gcttttggtc tgcggcattg ttatgatgtt ctcagcatca 2221 tacattgaag gtctttcaaa aggcgacggc tatatgtacg tccgtacaca gtgcttcgcg 2281 gcagttgtcg gcgttttgtt aatggtcttc atctctttct gggattacca cattttgatg 2341 aactcaaaaa tcgtaatttc ggcgtttgtt gttcttttgg gattactaac atatacaacc 2401 ttcttcggtg atgccgaata tggcgcaaga agatggatat atatcggcaa ccagtcgatt 2461 cagccgtccg agatgatgaa gcctgttttg atcgtatttt tggcatacat catggttaaa 2521 aaggcgggta acttcaaatc attccgcaag gatgtattcc cgctgatcgt tgtaatggga 2581 cttgtctgca taaacatggt cttccagcgc cacatttcgg gacttcttct gatgggtgtc 2641 atcggactcg ttgtcatttt cgtcggcgga atgccttgga agcagtttat gcagcttatt 2701 gctgtcattg cagttgcggc agttgttgca attttgctct attcaatgtt aacgggcggc 2761 ggactatcat acattcttga ccgaatcaag agtatgggtc aggcagacga ggaaatcaac 2821 gacgacacat ggcagacggc gcagtcgtta attgcgatcg gctcgggcgg atggtttggc 2881 cttggcttcg gcgaatcaag acagaaatat ctttggcttc ccgaatcgca gaacgacttc 2941 attatttcaa tcatcgtcga agaacttggc tatctcggcg gactcgtcgt tgttttgctc 3001 ttcggtctgt tcatctatcg cggattccat attgcgcgaa aagctcccga tcgctttgga 3061 atgctcattg ttatgggcat aatcttccag ctcggaacgc aggcgatttt gaacatcggc 3121 gttgcctgca atgctttccc gaatacgggt atctcgctcc cgttcttcag ctcgggcgga 3181 acggctttgt tgattcagct tgccgaaatg ggcgtagtgc tggcggtatc ccgtcagagc 3241 gaggtttaaa acgttgtaac ccaatcgtca ccatttttta accgcaattt aattgacccc 3301 gactcatcgg gacgttacaa tattggcata atcttacata taataaggag catcaaaata 3361 tatgcttaaa gttattcttg caggcggcgg caccgcagga cacgtcaatc ccgctttggc 3421 aatctccgaa ataatcaaag aatcctaccc cgacgcgaag tttctatatg tcggcacacc 3481 caacggcatc gagcgtgagc ttgtccgcaa ggcaggactc gacttcgcac ctatggaggt 3541 tgcgggcttc cagagaaaga taaatatgac caaccttaag cgcaatgtca aggcggcgat 3601 gtatcttttg aaatcgccca agcgcgcaaa ggcaataatc aacgagttta agcccgacct 3661 tgtaatcggt acaggcggat atgtcagtgg ccctatagtt atgcaggcgg caaaaatggg 3721 cattaaaacc tgcattcacg aacagaacgc tttcccggga gtcacaacca agctcctttc 3781 aaagaaggtc gacaaggtta tgctcaccgt tgaaaaggca aatgactatc tcgactgcga 3841 taaatcaaag tgcgtcgtaa caggtctgcc tgttcgttcc ggctttgcta aaaagaagat 3901 aggtaagagt gaagcccgcc gtcagcttgg ctttgatgac agtgtcacca ttctttcaac 3961 gggcggaagc ttgggcgcgg gtataatcaa cgaaactgta agcgacctta tcgcctggta 4021 tgagcaaaag ggcgtcaaag tcaaccatat ccactccttc ggtatgaacg gcagacagag 4081 tttccttaaa agtcttgtcg ataagggagt taaccttgca gaaagaccca actacatagt 4141 taaagaatat atcgacaata tgtccgtatg tatggaagcg gcagacctca ttatcagccg 4201 ttgcggtgcg ggcgcactaa cagaaatcga agctgtcggc tgtggctctg tattgattcc 4261 ttctccaatc gttgccgaaa accaccagta ccacaacggt atggtattgg caaacgcagg 4321 tgccgcaatt ttgtatgaac aaaagaatat gacctcgcag gtgcttattg acaccgtcag 4381 cggactttta aacgagcctg cacgcttgga agagctttcc cgcaatgccg catctttata 4441 tatttccgac accaactcaa gaatcgctga ggtaattgcc gaggtgctca aaaagtaacc 4501 aaaaataatg actttcatat tatgctaaca gatagcttaa tgtgggggtc attatatgaa 4561 gagttcaaga cttataattg aaggcgggcg aaggctctcg ggcgagataa aagttacggg 4621 tgcaaaaaac gcctcgcttc cgattcttgc cgcttcgctt ttaacgggcg gcgaaaccgt 4681 tttgtttaac tgcccgtctt tgtcggatgt tttcaccgcc tgccgaattt taactcactt 4741 gggctgtcgg tgcaaacgtg aaaacggcgc attgataatc gactcccgcg atgttttggg 4801 ctatgagatc agcgaggagc tgatgcgaaa aatgcgctcc tcgatcgtat ttctgggggc 4861 ggtattatca aggctcggcc gttgcaggct ttcattcccc ggcggatgcg agctgggcgc 4921 ccgacccatt gatattcacc ttgcctcaat gcggaaaatg ggcgttaaaa tcgaagaatc 4981 ccacggtgtg ctcgattgct ccctcaattc ggggcttaac tcctgcgatg ttgttttgcc 5041 atttcccagc gtcggtgcaa cggaaaacat aatgcttctg gcggctcgct caagtgcgac 5101 cgtcaccata atcaatgccg cgcgcgaacc tgaaatctgc gaccttgaag cttatctcaa 5161 cgcttgcgga gcggatattc acggcgcagg ctcatcgact gtaactgtca agggagtgga 5221 aacgcttcac ccttgcgaat attccgtgat gcccgaccga atcgtagctt ctacatatat 5281 gtccgccgcc gcaatcacct cgggggaagt gatgctgagt gctgtgcggc caaacgatat 5341 gcacgcggtc acagcgctgt ttgaacaga // LOCUS sequence031 5305 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence031 VERSION sequence031 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..5305 /mol_type="genomic DNA" /organism="" /note="sequence031" CDS complement(258..1037) /product="Nif3-like dinuclear metal center hexameric protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_002852315.1" /transl_table=11 /codon_start=1 /translation="MANLHDIYEYINSVAPFGLQDKFDNSGLIIDSGREEITKVLLALD ATKKVIDEAHNLGCELIITHHPVIFHPLKELDVKYPAPYMFSKGISCISAHTKLYSAEY DISDMMFELLGMTNTGEILSVNRSYEGKPVGYGRFATCECISADDLAKLCKERFNSRAV KYTPGCDRITRVAVCSGAGGSMIYEADVNRFDALVTADVKHDQFLEAELQGKTIIDCGH YETEVIAMPYLYDILSEKFPEVKFFFSAAMSNTIKAI" /locus_tag="LOCUS_1990" /note="WP_002852315.1 Nif3-like dinuclear metal center hexameric protein (Campylobacter) [pid:35.1%, q_cov:86.1%, s_cov:86.7%, Eval:2.6e-25]" /note="MGA_240" CDS complement(1041..1730) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MTHSLNTRLLTAAEFVTRGGIACDVGTDHAYLAAYLADNVISEKV IACDIALGPIESAKATVSRMGLEDSITVIQSDGLELIPDEGITDFIICGMGGELILSIL LRADWLKRGVNLVLQPMTRASELREGLYENGFVIKSEKACRDGRFVYSVINAEYRGETR KLTPLQALIGGLDMTKPESLEYASAVCERLSVSSLGKISSNDEATREDGERELDLVHEL MEIINEV" /locus_tag="LOCUS_2000" /note="WP_002263081.1 tRNA (adenine(22)-N(1))-methyltransferase TrmK (Streptococcus mutans) [pid:41.7%, q_cov:67.2%, s_cov:67.2%, Eval:1.9e-21, partial hit]" /note="MGA_241" CDS complement(1749..1946) /product="DUF1858 domain-containing protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_010964076.1" /transl_table=11 /codon_start=1 /translation="MKITKDSIIGDVLALDSGCGELFLEIGMHCLGCPSATGETIAQAC EIHGADADELVAKLNAYFEN" /locus_tag="LOCUS_2010" /note="WP_010964076.1 DUF1858 domain-containing protein (Clostridium) [pid:50.0%, q_cov:92.3%, s_cov:93.8%, Eval:2.1e-11]" /note="MGA_242" CDS complement(2074..2340) /product="zinc-ribbon domain containing protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011391912.1" /transl_table=11 /codon_start=1 /translation="MYEDKTLVCRNCGNEFVFTAGEQEFYAEKGFENEPKMCKDCRKKK KEEGKQYFTAVCASCGKEAKVPFKPHDDRPVYCSECFAKQRGE" /locus_tag="LOCUS_2020" /note="WP_011391912.1 zinc-ribbon domain containing protein (Moorella thermoacetica) [pid:45.5%, q_cov:97.7%, s_cov:93.4%, Eval:1.3e-21]" /note="MGA_243" CDS complement(2422..2982) /product="RNA polymerase sporulation sigma factor SigH" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_010966429.1" /transl_table=11 /codon_start=1 /translation="MATSRYESYTDDELAVLAKSDKDAFDALLNRYLDSLHYAAGSYAV GRKGYIDADDYRSEGVLGLMNAVKHFDPNGDASFATFARVCSSNRMINAYKKSKKVMNF ETNFDGKAVDSVADRSGDISLRELGSAVADVVDNELSKLEANVFLSYLSGMTYKEIAAC LDISEKSVDNALGRVRRKLRDRI" /locus_tag="LOCUS_2030" /gene="sigH" /note="WP_010966429.1 RNA polymerase sporulation sigma factor SigH (Clostridium acetobutylicum) [pid:32.8%, q_cov:95.2%, s_cov:91.0%, Eval:1.4e-17]" /note="MGA_244" CDS complement(3161..4228) /product="cell division protein FtsZ" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003386373.1" /transl_table=11 /codon_start=1 /translation="MGFIMENDGMDLAKIKVVGVGGGGGNALNCIVSTGIQNVEYIAIN TDSQALKNSKATIKIQIGQKLTHGLGAGGKPEVGEGAAQESKEEIQDALKGADMIFITA GMGGGTGTGAAPVVAEIAKDMGILTVAVVTKPFTFEGPRKARAAENGIDRLLKNVDSLV VIPNQKLLTGRENLTMRQSFALADDILKTAVLSVTELILRHGEINVDFADVQSIMKEAG YAHMAIGHGEGKDKVADAVQQVISSPLLETSIKGARRLLLNVVMSEDIGTTDMADLTEQ ITKAAADDVELIFGADFNPDLSDTIDIIVIASDFDTYAAPIEEEEEAPAEEENSETKKG DPFYDNIWKFINNDK" /locus_tag="LOCUS_2040" /gene="ftsZ" /note="WP_003386373.1 cell division protein FtsZ (Clostridium) [pid:52.1%, q_cov:87.3%, s_cov:84.3%, Eval:8.3e-82]" /note="MGA_245" CDS complement(4381..5241) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MKDVVKTNPNKNAPKRRRRRRNLSLYYLLMFLFVAAVLFILSRTV LFNIKQYDVSGNMRYSTDQILTAGNLKVGKNMYNLDLDKTEQAIKKTLIYVEDVTLKRD LPDTLHVIVTEAVEFACCEYEGNRYCVISRGGRYLETEQPYKREELMMVTGLDLKGVAL GEDMDSHDENKLEIIFDLFDAIDKTCPDMITYIDITDRTNIKMGYADRIDIDFGSSLDY EYKLRYITAIIEENLDPEAAGKIIYHSSAAGASFISAADLELQAQQNAAAVTENTAETS TSDPQ" /locus_tag="LOCUS_2050" /note="MGA_246" ORIGIN 1 agcatacaga acatcggcgg aacctttggg ttttcaagct cgcgggatgt taagtgcact 61 ctggcggtgc ctgccgcggc gctgaaaagc accttttggt tgccgtcgtg aagtgtgcgg 121 aaagatatga cgaccgagcc cttggtgggt tggtgtattt tatcaatgcg tgagccaagg 181 agcgtttttt caagctctga ttttacaagg ctcagatata tgccgtcaag tgccaagggt 241 ggttgcctcc tgattagtta gattgcttta attgtgttgg acattgccgc cgagaagaag 301 aacttaacct cggggaattt ctcgcttaat atatcatata gatagggcat tgcgatgact 361 tcggtttcgt aatgtccgca gtcgatgatt gtcttgcctt gaagctccgc ctctaaaaac 421 tggtcgtgct tcacgtctgc ggtgacgagg gcatcgaagc ggttgacatc agcttcatat 481 atcatgcttc cgcctgcacc cgagcagacc gcgactcttg taatacggtc gcaaccgggg 541 gtatacttca cagcgcggga attaaacctt tctttgcaga gtttagccaa atcgtcagcc 601 gagatgcact cgcaggttgc aaacctgcca tagccaacag gcttgccttc atatgagcgg 661 ttgacactta aaatctcgcc tgtgttggtc atacccaaaa gctcgaacat catatcggag 721 atgtcgtact ctgccgagta gagtttggtg tgggcggata tgcaggatat gccctttgag 781 aacatatagg gtgcggggta cttgacatca agctccttta aagggtggaa aattacagga 841 tgatgggtaa taatcagctc gcagccgagg ttatgagcct cgtcgatgac ctttttggtg 901 gcatcgagcg ccagcaagac ctttgtaatc tcttccctgc ccgagtcaat aatcagaccc 961 gagttgtcaa acttatcctg taagccaaag ggcgcaacgg agttgatata ttcataaatg 1021 tcgtgcaaat ttgccatttt ttacacctca ttaattattt ccataagctc gtggaccaaa 1081 tcaagctcac gctcgccgtc ctctcgggtg gcttcgtcgt tggatgaaat cttgcctaaa 1141 gatgacaccg acaaacgctc gcatacagca gatgcatact caagcgattc gggctttgtc 1201 atatcaagcc cgccgataag agcctgcaaa ggtgttagtt tgcgcgtttc gccgcgatat 1261 tcggcattga tgaccgagta gacgaacctg ccgtcacggc aggctttttc cgatttgatt 1321 acaaatccgt tttcatacag cccctcacgc aattcggacg cacgggtcat cggctgaagc 1381 acgaggttta ctcccctttt cagccaatcg gctctgagca aaatgcttaa aatcagctcg 1441 ccgcccattc cgcagatgat aaaatcggtt atgccctcat cgggaataag ttccagcccg 1501 tccgattgga tgacggtgat actatcttca agtcccatac gggaaacggt tgcttttgcg 1561 ctttcaatgg ggcccaaggc gatatcgcaa gcgatgacct tttcggatat gacattgtcg 1621 gcaagatatg ccgcgaggta tgcgtggtcg gtgcccacat cgcaggcgat tccgccgcgt 1681 gtgacaaatt cagcggcggt taaaaggcgg gtgttaagtg aatgggtcat tattataatc 1741 tccgaaaatc agttttcaaa gtatgcattg agctttgcaa caagctcgtc ggcatcggca 1801 ccgtgaattt cgcaagcctg agcgattgtt tcgcctgttg cagaggggca gccaaggcaa 1861 tgcataccga tttcgaggaa aagctctccg caaccggaat cgagtgccaa aacatcgccg 1921 atgatggaat cctttgtgat cttcattttt cattctcctt taaatatata ttgttaagtt 1981 tattatacct cattttttgc atcattgcaa cacccgggaa aataaacgaa aaagcgcaga 2041 cccgaaacga gcctgcgccg aagaaattat taattattcg cctctctgct ttgcgaagca 2101 ttcgctgcaa tatacagggc ggtcatcgtg gggcttgaaa ggaacctttg cttccttacc 2161 gcaagatgca catacagctg tgaaatactg cttgccttct tctttcttct tctttctgca 2221 gtccttgcac atcttgggct cgttttcgaa gcccttttca gcatagaact cctgctcacc 2281 ggctgtgaaa acgaattcgt ttccgcagtt acggcatact aatgttttgt cttcgtacat 2341 aaatttccct cgcttaaaga attttgccaa gaccatgact aatcatggca attatctata 2401 aaaaccgtcg tgcggttttt atcagatcct gtcgcgcagt ttcctgcgca ccctgccaag 2461 tgcgttatcc accgatttct cggagatatc gaggcaagcg gcaatctcct tataggtcat 2521 gcctgaaaga tagcttaaaa atacgtttgc ttcgagtttt gaaagctcat tatcgaccac 2581 atcggcaacg gccgagccaa gctcacgcag ggaaatatct cccgagcggt cagcaaccga 2641 atcgacagcc ttgccatcga aattggtttc aaaattcatt acctttttgg actttttata 2701 tgcgtttatc attcggtttg aagaacaaac tcttgcaaat gtcgcaaagc ttgcatcccc 2761 gttggggtca aagtgcttga cagcattcat aagtcccaaa acgccttccg agcgatagtc 2821 atccgcatcg atatatccct tacgcccgac ggcataagaa ccggcggcat aatgcaaaga 2881 atcaagataa cggtttaaca gcgcgtcaaa ggcatcttta tcagacttag ccaaaactgc 2941 aagctcgtca tctgtataag attcatagcg gcttgttgcc aagatatacc acctcatatt 3001 caatatcacc ttagattata ttatctatcg aaaattttgt caagagttga ttgaattttt 3061 gctcgatttt cgtcatttct cacaaaatgg aaacacatta tttaggaaaa taaaaggcac 3121 agacgctcaa aaaagcatct gtgccgttag ttttatacaa ttacttgtcg ttgttgatga 3181 acttccagat gttgtcatag aaggggtcgc ccttcttggt ttcggagttt tcttcctctg 3241 cgggagcttc ctcctcttcc tcgatgggag cagcatatgt atcaaaatcg gaagcgataa 3301 cgatgatgtc aatagtgtcg gaaagatcgg ggttgaagtc cgcaccgaag atgagttcaa 3361 catcgtcagc agcagccttg gtgatctgtt cggtaaggtc agccatatcg gtggtgccga 3421 tatcttcgga cataacaaca ttaagaagca atcttcttgc acccttgata gaggtttcga 3481 gcaacgggct ggagattacc tgctgaacag catcggcgac cttgtcctta ccctcgccgt 3541 ggccgatagc catatgagca tagccggctt ccttcatgat cgactgaacg tcggcaaagt 3601 cgacgttgat ctcgccgtgg cgcaaaatga gctcggtaac gctcaaaact gcggtcttga 3661 gaatatcatc agccaaagca aaggactggc gcatggtgag gttctctctg ccggtcaaga 3721 gcttctggtt ggggataaca accaaagagt caacattttt caaaagtctg tcgattccgt 3781 tttcagcagc tcttgccttt ctggggcctt caaaggtgaa gggcttggtg acaacagcaa 3841 ctgtgaggat acccatatcc ttagcgatct cagcaacaac gggagcggca cctgttccgg 3901 ttcctccgcc catacctgcg gtgatgaaga tcatatcagc gcccttgaga gcatcctgga 3961 tctcttcctt cgattcctga gcggcgcctt cgccaacctc aggctttccg cctgcaccaa 4021 gaccgtgggt caatttctga ccgatctgga tcttgatggt tgcctttgag ttcttcaaag 4081 cctgcgaatc tgtatttatt gcgatatatt caacattctg aatgcctgtc gaaacaatgc 4141 agttgagggc gtttcctccg ccgcctccga ctccgactac tttgatcttg gcaaggtcca 4201 tgccgtcatt ttccattata aatcccatac ccgtacatcc tccaatattc tatatataat 4261 catagtaaga gcagaataaa tctaaatata gtattatact atcatattta tagcttcttg 4321 gcaataggtt tgcaaaaata tttttgcaca aggatttgac caatttttgt atgatttttc 4381 ttattgcggg tcggaagtgc ttgtttcggc agtgttttct gttacggcgg cggcattctg 4441 ctgagcttgc aattccaaat cggcagccga gatgaaggat gcacctgcgg cagagctatg 4501 atagatgatc tttcctgcgg cttcggggtc gaggttctct tcaattatag cggtgatata 4561 tcgaagctta tactcatagt caagggaaga accgaagtcg atgtcgattc tgtcggcata 4621 tcccatttta atatttgttc ggtcggtaat gtcgatatat gtgatcatat cggggcaggt 4681 cttgtcgatg gcatcaaaga ggtcgaagat gatctcaagc ttattttcat cgtgagaatc 4741 catatcctcg cccaaggcta cgcccttaag gtcaaggcct gttaccatca taagctcctc 4801 gcgcttatac ggctgttcgg tttcaagata tcttccgccg cggcttatca cgcagtagcg 4861 gttgccttca tattcacagc aggcaaattc aaccgcctcg gtgacgataa cgtgcagggt 4921 gtcgggcaaa tcgcgcttta aggtaacatc ctcaacataa ataagggtct ttttaattgc 4981 ctgctcggtc ttgtcaaggt cgaggttata catatttttg ccgactttaa ggttgcctgc 5041 agtcaaaatc tggtcggtgg aatatctcat atttcccgaa acgtcatact gcttgatgtt 5101 gaaaagcacg gtacgtgaga gaatgaacaa aacagccgcc acaaaaagga acatcaaaag 5161 ataataaagc gagagatttc tgcggcggcg acggcgcttc ggcgcgtttt tatttggatt 5221 tgtttttaca acgtccttca aaaatatctt cctttcttat cttctgataa tttttgctcc 5281 caatttggaa agctcgtttt caacc // LOCUS sequence032 5298 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence032 VERSION sequence032 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..5298 /mol_type="genomic DNA" /organism="" /note="sequence032" CDS complement(548..1744) /product="glycosyltransferase family 4 protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011203512.1" /transl_table=11 /codon_start=1 /translation="MKILQVNNVYAQQSTGKITKEIFDGLLKAGHQPFAAYGRGEDYVG EGIIRICPDWYGKLNSFLSRITGLAHGGCFLSTSRLINLIKKEKPDVVHLQCINGHFVN IYRLISWLKNNRIKTVLSLHAEFMYTANCGYAYECDQWQKSCKCCPDKYRATKSWFFDG TGRSWQKMKKAFEGFEKDCIICPVSPWTEERAKRSDILKDFKFKTVYNGVNTAEVFNRS DRDMCEKNTVLNVTSYFSADKSHIKGGYYIIELAKRMPDVNFIVAGNADEVSDLPKNIT LPGSVNDQKELSKLYCKAGLTLMVSRRETFSMPCAESLCCGTPVVGFKAGAPEQISLDD YSEFVEHGDIDALEKTVRKWLERTDLDRMEISKQATETYSVETMVKTFSDIYEEILWN" /locus_tag="LOCUS_2060" /note="WP_011203512.1 glycosyltransferase family 4 protein (Bacteroides fragilis) [pid:28.8%, q_cov:88.2%, s_cov:87.4%, Eval:2.4e-35]" /note="MGA_248" CDS complement(1762..3042) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MKVLIISHNPISTKSNMGKTFLSLFSEFDRSELCQFYIYPSFPDV RRCSSFYRVTDKEIVRSLFSFKQIGGEVESKNINENADFYENPADRALYRNVKNKSALR RIARDTAWKLSRGYEKSLYGWLEKEKPDSIFLSPGPGEFIYDIALDISKKLNIPIVTYI CDEYYFLDTPKGLLDKLRFGKFKKKFEKLMANSACLAVICDELKEIYTQRFGVKAETLM TGASRGISEGAKIVDNPTEIRYFGNIRCNRFNSLCDVGLALDDINSHTGTDYKLKIFTA EKDSEILSIFDGIKSIELCGFVSGEDFEREFGASQLLLHVEAFDDASIDRVKHSVSTKI ADSLASGIPLLAYGPESISSMKHLIRHNCALTATSKEELKLMLETAFSDVERKRICAEN AIETAKKYHDSSKTGLALKDIFEKIHN" /locus_tag="LOCUS_2070" /note="MGA_249" CDS complement(3043..3864) /product="phosphorylcholine transferase LicD" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_000811992.1" /transl_table=11 /codon_start=1 /translation="MVKLNKDDLKALTLEVLCEIRDICRENGIAYSLTGGTLIGAVRHG GFIPWDDDIDIMMPRPDYDRFIELVRSGGKCFDLYSYESCGDDYWYPFAKACRKNTKIV EKSIVDSNITLGVYVDIFPIDGAGNGFFGAKLRCKLFKILHGLKLTKNWTGYRRSKIRS WYYEPLRFACYLIGKLFSKHFLNKMLDKFLRAKPYDKCAYAGRMSGDYGSREIMKKELF DTKTTVVFEGEEFDAVADYDSFLRSLYGDYTVLPPEHKRVTHHDFEAYWVD" /locus_tag="LOCUS_2080" /note="WP_000811992.1 phosphorylcholine transferase LicD (Streptococcus pneumoniae) [pid:32.5%, q_cov:98.9%, s_cov:98.5%, Eval:4.1e-32]" /note="MGA_250" CDS complement(3904..4794) /product="glycosyltransferase family 2 protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_000375711.1" /transl_table=11 /codon_start=1 /translation="MSELVSVIIATYRREAELTSALKSLVGQTYKNFEIIVVDDNADAT WNLKVKNAVEEFCGSNPSMRVNYIANGSNQGSARTRNIGIDGASGEYITFLDDDDIYLP SKIERQLRFMKENLLDYCITDLYLYNENDKLVDKRVRSYISDTSPESLLREHLKHHITG TDTLMFKRDYLMKIGKFPLIDMGDEFYLMMQAIDNRGKFGYLEGCDVKAYIHSENGGMS SGMGKITGENELYEFKKKYFNRLKAQDIRYVKARHYAVLAFAYLRSKKYGRFLANGCLA MLVSPINCLKILMAR" /locus_tag="LOCUS_2090" /note="WP_000375711.1 glycosyltransferase family 2 protein (Streptococcus pneumoniae) [pid:28.6%, q_cov:87.2%, s_cov:79.5%, Eval:3.6e-24]" /note="MGA_251" misc_feature complement(4787..>5298) /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_002902061.1:sugar transferase" /note="WP_002902061.1 sugar transferase (Streptococcus sanguinis) [pid:60.9%, q_cov:94.7%, s_cov:78.1%, Eval:9.4e-52]" /note="MGA_252" /locus_tag="LOCUS_2100" ORIGIN 1 agcttccagc cccacttctc gcgggagaaa agacggtaaa gctcgagcat ataaagacaa 61 acaaggaaca gtcccgtcag gttggggttt gagaatcgga aggtcaaata tgccgaaacg 121 cgattgtcga tcatatgcat ttgggaattc caaatgaaaa atgcaactat cagcaaaatt 181 gtcaaacagt cgacaagtcg gttgataaac acgaccatat cttttttcac tttgatttta 241 tagcaggtct gcaaaatcag catcgacatt gaaaacatga ttactttttt caaataatca 301 aaatcaatat ccgtgtttgt aatgcttgca tttatcaaaa cgcttataaa cgccagcgct 361 atcgctgtga gcgctgcaaa atcaagccct gtcacctttt gacgcacagt tcttatccac 421 agcgcaacgg tcagcggaaa ggtgaacaaa aacagcgtac tggttatctg aatatccaaa 481 acctcacaga caacgatgcc tgcaacaacc agatacagcg ctttgagcag tattctatct 541 aacagtttta attccataga atttcctcgt atatatctga aaaagttttt accattgttt 601 caaccgaata ggtttcggtt gcttgctttg atatctccat tcggtcgaga tcggttcttt 661 cgagccattt tcttacggtt ttttccaaag catcaatatc accgtgctca acaaactcgc 721 tgtaatcatc aagagatatc tgctcgggtg ctcccgcctt gaatcccaca acgggagtgc 781 cgcagcaaag gctttcggcg cagggcattg aaaaggtttc ccttctgctg accataagag 841 tcaagcctgc tttgcaatat agctttgaaa gctctttttg gtcattcacc gagcccggca 901 gggtgatgtt tttcggcagg tcggaaactt cgtccgcatt tcccgcaacg atgaagttga 961 catcgggcat acgttttgca agctcgatta tgtaatatcc gcccttgatg tggcttttgt 1021 ccgcgctgaa ataggatgtc acattcaaaa cggtgttttt ctcgcacata tctctgtcac 1081 tgcggttgaa cacctcggcg gtattgacgc cgttatagac cgttttgaac ttaaaatcct 1141 tgagaatgtc cgaacgtttt gcgcgctctt ccgtccaggg agatacaggg cagatgatgc 1201 aatccttttc aaagccctca aaggcttttt tcatcttttg ccaagacctt cccgtgccgt 1261 caaagaacca gcttttggtg gctcggtatt tatcggggca acacttacag ctcttttgcc 1321 attggtcgca ttcgtatgca tatccgcagt tggcggtata cataaactca gcgtgaagcg 1381 acaaaacggt tttaatgcgg ttgtttttta gccatgaaat cagtcgatag atgttcacaa 1441 agtgtccgtt gatgcactgc agatgcacga catcgggctt ctcttttttt atgaggttta 1501 tgagccttga tgtggataaa aagcatccgc cgtgggcaag acctgtaatg cgggacagga 1561 agctgttgag cttgccgtac caatcggggc aaatgcggat tattccctcg ccgacgtaat 1621 cttcgccgcg tccgtatgcc gcaaaaggct ggtggcccgc ctttaaaagc ccgtcaaaga 1681 tctctttggt gatctttccg gtgctttgct gagcatatac attgttgacc tgcagtatct 1741 tcataaaccg acttctttca cttagttatg tatcttctca aatatatctt taagcgcaag 1801 accggtcttg ctgctgtcgt gatatttttt tgccgtttca atggcattct cagcgcagat 1861 tcgctttctc tcaacatcgg aaaatgccgt ttcaagcatt aatttaagct cttctttcga 1921 tgtcgcggtc aatgcacagt tgtggcggat aaggtgcttc atcgaagaaa tgctttcggg 1981 gccgtatgcc aaaagcggaa ttccgcttgc aaggctgtcg gcgatcttgg ttgaaaccga 2041 gtgcttgacg cggtcgatgc tggcatcgtc aaaggcttca acgtgaagca aaagctgtga 2101 cgcgccaaac tctctttcaa agtcctcacc gctgacaaat ccgcagagct cgattgattt 2161 tataccgtcg aaaatgctca agatctcgct atccttctcg gcggtaaata tcttcagctt 2221 ataatcggtt cccgtatggg agttgatatc atcaagcgcc agaccgacat cgcaaagaga 2281 gttaaatctg ttgcatctga tgttgccgaa atatcttatc tcggtggggt tgtcgacaat 2341 tttcgcgcct tcggaaattc ccctgctcgc gcccgtcata agcgtttcgg ctttaactcc 2401 gaagcgctgg gtatatatct cctttagctc gtcgcagatt accgcaaggc aagctgaatt 2461 tgccataagc ttttcaaact tctttttaaa ctttccaaat cggagcttat cgagcaagcc 2521 tttgggggtg tcaaggaaat aatattcatc gcaaatatat gtaacaatcg gaatattcag 2581 ctttttcgaa atatccaaag ctatatcata gataaattcg ccgggaccgg gagagaggaa 2641 aatgctgtcc ggtttttcct tttcaagcca gccgtaaagg gatttttcat atcctcgtga 2701 gagcttccag gcagtgtcgc gggcgattct tcgcagtgcc gacttgtttt tgacatttcg 2761 atataatgct ctgtccgcgg gattttcata gaaatcagca ttttcgttga tatttttgct 2821 ttcaacctct ccgccgatct gcttaaagct gaacagcgat ctgacgatct ccttgtcggt 2881 cacgcgataa aaggacgagc atctgcggac atcgggaaac gatggataaa tataaaactg 2941 gcaaagctcc gaacggtcaa attccgagaa gagggacaaa aaggtcttgc ccatattgct 3001 ctttgtcgat atcggattgt ggcttattat aagtaccttc atttaatcca cccaatatgc 3061 ttcaaaatcg tgatgtgtca cccgcttgtg ttcggggggc aaaacggtgt aatcaccgta 3121 tagtgagcgc aaaaagctgt cataatcggc gacggcatca aactcctcac cctcgaaaac 3181 aacggtcgtt tttgtgtcga acaactcttt tttcattatc tcgcgggagc cgtaatcgcc 3241 cgacatacgc cctgcatagg cacacttgtc atatggcttt gcgcgaagga atttatcaag 3301 cattttgttc aaaaaatgct tgctgaaaag cttgccgata agatagcaag caaagcgcaa 3361 aggctcataa taccagcttc ggatcttgga tcttctatag cctgtccagt ttttggtgag 3421 cttcagaccg tgaagtattt tgaaaagctt gcagcgaagc ttcgcaccga aaaagccgtt 3481 gcccgcgccg tcaatcggga aaatgtcaac atatacaccc aaagtgatat tgctgtcaac 3541 aattgatttt tcaacaattt ttgtgttttt gcggcaggct ttcgcaaagg gataccagta 3601 gtcatccccg caggattcat aggaatataa gtcgaagcat tttccgcccg atctgaccag 3661 ctcgatgaag cggtcatagt cgggacgcgg catcataatg tcaatgtcgt catcccaagg 3721 gataaagccc ccgtgacgca cggcaccgat aagtgtcccg cctgtcaggc tgtatgctat 3781 gccgttctca cggcagatgt cgcgaatctc gcaaagcacc tcgagggtga gagctttgag 3841 gtcatcttta ttcagtttaa ccatatggat ccaccctccc cgcttgcagt gttgatatat 3901 ggcttaccgc gccataagta ttttcagaca gtttatcgga gaaaccagca tcgcaaggca 3961 tccgttggct aaaaaccgtc cgtatttttt cgagcgcaga tatgcaaacg ccaaaacggc 4021 ataatgcctt gctttgacat atcttatgtc ctgcgccttg agcctgttga aatacttttt 4081 cttgaattcg tacagctcat tttcgccggt tattttgccc attccgctgg acatgccgcc 4141 gttttcgctg tgaatatatg ctttgacatc acagccttcg agatatccga atttgcctct 4201 gttatcaatt gcctgcatca tcagataaaa ctcatcgccc atatcgataa gcgggaattt 4261 tccgatcttc atcaaataat cgcgtttgaa cattaacgtg tcagtgcctg taatgtggtg 4321 ctttaaatgc tctctgagca acgattcggg tgaagtgtcc gaaatgtagc ttctgactct 4381 tttgtcaacc aatttatcat tttcgttata aagataaagg tcggtgatgc aataatcgag 4441 caggttttct ttcataaacc taagctggcg ttcgattttt gacggcaaat aaatatcgtc 4501 atcgtcaaga aacgttatat attcaccgct cgccccatca attccgatgt ttctggttct 4561 tgcggagcct tggtttgagc cgtttgcaat ataattcaca cgcatcgaag gattgctccc 4621 gcaaaactcc tcaacagcat ttttaacctt caaattccaa gttgcatccg cattgtcatc 4681 cacaacaata atctcgaaat tcttatacgt ctgcccgact aacgatttca gagcggaagt 4741 caattcagct tctcttcggt atgtggcaat tattacgctt accagttcac tcattattgc 4801 ttacctcttg cttggcttcc tcattctgca tactccccgt tctgccttca acaacgccgt 4861 ccgatttcaa aacggacatt acggttccga taatgcattt tgcgtccatt gcaaagcctt 4921 ttcccgaatt caaggcttcg gtatattcgc cgtcgagctt tgcttttacg gggatttcaa 4981 gctcatctct gccgtttatc tgcgcccagc ctgtaagacc cggacggatg tcgtttgcgc 5041 cgtatttatc ccgctcggca atcaggtcat actgattcca aagggcgggg cgggggccgc 5101 aaatgctcat ctgtcccacg aaaatgttga aaagctgggg caattcgtca accgacgagc 5161 ggcgaatgaa cttctgccat ttgctcaaca tatctgccgc gttgaactga tgtgtcggaa 5221 catccttggg gacggttgtg ggcatacttc tgaacttcaa aattttaaag gtctttttat 5281 gtaatccgat cctttcct // LOCUS sequence033 5226 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence033 VERSION sequence033 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..5226 /mol_type="genomic DNA" /organism="" /note="sequence033" CDS 132..872 /product="PHP domain-containing protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_012869446.1" /transl_table=11 /codon_start=1 /translation="MNRYYYDLHIHSCLSPCAEDDMTPANIAGMGALCGLNIMALTDHN TTGNLEAFFAACKKHGIVPVGGMELTTAEEIHIICLFETLENALAFGDEVKKHLMPIKN RPDIFGNQLYMDDEDNILGEEPTLLLTASDLDLDSAVKLARSFGGAVYPAHVDRDSNGI IAILGDIPPDEGFTACEFNDSKNAETYPERYPIINGLSVLSCSDAHRLWEISEAENFLD LDDEPYSSAKVRQELIKFLKGKAD" /locus_tag="LOCUS_2110" /note="WP_012869446.1 PHP domain-containing protein (Thermanaerovibrio acidaminovorans) [pid:38.2%, q_cov:85.0%, s_cov:80.7%, Eval:4.2e-30]" /note="MGA_254" CDS 875..1435 /product="ATP-binding protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_012869297.1" /transl_table=11 /codon_start=1 /translation="MKELSLNILDITQNSVTAKADEIEISLAEDDKGILTLKIIDNGCG MKPETVKSVRDPFCTSRKTRKVGLGIPFLKLAANQAGGDIEIISTHIDDDPVNHGTTVS ATFDTHHIDFTPVGDMVETMITLISGNPDIDFRFSDVSPKRQVYLDTRELKAVLGEDIC LGEFEVLEWIKGYLNEQYSCIEQ" /locus_tag="LOCUS_2120" /note="WP_012869297.1 ATP-binding protein (Thermanaerovibrio acidaminovorans) [pid:37.1%, q_cov:93.5%, s_cov:91.4%, Eval:7.0e-25]" /note="MGA_255" CDS 1504..1875 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_004082448.1" /transl_table=11 /codon_start=1 /translation="MKSLAELAAIREKMKNKVSIRENSDNTTRIVVGMATCGIAAGARP VLAAFVEGVNEAGLSETVTVTQTGCIGVCQYEPVVEIYEAGKEKVTYVKMTAEKAKEVV EKHIKNGQVIDAYTIGANV" /locus_tag="LOCUS_2130" /note="WP_004082448.1 hypothetical protein (Thermotoga) [pid:41.7%, q_cov:93.5%, s_cov:90.5%, Eval:6.5e-21]" /note="MGA_256" CDS 1896..3716 /product="NADH-quinone oxidoreductase subunit NuoF" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_066666688.1" /transl_table=11 /codon_start=1 /translation="MIRSHVLICGGTGCTSSKSAEIAVSLQEEIVRQGLAEEVQVVKTG CFGLCALGPIMIVYPEGTFYHGVTLDDVNEIVSEHLLKGRPVSRLVYHETAEDTEKVAT SLSDTAFYSNQHRIALRNCGVINPENIEEYIANDGYMALGKVLTEMTPEEVIDTVLASG LRGRGGAGFPTGQKWKLARTIVPNADQKYVCCNADEGDPGAFMDRSILEGDPHALIEAM AIAGYAIGANQGYVYVRAEYPIAVSRLQIAIDQAHEYGLLGENIFGTGFNFDIGIRLGA GAFVCGEETALMTSIEGNRGEPRPRPPFPAEKGLFQKPTVLNNVETYANIPQIINNGAE WFTQMGTEKSKGTKVFALGGKIKNTGLVEVPMGTPLRTIIEDIGGGIPNGKKFKAAQTG GPSGGCIPAEHLDIPIDYDNLLAIGSMMGSGGLIVMDEDNCMVDIAKFFLEFTADESCG KCTPCRVGTKRLLELLTKITDGKGTLEDLDKMEQLCYYIKANSLCGLGQSAPNPVLSTL RYFKDEYLAHIVDKTCPAGVCKNLLKYEIDKNKCIGCGLCARQCPAGAISKTDYIAPGK KLPALAIDPEKCVKCGACVGACKFKAISKK" /locus_tag="LOCUS_2140" /gene="nuoF" /note="WP_066666688.1 NADH-quinone oxidoreductase subunit NuoF (Desulfotomaculum copahuensis) [pid:64.0%, q_cov:99.5%, s_cov:99.2%, Eval:2.4e-229]" /note="MGA_257" ORIGIN 1 gtttcacccg acgaaggcgt tcttgaaaag gcccgtgaat gcgaaattaa cattctttca 61 accgatatga ccgcttttga agcggcaggc aagctttatt caatgatctg attttttcgg 121 aaggaggcaa aatgaacaga tattattacg atctgcatat tcattcctgc ctttctccct 181 gtgccgagga tgatatgacc cctgcgaaca tcgcaggtat gggcgccctt tgcgggctta 241 atatcatggc gctgacagat cacaacacca cgggaaatct cgaagctttt tttgcggcat 301 gcaaaaagca cggaatcgtt cccgtcggcg gaatggagct gacaactgcc gaggaaatac 361 atataatctg cctgtttgaa actcttgaaa acgccctcgc ctttggcgat gaggttaaaa 421 agcatcttat gcccattaaa aaccggccgg acatattcgg caatcagctg tatatggacg 481 atgaggacaa cattttgggc gaagagccaa cccttttgct gacggcaagc gatctggatc 541 ttgacagtgc cgtaaagctg gcgcgcagct tcggcggtgc tgtatatccc gcccacgtgg 601 atagagattc aaacggaata atcgcaattt taggagatat tccccccgac gagggattta 661 ccgcctgcga gtttaacgac tctaaaaacg cggaaacata ccccgagcgg tacccgataa 721 tcaatgggct gtcggtgctt tcctgcagcg atgctcacag gctttgggag ataagcgaag 781 cggaaaattt cctcgacctt gacgacgagc cttacagctc tgccaaggta aggcaggagc 841 tgatcaaatt cctcaaagga aaggcggatt aaaagtgaaa gagctttcct taaacatttt 901 agacatcacc caaaactcgg ttacggcaaa agccgacgag attgaaataa gccttgctga 961 ggacgataag ggcattttga ccttaaagat aatcgacaat ggctgcggaa tgaagccgga 1021 aacagtaaaa tcagtccgcg acccgttctg cacatcccgt aagacccgaa aagtcggact 1081 cggaatcccc tttttaaagc ttgcggcaaa ccaggcgggc ggagatattg aaattatctc 1141 cacacatatt gacgatgatc ccgtcaacca cggcaccacc gtcagtgcaa cctttgacac 1201 tcaccacatt gacttcactc ccgtgggaga tatggttgaa acaatgataa cgcttatcag 1261 cggaaatccc gacattgatt ttcggttttc ggatgtttcg ccgaagcggc aagtatatct 1321 tgatacccgc gagcttaaag ctgttttggg tgaggatata tgcctcggag aattcgaggt 1381 gctcgagtgg ataaaaggat atcttaacga acaatattca tgtattgaac agtaactcac 1441 tgtttatgga tatataattg attcgctaaa aaataaaatt acaaatttgg aggtgcattc 1501 tcaatgaaaa gcttagctga actcgctgct atcagagaga aaatgaagaa caaggtttcc 1561 atccgtgaaa attctgacaa caccacaaga atcgttgtcg gtatggcaac ctgcggtatc 1621 gctgcaggcg ctcgccctgt tttggctgca ttcgttgaag gcgttaacga agcaggactt 1681 tcggaaaccg taaccgttac ccagaccggc tgcatcggcg tatgccagta tgagcctgtt 1741 gttgaaattt atgaagcagg caaggaaaag gtaacatatg ttaagatgac cgctgaaaag 1801 gcaaaggaag ttgttgaaaa gcacatcaag aacggccagg tcattgacgc ttacacaatc 1861 ggtgcaaacg tataataaat aaggaggaat aacaaatgat acgctcacat gttcttatat 1921 gcggcggtac cggctgtacc tcctctaaga gtgctgaaat tgcggtttct ttgcaggaag 1981 agatcgtaag acagggactc gctgaagaag tacaggttgt caagaccggt tgcttcggtc 2041 tttgtgcatt aggtccgatc atgatcgtat atcccgaggg aaccttctat cacggtgtta 2101 cccttgatga tgtcaacgag atcgtttccg agcatttgct caagggccgt cccgtttcaa 2161 gacttgttta ccacgaaacc gctgaggata ccgaaaaggt tgcaacatcc cttagcgaca 2221 ccgctttcta ttctaatcag cacagaatcg ctctcagaaa ctgcggtgta atcaaccctg 2281 aaaacatcga agaatatatc gctaatgacg gttacatggc tttgggtaag gttttgaccg 2341 aaatgactcc cgaagaagta attgacaccg ttttggcttc cggtcttcgc ggacgcggcg 2401 gcgcaggctt ccccaccgga cagaagtgga agctcgctcg caccatcgtt cccaatgccg 2461 accagaagta tgtatgctgc aacgccgacg aaggtgaccc gggtgcattt atggaccgtt 2521 ccatcctcga aggcgacccc cacgctctca ttgaagctat ggctatcgca ggttacgcta 2581 tcggcgcaaa ccagggctat gtatatgtaa gagctgaata ccccatcgct gtaagcagac 2641 tccagatcgc tatcgaccag gctcatgaat acggcctctt gggcgaaaac atcttcggaa 2701 ccggtttcaa cttcgacatc ggaatcagac tcggtgcagg tgcattcgtt tgcggtgaag 2761 aaaccgctct tatgacctcc atcgaaggca acagaggcga gcctcgtccc cgtcctccgt 2821 tccctgctga aaagggtctc ttccagaagc ctaccgtact taacaacgta gaaacctacg 2881 ctaacattcc ccagatcatc aacaacggtg ctgaatggtt cacccagatg ggtactgaaa 2941 agtccaaggg taccaaggta ttcgcactgg gcggcaagat caagaacacc ggtctcgttg 3001 aagttcccat gggtactccc cttcgcacca tcatcgaaga tatcggcggc ggtatcccca 3061 acggcaagaa gttcaaggct gcacagacag gtggaccttc cggcggatgc atccctgctg 3121 agcatctcga catcccgatc gactatgata accttctcgc tatcggctct atgatgggct 3181 ccggcggttt gatcgttatg gacgaagaca actgtatggt tgacatcgct aagttcttcc 3241 tcgaatttac tgctgatgaa tcctgcggta agtgcacacc ctgccgtgtc ggtacaaaga 3301 gacttcttga gctcttgacc aagatcactg acggcaaggg cactcttgaa gacctcgaca 3361 agatggaaca gctttgctac tatatcaagg ctaactccct ctgcggtttg ggtcagtctg 3421 ctcctaaccc cgttctttca accttgcgtt acttcaagga cgaatatctt gctcatatcg 3481 ttgacaagac ctgtcctgca ggcgtatgta agaaccttct caagtatgag atcgataaga 3541 acaagtgcat cggctgcggt ttgtgcgcaa gacagtgtcc tgcaggcgca atcagcaaga 3601 ccgactacat tgctcccggc aagaagcttc ccgctttggc tatcgaccct gaaaagtgcg 3661 tcaagtgcgg tgcttgcgta ggtgcatgta agttcaaggc aatttccaag aagtaattaa 3721 aggaggttta agactatgga tatgcttaac attaaggtaa acggtttacc tatcgaagcg 3781 cccaagggct ctaccgtcct cgaagcttca agaattgccg gcgtcgagat ccccactctt 3841 tgcttcctca aggacattaa cgagatcggc gcatgccgta tctgcgttgc agaggttgct 3901 gaaatgagag gtcccgcttt gggtcccaag agaatcgtcg cttcatgtgt ataccccatc 3961 accaacggta tggaaattta caccaacacc cccaaggtta tcgaatcaag aaagcagacc 4021 ttggagctca ttctttccac ccatgacaga aagtgcctta gctgcgtaag aagcggcaac 4081 tgtgagcttc agaagctctg ccgtgacctc ggcgttgagg acgaaggcaa gtatgacggc 4141 gacaagcctc attacgatat tgactactct gccgctcata tgatcagaga taacaacaag 4201 tgcattttgt gccgtcgttg caccgcagtc tgcgaaaaga cccagggtat cggcgttatc 4261 ggcgcaaacg aaagaggctt caactctcac atctcttctg catttgaact cggcttgggc 4321 gacaccagct gtgtatcctg cggtcagtgt atcgcagttt gccccaccgg tgctttggct 4381 gaaaaggaca acaccactga tgtatttgct gcacttgcag atcccaccaa gcacgttgtt 4441 gttcagaccg ctcctgctgt aagagctgct ttgggcgaaa tgttcggcct tgagatcggt 4501 accgacgttg agggcaagat gattgctgct ctcagacgtt tgggcttcga caaggtattt 4561 gataccaact tcaccgctga cctcaccatt atggaagagg ctcacgaatt cctcgacaga 4621 gttaagaacg gcggcacctt gccccttatc acctcttgct ctcccggatg ggtcaagtat 4681 tgcgagcact acttccccga gctcaccgaa aacctctcca gctgtaagtc tcctcagcag 4741 atgttcggtg ctttgaccaa gacctactat gctgaaaaga tgggcattga tcctaaggac 4801 atcgtttccg tatctatcat gccttgtacc gctaagaagt tcgagcttgg cagagatgat 4861 gagtctgcag caggcgttcc cgatgttgac tttgctctta ccacccgcga gctcggttat 4921 atgatcgacc gcgcaggtat caagttcaac tcgttgcccg atgaagaata cgatgagcct 4981 atgggaatcc ataccggcgc aggcgttatc ttcggcgcaa ccggcggtgt aatggaagca 5041 gcactcagaa ctgctgttga aacactcacc ggtgaagaat tgcccaatgt tgactttgtt 5101 gacgttcgcg gcaccgcagg catcaaggaa aaggcttacg aagttgcagg tatgaccgtt 5161 aaggttgcag ttgcttccgg tcttgcaaat gctaaggagc ttttgaacaa ggttaagtcg 5221 ggtgaa // LOCUS sequence034 5216 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence034 VERSION sequence034 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..5216 /mol_type="genomic DNA" /organism="" /note="sequence034" CDS complement(775..1554) /product="sugar phosphate isomerase/epimerase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003723840.1" /transl_table=11 /codon_start=1 /translation="MRFGICAGSTDKETLGYIKSLGYDYIEGNFGNVQGMDESALREYI SVTRDLDIAVESYCIFLKGDFRVVGPNTNHGDICEYAKIGFEKAARLGGKTVVFGSGGA RRYPEGFPRDKARDQFAECLRMCGDIASQYDISIVIEPLNNTETNLVNTVAEGVDICKY TAHKSVWLLADFYHIFRSGETLDALENNGGLLRHVHLARANNDRGQPTEADKETCLVWA DALKKCGYDGRMSLESAHIPDFKTAAKDAIKAFEWFK" /locus_tag="LOCUS_2150" /note="WP_003723840.1 sugar phosphate isomerase/epimerase (Listeria monocytogenes) [pid:27.7%, q_cov:87.3%, s_cov:85.2%, Eval:1.9e-07]" /note="MGA_260" CDS complement(1570..3858) /product="glycoside hydrolase family 95 protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_076055503.1" /transl_table=11 /codon_start=1 /translation="MIDRKIWTTHPASTSDDPHSGFFGDGWNNATPMGNGSLGAMVYGD PIHDTIQLNEETIWGGDDKLERMNPKAKGSWRKVRELLSEGRIKEAEELTKSDLFSIRA DPRWYDTAGFVWFDYKHTDYSAYRRMLELDSAVCYVNYRADGHSYEREYLVSAPDKVIA IHHNCPDGRFINLCADFTKRDGNYESIELCENGILIYAKEPENGCRYCILAATDSDGCV IYNEKGFDVYDASYLTVYITIRSTYHADDITEWCNRVIENVLESNYQSVKHRHIQDYRY WFTRCYLEIDGENRSHIPTDERIVQSGKEQDNSLIGLYFDFARYLLISCSRPGTLPANL QGIWNKDRYPAWGSKYTININAQMNYWPAEVMGLSELHMPLIEHLKTMLPRGQKMAKEM YGLDGFVAHHNTDIFGDCAPVDYWMPATIWPMGAAWICTHIKTHYDYTGDKAFLKEYLP ILKESCLFFTQYLFEHNGKLITGPSVSPENMYIHTSGESGCMCNGPAMDSQILNDLFSD TVYIAKLLGEEDELTDKVSEMLEKLPKPSIGKHGNIMEWIEDYDETEIGHRHISHLFGL YPSAQFTYEATPELMTAARATLERRLAHGGGHTGWSRAWIINMWARLRDGEKAGENVNA LLCRSTYPNMFDKHPPFQIDGNFGGGAGIAEMLLQSQNGIIVLLPALPKAWPSGRFTGF KARGGVSVDLEWSDGMVQKAVLHNEQSRAFSVQVPEGCVLKYGNKTLSGVGTVAFAEGE SGDIVIERE" /locus_tag="LOCUS_2160" /note="WP_076055503.1 glycoside hydrolase family 95 protein (Xanthomonas campestris) [pid:38.0%, q_cov:93.8%, s_cov:90.6%, Eval:4.4e-135]" /note="MGA_261" CDS complement(3976..5082) /product="aldo/keto reductase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_009891610.1" /transl_table=11 /codon_start=1 /translation="MKKLGFGLMRLPLADPKDHSNIDIEKVKEMVDVFMSKGFTHFDTA YVYHGGKSEVAFREAVVKRYPRESFTVTDKLPLFNRPDRAGMEKIFAEMLERCGVEYFD YVWLHAMNKDLYKHAQEVDAFGYLSELKAQGKIVNIGFSFHDSPETLDLMLTEHPEVDA IQLQINYVDWEGNWVQAKRCYEIACKHNVPVIVMEPIKGGSLAQLPKKAEKLFKDYNPD ASAASWAIRYAASLDNVVNVLSGMSNMDHMNDNVSYMEDFKPLTEEEYKVIDEVSKIVK FAIPCTACRYCTDGCPMKIDIPEIFKVYNDFKKGGKERWEGIKRYKEEITVNGGKASDC IGCGQCTEHCPQNLDIPKLLSDVTLDLD" /locus_tag="LOCUS_2170" /note="WP_009891610.1 aldo/keto reductase (Clostridioides difficile) [pid:55.2%, q_cov:98.4%, s_cov:97.6%, Eval:1.3e-117]" /note="MGA_262" ORIGIN 1 atatcaagtc cttgcgcttg gcatagaaat tgcggtcgat gagaaaatat tcctgctcgg 61 gtccgcaggt ggcggtaacc gtctttgcct cggtgccgaa aagtgtgagg atgcgcttga 121 ccgagcgatt gagcgcctcc attgatcgga gcaagggagt ttttgtgtca agtgcctcgc 181 cgctgtatga gcaaaaagcg gtgggaatgt aaagtgtgtc attcttgatg aaagcatatg 241 aagtggggtc ccatgcggta tagcctctgg cttcaaaggt cgctctgagt cctcccgagg 301 ggaaacttga agcatccgat tcgcctttaa taagctcctt gcccttgaat tcaagaatcg 361 gtgcaccgcc cacagagcca caaaggaagc tgtcatgctt ttcggcggtg atgcctgtta 421 atggctggaa ccaatgggta taatgtgtcg cacccttttc ggtcgcccat tcacgcatag 481 ctttagccac ggcatttgcg atgttaatat ccaacggctt gcccgaagca atagtctgct 541 tgagggcaga ataagtttcc tcggggagca ttttttgcat cacgctgtcg ttaaatacct 601 cgctgccgaa aacctgtgaa attacatttg gcatggataa ccctccgtaa cgtcaaatag 661 atatgttaag tatattatac tttatgtgcg ttgtcaaacg gaatatctcc caaaaaaata 721 atgccgcaaa aaggattatt tgtcctaatt tgcggcattg ttgtttaatt tatatcattt 781 gaaccattca aacgccttga tggcatcctt ggctgcggtt ttgaaatcgg ggatgtgcgc 841 cgattcaagg ctcattcttc cgtcatatcc gcattttttc aaagcatctg cccaaacaag 901 gcaggtttcc ttatccgcct cggtgggctg accgcggtcg ttgttggcgc gtgcaagatg 961 aacgtgcctg agcaatccgc cgttattttc aagcgcatca agggtctcgc cgcttcggaa 1021 gatatgataa aaatcggcaa gcagccaaac gctcttgtgc gccgtatatt tgcagatatc 1081 aacaccctcg gcaaccgtgt tgacaagatt cgtttccgtg ttattaagtg gttcgatgac 1141 tattgatata tcatattgcg aagcaatgtc gccgcacata cgcaagcact cggcaaactg 1201 gtcgcgggct ttgtcgcgcg ggaacccttc gggatatctt cttgcgccgc cgcttccgaa 1261 aacaacggtc tttccgccga ggcgcgccgc cttttcaaag ccgatttttg catattcgca 1321 aatatctccg tggttggtgt tcgggccgac aacgcggaaa tcgcctttta agaagatgca 1381 gtatgattcc acagcgatgt caagatcgcg ggtaacgctg atatactcac ggagcgcaga 1441 ctcatccatc ccttgaacat tgccgaaatt cccctcaatg taatcatatc cgagggattt 1501 gatatatccc aatgtttcct tgtcggtcga acctgcacat attccgaatc tcatatgaat 1561 acctctcttt tattctcttt caatcacgat atcgccgctt tcgccctcgg caaatgcaac 1621 tgtgccaacg cccgaaagtg tcttattgcc atatttaagc acacatcctt cggggacctg 1681 aacgctgaag gctcttgact gctcgttatg caaaactgcc ttttgcacca tgccgtcaga 1741 ccattcgagg tcgacgctta caccgcctct tgccttaaag cctgtaaatc tgcccgaagg 1801 ccaagctttt ggaagcgcgg gaagcaaaac aataattccg ttttggctct gcaaaagcat 1861 ttccgcaatg cctgcgccgc cgccgaagtt tccgtcgatc tggaaaggcg ggtgtttgtc 1921 aaacatattg ggatatgttg agcggcaaag aagtgcattg acattttcgc ctgccttttc 1981 gccgtcgcgc aagcgtgccc acatattgat tatccatgca cgggaccagc cggtgtgtcc 2041 gccgccgtga gcaagtcggc gctcaagggt ggctcttgct gcggtcataa gctcgggtgt 2101 cgcttcataa gtaaactgtg cggaaggata taaaccgaac agatgcgaaa tgtggcggtg 2161 gccaatttcc gtttcatcgt aatcctctat ccactccata atattgccgt gcttgccgat 2221 agacggcttt ggaagctttt caagcatctc gctcacctta tcggtcagct catcctcttc 2281 gcccaaaagc tttgcaatat ataccgtatc gctgaacagg tcattgagta tctgcgaatc 2341 cattgcaggg ccgttgcaca tacatcccga ttcaccagac gtgtgaatat acatattttc 2401 aggcgaaacg gaaggtcccg taatcagctt gccgttatgc tcaaaaagat actgggtgaa 2461 gaagaggcag gattccttca aaatgggaag atattctttc aaaaacgcct tatcgcctgt 2521 gtagtcatag tgggtcttga tatgtgtgca gatccaagca gcgcccatag gccagatcgt 2581 tgcaggcatc caatagtcaa caggagcaca atcgccgaag atatcggtgt tgtggtgtgc 2641 aacgaatccg tcaagaccat acatttcttt tgccattttc tgtcctctgg ggagcatcgt 2701 tttcaaatgc tcgatcaaag gcatatgaag ttcggaaagg cccataacct ctgcgggcca 2761 atagttcatt tgagcattaa tattgatcgt atacttgctt ccccacgcgg gatagcgatc 2821 cttattccag atgccctgca ggtttgcggg caatgttccg ggacgcgagc aggaaataag 2881 caagtatctt gcaaagtcga agtatagacc aatgaggctg ttgtcctgct ccttgcccga 2941 ttgaacgatt cgctcgtcgg tgggaatgtg gcttctgttt tcgccgtcaa tttcaagata 3001 gcatcttgtg aaccaatatc tgtaatcctg aatgtggcgg tgcttgaccg actgatagtt 3061 ggattcgagc acgttttcaa tgacgcggtt gcaccactcg gtgatgtcat cagcgtgata 3121 ggttgagcga atggtgatgt aaacggtcaa atagcttgca tcgtaaacat cgaagccctt 3181 ttcgttatat ataacacagc cgtccgaatc ggttgcggcg agaatgcaat atctgcaacc 3241 gttttcaggc tccttagcat atatcagaat gccgttttcg caaagctcaa tagattcgta 3301 attgccgtcg cgcttggtga aatcagcgca gaggttgatg aatctgccgt cggggcagtt 3361 gtggtgaatt gcaattacct tgtcgggcgc gctgacaagg tattcgcgct cgtagctgtg 3421 tccgtcggcg cggtagttaa catagcagac tgcgctgtcc agctcaagca tacgtctgta 3481 ggctgaatag tcggtatgct tataatcaaa ccagacaaat cctgcggtat cataccagcg 3541 ggggtcggca cggattgaaa acagatcgct ctttgtgagt tcctccgcct ctttaattct 3601 tccttcggat aaaagctcgc gaaccttccg ccaagagccc tttgccttgg ggttcattcg 3661 ttcaagcttg tcgtcgccgc cccaaatagt ctcctcgtta agctgaattg tatcgtgaat 3721 cgggtcaccg tataccattg caccaagcga gccgttgccc attggtgtgg cattattcca 3781 accgtcaccg aaaaagcccg aatggggatc atcggatgtt gaagcgggat gtgttgtcca 3841 aatcttgcga tctatcataa gtacctccga atttgataat ttcatcaagt tgattatata 3901 aattttccga gaaagattca acccaaaaag aaaaaagcgg cgccaaaaat gtgcgccgct 3961 ttttgtgcaa tataattaat ccaaatcgag ggtaacatcg ctcagaagct tgggaatgtc 4021 aagattctga gggcaatgct cggtacactg accgcatccg atacaatcag atgccttgcc 4081 gccgtttacg gtgatctctt ctttatatct cttgatgcct tcccagcgtt ccttgccgcc 4141 cttcttgaaa tcgttatata ccttgaagat ctcgggaatg tcgatcttca tcgggcaacc 4201 gtcggtgcag taacggcagg cggtacaggg aattgcaaac ttgacaattt tgctgacctc 4261 gtcaatgacc ttatattctt cttcggtgag gggcttaaag tcttccatat aggatacatt 4321 gtcgttcata tggtccatat tggacatacc gctcaaaaca ttgacaacat tgtcaaggct 4381 tgcggcataa cgaattgccc aggaagctgc ggatgcatcg gggttataat ccttaaagag 4441 cttttctgcc tttttgggaa gctgagccaa gcttccgccc ttgatgggtt ccataactat 4501 aacgggaaca ttgtgtttgc aggcgatctc ataacatctc tttgcctgga cccagttgcc 4561 ttcccagtca acatagttga tctgaagctg aatagcatcc acctcgggat gctcggtgag 4621 catcaggtca agggtttcgg ggctgtcgtg gaagctgaaa ccgatgttta caattttgcc 4681 ctgggcttta agctcgctca aatagccgaa agcatcaact tcctgcgcgt gcttatatag 4741 atctttgttc atagcgtgga gccagacgta atcgaaatat tcaacgccgc aacgttcaag 4801 catttcggcg aaaattttct ccattcccgc tctgtcggga cggttgaaca aaggaagctt 4861 gtcggtaacg gtgaagcttt ctctggggta tctttttacg accgcttctc tgaatgcaac 4921 ttcgctcttt ccgccgtgat aaacataggc agtatcaaag tgggtgaaac cctttgacat 4981 aaagacatcg accatctctt taaccttttc aatgtcgata ttcgaatgat ccttagggtc 5041 tgcaagaggc aatctcatca gaccgaagcc gagtttcttc atagtagtcc tccaagtagt 5101 ttcaaatatt attgtaattt aattatataa taagtatttg aaatgtcaag gcggttgagg 5161 ggctgtaaaa gtaaccaaaa attgcactta ttctttgtaa atttcggcag gctgtg // LOCUS sequence035 5208 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence035 VERSION sequence035 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..5208 /mol_type="genomic DNA" /organism="" /note="sequence035" misc_feature <1..2915 /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_011816923.1:glucoamylase family protein" /note="WP_011816923.1 glucoamylase family protein (Yersinia enterocolitica) [pid:25.0%, q_cov:39.6%, s_cov:14.6%, Eval:4.9e-25, partial hit]" /note="MGA_263" /locus_tag="LOCUS_2180" CDS complement(3059..4417) /product="D-alanyl-D-alanine carboxypeptidase family protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_004454794.1" /transl_table=11 /codon_start=1 /translation="MRKLTFIITLIFAIVTLTANVGAVSFNPDFEVYSEAALLINLDTG EVIYEKNADKQLVPASLTKIMTAVLLIEKYEDNIAELSTTYVSGGAACFDELYMTGCSN ADIRLGEKVSYKDLLYALMLRSACEAANIIAYNVAGSLEAFAEMMNIKAEELGCEDTHF TNSHGLFWENHYTTARDMAKIVEYALSLPLFEEISCSNEYTMEATKYHTDPRKISHTNY MMSRINGGDYYYEYVKGIKTGTLDQAGRCLASLAYKDGYSYMLVTMGAPQQDEAGNNVF YNFIDHKNIYEWAFDNFEYTTLISGTEEVAEVKVEYGDGTDYVIVKPAEEFSRIWNTRI TSSSIHKVISLDYDVVAPVKAGDKLGTMELQYGGETLAVVDLVATKDVARDEQAAMMTV AKSFIGSDAFYDAIKYAAIFFLAYTVLIIILKIIVARQNKKNSRMYTPTKRRR" /locus_tag="LOCUS_2190" /note="WP_004454794.1 D-alanyl-D-alanine carboxypeptidase family protein (Clostridioides difficile) [pid:26.8%, q_cov:98.9%, s_cov:97.7%, Eval:8.3e-40]" /note="MGA_264" ORIGIN 1 gggatgagat cgcacatccc gaggacgacg agcgtttctg cggccgtggg ttgataaatg 61 tgaaggcact tgcaagctgt cgcggtgata taccatacga caaaacgctt ttctgcaatc 121 ggcttttggc aggggttctg ggtgaacgaa gggtgcccgt taaattcaaa agcatcgaac 181 gcgagcattc gggcgacagg ttggctgaat atgccgaaca ggttcgcgaa acagcgcaaa 241 gcctgtggca tatcctctcc cgaaaaatga agatatatca aaaagttgag gtgcttggca 301 atctggcata ttttttgaca cccgtaatca tcaccgcgct gttgccgctg agccttgcga 361 tgtatccccc tgccgcgggc ggagcgattt tagcggcact tgcgatgtat cttttgggtt 421 catgggcgcg aaaggggcgc ggagtgctgt gggaaatgct ccttgtgccg acatatgccg 481 cggtaacgat atttgccctc ataagagaag cctatcgcgt ggtgtttatg cgaaatacgt 541 taagcgtcgt gccgtttaag tatgggcggt ttgtcatcat cgcagagata atatcccttt 601 gcgcgcttcg ctcgccctct ggcgcggtga agctgattgc tttgatattc gcactgatgc 661 cgattaagct tttggcagaa atgatgccga aaaaagagcc tgatatgctt agctatcggc 721 gcaaaaaggc gctgaatgag caagcggaaa aggtttggaa gttttttgag gaatatgtca 781 ccgaagctga caacaacctt ccgcccgaga gcgtgcagtt ttcccccgac ggcatttccc 841 acgttgcttc ccctgcggta atcggggtat atctggtttc gtgcctggcg gcatatgaca 901 aaaagctgat cgacctttat gcttttacca cgcgcattga gcgcacgctt gaaaccgtct 961 caaaacttga aaccgccaac ggcaatttat atgacaaata tgacacacgc acgctcactc 1021 ccctttcgcg cacagtcagc gatagcgaga tcgggctatg gttgatctgc cttatctgcc 1081 tgaaagaagg aactgaagag cttcgcggaa catttgctcg gttggatgaa tgcgtgaacc 1141 aaattgagga gatcatcagc aaagctgacc tgtcgcaggt tgaaaaccgc tattactttt 1201 catcgggaag gcttgcatcg tttttggcgg tagcattaag gcaacgggac aagagccatt 1261 ggcaggagct ttttcgccca attcggcttc acggcttcaa acagggaatc gcctcgcaac 1321 agggcggaat cgacgagttt tttgtttcgg agctgttcat caagagcccc aaaggctcag 1381 caagcgagca aagccttgat ttttgcatat attgccacaa gcggttggca aaagagaaaa 1441 atatgcccta tggccttgcg cacagcggtt gcgccgagcg ggacgaaagt atgtgctatt 1501 tgacccgaca tcacggcaca aagctatgca ctgctgaaga aaccgctgag ggttacgttg 1561 tttcgcccta ttcgatatat ctttgcgcgc aaagggaccc gagcggagca tttgaagctc 1621 ttgataagct caaagattta ggaacagtcg gtcgatacgg attttatgaa gcatatgact 1681 tcgaccttaa tgaagttgtt aaatgctata attccttgca tttgggactt gagatgattg 1741 caataagcaa tctcaccgac ggcggaataa tgcaaaagcg taccatgcaa agcacgacag 1801 ttcaaggggc atacgaattg ttaaacgaag cgatgccgaa ggcggataaa agcgccgtta 1861 cggcaccaac agccccggaa aacaagtgtg aaagatacac tgatatttcc ctttccgagc 1921 caagggtcag gttttgccat tcaaatggct acgctctcat tatgaccgat tcggggaatt 1981 gcttcggcgt ttataaaggc gcgtttgttt atgaatcggg cgacgggatg aagattaaaa 2041 tcggtgagaa tgaatcgcta ccctatcttt gcgaatttgc gggaagtgaa tcaagatgct 2101 attgggataa cggcgggctt tcaagttgca taaaagcgtt tttgcacggc ggtttaccct 2161 gcgaaatgag aagcatctgc cttgagaaca actcggatga ggaaatatca acaagcgttc 2221 aaatatcctt tacgtcgggc agtataggcg gggtgtcgat gcgggcggat aatatcattt 2281 tgcggacggg gaaaatgtat atacaggcgg gatttttgga aaatatgggc tgcaaaataa 2341 tgcccgaaag aacgggcttt aaggtgaata taccgattgc tcttccgacg aggggaaaat 2401 ggcaggcgag catatatatt ctttgcgcgg atagtttaga tgggctgaag caaagcgcaa 2461 aaaggctcat tgccgagcag atcaagcccg ccctcgcgcc cgataaaagc ggcgaaacaa 2521 gaatggcaga aatcattctg cgggatattt ttacatcatc tgtttcaaac ccgtcagaaa 2581 gcgagaaatt gcaaaggcgg tttggatttg aaaaatcact tccgctggtt gcggtcatgc 2641 ttaataataa aaacgacagc caaaagctgt cgctgtattt gggggcattc aaggcattgt 2701 gcgaatcgga gctggaaatt aaccttgcgt ttatctatcg ggatgatgag gacagagcac 2761 actatcgggc gcttattgac gagctgaagc cgcgcggtct tgaagagtat atatattcac 2821 agattatgcc gattgatttg agcgattcgg acgacggaac acttgaagaa attcactcgg 2881 tttccgacca cattgcaaag gacagcattc tgtgaacaaa taaaaagaga aggcccatat 2941 gcgttgtgcc cttagggcgc aaacggattt atatcatatc gcatttgaac atcagcgaaa 3001 aatatatcgc aataaaaata ggacaaagag ctgataaagc tcttcgtcct ctcatttttt 3061 atcttcttct cttagtggga gtatacatac gcgagttctt tttgttctga cgtgcaacaa 3121 taattttaag gatgattatc agtacagtat acgcaagaaa aaatattgcc gcatacttaa 3181 ttgcatcata gaatgcatcg cttccgatga agctcttcgc aactgtcatc attgccgctt 3241 gctcatccct tgcaacatcc ttggtcgcaa caagatcaac taccgccaat gtctctccgc 3301 catattgaag ctccattgtt cccagcttat cacctgcttt aacgggtgca acaacgtcat 3361 aatcaaggga gatgaccttg tggatcgagc tgcttgtaat tcttgtgttc caaattcttg 3421 aaaactcctc ggcgggcttg acgattacat aatcggtgcc atcgccatac tcgaccttga 3481 cctcggcaac ctcttcggtg ccgctgataa gggtcgtata ctcgaaattg tcaaatgccc 3541 attcatagat gttcttgtgg tcgatgaagt tatagaatac attatttccc gcttcatcct 3601 gctggggtgc gcccatggtt acaagcatat agctgtagcc gtccttatat gccaaggatg 3661 ccaagcatct tcccgcctgg tcaagggtac ctgttttaat gcccttgacg tattcgtaat 3721 aatagtcacc gccgttgatg cgggacatca tatagttggt gtggcttatc tttctcggat 3781 ctgtatgata cttggttgct tccatagtgt attcatttga gcaggagatt tcctcaaaca 3841 aaggcaagct caaagcatat tcaacgatct tcgccatatc gcgtgcggtg gtatagtggt 3901 tttcccaaaa aaggccgtga gaattggtga agtgggtgtc ttcgcatcca agctcctccg 3961 ccttgatgtt catcatttcg gcaaaggcct caaggcttcc cgccacatta tatgcaatta 4021 tatttgccgc ttcgcaggca gaacggagca tcaaagcata aagcaggtct ttatatgata 4081 ccttttcgcc cagtcggata tcggcatttg aacagcctgt catatataac tcatcgaagc 4141 aagcggctcc gcccgaaaca tatgtagttg acagctcggc gatattgtcc tcatattttt 4201 caatgagtag caccgcagtc ataattttgg tcagcgatgc ggggacaagc tgtttgtcgg 4261 cgttcttttc atatatgacc tcacctgtat cgaggttgat taaaagtgcc gcctcggaat 4321 atacctcgaa gtcggggtta aagctgaccg cgccgacatt ggcggtaagg gtcactattg 4381 caaatatcaa agttattatg aatgtaagct ttcgcatggg atttcctctc aatcaaaggg 4441 atttatctga attatacagc cttatacgcc tgatctcaac caagtttggc ttgaagtttt 4501 taagcaaccg acggttgaag gcaaacaaag ctgacaaaaa tctgctatgg aatcagtata 4561 gcagattttt tgtcggttgc aaaggggtaa agggttaata ttttgttaca aattgattag 4621 atgggtgaag cagaataggg gagaccctgc gtggtcgccc ctacggtgca cccacataga 4681 ggggccccct gcttttttgc ctagccccaa ttcggttcct gcaaaaacac cccatgccat 4741 aaggcatagg gtgtttttag tcattatgcg ttttccgact tgaagtattt ttccagcggt 4801 ttatagatca aaacagctac agcaaccgtg atgaccgttt cggccgccat ataccaaccg 4861 ttataggcaa gcgagtaaac gatcggggtc ataccgtatt cattggacca caatacatcc 4921 catatccacg caccggttac aacgtggcaa agatatctca ttaaaaatgt tgcacagatg 4981 cccacaacaa cggcgcgtct tgttttgccg aagaatttct cggaaaggga gcttaagccg 5041 atgaccatat atgccactac atagtcgagc aaaataattc cgatcgccat aatagcgctg 5101 gtggcatatg aaacattgtc aagtcccaaa acgatctgta aaaggctata tacagttgag 5161 cttaaaaagc cccatttcca gccgtaacgg tggctgatga gaattaac // LOCUS sequence036 5171 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence036 VERSION sequence036 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..5171 /mol_type="genomic DNA" /organism="" /note="sequence036" CDS 1829..2674 /product="DegV family protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011948024.1" /transl_table=11 /codon_start=1 /translation="MSKIKITCDSTCDLTKELYEKYDISVMPLAVNLGDDLYRDGVDID GPMIFDYVAKTGILPKTSAVSIAEYTDFFKPWVDDGYEVIHINLSSGLSSCHQNACLAA EELGNIYVIDSLNLSSGSGHLAIAGAELAAEGFEAKEIAEKLNEMKTRLDVSFIIQELD YLHKGGRCSGVAAFGANLLKLRPCIEVVDGGMIVGKKYRGSTEKTIKEYIDGRLAGRED LQLNRIFLTHSHAPQEIVDKMLEYIKELQPFAEVIETVAGSTITSHCGKACLGVLFFKK " /locus_tag="LOCUS_2200" /note="WP_011948024.1 DegV family protein (Clostridium botulinum) [pid:36.6%, q_cov:99.6%, s_cov:99.3%, Eval:3.0e-41]" /note="MGA_267" CDS 3190..3417 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MVTLGTFFAFLGKMGLLMLGVFIIALLTPKLAAWIDKKRAESPSP YGDEPSPARVDDETSPDVSADDVKLGDKNS" /locus_tag="LOCUS_2210" /note="MGA_268" CDS 3452..4894 /product="proline--tRNA ligase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_004450718.1" /transl_table=11 /codon_start=1 /translation="MADNKKMVSSITSMDEDFAQWYTDICKKAELVEYTSVKGCMVIRP YGYAIWENMQKILDAKFKELGHENVCMPMFIPESLLNKEKDHVEGFAPEVAWVTHGGSE RLEERLCVRPTSETLFCEHYANIVHSYRDLPKLYNQWVSVVRWEKTTRPFLRSREFLWQ EGHTIHATAEEAIVETEQMLNVYADFCEQALAMPVVKGKKTESDKFAGAVATYAIEALM HDGKALQAGTSHYFGDGFAKAFDITFTDKNNTVQNPHQTSWGVTTRLIGAIIMTHGDNN GLVLPPPVAPIQVVIVPVAQHKEGVLEKANELYETLKAAGIRVKLDDSDNSPGWKYSEY EMRGVPVRIELGPRDIEENHCVAVSRHNREKTFLSLDGIADAIKAKLEDVRRGMYEKAL ANQNEKTYACTSIDEIKEMLEKNGDGFVKAMWCGEEACEDEVKALTGVGSRCIPFEQEE LSDKCVCCGKPAKHMVVWGKAY" /locus_tag="LOCUS_2220" /gene="proS" /EC_number="6.1.1.15" /note="WP_004450718.1 proline--tRNA ligase (Clostridium botulinum) [pid:66.0%, q_cov:100.0%, s_cov:100.0%, Eval:5.0e-192]" /note="MGA_269" ORIGIN 1 atccgactct atgcaagaac ggaatatgac gagatcgaca accgcttcag atatgaattc 61 ttccccgatg ctctcgattc caacggttca aagataacat catataacaa gctttcgctt 121 cgcacctgtg caaatgacgc gggatatctc tatatgcgtg atgatatgat aagcgatctt 181 gctcacgcaa cgggcgtcga tgcaaaatat tcccgtccgt gcgctgtatt cctcaacggt 241 gaatattatt gcttcgcttg ggtacagcag accttctcgg aagactggct tgagcataca 301 tatgcaattg agcaggccga atgggatatc ctcaagggct gtgaatatat gatctgggag 361 gacgccgaca acgatattgt tcaggcaact gccgattggc acgagatgta ttcttatgct 421 tataaggatt taaccgacga tgctgtctat gccgagcttt gcgagatgat cgacattgac 481 aacttcttaa cctattacgc tttgaactca tatcttggca acggcgactg gccgaacaac 541 aactggaagg tatatagata caaatcgggc accgcctatg agggacagta tccctgcgac 601 ggaaagtggc gctttatgct ctatgacacc gacttctgtc tgggtcttta cggcaacgat 661 gcttttagcc gccacgttgc aaacctcttt aaagaggaac atttcggtct gatgcccaac 721 gactgggtaa ttgatgttca cgatgacggt gagaagtatc agcgctccga tctgctgatc 781 tccctttgca ggcgtgaaga tgtcagagag cgcttccttt gcatattgag cgatatgatc 841 aactggcact attcggaaga tcgcgtttct gatcatcttg atttgtataa cgcactgcga 901 ctccacgaga tcattgaagc ttcaaacgtt ggcaaggcaa acatctggag catcaacagc 961 gagcttaaca atgtcagaga atatatgccc acccgcgcat atgccgtaag aagtcagatc 1021 aaggacgttt tccctgatta taccgaggta tattatgtat actgctcgcc cacagacggc 1081 gcgaccataa ccgtcaacac cgcaaatatc actcctgacg aggaatatat cttcggaggc 1141 tggtatttca agggtacaga ggtaatgctc acctgcgagc ttgcttatgg ctatgaattt 1201 gattattggg agatcaacgg cgaaaagatc tatgatatga ccactccttt gtccgatgag 1261 atatacggcg acaaggcaag catcgagctt tatgttcaca acaccgcaag cgagcttatc 1321 ctctccgagg tatgctataa gggctcaaca agcgactata tcgtcattaa gaaccccacc 1381 gaggaggata tcgttctcaa gaactatatg ctcagcgacg gaagctcata tttcaccgtt 1441 cctaccacga caattaaagc aggcggcgaa ttgaagattc tttgcaagaa ctattccaag 1501 gctgacgcca tcggcaaaat cgaatgcggt ttcaacctca aggaatttga aacggtatat 1561 ctttacaacg gttcgggcga ggtcatctgc gaaatgtatc tgcccgacgg ctcggacaac 1621 accgttcgca agttcaatga gctaacaagc acatattatg aagaaaccaa tgaaacaaaa 1681 acccgtattc ttgaagcaga acttccgcaa agaggcggtt ggggaggctg gggctggtaa 1741 aaagccttta caaaccgttt aaaagatgtt aaaatggttg agcactcaac aaattttgtt 1801 agaaaatcca tttttaggag tagtttatat gtctaaaatt aaaatcacct gcgactctac 1861 ctgcgactta acaaaggaac tttacgaaaa gtatgatatt tccgtaatgc ctttggcggt 1921 aaatttgggc gatgaccttt accgtgacgg tgtagatatt gacggcccca tgatctttga 1981 ctatgtcgca aagaccggca ttttgcccaa gacctcggca gtatccattg cggaatatac 2041 cgacttcttc aagccttggg tagacgatgg gtatgaagtg atccatatca acctttcctc 2101 gggactttcc tcttgccatc agaacgcttg tctggcggct gaagagcttg gaaacattta 2161 tgttattgac agcttgaatc tttcctccgg ctcgggacac cttgcaattg caggcgctga 2221 gcttgcggcc gaagggtttg aagctaagga aattgcagaa aagctcaacg aaatgaagac 2281 aagactcgat gtcagcttca tcattcagga gcttgactat ttgcacaagg gcggcagatg 2341 ctcgggcgtt gcggcattcg gcgcaaacct tttgaagctc agaccttgca ttgaagttgt 2401 tgacggcgga atgatcgtcg gcaagaaata tcgcggttcc accgaaaaga ccatcaagga 2461 atatattgac ggcagacttg cgggaagaga ggatcttcag ctcaacagaa tcttcctgac 2521 acacagccac gctccccagg agatcgtaga taagatgctt gaatatatta aggagcttca 2581 gcccttcgcg gaagtgatcg aaaccgttgc cggctcgaca attaccagcc attgcggaaa 2641 agcttgcctg ggcgtgctgt tctttaaaaa gtgatgatca aacaaaatcc cttgctcgaa 2701 tgagcagggg attttttgat atgagcggag cgccgtctgc gggtgcgttc cgtaggaaca 2761 gtaccgcagg tggcgcgtag cgggggcggc cctgtgtggt cgcccgttaa tgtcccgcag 2821 ggacaattcg tgtcacgcaa gtgactattc atgacagctt gcttgtttat tcaattactt 2881 gcaggggcag gcctgtgtgc ctgcccgttt ttatcgaggg aaaaccgcag gaatccttta 2941 catatatgac aaagaatgaa ttgcaactgc gttgcatgaa tagacgaggt gtgtcataaa 3001 attgtttgct ttgcaaacat gaattgcctt cagcattata aagggcgggc ctgtgtgccc 3061 gccttgtttg tcgcgggcga ccacataggg tcacccctat atgcttacaa cattttccct 3121 tcaccccttg caatcccaat ttatctgtga tattatgaaa tgtaacgaaa ttgcggaagg 3181 gagagatttt tggtgacatt gggcacattt tttgcctttt tgggcaaaat gggtcttctg 3241 atgcttggcg tatttataat cgcgctgctc actcccaagc ttgcggcttg gatagataaa 3301 aaacgcgcag aaagcccctc tccttacggc gatgagccga gtcccgcaag ggtggatgat 3361 gaaacttcac ccgacgtcag cgccgatgac gtaaaattag gcgataagaa cagttagatc 3421 aattacataa atataaaatg gagagataat tatggctgat aacaaaaaaa tggtttcctc 3481 tatcacctca atggatgagg actttgccca gtggtatacc gacatctgca aaaaggcaga 3541 gctggttgaa tatacctccg tcaagggctg tatggtaatc cgcccctatg gctatgctat 3601 ctgggaaaat atgcagaaga ttttggatgc caagttcaag gagctcggac acgaaaacgt 3661 atgtatgccg atgttcattc ccgagagctt gcttaacaag gaaaaggacc acgttgaggg 3721 ctttgctccc gaggtcgcct gggtaaccca cggcggaagc gaacgccttg aagagcgtct 3781 ttgcgttcgc cccacatctg agaccctttt ctgcgagcat tatgcaaata ttgttcattc 3841 ctaccgcgac ctgcccaagc tttataacca gtgggtaagc gttgtaagat gggaaaagac 3901 cacaagaccc ttcctcagat cccgcgaatt cctctggcag gaaggccaca ccattcacgc 3961 aactgccgaa gaagcaattg ttgaaaccga gcagatgctt aatgtatatg ccgacttctg 4021 cgagcaggca cttgcaatgc ccgttgttaa gggcaagaag accgagtcgg ataagtttgc 4081 aggcgcagtt gcaacttatg caattgaagc actcatgcac gacggtaagg ctttgcaggc 4141 cggcacatcc cactatttcg gtgacggctt cgcaaaggca tttgacatca cctttaccga 4201 caagaacaac accgttcaga accctcacca gacatcctgg ggagttacca cccgtcttat 4261 cggcgcgatc atcatgaccc acggcgacaa caacggcctt gttttgcccc cgccggttgc 4321 acctatccag gttgttatcg ttcctgttgc tcagcataag gaaggcgtgc ttgaaaaggc 4381 taacgagctt tatgaaaccc tcaaggccgc aggaatcaga gttaagctgg acgattctga 4441 caattctccc ggctggaaat attcggaata tgagatgcgc ggcgtgcccg taagaatcga 4501 gctcggcccc cgcgatatcg aagaaaacca ctgtgtagca gtatcccgcc acaaccgcga 4561 aaagaccttc ctttccttgg acggtattgc agatgcaatt aaggctaagc ttgaggatgt 4621 aagacgcgga atgtatgaaa aggcgttggc aaaccagaac gaaaagactt acgcttgcac 4681 atccatcgac gagatcaagg aaatgcttga aaagaacggc gacggctttg ttaaggcaat 4741 gtggtgcggc gaagaggctt gtgaggacga agttaaggca cttacaggcg tcggctcaag 4801 atgcattcca tttgaacagg aagaactcag cgacaaatgt gtatgctgcg gaaagcccgc 4861 caagcatatg gtcgtttggg gaaaagctta ttaaaaatca agctcctatc cgaaaggatg 4921 ggagcttttg ctttataggg gcgaccctat gtggtcgccc gcggggcagg cacacaggcc 4981 tgcccctttt taatgaataa tgaatgatga ataatgaatg atgaataatg aatgatgaat 5041 aatgaataat attgttaaaa aagcacctct tcggggtgtt tttttaaatg gtgctttctc 5101 cccgcgctcc gcgccacctg cggcactgtt ccttcggaac gcgcccgcag acggcgctcc 5161 gctgcgtagc g // LOCUS sequence037 5049 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence037 VERSION sequence037 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..5049 /mol_type="genomic DNA" /organism="" /note="sequence037" misc_feature <1..1183 /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_010890705.1:spore germination protein" /note="WP_010890705.1 spore germination protein (Clostridium) [pid:39.2%, q_cov:94.7%, s_cov:69.8%, Eval:2.8e-81, partial hit]" /note="MGA_270" /locus_tag="LOCUS_2230" CDS 1173..2219 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MKTKSRISPWQVFVLLMLGRIMYSMLYQARNFTSGTPMMLGQLLA TLIEAIIAIPLLVFLSYGEPLAESISSKSAVQAIIKGGFAIYFTALFSMMLADFAAFMH NQFSVVGSPITVIIILALASAYCASLGLEGIARAAGIVFWCVIILVVSMALLSEGEPNW LYLQPMTKGDIATMLDYMNESRGSSWWLPMLASISGSLKKDSWRAGIWYLVGKLVFVEL LIFAVTVILWRFVNVPGYPILALGAYAKTDFVQRFDAVNMFVWTLNCVIVGGSYLYSSS GVGKKKRKICIWLFALAAVALAAIEYHLEVPLQSGLAVAFRGWGTLILGAMLPLIAIIM IKRRRKCA" /locus_tag="LOCUS_2240" /note="MGA_271" CDS 2210..2653 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MRLASVLLAIMLALTGCSYVSEVEQRIMVYALGVDREEDGNVSVS YQVFDPSGDKGSSPVGADEKNIKIIEAKGKSLFECEKKVELMTGKEIFVGDTELIVLGD SIKNEDIEKLMSYFRNSKDIYLGTDMIFSSGKAIEVIDVSKSK" /locus_tag="LOCUS_2250" /note="MGA_272" CDS complement(2581..2781) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MIGITIEFDPLISLVTSITREEYALDDDTAAESISPKLWGSTPYL LLLTSMTSIALPDEKIISVPR" /locus_tag="LOCUS_2260" /note="MGA_273" CDS 2765..3295 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MVIPIMTVEKDEEGQPYPKGVMTNMLLVDGRGVDTLNEDDAKGAR LLRGNAKMLSLNIPEGEYESAAVVKIKKTKRSIEIGQNGYPVVTVRIEGEISITENPSD TDREVLRLAAQKELVWFCDLAYLKAAKNAADIFEIGLMLQKYQPRYYEKMRQDFENMLE NTEFQVFITLQTR" /locus_tag="LOCUS_2270" /note="MGA_274" CDS 3394..3750 /product="Asp23/Gls24 family envelope stress response protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003431114.1" /transl_table=11 /codon_start=1 /translation="MVKIDNHLGTIEITSAYLTTLIGHTVTSCFGVVRMNPAGARQGVK TNLLKTESIDNGVKVRFAKDTNKLVIDLHISVTYGINVSAITDSIINKVRYVVEKETGI EVKKINVFIDGMES" /locus_tag="LOCUS_2280" /note="WP_003431114.1 Asp23/Gls24 family envelope stress response protein (Clostridioides difficile) [pid:31.6%, q_cov:96.6%, s_cov:94.8%, Eval:5.4e-12]" /note="MGA_275" ORIGIN 1 agagggagtt cagcttcttt gcggcggctt tgcgttaatt ttggtgcatg gcgtcagccg 61 cggcgtttcc gttgcggcac agggctattc aattcgcgcc gtttctccgc ccgactccga 121 atcggacgtt atgggcaccc gcgaagcttt gagcgacaac atccgaacaa gcatctcctt 181 aattagacgg agagttaaaa gcccgcgcct gcggtttgaa tttgtgcggg caggaaagct 241 ctcggacatt gagctttgct tagtatatat cgacggcaag accccaaaga agctgaaaaa 301 cgaggtgaaa tcacggcttg aaaaaatcaa gctggagctg attttgacca gcggaaacat 361 aattcccttc atctctgaaa acggcgggtc ctttttctcg ggagcatcga caacagagcg 421 ccccgatgtt ctggcggcaa aggtgaatga ggggcgaatc gcggtgctta ttgacggaat 481 tccctatgcg gtggtgtatc catcgctatt catcgagaat ttccagacgg tggatgacta 541 ctctcaaaaa ccgtattatg tggcatatat gcgagtaatc cgctatttgg cgtttatcat 601 ttcagcactt ctgcccgggg catatgttgc cgcggcgacc catcatccgg aggtattatc 661 aaggctgtta ctaattaacc tcatcgccag cgaggagctg acgccgtatc ccttgatcgt 721 tgagatgctt atcgtgatcg tgatgtttga aattctgcgg gaggcgggtc tgcggcttcc 781 caaagtcatc ggtggggcgg tgtcaattgt cgggggactt gtaatcggcg atgccgctgt 841 cacaagcggg ttgattcccg caccgctgtt aattatcatc ggcataaccg caacttgttc 901 ctttgcgctt ccctcgcttg gacagcagat ggcggtaata agattgataa atgttgtttt 961 gggcgggctg acagggcttt tcggcattgc agttttttcg gcgatagtgt ttgtcaatgc 1021 ctgcgtcacc gatgccttcg gaattccgta cacagcaccc ataacgccgt tcacaaaaag 1081 cgcaatgagg gatgttttgg tgagaatggg atttttaaag atgcaacaaa accatccgac 1141 ggttgaagag cttaacggct cgggagggga aaatgaaaac taaatcccga ataagcccgt 1201 ggcaggtgtt tgtgctttta atgctgggca gaataatgta ttcgatgctg tatcaggcgc 1261 ggaattttac ctcgggaaca ccgatgatgc tcggtcagct tttggcaaca ctcatcgaag 1321 cgataattgc aattcctctg ctggtgtttt tgtcatatgg cgagcctttg gcggagagca 1381 taagctcaaa gtctgccgtt caggcaataa ttaaaggcgg atttgcaata tatttcaccg 1441 ctttgttttc aatgatgctt gcagactttg ccgcttttat gcataaccag ttttccgtgg 1501 tcggctcacc cataacggtg ataataattc tggcgctcgc ttcggcatat tgcgcttcgc 1561 ttggacttga gggcatagct cgtgcggcgg gaatcgtttt ctggtgtgtt ataattttag 1621 ttgtgtcgat ggccctgctc agcgagggcg aaccaaattg gctatatctt cagccgatga 1681 ccaaaggaga tattgcaacg atgcttgatt atatgaatga gagccgaggt tcaagctggt 1741 ggcttccgat gttggcatca atttcaggca gcctcaaaaa ggattcctgg agggcgggaa 1801 tttggtatct tgtcggcaag ctggtgtttg ttgagctttt gatatttgcg gtgacggtaa 1861 ttttgtggcg gtttgtgaac gttccgggat atcccattct cgcgttgggg gcatacgcaa 1921 aaaccgactt tgttcagcgc ttcgacgcgg ttaatatgtt tgtgtggact ctcaactgtg 1981 tgatcgtcgg cggatcatat ctgtattcat catcaggcgt cggcaagaaa aagcgaaaga 2041 tctgcatatg gctgtttgcc ttggcggcgg tggcacttgc ggcaattgaa tatcaccttg 2101 aagttccgct tcaaagcggt cttgctgttg cattcagagg atggggaacg ctgatcctcg 2161 gggcgatgct gcccctgatt gcaataataa tgattaaaag gagaagaaaa tgcgcttagc 2221 ttcggttttg cttgcaatta tgcttgccct gacaggctgt tcatatgttt cggaggtcga 2281 acagcgaata atggtctatg ccctcggggt cgaccgagaa gaggatggca acgtcagcgt 2341 gtcatatcag gtttttgacc cctcggggga taaaggttca tcgcctgttg gcgcagatga 2401 aaaaaacatc aaaattattg aagcaaaggg taaaagcctc tttgaatgcg aaaagaaggt 2461 tgagcttatg acaggcaagg agatcttcgt cggagatacc gagctgatag ttcttggcga 2521 cagcattaaa aatgaggaca ttgaaaagtt gatgtcatat tttcgcaact caaaggatat 2581 ttatctcggc accgatatga ttttctcgtc gggcaaagcg atagaggtca tagatgtcag 2641 caaaagcaaa taaggtgtgg acccccagag cttggggctg atgctctcgg cggcggtgtc 2701 gtcgtcaagg gcatattcct cgcgggtgat tgaagttacc aacgaaatga gcggatcaaa 2761 ctcgatggta attccgatca tgaccgttga aaaggacgaa gagggccagc cttatcccaa 2821 gggtgtgatg accaatatgc ttcttgttga cggcagggga gttgacaccc tcaatgagga 2881 cgatgccaag ggcgcgcggc ttttgcgggg caatgcaaaa atgctgtcgc tgaatattcc 2941 cgagggcgaa tatgaaagcg cggcggtggt gaaaattaaa aagaccaaac ggagtattga 3001 aatcgggcag aatgggtatc ccgtggtgac ggtgagaatt gaaggggaga tatcaataac 3061 ggaaaaccca tcggataccg accgcgaggt tttgcggctg gcggcgcaga aggaattggt 3121 gtggttttgc gatttagcat acctcaaagc cgccaaaaat gccgcagata tctttgaaat 3181 cgggttgatg cttcaaaaat atcaaccgag atactatgaa aaaatgcgtc aagattttga 3241 aaatatgctc gaaaacacag aatttcaggt atttatcaca cttcaaacac gttagatgga 3301 attattttgc ttgcatttta atgaggaata tgatatgata cattagataa cgtatgatta 3361 caaattaaat ctcgacctga aaggggaatg agcatggtaa aaattgataa ccacctcggc 3421 accattgaaa taacctctgc ttatttgaca acgcttatcg gccatacggt cacaagctgt 3481 ttcggcgttg taagaatgaa ccctgccggc gcaagacagg gcgttaagac aaatcttttg 3541 aaaaccgaat caattgacaa cggcgtcaag gtaagattcg caaaggacac aaacaagctt 3601 gtaattgacc ttcacatttc cgtcacctat ggaatcaatg tttccgcaat caccgacagc 3661 atcatcaaca aagttagata tgttgttgaa aaggaaacag gcattgaagt taagaagatc 3721 aacgttttca tcgacggaat ggaatcataa ttggaggatt aaattgacat gatcagcggt 3781 aatattctgc gcgacgcatt catcagcggc gcaaatgtaa tatcaaacaa gaaaaagagc 3841 attgacgagc tcaatgtttt tcctgtaccc gacggagata ccggcacaaa tatgtccatg 3901 actctttcaa acgcaaagaa agagcttgtt cttatggacg atgacgtaac agttgcacag 3961 gtttcaaaga caatggcatc tgctttgctc agaggcgcaa gaggaaactc gggcgttatt 4021 acaagccttt tgttcaaggg atttgacaag gctttgaagg acaagaagac cgcaaccaca 4081 gctgacattg cttcggcact tgaagttggt gttgagcgtg catataaagc agttatgaag 4141 cccactgagg gtaccatttt gactgttgca agactcgcca gcgttaaggc aagagagatc 4201 tgcgacgagg ttacagatgt tgcagtattc tgggatatgg tctgcgaaga ggctgaaaga 4261 gttttggata ccactcccga ccttttgccc actttgaaga aggcaggcgt tgttgacgca 4321 ggcggcaagg gcctttgcga aatgtggcgc gcgatgggca aggtatttaa gggcgaaggc 4381 attgttgccg atgaagctgc cgcagttaag ggctcggaac ctgtaacaat tgaaacattt 4441 gcatctgtag ttggtgaatt cgacgatgag atcaccttta catactgcac cgagtacatc 4501 gttaagaagc acgagaacgc tgaggattcc ctcaagctca gagcttacct tgaaacgatc 4561 ggcgactgcg ttgtggttgt tgaggatgat gagatcatta aggttcatgt tcatacaaat 4621 aaccccggct tggcaattga aaaggctctt gaatttggtt caatgacatt gcccaaggtt 4681 gaaaatatga gatatcagca cgaggccaag cagaaggaat ctaaggttac agtttcctct 4741 gccgataagg catatgtgag cgttgctccc gaaaagcagt tcggatttgt tgcagttgcc 4801 gcaggcgacg gcgttgaaga actcttcaag gatgcaggtg ctgattgtat cgtcaagggc 4861 ggacagacaa tgaacccctc gactcaggat attttggctg ctgtacagtc ctgccccgct 4921 gagatcgttt tcgttttgcc caacaacaag aatatcatca tggctgccga gcaggtcaat 4981 gctctgaccc ccaagaatgt ggtggtcatc cccagcaaga ccgttcctca gggcattacc 5041 gccatgctg // LOCUS sequence038 5034 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence038 VERSION sequence038 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..5034 /mol_type="genomic DNA" /organism="" /note="sequence038" CDS 53..580 /product="30S ribosomal protein S5" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011393920.1" /transl_table=11 /codon_start=1 /translation="MARFDAPKTQEQSEFKEKVVAINRVSKTVKGGRIMKFAALVVVGD GNGTVGFGIGKSGEVPDAIRKGIEDARKNLIKVSLKGTTIPREIVGKYGAGEVLMRPAA KGTGVIAGGPVRQVLDAVGIKDIRTKSLRSNNPYNVVRATFNGLENLKSAEEVAAKRGK TVKEIFAEGGAK" /locus_tag="LOCUS_2290" /gene="rpsE" /note="WP_011393920.1 30S ribosomal protein S5 (Moorella thermoacetica) [pid:66.1%, q_cov:96.0%, s_cov:98.8%, Eval:1.3e-54]" /note="MGA_277" CDS 580..759 /product="50S ribosomal protein L30" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003357637.1" /transl_table=11 /codon_start=1 /translation="MATIKIELVKSLNGRLKDQIATAHALGLRKIGDVTVQPDNACTKG KINKIVHLIKVTEA" /locus_tag="LOCUS_2300" /gene="rpmD" /note="WP_003357637.1 50S ribosomal protein L30 (Clostridium) [pid:54.2%, q_cov:100.0%, s_cov:100.0%, Eval:6.9e-10]" /note="MGA_278" CDS 779..1219 /product="50S ribosomal protein L15" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003357513.1" /transl_table=11 /codon_start=1 /translation="MKLHDLAPVEGSNKGSKRVGRGHGSGWGKTAGKGHKGQNARSGGG VRPGFEGGQTRLARRIPKRGFNNIFATNYTAINVSSLEKFVDGTVVDTELLMAAGIVKD PADGIKVLGNGELTKKLTVKAAAFSASAKEKIEKAGGEAQVV" /locus_tag="LOCUS_2310" /gene="rplO" /note="WP_003357513.1 50S ribosomal protein L15 (Clostridium) [pid:61.0%, q_cov:100.0%, s_cov:100.0%, Eval:2.0e-45]" /note="MGA_279" CDS 1220..2515 /product="preprotein translocase subunit SecY" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_005810127.1" /transl_table=11 /codon_start=1 /translation="MFNTLRNAWKVADIRKKLFYTLFIIVLYRLGGYIPVPFLDATVIG EMISGSNNIFSYLNVLSGGTFSKATLLCLSISPYINAQIIIQLLTYAIPALERLAKEGE EGRKKISNITKWSTLAIALVQSYAYYITLRNEGALVYTTGFEKWLSMFVIIACFTAGAM LIIWLGGKIDQHGIGNGISMLLFAGIVADLPKSFGSTFATLIDTGSVGYILLIPVIVII FVLIIGFVVFMDNAERRLPIQYAKRVVGRKMYGGQSTYLPIKVAMAGVLPIIFAISFLS IPSTIVMFTGEPEAGTFWHGFLTLFSYTHPVYAILYLILIIAFSYFYISMQYNPVEIAN NLRQNNGGIPGLRPGKPTSDYIQRVVNKLTLVGAIFLGIIALLPIVFAQITGIGNLALG GTSILIVVNVALETVRQIESQMMMRHHKGFLE" /locus_tag="LOCUS_2320" /gene="secY" /note="WP_005810127.1 preprotein translocase subunit SecY (Desulfitobacterium hafniense) [pid:43.9%, q_cov:99.5%, s_cov:99.3%, Eval:1.1e-102]" /note="MGA_280" CDS 2591..3223 /product="adenylate kinase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_005649108.1" /transl_table=11 /codon_start=1 /translation="MNLILLGAPGAGKGTQAEVICNAKGIPAISTGNILREAVKNGTPM GLEAKTFMDSGALVPDEVVIGILKDRIAQDDCKNGFILDGFPRTVPQAQALDRMGVTID KVIEIYVPDETIAARLSGRRVCEKCGNSYHVEFKPTKVEGICDACGGNVVIRKDDEPAT VLDRLSVYHEKTAPLKDFYSAQGKLTTVIGQEELAETSRLTLEAVEA" /locus_tag="LOCUS_2330" /gene="adk" /EC_number="2.7.4.3" /note="WP_005649108.1 adenylate kinase (Haemophilus) [pid:59.9%, q_cov:89.0%, s_cov:87.4%, Eval:1.0e-60]" /note="MGA_281" CDS 3230..3982 /product="type I methionyl aminopeptidase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003421130.1" /transl_table=11 /codon_start=1 /translation="MIIIKTSNELTKMRKAGLITGGALVAAEKAIRPGMSTLELDKVIK NYIISHGAKPSFLGYGGFPASACISVNDTVIHGIPTAGEKLKEGDIVSVDVVAYIDGYH GDSAKTFAVGEISREAKALMASTEESLYVAINMAKPGVRIGDISAAIQEYNEKRGYSVV REFVGHGVGANLHEDPEVPNFGRAGHGPRLMPGMVIAIEPMINAGRPHVKILNDGWTVK TNDKSLSAHFEHTIAITSSGAIILTQPE" /locus_tag="LOCUS_2340" /gene="map" /EC_number="3.4.11.18" /note="WP_003421130.1 type I methionyl aminopeptidase (Clostridioides) [pid:59.0%, q_cov:99.2%, s_cov:99.6%, Eval:3.1e-76]" /note="MGA_282" CDS 3995..4273 /product="RNA-binding protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_010966390.1" /transl_table=11 /codon_start=1 /translation="MNIVKGSVVKSLAGRDQGRYYVAVATEDRLVYIADGRERKLEKPK AKNPRHISPTCMVVSLEGMTNKKLKKLLDELITQGSPEAGCDRTRNI" /locus_tag="LOCUS_2350" /note="WP_010966390.1 RNA-binding protein (Clostridium) [pid:39.0%, q_cov:79.3%, s_cov:89.1%, Eval:9.3e-07]" /note="MGA_283" CDS 4287..4505 /product="translation initiation factor IF-1" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003357316.1" /transl_table=11 /codon_start=1 /translation="MSKEDVIELEGTVLEALPNAMFQVELANGHKILAHVSGKLRMNYI RIVPGDKVTVEMSPYDLTKGRITWRSK" /locus_tag="LOCUS_2360" /gene="infA" /note="WP_003357316.1 translation initiation factor IF-1 (Clostridium) [pid:80.6%, q_cov:100.0%, s_cov:100.0%, Eval:3.5e-30]" /note="MGA_284" ORIGIN 1 gccgaaggcg cccgtgaggg cggcctcaag ttctaaggag gaggagaaga ctttggctag 61 atttgacgca cccaagactc aggaacagtc tgagttcaaa gaaaaggttg tcgccattaa 121 ccgtgtatct aagacagtta agggcggccg tattatgaag tttgctgcac tcgttgtagt 181 aggcgacggc aacggcactg tcggattcgg tatcggtaag tccggcgaag ttccggacgc 241 tatcagaaag ggtatcgaag acgcaagaaa gaaccttatc aaagtttcac ttaagggaac 301 aactatccct cgcgaaatcg tcggtaagta cggcgcaggc gaagtcctca tgagacccgc 361 tgcaaagggt accggtgtta tcgccggcgg tcctgtacgt caggtactcg acgctgtcgg 421 catcaaggat atcagaacga agtcccttcg ttccaacaat ccttacaatg tagttagagc 481 tacattcaac ggacttgaaa atcttaagag cgctgaagaa gttgctgcta agagaggcaa 541 gaccgtaaag gagatctttg cagaaggagg agctaagtaa tggcaacaat taagattgaa 601 ttggtcaaga gcctcaacgg cagacttaag gaccagattg ctactgcaca cgctctcggt 661 cttcgcaaga tcggcgacgt taccgttcag ccggataacg cttgcacaaa gggtaaaatc 721 aacaagatcg tacacctgat caaagttacc gaagcataag acaaggaggt gcgaataaat 781 gaaattgcat gatttggcac ctgttgaagg ctccaacaag ggctccaaga gagtcggccg 841 cggacacggt tcaggctggg gcaaaactgc aggtaaagga cacaaaggtc agaatgctcg 901 ttcaggcggt ggcgtaagac ccggctttga aggcggacag accagactcg caagaagaat 961 ccctaagaga ggattcaaca acatcttcgc aaccaattat acagcaatca acgtttcttc 1021 ccttgaaaag ttcgttgacg gaacagtagt cgacaccgaa cttcttatgg cagcaggcat 1081 cgtaaaggat cccgctgacg gtatcaaggt tttgggcaac ggcgaactca ccaaaaagct 1141 tactgttaag gcagctgctt tctctgcttc cgctaaggaa aagattgaga aggcaggcgg 1201 agaggcacag gtggtctaaa tgtttaatac attgagaaac gcctggaaag ttgccgatat 1261 tagaaagaaa ctgttttata cactgtttat aattgttctt tacagattgg gcggatacat 1321 tcccgtcccc ttcctggatg caaccgtcat cggcgagatg atctcgggaa gtaacaacat 1381 tttcagctat ctgaacgttc tctcgggtgg tacattctct aaggcaacct tgctttgctt 1441 gtccatctcc ccctacatta acgctcagat catcattcag cttctgacct acgctattcc 1501 tgcactcgaa agacttgcta aggaaggcga agaaggcaga aagaagatca gcaacatcac 1561 caagtggagt acacttgcaa ttgcacttgt tcagtcctat gcatactaca tcaccctcag 1621 aaacgaaggc gctttggtat acaccaccgg atttgaaaag tggctctcga tgttcgttat 1681 catcgcttgc ttcacagcag gcgctatgct cataatctgg ctcggcggca agatcgacca 1741 gcacggtatc ggaaacggta tctcaatgct cctctttgcc ggtatcgtag cagacttgcc 1801 caagtccttc ggttccactt ttgcgacact gatcgacacc ggctctgttg gatacattct 1861 tctcatcccc gtaatcgtca tcatctttgt tttgatcatc ggcttcgttg tcttcatgga 1921 taacgctgag agaagacttc ccatccagta cgctaagaga gttgtcggca gaaagatgta 1981 cggcggccag tccacctacc ttcccatcaa ggtagcaatg gcaggcgttt tgcccatcat 2041 cttcgcaatt agctttttgt cgattccttc caccattgta atgttcaccg gcgaacccga 2101 agcaggaaca ttctggcacg gattcctcac attgttcagc tacactcacc ctgtatacgc 2161 aattctctat ctcattctca tcattgcatt cagctacttc tacatttcaa tgcagtacaa 2221 ccctgttgag attgcaaaca atctgcgtca gaacaacggc ggtatccccg gacttcgtcc 2281 cggtaagccc acttccgact acattcagag agttgttaac aagctcaccc ttgttggcgc 2341 aatcttcttg ggcataatcg ctttgcttcc tatcgtgttt gcacagatta ccggtatcgg 2401 caacttggca ctcggcggaa cttcgatcct catcgttgta aacgttgcac ttgaaactgt 2461 acgtcagatt gaatctcaga tgatgatgcg tcatcataag ggcttccttg aataatatat 2521 tcattgaggc gtgttatgtt cggcggcaag cctttggggc ttccgtcgga ccctgaaaag 2581 gagcttgaat atgaacctga ttttgttagg cgctcccggt gccggaaaag gcacacaggc 2641 agaggtaatt tgcaacgcca agggcattcc tgcaatctca accggcaaca ttttgcgtga 2701 agccgttaag aacggaactc ccatgggact tgaagcaaag acctttatgg attcgggcgc 2761 attagttccc gacgaagtcg ttatcggcat tctcaaggac agaatcgctc aggacgactg 2821 caaaaacgga tttattctcg acggtttccc cagaactgta ccccaggcgc aggctttgga 2881 cagaatgggt gtcaccatcg acaaggttat cgagatctat gttcccgatg aaaccatcgc 2941 cgcaagactc tctggaagaa gagtctgcga aaagtgcggc aactcctatc atgtggaatt 3001 caagcccaca aaggtagagg gcatctgcga tgcctgcggc ggcaacgttg tgatccgcaa 3061 ggacgacgag cccgcaacag tcctcgatag actcagcgtt tatcacgaga agactgctcc 3121 tttaaaggac ttctactccg ctcagggtaa gcttacaacc gtaatcggac aggaagagct 3181 cgctgaaacc agccgcttga cccttgaagc agttgaggcg taagcttaaa tgataattat 3241 taaaacttcc aacgaactca cgaagatgcg caaagcggga cttattacag gcggtgcatt 3301 agtcgctgcc gaaaaagcga tacgccccgg aatgagcact ctggagctgg ataaggtgat 3361 aaaaaactac atcatctctc acggcgccaa gccctcgttc ttaggatatg gcggtttccc 3421 cgcttccgcg tgtatctccg ttaacgacac cgttatccac ggtatcccca ccgcaggcga 3481 aaagctcaag gagggtgaca tcgtgtcggt agatgtcgtc gcatatatcg acggttatca 3541 cggcgactcg gcaaagacat ttgccgtcgg cgagataagc cgggaagcga aagctttaat 3601 ggcttcaacc gaagaaagcc tatatgttgc catcaatatg gctaaaccgg gcgtgcggat 3661 cggagatatt tccgcggcaa ttcaggagta taacgaaaaa agaggttact cggtagtcag 3721 ggaatttgtc ggtcacggtg tcggcgcaaa ccttcacgaa gaccccgagg ttcccaactt 3781 cggccgagca ggccacggtc cgcgcttaat gccgggcatg gtaattgcaa ttgagccgat 3841 gataaatgcg ggcagaccgc atgttaagat ccttaacgac ggctggaccg ttaaaactaa 3901 cgacaaatct ctttccgctc actttgagca cacaatagca attacgtcct cgggtgcgat 3961 aattctcacc caacccgaat aaggaggggc gtttgtgaat attgtcaaag gctccgtggt 4021 caaatcattg gcagggcgag atcaaggccg ctattacgtt gcagtggcga ccgaagaccg 4081 cttggtatat attgctgacg ggcgtgagcg caagcttgag aagcccaaag cgaaaaaccc 4141 aagacacatt tcaccgacct gcatggtggt cagcctcgaa ggcatgacga acaaaaagct 4201 gaaaaagctt cttgatgagc ttataaccca aggctcgccg gaagccggct gcgaccggac 4261 gagaaacatt tgaaaagagg gattaaatgt ccaaggaaga tgtaatcgaa ctcgaaggta 4321 ccgttttgga agctttgccg aacgcaatgt tccaggttga gctcgcaaac ggacacaaga 4381 ttctcgccca tgtatccgga aaactcagaa tgaactacat tcgtattgtt cccggagata 4441 aggtgacagt tgaaatgtcg ccatatgatc tgacaaaggg cagaatcacc tggagatcca 4501 agtgatctgt cgattaaacc aaccaacgaa agcataagct ttaaagtatt aggaggtatt 4561 tcaatgaaag taagaccttc agttaaaccg atgtgcgaaa agtgcaaggt aatcaagcgc 4621 aagggcaagg taatggtcat ttgcgagaac cccaagcaca agcagcgtca gggttaaatc 4681 acttaatgga ggtgcagcta atttatggct cgtatagcaa gtattgacct tcccagagat 4741 aaaagaattg aggttgctct cacttatatc tacggtatcg gtcagcccac agcaactctc 4801 atctgcaagg aaacaggcgt tgaccctgac atcagagtta aggacctttc tgaagaagat 4861 gaagcaaaat tgcgtgaata tatcgacaag aacctcattg ttgaaggtga caagagaaga 4921 gaagttcaac tcaacattaa gagacttgtt gaagtaggtt gctaccgcgg tcttcgtcac 4981 cgcagaggac ttcctgtaag aggtcagaga accaagacca acgcaagaac ccgc // LOCUS sequence039 5018 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence039 VERSION sequence039 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..5018 /mol_type="genomic DNA" /organism="" /note="sequence039" CDS complement(36..1403) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MTNAKTTKRALLSSIVALLICFTMLLGTTFAWFTDSVSSTNNIIK SGTLDVEMTYSSDNATWADASTGTIFNYQLWEPGYSEMKYVKIENKGDLAFKYQLNIIP NILNAKEVYGVDLADVIDVYFGLIDENHTVPTSFADVKNTLTRVGTLSSLMLETDGAAH GILLPEGSTPLLPEVEEVGSVTACIVLHMQETAGNEYQNLSVGEGFSVQLLATQYTYEE DSFDNQYDAEADYDTNQAIPVAKVEYADEYMGENPTTPIVWNNSWGMVRSGTGDVDGDG KTGENDPDEYDIAFDAAYVFTAPVDADTAEKSPYKYYIADFAVSFDKDVTSDMQIGIAG NYGAWNWIGFMANNDLLSTLEGNKIAAGDVYNLLEVYSGGALSINYYELCNSVKEFKCS AWGGEAAKGVTLTVELRLYETYSAEECYEKFGYSSTNEKTGNYYVIGTYNYTFTGE" /locus_tag="LOCUS_2370" /note="MGA_286" CDS 1701..1937 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MKKIICKVEYDTEKSELIAKFTNGSFGDPAGYEESLYKTADGKYF IYCYGGSESIYPEETIKRLAQAKVDLWLAEHNG" /locus_tag="LOCUS_2380" /note="MGA_287" CDS complement(2060..2911) /product="DegV family protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003438997.1" /transl_table=11 /codon_start=1 /translation="MSVKIIIDSTTDITPEILEQVAVVSMTIRFGETEYTDGIDISKQK FYELLVESDILPATSQPTPDAFMRAYENATADGSDVVVITVSSKLSGTYQSATIAAMDY SDKVRVVDSKSVAIGAGILTVMAVKLANEGKGADEIATILEQEREKICIVALLDTLEYL KKGGRISAAVAFAGGVLSIKPVVCLKDGAVEMLGKARGSRQGNNLLMTEIEKAGGIDYS KPVMLGYTGLSDVLLQKYIEDSRAVWEGKVEPLNYALVGSTVGTHVGPGAIAAAFFKSN AR" /locus_tag="LOCUS_2390" /note="WP_003438997.1 DegV family protein (Clostridioides difficile) [pid:35.0%, q_cov:98.6%, s_cov:98.9%, Eval:7.1e-43]" /note="MGA_288" CDS complement(2936..3391) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MVSRFEQFSAVIAVINRYIQNIERDEMIKVGYKGAYAIYLVTIAR YPEGITAAQLGEYCVKDKAAVSRIVSEMEDRGLIKRAGKGENLYRAKLILTPKGEELAE FVKQKARTAVNEVSGKMSDEDRNVMYKALDIISKNLEIISKDGIPEK" /locus_tag="LOCUS_2400" /note="MGA_289" CDS complement(3537..4373) /product="DUF3737 family protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_008764890.1" /transl_table=11 /codon_start=1 /translation="MNIIKNQTFDEERTLYGSRDLEVICCSFDGPADGESAFKECKNIK TTDCFFNLRYPFWHVDGLEISGCEMTELCRAALWYSSDISIGGTKMHGIKALRECKNVK IEGCDIISPEFGWSVDGLTVKDTDAVSEYFMMRSSNLHFDDVRFKGKYSFQYVTDAVFE NCNFDTKDAFWHAKNITVKNSTIKGEYLAWYCENVTFENCKIIGTQPLCYCKGLRLINC EMLDADLCFEKSEVEATLNAPVISIKNPKCGKVYVPAVGELIYDDTEAKGEVIITE" /locus_tag="LOCUS_2410" /note="WP_008764890.1 DUF3737 family protein (Bacteroides) [pid:37.4%, q_cov:96.0%, s_cov:93.0%, Eval:1.1e-48]" /note="MGA_290" misc_feature complement(4456..>5018) /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_010878142.1:ABC transporter ATP-binding protein" /note="WP_010878142.1 ABC transporter ATP-binding protein (Archaeoglobus fulgidus) [pid:42.5%, q_cov:98.9%, s_cov:78.7%, Eval:5.7e-35]" /note="MGA_291" /locus_tag="LOCUS_2420" ORIGIN 1 gcaggttggg ggacgaaggt tagtttttga gttgattatt cacctgtgaa ggtgtagttg 61 taagtgccga ttacatagta gttgccagtc ttttcattgg ttgaactata accaaacttc 121 tcgtagcact cttcagcgga gtaagtttca tacagacgaa gttcaactgt aagggttacg 181 cccttagcag cttctccacc ccaagcagag cacttgaatt ccttaacaga attgcagagt 241 tcataataat taatggagag agcgccacct gagtagacct cgagcaagtt atatacatct 301 ccggctgcaa tcttattgcc ttccaaagtt gaaagcaagt cattgtttgc catgaatcca 361 atccagttcc aagctccgta gtttcctgca ataccgattt gcatatcgga tgttacatcc 421 ttgtcaaagc ttacggcaaa gtcagcgatg tagtacttgt aaggagactt ttcggcagta 481 tcagcatcaa caggcgcggt gaatacatac gctgcgtcaa acgctatatc gtattcatcg 541 ggatcatttt caccagtctt gccgtcaccg tctacgtcac cagtgccact gcgaaccatg 601 ccccatgagt tgttccatac gatgggagtt gtaggattct cgcccatgta ctcatccgca 661 tattcaacct tagcaacggg tattgcctga ttggtgtcgt agtctgcctc agcatcatac 721 tggttgtcga agctatcttc ctcatatgta tactgggttg caagaagctg aacgctgaag 781 ccttcgccaa cggaaagatt ctgatattca tttcctgcag tttcctgcat atgcaatacg 841 atgcaagcag ttacggagcc aacttcttca acttcgggca acaaaggagt agaaccctcg 901 ggaagcaaaa tgccgtgagc tgcaccgtcg gtttcaagca tgaggcttga aagtgtgcca 961 accctagtaa gggtgttctt gacatctgca aagctggtgg gaacagtgtg attctcgtcg 1021 ataagaccga agtatacatc aataacatca gcgaggtcaa cgccgtaaac ttccttggca 1081 ttaagaatgt tggggataat gttaagttga tacttgaatg ctaggtcgcc tttgttttca 1141 attttaacat acttcatctc ggagtaacca ggctcccaaa gctgatagtt aaagattgtg 1201 cctgtggaag cgtcagccca tgtagcatta tcagagctgt aggtcatctc gacatctaat 1261 gtgcccgact tgataatgtt gttggtgctt gaaacagagt cggtgaacca agcaaatgtg 1321 gtgcccaaaa gcattgtgaa gcaaataagc aatgcaacaa tgcttgaaag caatgcgcgc 1381 ttggtggttt ttgcgtttgt cattatgttt ctcctccagt ttaatattgt gaaatgcaac 1441 gttttgtttc aaaatgtcca ttccaataaa tgaactctcc ccataatatg cattatcaca 1501 ttatgaccac attatatcac caatgtgtta agaatgcaac acttttggct tctttttttt 1561 tttttttgag gtttttccgc gctttttggg tatttcaagc aattttaaga aacctattgc 1621 aaaaataagc aaaagcgtgt ataatatctt tcgacccgag tctatcttgg gaatacaata 1681 ttaataaagg aatttgaaat atgaagaaga tcatttgcaa ggttgaatac gataccgaaa 1741 agtcggagct tattgcaaag ttcacaaacg gctccttcgg cgatcctgcg ggatatgaag 1801 aaagccttta taagactgca gacggcaagt atttcatcta ttgctacggc ggatctgagt 1861 ctatctatcc cgaggagacc atcaagcgtc ttgctcaggc aaaggttgat ttgtggctcg 1921 ctgagcacaa cggataattg tttgctcaaa attaaaacgg cagagggaat cgacctctgc 1981 cgtttttgca tattgaaaaa ataaaccggc cgaataggag gaatatcttc ctttcgaccg 2041 gttttcctat taacataatt tatctcgcgt tactcttaaa aaatgccgca gctattgcgc 2101 ccggtccaac gtgtgttccg acggtgcttc cgacaagagc gtagttgagc ggctcgacct 2161 tgccttccca aacagccctg ctgtcctcaa tatatttctg caataaaaca tccgacagcc 2221 ctgtatatcc cagcattaca ggctttgaat aatcaattcc gcccgccttt tcaatttcag 2281 tcataagcag gttgttgccc tggcgggaac cgcgcgcctt gcccagcatt tcaaccgctc 2341 cgtctttaag gcaaaccaca ggcttgatcg acaaaactcc gcctgcaaat gccacagccg 2401 cagaaattct tccgcctttt ttcaaatatt caagtgtatc caaaagtgca acaatgcaga 2461 ttttttcgcg ctcttgctca agaattgttg caatctcgtc tgcacctttg ccctcgttcg 2521 caagcttaac tgccatcacg gtcaagattc cggcaccgat tgcaaccgac ttgctgtcaa 2581 cgaccctgac cttgtcggaa taatccattg cggcaatggt cgcactctga tatgtacccg 2641 aaagcttcga ggaaacggtg ataacaacaa cgtcgcttcc gtcggctgtt gcgttctcat 2701 atgcccgcat aaatgcgtcg ggtgtgggct ggctggttgc gggcaaaatg tccgattcca 2761 ccagcaattc ataaaacttc tgtttgctta tgtcgatgcc gtcggtatat tcggtctcgc 2821 cgaagcgtat agtcattgac actacagcca cctgctcaag aatttcgggg gtaatatccg 2881 tcgttgagtc aatgatgatc ttaacgctca taacaatctc cttttaatat gtatattatt 2941 tttcggggat tccgtccttg ctgataattt caaggttctt tgaaattata tccagcgctt 3001 tatacatcac gtttctgtcc tcatcggaca tttttccgct gacttcattt acagcggtgc 3061 gagccttttg tttaacaaat tctgccaatt cctcaccctt gggtgtcaaa atcagctttg 3121 cgcggtaaag attttcgccc ttgcctgcgc gcttaatgag tccgcggtct tccatctctg 3181 aaacaatgcg cgaaactgca gctttgtcct taacgcaata ttcgcccaac tgtgcggcgg 3241 taatgccctc aggatatctc gctattgtca caagatatat ggcatatgca cctttatatc 3301 cgactttgat catctcgtcg cgctcgatgt tctgaatata tcggttgatt actgctataa 3361 ctgctgaaaa ttgttcaaat ctggaaacca cggtgaccct ccttttcaat gttgacaagt 3421 caacgtcttg gagtatagca tacgaaagtt gatttgtcaa catcttttga caatatcaat 3481 aattcaagca tcaataaaaa accgtccaaa cgagaattcg tccgaacggt tttcttttat 3541 tctgtaatta ttacctcacc ctttgcctca gtatcatcat atatcagctc gcccacagcg 3601 ggaacataaa cttttccgca ctttggattt ttaatgctga tgacaggggc attaagcgtt 3661 gcctcgacct ccgacttttc aaagcaaagg tcagcatcca acatctcgca gttgatgagt 3721 ctaaggccct tgcaatagca aagaggctgt gtgccgatta ttttgcagtt ttcaaaggtc 3781 acgttttcac aataccaagc gaggtattcg cccttgatgg tagagttctt aacggttatg 3841 ttctttgcat gccagaaggc atccttggtg tcaaagttgc agttttcaaa cacagcatcg 3901 gttacatatt ggaaggaata ctttcccttg aaacgaacat cgtcaaaatg cagattcgac 3961 gagcgcatca taaaatattc gctgacagca tcggtgtcct taacggtcag cccatccacc 4021 gaccagccga attcgggaga gatgatgtcg catccctcaa ttttaacatt tttgcattcg 4081 cgcaacgcct taattccgtg catctttgtg ccgccgatgg aaatgtcgct tgaataccaa 4141 agtgccgcgc ggcaaagctc ggtcatctcg caacccgaaa tctccagccc gtcaacatgc 4201 cagaagggat agcgcaggtt aaaaaagcaa tccgttgtct taatattctt gcattcttta 4261 aaggcgctct cgccgtcggc ggggccgtca aaggaacagc atataacctc gaggtcgcga 4321 cttccgtata atgtgcgctc ctcgtcaaat gtctgattct tgattatgtt cattttgaaa 4381 atcctttgcc caaaattgtc attgtcctaa taataacaca aaggggcgca gaaaacaagc 4441 acccctttca tatttttata tttcaattat tcgctcgcag agcttattcg cttcatcctt 4501 tgaatgagtg attaaaataa acgttttacc ctcggttagt tttgcaactg tttcggtgac 4561 cttttcgagc gtgccctcgt cgattccctt gaaaggctca tcgaagatat atatgtccgc 4621 attcgttgcc aatgcgcggg caatgcaaac tcgtcttctt tcgccacccg aaagctcatt 4681 cgcgggctta tatatcagct cacgttccag ccctgcattt tcaagcaggc cgataacatc 4741 atcctccgac gggggatttt tcaataccac gctgacattt ccaaccgctg aaagcgattc 4801 aatcagtctg tcctcctgga ataccattcc gaatgtggca tcttttgaaa ctttaaccgc 4861 accggaatcg ggttttatca gccctaaaat gaggttgatg agtgtggtct ttccggcacc 4921 cgagcgcccc ataattgcca cacgttcgcc gtctttaata tcaaggctga atccactcaa 4981 aacctgctga ttgctatagc ttttgctgac attttcaa // LOCUS sequence040 4944 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence040 VERSION sequence040 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..4944 /mol_type="genomic DNA" /organism="" /note="sequence040" CDS complement(1243..1575) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MNILEHLIETVLPYIIAILEIMGILVVAWTGVRAFWEYIQNTFMK KNNPLQNHFANGLATALEFKMAAEILKTVLVREMSELLVLGAVIGLRALLSLLIHFEMK HSEKEK" /locus_tag="LOCUS_2430" /note="MGA_293" CDS complement(1688..3127) /product="sodium/glutamate symporter" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011015371.1" /transl_table=11 /codon_start=1 /translation="MDYTSSWDFTLANYGAVWAFMVQIGILLLFLMIGNILRRVVPLFR KCLIPSALLGGVLMLIINIICKQFDFMLVDKRMMQIITYHCLAFGFAAMSLKTEKSTHK TNKAQVVEFGALQGGAYMLQAFVGMGLTLLLFYLTKDGENVISYICGLILPLAFGQGPG NALSWDINFTNTPAAMFAGNGSFGLSLASIGFVVASVFGVLYININKKRGNLNIRSTST TGEVVDQTNPDGNEIPDNESVDKFSLQVGFVALAYAISFGFMCLLGVLSDFTKSIAWGF NFLWASLAAMLIRFVVKQLRKRNVMHREYINNYQMDRVSGFSFDIMIVAGVSAIEINDI KNYILPIILLSIIGSIITYVYIRLVSKECFKGFEHEFFLMSFGTLTGTASNGMILMKEI DPGLKTPTSSLYILSNFPAMVMIAPLLLCLNFASKSVTNAIIAFAIFFILWLIYTTFLF RRKIFKKHYENKPIEVWKEEN" /locus_tag="LOCUS_2440" /note="WP_011015371.1 sodium/glutamate symporter (Corynebacterium glutamicum) [pid:22.2%, q_cov:86.4%, s_cov:90.4%, Eval:8.2e-17]" /note="MGA_294" CDS complement(3362..4408) /product="SpoIVB peptidase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011986434.1" /transl_table=11 /codon_start=1 /translation="MPIISCGINVSCEAKPRQEDSNQVVLKLFGVIPIKDASVEKSDAP LLIPGGSPVGIKLLTDGVVVVKMTEVSEGICPCKEAGLKIGDCITEANGTDVTSSAQLA DIIMNSRGKSIDLTIERNGKELDVTLNAVYSETDGTYKAGLWIRDSSAGVGTLTFINPK TGAFGALGHPISDFDTGKLMPLGSGEIVDATVTGYERGLEGLPGELYGTFVSGLAMGTI TKNCERGIYGNVNYTKTHTAAIPIAFKSEVETGKASILTTIEGSKPREYEIEIEKITLS TAAGTKNMVIKITDPELLKTTGGIVQGMSGSPILQNGKLVGAVTHVFVSDPTRGYGIFI ENMLEEAE" /locus_tag="LOCUS_2450" /gene="spoIVB" /EC_number="3.4.21.116" /note="WP_011986434.1 SpoIVB peptidase (Clostridium botulinum) [pid:42.4%, q_cov:97.7%, s_cov:85.5%, Eval:9.3e-78]" /note="MGA_295" ORIGIN 1 aagttttcaa ttacggtatc ggtgccgata gcattaaatt ccggatagag attgattcct 61 tcggcgcctg tcaaatcagc ataaggcata tattctccga cgaacaggcc ttcgtttgcc 121 tgaagccaag gatagaagtt gtccaaaaca tcttcgccgt atgtcgcctt gagcactagg 181 gttacatgct cggtcggagc ttggtctgaa ataggggcga tctctctgaa gcaataagcc 241 ttttcaaatt cggttatcca cttgctgtaa tcgccgtata catcgtcaag ataccacata 301 aagcggaaac cgatggcata gttgttgttg cttgcatatt caaagttatt ttcaaaccaa 361 tattcaatcg gctgttcata tagctttgaa taatcgctga cctccaagtt gaagaggcta 421 taatctgccc tgttgaaata taccgacgcc tcgggatgag tttttgccaa ttccttaagg 481 ctaagatatg tagaatattc agcaaagcct tcgtttaaaa gcgtattata aaaccactcg 541 gtctgacgcc acatcagcat atgagagcct tcgtgaataa gcgtatattc tttgttgggt 601 atcagatttg agggccccat aacgatgtga ccccatgttg aagcatatgc cgagcctgcc 661 tcgttggtcg gaagcccctg atagaatccc atattgatat aaagattttc tctggtgaaa 721 tcgctgtgaa tctttccgtc cggatataac atttcgcaat atccgttgcc gtcaaagctg 781 agtcccgaaa ccttttcaag cgtgtcggca agaagctcgg cagagtttgt catcgtttcg 841 gaaacatata tatttgcctt tacgtcgaac ataaatgttc ccgtatcgac agagatatcc 901 gattcggtga catagtcatc agcatcaaag tcataatatc ccggaccttc aaggggataa 961 ttctcgttgc cgaaaagact gtgatataaa agataaatcg catcgttctt atcaacaggt 1021 ccgtcacagt taaagtcgct gaatccgctt acaggatata gatcatcccc gaagagcacg 1081 ctgtatagca gataaatggc atcgtttttg tcggttgcac cgtcgccgtt aatatcagcg 1141 gatatcacag gctctgcgga tggtgcagca taaaccgata ctgttaatag agataaaatg 1201 aacgaagcgc aaacaaaaat ttgcaacagc tttttcattt tattatttct ccttttccga 1261 atgcttcatt tcaaagtgta taagcaagct caaaagtgcg cgcagaccga tgactgcgcc 1321 caaaaccaac agctcgctca tctctctgac gagaacagtt ttaagtatct ccgccgccat 1381 tttaaattca agggcggtag caagtccgtt tgcaaagtga ttctgcaaag ggttgttttt 1441 cttcatgaac gtgttctgaa tatattccca aaaagcgcga acgcctgtcc atgcaaccac 1501 cagaattccc atgatctcca gaattgcgat gatatatggc aaaacagtct caattaaatg 1561 ctccaaaata ttcataacca agcctcctat tgttgatgga actattataa cacaatatgt 1621 aaaaaaagaa aagacctatt taaatcagcc gacccccaaa aaagagtcgg ctgtttcagt 1681 ttgatattta gttttcctct ttccagactt ctatgggctt attttcataa tgctttttga 1741 agatctttct gcggaagagg aatgttgtat aaatcagcca gagtatgaag aatatcgcaa 1801 atgcgatgat agcatttgtg accgattttg acgcaaagtt taaacacaga agcagaggtg 1861 caatcattac cattgcaggg aagtttgaaa gaatataaag gctggatgtg ggagtcttga 1921 gcccggggtc gatctccttc ataaggatca taccgttaga tgcggtgcct gtcaaggtgc 1981 cgaagctcat gaggaagaac tcgtgctcaa atcccttgaa gcattccttt gaaaccaggc 2041 ggatgtaaac atatgtgatg attgagccga tgatgctcag aagaatgata ggcaaaatat 2101 agttcttaat gtcgttgatc tcgattgccg atacgcctgc aacgatcata atgtcgaagg 2161 agaagccgga gactctgtcc atctgatagt tgttaatata ttcgcggtgc ataacatttc 2221 gcttgcgaag ctgtttaaca acaaagcgga tgagcattgc cgccagcgaa gcccaaagaa 2281 agttgaagcc ccaggcgatg ctttttgtaa aatcggaaag aacgcccaat aagcacataa 2341 atccgaagga gattgcatat gccaaagcga caaatccaac ctggagcgag aatttatcta 2401 ccgattcgtt gtcagggatc tcgttgccgt cggggttggt ctggtcaacg acctcgcctg 2461 tggtgcttgt ggagcgaatg ttaagattgc cacgcttttt gttgatgtta atatatagca 2521 caccaaagac ggatgcaaca acaaagccga tggatgccag cgaaaggccg aagcttccgt 2581 ttcctgcaaa cattgccgca ggggtgttgg tgaagttaat atcccagctc agcgcgtttc 2641 cgggaccttg tccgaatgcc aaggggagaa tgagtccgca tatatatgaa atgacattct 2701 cgccgtcctt ggtgaggtag aacaaaagaa gggtcagacc catgccgaca aatgcctgga 2761 gcatatatgc gccgccctgc aatgcaccga attcaacgac ctgtgctttg ttggtcttgt 2821 gggtgctctt ttcggtttta aggctcattg ccgcaaagcc gaaagccaga cagtgatatg 2881 taataatctg catcattcgt ttgtcgacca gcataaagtc aaactgcttg caaatgatgt 2941 taataataag cattaaaact ccgcccaaaa gtgcagatgg tatgaggcat tttctgaaca 3001 gaggcacaac ccggcgcaaa atatttccga tcatcaaaaa caaaagcaag attccgattt 3061 gaaccataaa cgcccaaacg gcgccatagt tggcaagggt aaagtcccaa ctcgaggtat 3121 aatccatata agtatccatc tccaatctga agcacttcaa aaaaattata actcaaaaat 3181 tcagtcaatt caataaacgg tgaaacataa tatcagcaaa tgtgtcagta atgggtatgg 3241 ataaaggccc cctctgatga gggggctggc accgcaggtg actgggggag agatggttca 3301 cggtctgccc tcccgtcaaa aatcaaagat ttttgccact ttcctttgca ccaaggaggc 3361 tttattccgc ctcctccagc atattctcaa tgaaaattcc atatccccgc gttgggtcgc 3421 tgacaaaaac gtgggtgacc gcgcctacca gcttgccgtt ttgcagaatg ggtgagccgc 3481 tcattccctg aacgattccg cccgttgttt ttaataactc ggggtcggta attttgatca 3541 ccatattttt tgtgcctgcc gccgttgaaa gggtgatctt ttcaatttcg atctcatatt 3601 cgcgcggctt gcttccttca atggtggtca aaatgctcgc ctttcccgtt tcgacctcgc 3661 ttttaaatgc aatcggaatt gccgcggtgt gggtctttgt ataattcaca ttgccgtaaa 3721 tccctctttc gcagtttttg gttattgtcc ccatcgccag acccgaaaca aaggtgccgt 3781 atagctcacc gggaagcccc tccagccccc gttcataccc cgtgacagtg gcatcgacga 3841 tttcacccga acccagcggc atcagtttgc ctgtgtcaaa atcggatatt gggtggccga 3901 gtgcgccgaa tgctcccgtt ttcggattta tgaatgtaag cgtgccaaca cctgccgagc 3961 tgtcccgaat ccaaagccct gctttataag ttccgtccgt ttccgaatat accgcgttga 4021 gagttacatc cagctctttg ccgtttcgct caattgttaa gtcaatactt ttgccccgcg 4081 agttcataat aatatccgca agctgtgccg aggatgtgac atctgtgccg ttggcttcgg 4141 tgatgcaatc tccgatttta agccccgctt ctttgcaagg gcatatgccc tcgctcactt 4201 ctgtcatttt aaccaccacc actccgtcgg tcaaaagctt gattccaaca ggtgacccgc 4261 cgggaattaa aagcggagca tcgctttttt caaccgatgc atctttaatt ggtatgaccc 4321 caaagagctt gagcaccact tggtttgagt cctcttgccg gggttttgct tcgcaggaaa 4381 catttatccc gcaggagatg atgggcatat catcccccga aacgtaataa ctggccggca 4441 acgtggcatc cagatacccc accagcgaca ttgccgcaat cagcacagcg cccaaaaggc 4501 atgctgtgcg tttaaaaaat ctttccatta tatttaaaag aacctttctt gttagttgcg 4561 attatatttt tcgcaagcag gtcttaaata atcaaagcat tattttcatt ggtcaaatta 4621 agggttgaat gtttccactc ttgtgtgcta taatgattac aatgaaataa aataacctat 4681 gtataacttc ctgcgaggac aaaacaatga aatttgaaaa atataaaaaa accgcatcgg 4741 atgagctttc gggcaagaaa gaacacaaaa tatatctttt tgccaagctt ttaatgacct 4801 tgattttcct ttggtcggga tttttctggt cgggcgttac ggttttgaat ttttacataa 4861 atatgacctt tgattcccac cttgcgacac tgttcctcat cggctcgatc ctgcttttgg 4921 tgtcgctgat cctttgttgg tgca // LOCUS sequence041 4911 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence041 VERSION sequence041 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..4911 /mol_type="genomic DNA" /organism="" /note="sequence041" CDS 559..1197 /product="RNA polymerase sporulation sigma factor SigE" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_000976948.1" /transl_table=11 /codon_start=1 /translation="MNIFTKLLQKLLKLFSKENRIDYINGSDTLPPPLKPNEELEVFDK LKTDPKYAKEKLITHNLRLVVYISKKFESTGIGIEDPISIGTIGLIKAVNTFNPEKNIK LATYASRCIENEILMYLRKTAQQRNEVSIDEPLNIDWDGNELLLSDVLGTDGEEVVQRL EYETEKQLLVEAVNALKGREKLIMQLRFGLLDGKEMTQKEVADVVGISQ" /locus_tag="LOCUS_2460" /gene="sigE" /note="WP_000976948.1 RNA polymerase sporulation sigma factor SigE (Bacillus) [pid:63.9%, q_cov:95.3%, s_cov:84.5%, Eval:7.0e-65]" /note="MGA_298" CDS 1388..2119 /product="LytTR family DNA-binding domain-containing protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_010964889.1" /transl_table=11 /codon_start=1 /translation="MIRIGICDDNVNMLENLKNITFNAFSSHNVDFDIYTYTNGQALLN AHAVEKFDILFLDIDMPGLNGFDISRNLRDDYVNCFIIFVTSHGELVYDSMNFQPFNFI RKNCAIPLEESIANVTAKLVKHMKQNEKLLLKFDNGENIDIYVKDIIYIENDKHYLKYY TTKSETPLRIRGLISELEAKLIDCDFVRVHRSYIVNLRYVSRIDRTGFEVYLKENSRRL PLSKNLKKDVFDRYVQYMRNR" /locus_tag="LOCUS_2470" /note="WP_010964889.1 LytTR family DNA-binding domain-containing protein (Clostridium) [pid:29.8%, q_cov:99.2%, s_cov:98.7%, Eval:1.1e-27]" /note="MGA_299" CDS 2149..3486 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MNVLWLLFELIVNVYQGFVMSYFMYSYLGDKKRVKFFKSKGVLFA FIFAAAITTMNFITYFEHVYALIYGVILFVYALLYLKGTLMRKLFASILAIVILLISTA FIGAASTIIFKTDLYLIMTEISVERFVALVSTQLMILYIVTIALKMLKTDNYNRRELSA SEWIIIAIVLAISIVLVALLFLMTMTQGTDRMYSILSLMGVIVINILVCYLVIGLGKKN EIVRENEALKLSQEYNQQYVNSATAEYDTIRKLQHDFKNNYYTVHTLIKEGNAQAALDH IEGNLELLESFAVFVKSENPIVNAVVNAKFSEAKTFGIDCSCICGTDFKHIDNLDLCRL LSNLLENAVTACKQSRSEHPSIVLSLLSDESTYSIDLKNTIDISVLESNPQLLTTKKNR NDHGYGINIIKEIASKYDGYCDFYEESGMFCCRIILNSTKNKADCE" /locus_tag="LOCUS_2480" /note="WP_009895625.1 ATP-binding protein (Clostridioides difficile) [pid:24.4%, q_cov:51.2%, s_cov:81.7%, Eval:1.0e-10, partial hit]" /note="MGA_300" ORIGIN 1 aagatgcttg tatacggtgc cgtatttata agccttaaca tactgctgtg cggtgctgtt 61 ggactgtttt gtgaactgtt caatatggaa tcgacttttg tatttaacgg cacgatttat 121 ctggatattc cattgatcat gctcatattg accaccgcgg ggatatatat cattctagct 181 gtattttcaa ggcttacagc ctttaaatat gataagcata attcatacaa ttttgagttt 241 tcatataaag acacaaccta taatctccct gcaatcgcag atactggtaa tactgcaaaa 301 gatgtattca gcggtaagcc tgtaattgtg tgtaatggta tttcacttta catatctgaa 361 aatgattata tcagaccaat tccgtattca accgtatccg gggagggggt attatatgct 421 ttcaagccgg aatatgtgct tatatcagat gaaaccggtc gaaaaaaagt tgttgatgcc 481 ttggttgctt cagcagacac aaaaggggac agccgcgcaa ttttcaatcc caagctatta 541 acatgaggtg acaaaattat gaatatattt accaaacttt tgcagaagct gctcaagctg 601 ttttcaaaag aaaacagaat tgattatatt aacggctcgg atactcttcc gccaccatta 661 aagcctaacg aagagctgga agtatttgat aagctaaaaa ctgacccaaa atatgcaaag 721 gaaaagctaa taactcataa tttacggctt gttgtttata tatcaaaaaa gtttgaatca 781 acaggaatcg gcattgaaga tcctatctca atcggtacaa taggtttaat taaggctgta 841 aacaccttta acccggaaaa gaatataaaa cttgcaacat atgcttcccg ttgcattgaa 901 aatgagatat taatgtattt gcgaaaaaca gcacagcaac gaaacgaggt ttcaattgat 961 gaaccgctca atatcgactg ggacggcaat gagcttttgc tatccgatgt tttgggcacc 1021 gacggagaag aggtcgtaca aagattggaa tatgaaactg agaaacaatt acttgttgaa 1081 gctgttaacg cacttaaagg aagagaaaag cttataatgc agcttcgttt cggactgctt 1141 gacggcaagg aaatgactca aaaagaggta gcagatgtgg ttggaatatc acaataatat 1201 atttcacgtc tttaaaaact tattatgaaa caattaatgc gttatcttga atcaatctgt 1261 tgattcataa tactcaatat ggttacactt ttaggcagag ataaagctct gcctatttta 1321 tatctaaaaa gttgcttttc ttttgatatt gttgtataat caatcaaaaa gagtacggag 1381 gaaaaacatg atacgaatcg gaatatgcga tgacaacgtg aatatgcttg aaaatttgaa 1441 gaatatcaca tttaacgctt tttcttctca caatgttgat tttgatatat acacttacac 1501 taacggtcaa gccctgctta atgcgcacgc ggttgaaaag ttcgatattc tgtttttgga 1561 tattgatatg cccggtctca acggctttga tatttcccga aacctgcggg atgactatgt 1621 caactgtttt atcatatttg taacctctca tggtgagctt gtatacgata gtatgaattt 1681 ccaacccttc aactttattc gtaaaaactg cgcaattccc cttgaagaga gcatcgcaaa 1741 cgtgaccgcc aagctcgtca agcatatgaa gcaaaacgag aagcttcttt tgaaattcga 1801 caacggcgag aatatcgaca tttatgtcaa agatatcatc tacattgaaa acgacaagca 1861 ttatttgaag tactacacca ccaaaagcga aacgcccttg cgtattcgcg gactgatttc 1921 tgaattagaa gcaaagctca ttgactgcga ctttgttcga gttcatagaa gctatatcgt 1981 aaatctgcga tatgtttcaa gaattgacag aacaggcttt gaggtatatc tcaaggaaaa 2041 ctcaaggcgc cttcctttga gcaaaaactt aaagaaggat gttttcgaca gatacgtaca 2101 gtatatgagg aatagataat aaaacgttat agttatgagg aaaagacaat gaatgtatta 2161 tggctactgt ttgaactgat tgttaatgtt tatcaaggct ttgttatgtc atactttatg 2221 tactcatacc ttggagataa gaaaagggtg aaattcttta aaagcaaggg cgttttgttt 2281 gcttttatat tcgccgcagc aatcacaaca atgaatttca tcacttactt tgagcacgta 2341 tatgcgctca tatatggcgt tatacttttt gtgtatgcat tactgtatct caaaggcacg 2401 ctgatgcgaa aactgtttgc gtcaattctg gcgattgtaa tactcttaat atcaactgct 2461 tttatcggcg ccgcatcaac gataatcttc aaaactgact tatatctgat tatgaccgaa 2521 ataagtgttg aacgttttgt tgcattggtt tcgacccagt taatgattct gtatattgta 2581 accattgcgc tgaaaatgct taaaacggat aattacaacc gccgcgagct ttcagcctcc 2641 gaatggataa taattgcaat cgtattggca ataagcattg ttctggtcgc tttgctattc 2701 ctgatgacca tgacacaggg taccgaccgt atgtattcga ttctttcgct tatgggcgta 2761 attgtgatta acattttggt atgctacttg gtcatcggcc tcggcaaaaa gaacgaaatc 2821 gtccgcgaaa acgaagcctt aaaactctcg caggaataca accaacaata cgtaaacagc 2881 gccactgcgg agtatgacac catccgaaag cttcagcacg attttaaaaa caactactat 2941 accgttcata ctttaatcaa agaggggaat gcccaagcgg cacttgacca catcgaaggc 3001 aacttagaat tattggaatc cttcgccgtc tttgtaaaat cggaaaaccc gatcgtcaat 3061 gctgttgtca acgcgaagtt ctccgaagca aagacattcg gtatcgactg ctcctgcatc 3121 tgcggcaccg attttaagca catcgacaac ctcgacctct gccgacttct ttcaaatctg 3181 cttgaaaacg ccgtcactgc ctgcaagcaa tcgcgaagtg agcacccttc aattgtgctg 3241 tcgctcttga gcgatgaaag cacctattcg atcgacctga aaaacacgat tgatatatcc 3301 gtcctcgaat caaacccgca attacttaca acaaagaaaa acagaaacga ccacggctac 3361 ggcatcaata tcatcaaaga gatcgcatca aaatatgacg gctactgcga cttctatgaa 3421 gaaagcggaa tgttctgctg cagaataata cttaatagta ccaaaaataa agctgactgt 3481 gaatgattca cagtcagctt taactgtttt tccgctaaaa aatgtcacct cgtgccagaa 3541 aatgtcacgt cgtgccaaac ctgttgatta ttttaaaaaa tatgataaaa tgattttgga 3601 cagcttaatg ttgttcttaa aagatggcct cttgctgatt taatcaagta ctctttctac 3661 attacaaaca gtcatagcta tactgcctgc ttgaggccat cgttttacat atcagcaatt 3721 ttatgattgt ttatatacaa ttttaaaaaa ctttgaacag gggattacca aatgaaacga 3781 atattatcat ttatgcttac ggttgcaatg gctttatctg tgatttcatt tgcattaacc 3841 gaagaattat tcgcagtcgc ggatgattgc gatgttaatt tggagagttt acaaagtgaa 3901 cagataacac acacagatgg tgaatgctac agttttagct ccagctatgc aaatccgctg 3961 ttcagcagta gcgatcaagt cacatataca tctgagtcaa ttacatatac cccgcctgtt 4021 ttctttgctt ctcaaacaat tatgaccgag caggaagcaa aggaatatat tcttgaacag 4081 attaaagcga gaaacacaac atttaccgtt gtgcacagaa cacagagata ttatgacggt 4141 tattcaatag atctcgctct tgaggcaatg aaacacaccg gtgtgccaaa tgagggcgac 4201 tatctgatga agcagtttaa gaatatatcc tgtcaaggta actatagtta tgtcggcggt 4261 ggatttaatt tgtccgtcac atacactatc acttatttta caacagcgca gcaagaagca 4321 ttagtcgatg aggcagtaaa tgaactgctt tcctattttg acttcagttc ttcatcagat 4381 tatgagaaaa tatacacaat atataggtgg atatgcgaca atgttgaata tgattatttc 4441 ggccaggatc tgctgaagca ttctgcatat tctgcaataa ttgacggcaa ggcagtatgc 4501 caaggatatg ctgttttgtt ctatcgcctt atgttggaat tgggaataga ctgcagagta 4561 atttcaggtg tcagcggcga tgaacgccat gcatggaata tcgttaagct gggaggcgtg 4621 tattacaatg ttgatgcaac gtgggacgca agttcagctt attatgattt cttcttgaaa 4681 acagatgctg atttttcgga tcacacaaga gacgaaatgt ttactacagc tgaattttac 4741 agcagatacc ccatggcaac aagtaactat gttaagcctg attgggtaat agtaaatggc 4801 gttgttcttg aatataacgc tcaagatacc gatataatta ttccgaatgg cgttgttgca 4861 atcggtgact atgttttcta tggcaagaac ataaccagcg ttgtaatccc c // LOCUS sequence042 4874 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence042 VERSION sequence042 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..4874 /mol_type="genomic DNA" /organism="" /note="sequence042" CDS 159..680 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MKNVIKYNRPLAFCVLVIVVALSLVVGCVRTLSSFENKVENLYES TKAMADINDLYGYASKIQAGAKAAGFDTAKLDEALEALAKNASDPTALGDTVSVIFSES SILYSDISYSGKVADMNSLTAYMAEIESTMMRLQNNTKYNKAALDYNRAIRSFPASIFA LGRNNAAVFG" /locus_tag="LOCUS_2490" /note="MGA_303" CDS 699..1595 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MKKLTVILSLIVLVFSLTTCCYAHEYGFPDELDTYVYDEAGVLSE GTKEHIINSSYDLSQQSGGEIIVACVNTTGLYDIADYAYEMFNTWKIGGKDKNNGVLLL LSIDEQDYWCLQGEGLERTLSSGKIKLILNEYLEPDFASGNYDAGVLATYNALLGELEA AYGISVDGEFPEEYAEQLEQYEQYKENDGTGFIIMLVVIVFIIIFVSNLAGQTKRGFHG HHPTVVIAPDPTRTIIRTMRHMNHHHGHHRPPTGMGSFRGPTSHGGFGGGFSGGSRGGF GGRSGGGISRGGGAGRR" /locus_tag="LOCUS_2500" /note="WP_004080600.1 YgcG family protein (Thermotoga) [pid:31.9%, q_cov:63.1%, s_cov:73.9%, Eval:3.1e-20, partial hit]" /note="MGA_304" CDS 1917..2564 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MPNCANNKEAKSSSHHTCGHVKGDNTHPKTREERRESPYKGTKTE QNLREAFAGESQARNKYTYFAEVAKAQGFEEIAEIFLKTAKNEQEHAKIWLEALKEIGD TEENLETAAGGENAEWTDMYERMAREAEEEGFDEMAIKFRCVGAIEKMHEERYRRLLKD VKNQEVFEKSSVKIWECRNCGHIVVGLAAPKTCPVCRHPQGFFEVIGDGDEK" /locus_tag="LOCUS_2510" /note="WP_015943945.1 ferritin family protein (Desulfitobacterium hafniense) [pid:52.0%, q_cov:95.8%, s_cov:57.4%, Eval:1.2e-59, partial hit]" /note="MGA_305" CDS complement(2697..2897) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MGKIRLNENEEIVKLVKEGLKERGGYCPCVREISPDTKCMCKQFR EQIADPDFEGYCHCMLYYKEK" /locus_tag="LOCUS_2520" /note="MGA_306" CDS complement(2902..3540) /product="pyroglutamyl-peptidase I" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_002287081.1" /transl_table=11 /codon_start=1 /translation="MKILITAFDPFGEETTNAAMQALELAETDACEMVRLVVPTSFERS VDVVCKAVCEHKPDAVIMLGQAAERAVVTVERVSINVDDASIADNDDYKPKDKPIVENG PAAYFSTLPIKEIVSDMKLRGIPAQVSNSAGTFVCNHLMYGVLHFLNIVFPKTPAGFIH FPITPSQAAKFSRSIASMSSEISAKAVTSAVETTVKYIEYGNITPNEEV" /locus_tag="LOCUS_2530" /gene="pcp" /EC_number="3.4.19.3" /note="WP_002287081.1 pyroglutamyl-peptidase I (Enterococcus) [pid:44.3%, q_cov:93.9%, s_cov:93.9%, Eval:2.0e-43]" /note="MGA_307" ORIGIN 1 gagaccctta cccacaccaa ccaggaactt atcaatactc tcgacgaagt caagcagatt 61 cagacagaag gccgcgaaaa gcgcagagct gcagaagccg agcttggcag aattgaaaac 121 gaaattaaga acaagcttct tgaggtatcg cagagctgat gaaaaacgta ataaaataca 181 accgaccttt ggctttttgt gtacttgtta ttgtcgttgc actctcgctt gttgtcggat 241 gcgtcagaac gctttcgagt tttgaaaaca aggttgaaaa cctgtatgaa tccaccaagg 301 cgatggcaga cattaacgac ctttacggct acgcttcaaa aattcaggcg ggcgcaaagg 361 ccgcagggtt tgacaccgca aagcttgatg aggcacttga agcgctcgcc aagaatgcat 421 ccgaccccac agccttgggc gataccgtaa gtgtcatctt ctccgaatca agcatacttt 481 acagcgacat ctcctattcg ggcaaggtgg ctgatatgaa ctcgctgacg gcatatatgg 541 ctgagatcga gtcgacgatg atgcgtttgc aaaataacac aaaatataac aaggcggcac 601 ttgattataa ccgcgcgata agatccttcc ccgcatcaat ttttgctttg ggaagaaaca 661 atgccgcggt attcggttaa aggaaaactg ataaataaat gaaaaaacta actgtaattt 721 tatcgctgat agtcttggtc ttttcgctga ccacctgttg ctatgctcac gaatacggct 781 tccccgacga gctggatact tatgtatatg acgaggcggg ggttttgagc gagggaacaa 841 aggagcatat cataaactca agctatgatc tgagtcagca gtcgggcggc gagataatcg 901 ttgcttgtgt caacacaaca gggctttatg acattgccga ctatgcctat gaaatgttca 961 acacttggaa aatcggcgga aaggacaaaa acaacggtgt cttgctcctt ctttccatcg 1021 acgagcagga ttattggtgc ttgcagggtg aagggcttga aagaaccctt tcctccggca 1081 aaataaagct gattttgaat gaatatctcg agccggattt tgcatcgggt aactatgatg 1141 caggcgtttt ggcaacttat aatgcacttt tgggcgagct tgaagcggct tacggcataa 1201 gcgttgacgg agaatttccc gaagaatatg ccgaacaact tgagcagtac gagcaatata 1261 aagaaaacga cggcacagga tttatcataa tgcttgttgt aatcgtgttt atcatcatat 1321 tcgtttcaaa cttggccggt cagacaaaaa gagggttcca cgggcatcat ccgacagttg 1381 tcattgcacc cgaccccaca agaacaatca tccgcacaat gcggcatatg aatcaccatc 1441 atggccatca ccgtccgccg acaggcatgg gcagtttcag aggcccgacc tctcacggag 1501 gcttcggcgg aggtttctcg ggaggctctc gcggcggctt tggcggtcgc tctggcggag 1561 gaatatcacg cggaggcggc gcaggcagaa gataataccg acaataaatc tcctcggagc 1621 atatgcttcg gggagatttt gtttgcgcgc tgaggcggca gcccaacagg ccgaggcctg 1681 ttgggctgcc gcaggcgcga agaacccgtt tcgcccgtag ggcgaaacgg gttggctgcc 1741 gccgaatagc ggaggggcgt ccgacggatg gcgttgcgtg agcaactgta tccgacgggt 1801 gccccggagc gggcgaattt acagtgtacg cttgagcaca aaactttgat ttaatattgg 1861 cgtatatttc cctttttgaa gcaaacacta cttaaaaatc atcgggagga aaaaccatgc 1921 ctaactgtgc aaataacaaa gaagcaaaaa gctcatcaca ccacacctgc ggacatgtca 1981 agggcgacaa cacccacccc aagacccgcg aagaacgccg cgaaagtccc tataagggca 2041 caaagaccga acagaattta agagaagcat ttgcagggga atcccaggca agaaacaaat 2101 acacatattt tgccgaggtt gccaaggcgc aagggtttga ggaaattgca gagatcttcc 2161 ttaaaaccgc caaaaatgag caggagcacg caaagatctg gcttgaagcg ctcaaagaaa 2221 tcggcgacac cgaggaaaac cttgaaacag cggcaggcgg tgaaaatgcc gaatggacag 2281 atatgtatga acggatggcc cgcgaagccg aagaagaggg cttcgacgaa atggcgatca 2341 agttccgttg cgtcggcgca atcgaaaaga tgcatgagga acgctatcgc agactgctaa 2401 aagatgtcaa aaatcaggaa gtctttgaaa agagctctgt gaagatctgg gaatgccgaa 2461 actgcggaca tattgttgtc ggtttggcgg cgcccaaaac ctgccccgtt tgccgtcatc 2521 ctcaaggatt ctttgaggtc atcggcgacg gcgatgaaaa ataaatgggt ggtaacccca 2581 acttcgctcg ccaccgttcc gccacagcct cgctacgctc ggcgcaggca aaacgacggc 2641 tcgctcagtc ataataaaac aaaacggcaa gcaatagcgc ctgccgtttt ctctttttat 2701 ttttctttat agtagagcat gcagtggcaa tatccctcaa aatcaggatc tgcaatttgc 2761 tcgcggaact gcttgcacat acacttggtg tcgggagaga tctcgcgaac gcaagggcaa 2821 tatccgccgc gttcctttaa gccttccttt accaatttga caatttcttc attttcgtta 2881 agtcttatct ttcccatatt gttaaacctc ctcgtttggg gtaatattgc cgtattcaat 2941 atatttcaca gttgtttcaa ccgcagatgt aacagcttta gccgaaattt cggatgacat 3001 acttgcaatt gacctggaaa attttgccgc ctgcgatggc gtgatcggaa aatggataaa 3061 tcccgcaggt gttttaggaa acacgatgtt caaaaaatgc aacacgccat acataaggtg 3121 attgcacaca aatgtgcctg cagaattgga aacttgagca gggattcctc gcaatttcat 3181 atccgatact atttctttta tcggcaatgt cgaaaaatat gccgcggggc cgttttcgac 3241 gataggtttg tccttgggtt tatagtcatc gttgtcggca atggatgcat cgtcaacatt 3301 tattgaaact cgctcaacag ttacaaccgc tctttccgcc gcttgaccga gcattatgac 3361 agcgtcgggc ttatgctcgc agaccgcttt gcaaacgaca tctaccgaac gttcaaacga 3421 tgtcggaaca acaagcctaa ccatctcgca agcatctgtt tcggcaagct caagtgcctg 3481 cattgcggca ttggtggttt cttctccgaa agggtcaaag gcagttataa ggatcttcat 3541 tattctcacc tcaagtcaat tatatgcttg tgtcaagtta ggaacaaatt tagccatcgg 3601 ctccctctga cgagggaact gtcagcaaag ctgactgagg gagagaaaac tacccctccg 3661 gcaacacttc gttttgccac ctcccctgac aagtggcggc tcccgctttt aacttgtgga 3721 agtcatttcc acaagttgaa ttttccgcat aacaacaagc attttcttta atttaatata 3781 acatttttta ttggtttttt caagttatat atacaaaaag agttatcccg acattgtgag 3841 ataactctat ttttgatggt atgacaaaaa tcataccgac atattgaaaa tcataccaaa 3901 gaaaatatgg ttagaaactt tgtttttaag cagtaaaact gccgaaagta tgacggttat 3961 tcctgacttg cctttttaaa gtctttacag tgtgatgata acttgcttga aaacacctct 4021 atttcattca agaattgcga cagttctgta taagatttac ttttataatc aatatcagaa 4081 aaatggtgtt tatagcatct aatcaaattt tcacacgctc tcttagttgc atcaatcatt 4141 tcaataagtg ttttttcttt tgctatgcaa tcttcttgca aagtcgtagc gccaaatgta 4201 tgataaaaac ttttatgcat atctttgtac agaactaaat ctgcatacat ttttgatttt 4261 tctgcgtttt ttatatcctg ttcattgcta cgctttagat tcacttgctc tgaatagtaa 4321 actgcaaggt tataatttgc ataactacgg tatgaatcgt ttcttgagaa atctaaaatt 4381 ctttcactaa ctttaagaat ctctgcatta actatctctt tttgagcatc tgtctcgatt 4441 ttatcgtgca tagtacgaag aaattttaat gcaacaaata agagtttatc atttgttgga 4501 tgatgtaaca actgtttttc tatttcgccc cattttgtat gcaaaaatgg atatgaggta 4561 ttttcttttt gaattatact ctcgatttct tctataaaat cattgacctg ttccggagaa 4621 ataccacaca aatcatctaa tgagacatta aaaattcttg tcaatgaaca cagaattgca 4681 atatctgggg ctgcaatacc attttcccac ttgctaatta cttgattaga aacgcataaa 4741 atatctgcca atttttcttg tgtccagtta aatgcaagtc ggtattttct tatattagca 4801 cctaaaattt catttaccat tatgaacact cctttctttg attttattat ataacaatca 4861 aggagttcaa tcta // LOCUS sequence043 4866 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence043 VERSION sequence043 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..4866 /mol_type="genomic DNA" /organism="" /note="sequence043" CDS complement(397..1764) /product="2-isopropylmalate synthase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011393738.1" /transl_table=11 /codon_start=1 /translation="MKKIIISDSTLKTASKGLSFREKTAVAKALDAMGVDTVELYTPAK SKEDAVVISTVCSAVKNGTIAIPCSMNNDDIDYAIECIKNNGIIQFEVPVSTVCMEYTY HMKSPKMLEAVKKALSYAAEKGAKTEVVCMDASRAEEGFIAEVAKTAKDCGAAALTLQD DAGIFLPEELAACVETVKSVADIAVYVAPSNEMGMALACAAAAIKAGADGVKTSVAEGL ALDGVAQFMKLKGDAMGIGAKLDLTKCAHAVADLRARVFDGAKAAPLVPKEDAENISLS ADAGLPEVGEAVVALGYELSADDMGKVYEEFLRFAKRRIVISAKELEAIIASSAMQAPS TYHVESYISTSGNIAPSMCNITLIKEGEKLAGVASGDGPIDAAFKAIEQIIGHHYELDD FKITAVTEGKEAVGSAIVRLRDDGKLYSGNGISTDIIGAGIRAYINALNKIVYGEN" /locus_tag="LOCUS_2540" /EC_number="2.3.3.13" /note="WP_011393738.1 2-isopropylmalate synthase (Moorella thermoacetica) [pid:27.8%, q_cov:99.1%, s_cov:96.3%, Eval:7.3e-44]" /note="MGA_309" CDS 2573..3793 /product="tryptophan synthase subunit beta" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_005482634.1" /transl_table=11 /codon_start=1 /translation="MNFNNVDFDTYFKHYPDENGYFGKYGGVYVSPELKQAMAEITEAY QTICKSRKFINELRRIRKEFQGRPTPISHLERLSNKIGTGVQLYVKREDLNHTGAHKLN HCMGEALLAKYMGKKKVIAETGAGQHGVALATAAAYFGLECDIYMGSVDIKKQAPNVAR MKILGANVVEVTHGLATLKEAVDAAFDAYCREYKDAIYCIGSVLGPHPFPMMVRDFQSV VGIEAREQFIEMTGELPDAVVACVGGGSNAMGMFSGFLNDPVDIYGVEPLGRGPKLGDH AASLTYGEEGVMHGFNSIMLKDENGDPAPVYSVASGLDYPSSGPEHAFLHELGRVKYDV INDEETIDAFFELARMEGIIPAIESSHAVAYAIKLAKKMGKGSVLICLSGRGDKDMDYV IENYGIR" /locus_tag="LOCUS_2550" /gene="trpB" /EC_number="4.2.1.20" /note="WP_005482634.1 tryptophan synthase subunit beta (Vibrio) [pid:65.8%, q_cov:98.0%, s_cov:97.8%, Eval:2.0e-151]" /note="MGA_310" CDS complement(3904..4248) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MTTNNHEVIFAIVNSGYAEDVMDVAREHGARGGTIINGRGVARED EAAFFGISIHADKELLMMVVEKDSRDEILHALYKQMGMQKKAQGIVFSLPVSDVAGLAQ RIEAPQTTEN" /locus_tag="LOCUS_2560" /note="WP_002666310.1 P-II family nitrogen regulator (Treponema) [pid:37.2%, q_cov:82.5%, s_cov:43.7%, Eval:2.6e-14, partial hit]" /note="frameshifted, insertion/deletion at around 4270" /note="MGA_311" CDS complement(4253..4621) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MANTINDTAIKKLKVIITVVDRSKAEFYLDVLSQFEVNFQMATGG KGTATSELVEMFGLNLNKAVLMSVVREDMVNPIMECLEDKFKTIRNGKGIAFAVPLSGV IGVNMYQFLSNNKQSRED" /locus_tag="LOCUS_2570" /note="MGA_312" ORIGIN 1 tcaagattgt gacatcgtcc ttttctgcct ctttaacagc gggagccata atctttttca 61 attcatatgg gtcaatttcg ttctttgctg taacgatcac gtttttgata cccgcatcgt 121 gcgcagcatc aatatattca accagctttt cgccgtcggc accggcttct gtcatatcgc 181 agggataggt caaggcactt acagtgaggt gtcggttgat gagtttgcgc ttggcatcag 241 cccgctttgc accgaaaagg ccgtcggcgt gagctttttt aacttcatcc aaatcgtaaa 301 gctcaacagc atcaaagcca tagtcgagcg cagtctgcgc cagctccaaa aatgtatctg 361 ttttaacgtg ttttgttgaa aatgaaagct tcataattag ttctctccgt agacgatctt 421 gttgagcgcg ttgatatatg cgcggatacc tgcgccgatg atgtcggttg aaattccgtt 481 gcccgaatag agcttgccat cgtcgcgaag tcttacaatt gccgagccga cagcctcctt 541 gccctcggta acagcggtga tcttaaagtc atccagctca taatggtggc cgattatctg 601 ctcgatcgcc ttgaatgccg catcaatagg gccgtcgccc gaggcaacac ctgccagctt 661 ctcgccttcc ttaataaggg tgatgttaca catcgaggga gcgatgtttc cgctggtgga 721 gatatatgat tcaacgtgat aagttgaagg tgcctgcatc gcacttgatg cgattatcgc 781 ttcaagctcc tttgcgctga taacgattct tctctttgca aagcgcaaaa attcctcata 841 taccttgccc atatcgtcag cagaaagctc atatcccaaa gcaacaacag cctcgccgac 901 ttcgggaagt cctgcatctg cgctgagcga aatattttcc gcatcttcct taggcactaa 961 gggagcggcc tttgcgccgt cgaaaactct tgctctcaaa tcggcaacag cgtgggcaca 1021 cttggtcaaa tcgagcttgg caccgatgcc catagcatcg cctttgagct tcataaactg 1081 tgcaacgccg tccaaagcca agccttcggc aacagaagtc ttaacgccgt cagcacccgc 1141 tttaattgcg gcagcggcac aagccaaagc cattcccatt tcgtttgaag gagcaacata 1201 tactgcgata tcggcaacag atttgaccgt ttccacacac gctgccaact cctcgggcag 1261 gaaaatgcct gcgtcgtcct gcaaggttag agccgctgcg ccgcaatcct ttgcggtctt 1321 ggcaacttct gcaataaagc cttcttcggc tctggaagca tccatacaaa cgacttctgt 1381 ctttgcgccc ttctcggcgg catatgaaag agccttttta acagcctcaa gcatcttggg 1441 cgacttcata tgataggtat attccataca aacggttgaa acgggaacct caaactgaat 1501 tatgccgttg tttttgatgc attcaatagc atagtcgata tcatcattat tcatagagca 1561 cggaatggcg atggtgccat ttttcacagc cgagcagacg gtcgaaatta caacagcatc 1621 ctccttgctc ttggcgggag tataaagctc aacggtgtca acacccatgg cgtcaagcgc 1681 ctttgcaacg gcggtctttt cgcggaagga aagccccttt gaagcggttt tcaacgtcga 1741 gtcggaaatg atgatctttt tcatggtgtt ttgtcctcct gtgggaaaaa tatatttgcg 1801 tctgagtcaa taaagaaacc cgcagaccca ataatctggt tctgcgggat gattaacatt 1861 aaaattaacc acggtaccac ccgtattgcc ggcatacttt gccgaccgct cattaaggca 1921 cactcgcctt caggctcaga caagccctga ccgttaacgg tgtccaccgt aagcccttac 1981 tgcaattttc acggcttccg ctcagatagg agagagcttg ggattttctt tcctgcctcg 2041 caccatccgg cagttctctt taaatacttg gcccaaacca attatcttca cagcgtttga 2101 aacgataata tcacaaatca agaaatttgt caacactttt acttgacaaa tctgtaatgc 2161 agtgatatat taaagtaaac cagtgaaaaa gagaagtaag cattgttttt catctcaaga 2221 gagccgacac tttggtgcga gtcggcggtg atgctttgct gaatggactt ttgagggcaa 2281 tcggaaagaa aaccgtgcgg tttttaagta tgtgcgacgg agcggtactc cgttaacaaa 2341 tcctgcttat tgattgataa gcgcagagcg ggcgaaaagt aatttcgcca aggttgggtg 2401 gcaccgcagg aatgttttcc tgtcccggca gttgagtttt aaaactgcgg ggctttttta 2461 ttttataagc ctcggaaagg atatgaataa aatgttactt acaaagcgat ggcgacccat 2521 aaaccaagcc caataacatc acattaataa tatatatttg gaggaaaaga ttatgaattt 2581 caacaacgtt gattttgaca cctatttcaa gcactatccc gatgagaacg gctatttcgg 2641 caagtacggc ggagtttatg tatcccccga gctgaagcag gcgatggcag aaattacaga 2701 ggcatatcag acaatttgta aatctcgcaa gtttataaat gaactcagac gcatccgcaa 2761 ggaattccag ggcagaccca cccccatttc tcaccttgag cgcctttcaa acaagatcgg 2821 cacgggtgtt cagctttatg ttaagcgtga agaccttaac cacacaggtg ctcacaagct 2881 caaccactgt atgggtgaag ctttgctggc aaaatatatg ggcaagaaaa aggtcattgc 2941 cgaaacgggc gcaggccagc acggcgtagc cttggctacc gctgcggcat atttcggact 3001 tgagtgcgac atttatatgg gctcggtgga tattaagaag caggctccca acgttgcaag 3061 aatgaagatc ttgggcgcaa atgttgttga agtcacccac ggtcttgcaa ccctcaagga 3121 agcggttgac gccgcatttg atgcatactg ccgcgaatat aaagacgcaa tttattgcat 3181 cggctccgtt ttgggccctc atcccttccc gatgatggtc agagatttcc agagcgttgt 3241 cggaattgaa gcaagagagc agtttatcga gatgaccggc gagttgcccg atgctgttgt 3301 cgcttgtgtc ggcggcggct caaacgcaat gggaatgttt agcggcttcc tcaacgaccc 3361 tgttgatatt tacggcgttg agcctttggg cagaggcccg aagcttggcg accacgccgc 3421 aagcctcaca tatggcgaag aaggcgttat gcacggcttt aacagcatta tgctcaagga 3481 cgaaaacggc gaccccgcac ctgtatattc agttgcatcg ggacttgact atccctcttc 3541 gggacccgag cacgcattct tgcacgagct tggcagagtt aagtatgatg ttattaacga 3601 cgaggaaaca attgacgcat tctttgagct tgcacgaatg gaaggcatca ttcctgcaat 3661 cgaaagctcc cacgctgtgg catatgccat taagctggca aagaagatgg gcaagggctc 3721 agttttaatt tgtctttcgg gcagaggcga caaggatatg gattacgtca ttgaaaatta 3781 cggaatcaga taagcataca gaatcaaagc agtcttgcaa atgtgcagga ctgctttttt 3841 gtgccgcaac gaaaagctcc ccttcctttt tcgggaagag gagcatattg tttgtgaaaa 3901 actttagttt tctgtcgtct ggggagcttc aatgcgctgt gccaagccgg caacatcgga 3961 aacagggagc gagaaaacga ttccctgcgc ctttttctgc attcccatct gcttatagag 4021 cgcgtggagg atctcatcgc ggctgtcctt ttcaacgacc atcatcaaaa gctctttatc 4081 tgcatggata gagatgccga agaatgcggc ttcatcctca cgtgcaacac ctctgccgtt 4141 gattatcgtg ccgccgcggg caccgtgctc acgtgcaacg tccattacat cctcggcata 4201 tccggaattg acaatggcga aaattacttc atggttatta gttgtcatta tttcaatcct 4261 ccctgctttg cttgttattg ctcaggaact gatacatatt tacaccgatc actcccgaaa 4321 ggggcacagc aaaggcgatt cccttgccgt ttcgaattgt tttgaattta tcctcaaggc 4381 attccattat tgggtttacc atatcctcac ggacaacgct cataagcact gccttattga 4441 gatttaaacc gaacatttca accagctcgc tggttgcggt gcccttgccg cctgttgcca 4501 tctggaagtt gacctcaaac tggctcaaca catccagata aaactccgcc ttggagcggt 4561 caacaacggt gatgataacc ttcagctttt taatagctgt atcgtttatt gtatttgcca 4621 tattatcgcc actcctttaa ataaagttga tgatctgctc atcatcagat gcaagaattc 4681 gctgcattgc gcgtctttcc ttgatcttgt tggatacgat cgctctgaag ccgagaagct 4741 gaatggtgat aagcggtgcc attgcaacca tcgcaacaac gccgaagccg tcgcgaagta 4801 ccgcgctttc gccctgcaac gatacgcaca caccgacagc gaagggcaaa atgaaacccg 4861 atgtca // LOCUS sequence044 4773 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence044 VERSION sequence044 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..4773 /mol_type="genomic DNA" /organism="" /note="sequence044" CDS complement(529..1773) /product="homoserine dehydrogenase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_196768329.1" /transl_table=11 /codon_start=1 /translation="MEPIKIAVMGFGVVGSGTVELIYKNKELLEARCARSLDVKYILDL RDFPDSPYADKLTKNFEDILNDDEISVVCELMGGKTFAYDYTKRLLEKGKSVVTSNKEL VAYHGAELLAIAKEKGCHYLFEASVGGGIPIIRPLHQCLAANRIEKIAGILNGTTNFIL SKMIFDQISFADALSMAQELGYAEKDPTADIDGHDPCRKLCILGSLAFGKHIYPEYIHR SGIRDLTLDDVEYAENAGYAIKLIGMIEDTGEGLVATVCPRLVPVNNPLSTVNDVFNGI MVTGDALGDALFYGKGAGKFPTASAVVADVLDAIKNEGREMISLNWVDSQSGDFIKHYK SASVREYVRIHCENADMLKEFITGLFGYVDFIPRKYRADNELAFITPLMVESQIDQRLE KIREKAVIKKKIRLL" /locus_tag="LOCUS_2580" /note="WP_196768329.1 homoserine dehydrogenase (Moorella thermoacetica) [pid:42.1%, q_cov:98.1%, s_cov:97.0%, Eval:5.1e-81]" /note="MGA_315" CDS complement(1789..2253) /product="ACT domain-containing protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_005811150.1" /transl_table=11 /codon_start=1 /translation="MSKNSFVIVSADVLPEVILKVLEAKKLIAQGVCRTSTEACKRADV SRSAYYKYKDSVHLYSERLSGRVVTYYFTLYDRAGVLSGVLAELHKLNANVLTINQNIP IDSAATVTITVRFDDPDIDPQAICDAIKKVDGVVKAKIITGGSEAGKMEQ" /locus_tag="LOCUS_2590" /note="WP_005811150.1 ACT domain-containing protein (Desulfitobacterium) [pid:44.9%, q_cov:89.6%, s_cov:92.0%, Eval:7.1e-26]" /note="MGA_316" CDS complement(2388..3218) /product="metallophosphoesterase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_000037684.1" /transl_table=11 /codon_start=1 /translation="MKLKRPLKFAIAAAVLLACFAGYCVAQREWLTKSYYTLSSPKVSA AFDGFKICHLSDLHNHEFGRDNARLLNVIAKENPDIIAITGDLIDSRHTDIEVSLEFVS KCVEIAPTYYVCGNHEDRFTPEEQAYIYSSLEEMGATLLEGESVGIFRESESIYIGGFF NKYENEDGDYDIFDRKDKLNVLLYHRPTCFDLFKATGADLVLSGHAHGGQFRIPFVGGL LAPDEGFFPKYSEGMHDIDGTKLIVSRGLGNSLMPIRLNNPPEVIFVTLKNSTI" /locus_tag="LOCUS_2600" /note="WP_000037684.1 metallophosphoesterase (Bacillus cereus) [pid:38.8%, q_cov:97.8%, s_cov:98.6%, Eval:4.6e-47]" /note="MGA_317" CDS 3364..3993 /product="uracil phosphoribosyltransferase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_010966163.1" /transl_table=11 /codon_start=1 /translation="MANITIFEHPLIKHKISLLRDKSTGTKDFRVLIEEIATLMGYEAL RDLPLENVEVETPICKASVPMVAGKKLAIVPILRAGLGMVNGILALVPSAKVGHIGMYR DEVTHIPHEYYCKLPDSLEERTIIVLDPMLATGGSAVDSISLIKQRGGKNIKFMSIIAA PEGLKALSEAHPDVEIYCGNLDEKLNENCYIVPGLGDAGDRIFGTK" /locus_tag="LOCUS_2610" /gene="upp" /EC_number="2.4.2.9" /note="WP_010966163.1 uracil phosphoribosyltransferase (Clostridium) [pid:65.6%, q_cov:100.0%, s_cov:100.0%, Eval:8.2e-79]" /note="MGA_318" ORIGIN 1 gtcatcgagt atgatttgga taactgcggc aattcaactg tttctgaaag cagttaacct 61 cgccgaaagc tatgaggctg ataccactcc gtttttgata ccgacacttt atgttgcgat 121 cgctatagca ctcggcacag caattttctt tatcatcaaa aagaatatca cgttctttaa 181 tctgatagtg tggcctctta ttgtaggcat aatgattggt gtattgttcc tcctgatact 241 tagcgccctc aattactccc ttgatctttc cacacccgag gaatattcag gaaccgtcat 301 cagcaccgat tttgatattg gaataaggcg aagcccgaca acttacgaaa taaccgtgtt 361 gtccggcgat gatgagatcg acttgggcgt cacaaaggct caatattacg aatactatgt 421 cggtcagaat gtgacgatat accgttatga aggagcgctc ggcgcaccgt attacataat 481 tgaatagaac gacaaatccc gtcgagcata agcacgacgg gatatttttt acaacaacct 541 gattttcttc ttgataaccg ctttttctct tatcttttcc aagcgctggt ctatctgcga 601 ttcaaccatt aagggcgtaa tgaacgccag ctcgttgtct gcgcggtatt ttctcggaat 661 gaagtccaca tatccgaaca agcctgtgat gaattcctta agcatgtctg cgttttcgca 721 gtggatcctc acatattcgc gaacacttgc cgatttgtaa tgcttaataa agtcgccact 781 ctgtgaatcg acccagttaa gggagatcat ttccctgccc tcgttcttaa tggcatcaag 841 cacatcggca acaacagcag aagctgtcgg gaatttgcct gcgcccttgc cataaaacag 901 cgcatctccc aaagcgtcgc ccgttaccat aatgccgttg aaaacatcgt tgacggttga 961 aagaggattg ttgacaggca caagtcttgg gcagactgtt gcaaccaagc cctcgcccgt 1021 atcttcgatc attccgatga gcttgatggc atagcctgca ttttcggcat attccacgtc 1081 gtcaagggtc agatctctta tgcccgaacg gtggatatat tcgggataga tatgcttgcc 1141 gaatgcaagc gaacccaaaa tgcacaattt tctgcagggg tcgtgtccgt cgatatcggc 1201 agttgggtct ttttcggcat atcccaattc ctgcgccatt gaaagagcat cggcaaagga 1261 tatctggtcg aaaatcatct tggaaagaat gaagtttgtg gtgccgttca aaatgcccgc 1321 aatcttctca attcggtttg cggcaagaca ctgatgcaaa ggtcttatga tcgggattcc 1381 gccgccgacg gaagcttcaa acaaatagtg acatcccttt tctttggcga tcgccaaaag 1441 ctccgcgccg tgatatgcaa ccaattcctt gttggatgtt acaacgcttt tgcccttttc 1501 aagcaagcgc ttggtatagt cataagcaaa ggtctttccg cccataagct cgcagactac 1561 gctgatctca tcatcattta aaatatcttc aaaatttttg gtcagcttgt cggcataagg 1621 gctgtcggga aaatctctga ggtcaagaat atactttaca tcaagcgatc tggcgcatct 1681 tgcttccaaa agctccttat ttttatatat gagttcaacg gttcctgagc cgacaacgcc 1741 aaagcccatt accgcaattt ttatcggttc catattgcta agttctcctt attgctccat 1801 tttgcccgct tccgagccgc ctgtaattat ctttgcttta acaactccgt caaccttctt 1861 aatggcatcg catatcgcct gagggtcaat atcggggtca tcaaaccgca cggttatcgt 1921 caccgtcgcc gccgagtcga tggggatatt ctggttgatt gttaaaacgt ttgcattcaa 1981 cttatgaagc tccgccaaaa ctccgctcaa aactcccgcg cggtcataaa gggtgaaata 2041 atatgttaca acgcgcccgg aaagcctttc cgaatatagg tgaacgctgt ccttatattt 2101 gtaatatgcg cttcttgaaa cgtccgcacg cttgcatgcc tcggtagagg ttcggcaaac 2161 gccttgcgcg ataagctttt tcgcttcgag cactttaagt attacttcgg gcaacacatc 2221 tgccgaaaca ataacaaaac tgttctttga cacgcaattt tctcccttca cgagtgtttg 2281 tcacaaatac aactgtattc gttgcaaata caattataca atgattggca aatattgtca 2341 acaagcggat aaacaaaaag cgcccaacaa aggagcgctt tatttgttta aattgtcgaa 2401 ttctttagag tgacaaaaat cacttcaggg ggattattga ggcgaatagg catcagcgag 2461 ttgccaagac ctctcgaaac aatcagcttt gtgccgtcaa tatcgtgcat accctccgaa 2521 tatttcggga agaagccctc gtcgggtgcc aaaagaccgc cgacaaatgg aattctgaac 2581 tgtccgccgt gggcatggcc tgacaaaaca aggtcggcgc ctgttgcctt gaacaggtca 2641 aagcaggtgg ggcggtgata gagcaacaca ttcagcttgt ccttgcggtc gaatatatcg 2701 tagtcgccat cttcgttttc atatttgttg aagaagccgc cgatgtaaat gctttcactt 2761 tcgcggaaaa tgccgacaga ttcgccctcc aagagggtgg cgcccatttc ctccagcgaa 2821 gaatagatat atgcctgttc ctcgggagtg aagcggtctt cgtggtttcc gcagacgtaa 2881 tatgtgggag cgatttcaac gcacttggaa acaaactcca gcgaaacctc aatgtcggta 2941 tgcctcgagt cgataaggtc gcctgtaata gcgatgatgt cggggttttc ctttgcaata 3001 acatttaaaa ggcgggcgtt gtccctgccg aattcgtggt tatgcaggtc gctgaggtga 3061 cagatcttaa agccgtcaaa tgcggcactg accttggggg atgagagggt ataatatgat 3121 tttgtcagcc attcccgctg tgcaacgcaa taaccggcaa agcaggcaag gagcactgcg 3181 gcggcgatgg caaattttaa gggtcgttta agtttcattc ggtcttctcc gtaaaaatat 3241 aataatcact atggtaatca tagcacaaac gaaggaattt ttcaacttga atatttatct 3301 attgcaattt ttgtcgatgg gtggtagaat ataaacaata atgtaacata aaggagagat 3361 accatggcta atatcacaat tttcgagcac ccgctcatta agcacaagat ttccctttta 3421 agagataaga gcaccggcac caaggacttc agagttttga ttgaagagat tgcaaccctt 3481 atgggttacg aagctttgcg cgacctgccc cttgaaaatg tcgaggttga gacccccatc 3541 tgcaaggcaa gcgtacctat ggttgcaggc aagaagttgg caatcgttcc catccttcgt 3601 gcaggcttgg gtatggtaaa cgggattttg gctcttgttc cttccgcaaa ggttggacac 3661 atcggtatgt accgcgacga agtcacccac attccccacg aatactactg caagcttccc 3721 gacagcttgg aggaaagaac tatcatcgtt ttggacccca tgcttgcaac aggcggctcg 3781 gctgttgact ctatttccct tattaagcag cgcggcggca agaacattaa gtttatgtcc 3841 atcattgcag cccccgaggg acttaaggca ctcagcgaag ctcatcccga cgttgagatc 3901 tattgcggaa accttgacga aaagctcaac gaaaactgct acatcgttcc cggtctgggc 3961 gacgcaggcg acagaatctt cggcacaaag taatatttaa aatgcaaaac agcttcctta 4021 aaaagggggc tgtttttgtt tggcaacgag gcgcagttta gcaaagggga aaaccacaag 4081 acgacaagag agaacggagt aaggagaagt cggcgcgtcg ttctcccttt tcttcttaag 4141 gttttcccct ttgtatcccc tttccttatc ttctttttcc tcttcccgag cctactggct 4201 tcgatatcct atgcgcttac aaagctaata attgtaacag aggagcgact ggtagagagc 4261 aatcttttca tagatggtag tgcaatacgt tgagagatta aatcttgcga caagatgtgt 4321 aaagataaat tagcaaaata ggtagcgcat gggattcaag tgtgagtgct aaacgtttgc 4381 gcgttgcaat gttaaaaggt acaagccttc ggcttgtgct atgcccaccc cctcccccct 4441 cccacgggga gggggcttaa caaaccattc accaaaagct cttgcatttt taacaaagct 4501 atgctatact gcatataatg ctgaaaaaag ctatgaacga agagagtagc gcaaacaagc 4561 ttctttaaag agagcggtga gggtggaaat ccgcaggagg ccttgcgtga agtgcattcg 4621 ggagccgggc ggaggaaatt ttaaaaagta ttccgtcacg tttgccgcgt taaggcgatt 4681 aaagttacaa atcggagtgg aaccgcagcg aaatttttgc cgcctcccgt ggaagttatt 4741 tcccgtgggc gcggtttttt tatttttttt gaa // LOCUS sequence045 4737 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence045 VERSION sequence045 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..4737 /mol_type="genomic DNA" /organism="" /note="sequence045" CDS complement(175..504) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MKTAIIGSRSLEISDLEEYLPDGTTEIISGGAKGIDSCAEELAAR LGLAITVIRPNYAKFGRCAPLKRNDEIISLADIVVAIWDGKSKGTKYVIERCQKLGKTA IVHIK" /locus_tag="LOCUS_2620" /note="MGA_319" CDS 609..821 /product="helix-turn-helix transcriptional regulator" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_026184197.1" /transl_table=11 /codon_start=1 /translation="MYRRIRDLREDKDLTQAQIAKMLGMSQTGYSKYETGENDIPTVIL IKLARFYNTSVDYLLGEIDTKERYK" /locus_tag="LOCUS_2630" /note="WP_026184197.1 helix-turn-helix transcriptional regulator (Desulfitobacterium) [pid:67.2%, q_cov:87.1%, s_cov:87.1%, Eval:3.3e-17]" /note="MGA_320" CDS 979..1164 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MRNKNNKHLGIEVDPELHYKLHYISKYEGRSAHGQILYLIRKCIK EFEQENGLIEVPESKE" /locus_tag="LOCUS_2640" /note="MGA_321" tRNA complement(1590..1664) /product="tRNA-Arg" /inference="COORDINATES:profile:Aragorn:1.2.38" /locus_tag="LOCUS_t0050" /note="Aragorn_5" CDS complement(1823..3676) /product="methionine--tRNA ligase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_010966273.1" /transl_table=11 /codon_start=1 /translation="MQDYDVFFLTGTDEHGQKIEQQAIEEGITPKQHVDIIAGQIKDIC DLLNISYNRFIRTTDEDHEKCVQKIFTKLYEQGDIYKSEYEGWYCTPCESFFTETQLVD GKCPDCGREVNRTKEEAYFLKLSKYQKQLEQFLEENPDFIQPESRKKEMVNNFIKPGLQ DLCVSRSTFKWGIPVEFDPKHVTYVWLDALSNYISGLGYDIDNPSEMYKHYWQNCTHII GKDILRFHSIYWIIELMALGLTLPKKIFAHPWMLFGTDKMSKSRGNVIYADDMVGHFGV DATRYYLLSEMPFAADGSISYETVIDRYNTDLANTLGNLVNRTVAMVNKYFGGVVDGPS DKTETDLDLEATALKAVANIASHIDAFKMADAVDDVMTLARRANKYIDETTPWALAKDE ATLPRLKTVMYELIEAIRFIGILVEPFMPETSKKILEQINTDVCGFETLCAFGGYVAGT KVNAPVPLFARIDSEKLLAELNAQMEAVKKAAEEEARKAEEVAAYKVDPIAEEVTIDDF FNIDLRACKVLECEKVPKSKKLLKLQLNDGIGTRQVVSGIAAWYAPEDLIGKTVAVVAN LKPAKLCGIESQGMICATDMPDGSAKVVFLSDDVPAGARLR" /locus_tag="LOCUS_2650" /gene="metG" /EC_number="6.1.1.10" /note="WP_010966273.1 methionine--tRNA ligase (Clostridium) [pid:55.0%, q_cov:100.0%, s_cov:93.9%, Eval:5.1e-195]" /note="MGA_322" CDS complement(4023..4235) /product="DUF378 domain-containing protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011037754.1" /transl_table=11 /codon_start=1 /translation="MRFLDRLCLAILIIGGINWGLVGIFSFDLVAYLFGGMASLMSRVV YVLVAISAVWTVSLFFRDSMLVEES" /locus_tag="LOCUS_2660" /note="WP_011037754.1 DUF378 domain-containing protein (Xanthomonas campestris) [pid:53.1%, q_cov:91.4%, s_cov:81.0%, Eval:2.0e-14]" /note="MGA_323" ORIGIN 1 atggtaaaac ctccgtaatt tcaatgattt tgaaatagaa aaagaacgat gttaagtctt 61 tcgactcgac atgttctttt cgtagttgtt ttccaaccct gtcagacaga tgctgtaaaa 121 ttgtaattta tttagaatta cagttttacg agcacccacc taagggtggc ttttttattt 181 gatatgaacg attgccgttt tgccgagctt ttgacacctc tcgattacat acttcgtgcc 241 ttttgacttg ccatcccata ttgccacgac aatatccgca agtgagatga tttcgtcgtt 301 gcgtttgagt ggcgcacatc tgccgaactt ggcgtaattc ggtcgaatca cagttatcgc 361 aagcccaagc cgagccgcaa gttcttctgc gcaggaatca atcccctttg ccccgccgct 421 gatgatttcg gttgtgccgt caggcagata ttcttccaaa tccgatattt caaggcttcg 481 cgagccgatt attgctgttt tcatattccc actcctcatg gatattttaa cctgttttag 541 gttaaaatgc aatactctaa aacaggttgg ctataattat aattacaact atgtagagga 601 gtgagggtat gtatcgccga atccgtgatt tgcgagagga caaggattta acgcaggcac 661 agattgccaa gatgctcggt atgtcgcaga caggatattc gaaatacgaa acgggcgaaa 721 acgatattcc taccgttatc ctcattaagc tggcgagatt ttataacaca agcgttgatt 781 atctcttagg agaaatcgac acgaaagaaa gatataaata actttcgggc gaccaaacag 841 ggtcgccttt ttgattatat ttgaatgcct gcgtaataag ttctcattat ttagtatact 901 taaaataagt atactgtcaa ctgccgcgct caaattaatc ttaaaatata cttaaattaa 961 gatcggcgag gcgatgttat gagaaacaaa aacaataaac acttgggaat cgaagttgac 1021 cccgaattgc attataagct acattacatt tcgaaatatg aaggtcgttc tgcacatgga 1081 caaattctgt atttaattcg caagtgcatc aaggaatttg agcaagagaa tggtctcatt 1141 gaggttccgg aaagcaaaga ataacgcaaa taaaaaagac ccacaagggg ccttttttgt 1201 tttggtccac ccggcgagaa tcgaactcac atttccatgg tcggagcgtg gcgttctatc 1261 cattatactt cataattata gtcataatta tgactattgt caataatgtg attgcacttt 1321 atgctaataa tagcgtaaag gtggtgagac tgttgattag ttatcgtccg ttttgggaaa 1381 cattaaagaa acgcaacgtt tcgacgtata cattgataac aaaacataat atcagcagtg 1441 caaccattga cagaataaaa gagggtaagg gtataaccac aaccaagatt gatgactttt 1501 gcaagatttt agattgcagt gtttcggata tcatcgaata tataaaggaa taacaaaagg 1561 cgaccacata gggtcgcctt tttttgtttt ggtccacccg gcgagaatcg aactcacatt 1621 tccacggtcg gagcgtggcg ttctatccat tatactacgg gtaggtgtct gtcattcttc 1681 aaaatgtggg agtttgcgta gcaaactcgt atcgaccgac acaagcgttc agggtgcgag 1741 ccgtttttga cggtcgatta tccattaatc tatggacagg cacgggcggg cacacaggcc 1801 cgcccctatt ttcgaacatt ttttatctga gtcttgcacc tgcaggaaca tcatccgaaa 1861 ggaagactac ctttgccgat ccgtcgggca tatctgtcgc acagatcata ccctgagatt 1921 caattccgca gagctttgcg ggcttgaggt ttgcaacaac cgcaacggtc ttgccgataa 1981 gatcctcggg agcataccaa gcggcaattc ccgaaacgac ctggcgtgtg ccgatgccat 2041 cgttaagctg aagcttcaaa agctttttcg acttcggcac cttctcgcat tcaagcacct 2101 tgcaagcgcg aagatcgata ttgaagaaat catcaatcgt aacttcttct gcaatcggat 2161 caaccttata tgctgcaact tcctcggcct ttcttgcttc ctcttcggca gccttcttaa 2221 ccgcttccat ctgtgcgtta agctcagcca aaagcttctc cgagtcgatt cttgcgaaca 2281 gcggaacggg cgcattaacc ttggtgcccg caacatatcc accgaatgca caaagggttt 2341 caaaaccgca aacgtcggta ttgatctgct ccaagatctt ctttgaggtt tcgggcatga 2401 aaggctcaac cagaatgccg atgaaacgaa ttgcttcaat cagctcatac ataactgtct 2461 tgagtcgggg cagagtggcc tcgtccttag ccaatgccca gggagttgtt tcgtcaatgt 2521 atttgttcgc acggcgtgca agggtcataa catcgtcaac agcgtccgcc atcttgaagg 2581 cgtcgatatg agaagcaata ttagccaccg ccttaagcgc agttgcttca agatcgaggt 2641 cagtttctgt cttgtcagag gggccgtcaa ccacaccgcc gaaatatttg ttgaccattg 2701 caacagttct gttgacaagg ttgcccaagg tgtttgcaag gtcggtatta tagcggtcga 2761 tgactgtttc atagctgatt gagccgtcag cagcaaaggg catttcgctc aagaggtagt 2821 atcttgttgc atcaacgccg aagtgaccga ccatatcgtc agcatagata acatttccgc 2881 gtgatttact catcttgtca gttccaaaga gcatccaggg gtgagcaaag atctttttag 2941 gcaatgtaag tcccagagcc atcagctcga ttatccaata aattgagtgg aatctcaaaa 3001 tatccttgcc gatgatgtgg gtgcagttct gccagtagtg cttatacatc tcgctggggt 3061 tgtcaatgtc ataaccgagg ccggagatat agtttgaaag agcatccagc caaacatagg 3121 ttacgtgctt ggggtcaaac tcaacgggaa taccccactt gaaggttgaa cggctgacac 3181 aaaggtcctg cagacccggc ttaatgaagt tgttgaccat ttccttcttg cgggattcag 3241 gctgaatgaa gtcggggttt tcttcaagga actgctcaag ctgtttctga tactttgaaa 3301 gcttcaaaaa gtatgcttct tccttggttc tgttaacttc tcgtccgcag tcggggcatt 3361 tgccgtcgac aagctgagtt tctgtaaaga agctctcaca gggggtgcaa taccaaccct 3421 catattccga tttatagatg tcgccctgct catagagctt ggtgaatatc ttctgaacgc 3481 acttttcgtg atcctcgtcg gtggtgcgga taaagcggtt atatgagata ttcaaaaggt 3541 cgcagatgtc cttgatctga cctgcaataa tgtcaacatg ctgcttgggg gtgatgccct 3601 cttcaatcgc ctgctgttca atcttctgtc cgtgttcatc ggtacccgtg aggaaaaata 3661 catcgtaatc ctgcattcgg cggaacctcg cgatggcatc agcgcaaact acatcgtaag 3721 tattgccgat atggggcttt ttagatgtat atgcgatcgc cgtagtaata agttatggct 3781 ttttacacat acagattcct ccttaataat aaaaatttcc ctcacaaact cgtgaggcaa 3841 tacactttta ttataccctt ttggcagggt ttgtcaaggg cgaccggcct cgccgtaaag 3901 aataatgaat agtgaatgat gaataatgaa taattgcagt atcgccttcg gctgagaatt 3961 tcaaggcacg aaagtataaa ggcgggcact caggcccgcc cctcatacga gatatgtccc 4021 tatcagcttt cttcaaccag catcgaatct ctgaagaaca gcgataccgt ccagaccgcg 4081 ctgatggcaa ccaacacata caccactctt gacataagcg atgccatgcc tccgaacaga 4141 tatgcaacca ggtcaaagct gaaaatgccc accaagcccc agttgatacc gccgatgatc 4201 aaaattgcca gacaaagtct atcgagaaat ctcataaatt aaacactcct ttacttcttt 4261 taagttattc tttcccaagt ttaataattt tatgcgaaaa cagtttacaa aagttttcct 4321 tcaaggtata atcaaattgc aacgattctg tttgaaagga agattttaaa atatgaagtt 4381 cggatatttc gacgaccaaa accgtgaata tgtcattact cagcctaaga ccccctaccc 4441 ctggataaac taccttggca cagaagggtt cttctccctt atttccaaca ccgcaggcgg 4501 ctactgcttc tataaggatg cacgccttcg ccgcatcacc cgctatcgct ataacaacgt 4561 gccgatagat atgggcggaa gatacttcta tattaacgac ggcgaatcgg tctggagccc 4621 ctcttggagc cctgtcaagg ctgatttgga ttcatacacc tgccgtcacg gtatgggcta 4681 taccgtaatt aagggcgcaa agaacggcat cgaggctgaa actaccttct tcgttcc // LOCUS sequence046 4735 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence046 VERSION sequence046 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..4735 /mol_type="genomic DNA" /organism="" /note="sequence046" CDS complement(991..1560) /product="CDP-diacylglycerol--glycerol-3-phosphate 3-phosphatidyltransferase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_009889106.1" /transl_table=11 /codon_start=1 /translation="MNLANKLTILRVVLIPLFVLFLLWQFTSFNVLIALVIFTVAAITD ALDGNYARKHNLVTNFGKFLDPLADKALVMAALVAFVGLGWAGSVPVMIILFREFMVSA LRMVASSANGKVIAAGAWGKLKTAFTMVAIIAIMFFRGIMALGVPIPENILSVGSAILI WIATILTVVSGVQYLWAYRDVIDTNK" /locus_tag="LOCUS_2670" /gene="pgsA" /EC_number="2.7.8.5" /note="WP_009889106.1 CDP-diacylglycerol--glycerol-3-phosphate 3-phosphatidyltransferase (Clostridioides difficile) [pid:48.4%, q_cov:100.0%, s_cov:100.0%, Eval:1.7e-34]" /note="MGA_326" CDS complement(1562..2893) /product="30S ribosomal protein S12 methylthiotransferase RimO" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011861176.1" /transl_table=11 /codon_start=1 /translation="MAIRVGMVSLGCPKNQVDAEHMVYNLREEGYELTADAGLADVVVI NTCGFIESAKQEAIETILEFCTLKEEGRIKAVIVTGCLAERYREEISKEMPEVDAVIGI GSNELLGTVIKKVLDGEGRINTFGDKYSLIIGGKRLISTETFAYVKIAEGCDNCCTYCA IPSIRGRFRSRKMESVLDEVKWLASVGYKEIILIAQDTTRYGEDIYGKPMLASLMREVA KIDGIKWIRTLYAYPERITDELIDVIAEEPKCVKYLDIPIQHCDGEVLRRMNRRGDEKT LRELIAKLRERIPGIILRTTLIAGFPGETDEQFERLCEFVKDTKFDRLGCFAYSAEEGT PAADFPDQIDEEVKQRRADIIMETQMLINDEVCQKMVGKTLEVVTEGFDRWGECYFGRS VGEVPEIDGKIFFSSPVPRALGEYVSVHIDDVMDYDLVGSVVED" /locus_tag="LOCUS_2680" /gene="rimO" /EC_number="2.8.4.4" /note="WP_011861176.1 30S ribosomal protein S12 methylthiotransferase RimO (Clostridioides difficile) [pid:48.2%, q_cov:99.1%, s_cov:98.9%, Eval:7.4e-118]" /note="MGA_327" CDS complement(2896..3513) /product="recombination regulator RecX" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003894108.1" /transl_table=11 /codon_start=1 /translation="MARQISEISQFKGKTLRIDFSEGEPIFVHADIVADYHLSKGLEMP DGAIDDVVHANDARRAKERAFYLLDERDYSYVEMFKKLERNYDEDICYDVCNRLAELGL IDDRRYAKKAAEYYCVTKKCGYYRAREEMRKRGLSGELIDEALAEYEDDTPERLAELIC RKYARYLTDEKGITKVKSALVRLGYTYAEINSAIEEFLQEED" /locus_tag="LOCUS_2690" /gene="recX" /note="WP_003894108.1 recombination regulator RecX (Mycolicibacterium smegmatis) [pid:27.5%, q_cov:81.0%, s_cov:92.0%, Eval:8.1e-07]" /note="MGA_328" CDS complement(3514..4686) /product="recombinase RecA" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_005812939.1" /transl_table=11 /codon_start=1 /translation="MAMKKPAEKKAAPVSTQSKEEKRKALETAIAQLEKTYGAGAVMRL GQTSTLNVEAIPTGSMTLDMALGIGGVPRGRIVEIYGPESSGKTTVALSIAAQAQKLGG EVAFIDVEHALDPIYAEKLGVDINSMLVSQPDSGEQALEIAEALVRSGAIDCIVLDSVA AMVTKAEIDGEMGDTHVGQLARLMSQAMRKLTSVISKSNCVAIFINQVREKIGVIYGNP ETTPGGRALKFYSSVRIEVRKGEAIKNGSEIVGNRTRCKVVKNKVAPPFKEAEFDMLYG KGVSRIGEVVDIATELDIIHKAGAWFSYEGNKIGQGRENTKEFLLTHPDLMAEVEEKIL AAKNEVVMTSEKDKKAAVLSAASAAAAKVSSNDVIVDAEDDFEEFTPAEK" /locus_tag="LOCUS_2700" /gene="recA" /note="WP_005812939.1 recombinase RecA (Desulfitobacterium hafniense) [pid:66.9%, q_cov:82.6%, s_cov:93.4%, Eval:2.0e-127]" /note="MGA_329" ORIGIN 1 aagctgttta agagaccaat caatgctgcc cttgccgcta ttatcaaact tgttgtggtt 61 ggggtctgtt cccattgcca gattgtaagg cgaataggag tgggtggaaa gaaggagtct 121 gtcctcaaca gtgtcggtgg ggatgatgaa ttcgtctatt gatgcagttg aaggcgagcc 181 cgcatatgag gacatcatta aaaatctgtc ggtatttctg ccgcccgatt cgcgaacgac 241 atttacaaag atctgattat atttgttgag aatttcaact gcccttgcgc atctggtgtt 301 gttaatgtca atagaccatt cccaatcggt gccggaaaga cggggctcgt tcatgcattc 361 aaaaatcaga tgctggtcat agtccttaaa atactcggcg acctgtgtcc agattgcggt 421 gataaacttt tcgccctgtt cctcgtcgtt gttcttggtg ggatagtaaa aatcgttatc 481 gtggtgagaa ttgatgatta catacatatc gttgtccata gcatagtcaa cgatatcctg 541 cacacggcgg atccattcgg gatcaatgtt gaattcttcg tcggtgtgtt ttccccagga 601 aacgggaact ctgatggtgt tgaagccaag ctccttaacc ttgtttatca tttcgggggt 661 ggtggtgggc tgtccccaag cgttctctcc gtcgggcgcg tccattgtgt tgcccaggtt 721 ccatcctatg cccatttttt caacaagctc gcttgaggag atcgaggtgt agctgatttc 781 aagatcgtta tgcttgccgg gctctttaga ggcaggcgca ccgcaggcgg tgaataagcc 841 gacaaccata ataagtgcaa gtgccaatga taaaagtcgt ttcatataat cagattcctt 901 tcaagcaaaa gctcatttat ttcaaattaa aacgcaaagt gcgctgaatc aattataatt 961 caacgcacag tttctgtcaa tatatgggtt tcatttatta gtatcaataa cgtcgcgata 1021 tgcccaaaga tactgaacac ccgaaacaac tgtaagaatt gttgcaatcc aaataagtat 1081 cgcagaaccg acggatagga tattttccgg aatcggaaca cccaatgcca ttattccgcg 1141 gaagaacatt attgcaatta ttgcaaccat cgtgaaagcg gttttaagct tgccccaagc 1201 acctgcggca ataaccttgc cgtttgcaga agatgccacc attcgcaaag ccgaaaccat 1261 aaactctctg aacaaaatta tcattacagg caccgaacct gcccagccaa gcccgacaaa 1321 tgcgaccagc gccgccatca caagagcttt gtcggcaaga gggtccaaaa attttccaaa 1381 gttggtgacc aaattgtgct ttcttgcata gttgccgtcc agagcatcgg tgatggctgc 1441 aacagtaaag atcacaagtg cgatcaaaac attaaaactt gtaaactgcc acaaaaggaa 1501 cagcacgaac agaggtatta gcaccactct taaaatggtg agtttatttg ctaagttcat 1561 cttaatcctc cacaacactg ccgacaaggt cgtaatccat aacatcgtcg atatgaacac 1621 ttacatattc gcccaaagca cggggaacgg gagacgagaa gaaaattttg ccgtcaattt 1681 ccggcacttc tcccacactt cttccgaagt agcattcgcc ccagcggtca aacccctcgg 1741 ttacgacctc taaggtcttg ccgaccatct tttggcagac ttcatcgtta atgagcatct 1801 gagtttccat aataatgtca gcacgtcttt gcttgacctc ctcatctatc tggtcgggga 1861 agtcagccgc gggagttccc tcctccgcgg aatatgcaaa gcatccgaga cggtcaaact 1921 ttgtgtcctt aacaaactcg cacaagcgtt caaactgttc atcggtttcg ccggggaagc 1981 ctgcaataag ggtggttcgc aaaatgattc cggggatgcg ttcacggagc ttagcgataa 2041 gttcacggag agttttttca tctccccggc ggttcattcg gcgcaagacc tctccgtcgc 2101 aatgctgaat cggaatatcc aaatatttaa cgcacttggg ttcttccgca ataacgtcga 2161 taagttcatc tgtaatacgc tcgggataag cataaagtgt tcggatccac ttgatgccgt 2221 caattttcgc aacctcgcgc ataagcgatg caagcatcgg cttgccgtaa atatcctcgc 2281 cgtagcgggt ggtgtcctgc gcaataagga taatctcctt atatcccacg cttgcaagcc 2341 acttgacttc atccagcacg ctttccattt ttcttgagcg gaaacgaccg cgaattgaag 2401 gaatggcaca gtatgtacag cagttgtcgc aaccttcggc aattttaaca tatgcaaagg 2461 tttcagtgga tataaggcgt ttgccgccga ttataagcga atacttgtcg ccgaaggtat 2521 tgattctgcc ctctccgtca agcacctttt taattacggt gcccaaaagc tcgttagagc 2581 cgatgccgat tacggcatca acctcgggca tctcctttga aatctcctcg cgatagcgct 2641 cagccaagca acccgtgacg attaccgctt taattctgcc ctcctcttta agggtgcaaa 2701 attcgagtat cgtttcaatc gcttcctgct ttgccgattc aatgaaaccg caggtgttga 2761 ttacaacaac atctgccaat cccgcatcgg cggtaagctc atagccctcc tcgcggagat 2821 tatataccat atgctcggca tccacttgat ttttcgggca gcccagcgaa accattccaa 2881 cacgaatagc cataactaat cttcctcttg caaaaattct tcaatcgcgg agtttatctc 2941 cgcatatgta tatcccaatc tgactaaagc tgacttgacc ttggtaatac ccttttcatc 3001 ggtgagatac cttgcatatt tcctgcagat aagctcagcc aatcgctcag gggtatcgtc 3061 ttcatattcc gccaaggctt cgtcaataag ctcgcccgac aatccgcgct ttcgcatttc 3121 ttcgcgtgcg cgatagtagc cgcacttttt tgtaacgcag taatattccg ccgctttttt 3181 ggcgtagcgt ctgtcatcaa tcagtccaag ctcagctaaa cggttgcaga catcatagca 3241 gatgtcctca tcatagttgc gctcaagctt cttgaacatc tcaacatacg agtagtcgcg 3301 ttcatccaaa agatagaatg cacgttcctt ggcgcgcctt gcatcgttgg cgtgaacaac 3361 atcatctatc gcgccatcgg gcatttcaag accttttgaa aggtgatagt ccgcaacaat 3421 gtcagcgtga acaaatatcg gctcgccctc ggaaaaatct atccgcaagg tcttgccctt 3481 aaattgggaa atttcgctga tttgtcttgc catttacttt tcagcggggg tgaattcttc 3541 aaaatcgtcc tcggcatcaa cgatgacgtc gtttgaagat acctttgccg cggcggcact 3601 tgcagcactc aaaactgctg ccttcttgtc cttttcggag gtcattacaa cttcattctt 3661 tgccgccaaa atcttttcct caacctctgc catcaaatcg ggatgagtaa ggaggaattc 3721 cttggtgttt tctctgccct ggccgatctt gttgccctca tagctgaacc atgcgcccgc 3781 cttgtggatg atatccagct cggttgcgat atccacaact tcgccgattc tcgaaacgcc 3841 cttgccataa agcatatcaa actcagcttc cttgaaagga ggagcaacct tattcttaac 3901 gaccttacat cttgtgcggt tgccgacgat ctccgagccg ttcttaattg cttcgccctt 3961 tctgacttca attctgacgg aggaatagaa cttaagggca cgtccgccgg gggtggtttc 4021 ggggttaccg tagataacgc cgatcttctc acgaacctgg ttgatgaaga ttgcaacgca 4081 gttggacttt gaaattacgc ttgtaagctt tctcatcgcc tgggacataa gtcttgcaag 4141 ctgaccgaca tgggtatcgc ccatttcgcc gtcgatctca gcctttgtta ccattgcggc 4201 aacagagtcc aaaacgatac agtcaattgc gcccgagcgc accaaagcct cggcaatttc 4261 aagggcctgt tcgcccgagt cgggctgtga aacgagcatc gagttgatat caacgccgag 4321 cttttcggca tagatggggt ccaaagcgtg ctcaacgtcg atgaatgcaa cttcgccgcc 4381 cagcttctgt gcctgcgccg cgattgaaag agcaacggtg gtcttgccgg agctttcggg 4441 tccatagatc tcgacgattc ttcctctcgg aacgccgccg atacccaaag ccatatcaag 4501 agtcatcgag cctgtgggaa tagcctcaac gttgagggtc gaggtctggc ccaagcgcat 4561 tacagcacct gcgccatagg tcttttcaag ctgagcaatg gcggtttcaa gcgcctttct 4621 cttttcttct ttagactgtg tgctgacggg agccgccttt ttttcagcag gttttttcat 4681 tgccataaca atttcctccg attttcgtca aattttcgct gttcgcttaa atgta // LOCUS sequence047 4560 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence047 VERSION sequence047 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..4560 /mol_type="genomic DNA" /organism="" /note="sequence047" CDS complement(162..2120) /product="DNA topoisomerase (ATP-hydrolyzing) subunit B" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_000435982.1" /transl_table=11 /codon_start=1 /translation="MDINEINNSVTAVDKDNNYDASEIQVLEGLEAVRKRPGMYIGSTG PKGLHHLVYEIVTNSIDEALAGYCTRIDVELLKGNIVRVTDNGRGIPTGIHPKEGISAA TVVYTVLHAGGKFGGGGYKVAGGLHGVGASVVNALSEWLEITIYDGKNIHFQHFDRGGY EEQLKIVGETDKTGTVVTFKADPLIFEQSTEYDYQTLLDMLREQAFLNAGIRIVFTDRR GELDEEVDLCFNGGIREFVTFEREKRGHDPLSDGVVYLGGTKDDYTCEIAFQYNDSYND LVYSFANNVRTPDGGTHETGFKKALRKVINDYGKKFNLLKDGTVLSEDDVREGIIAIVS VKLTNCEFEGQTKGRLGNPEVRPFVEALVNEKLMNFLEENPDVARTIFDKALQAQKARE AAKRARDLTRRKTALESASLPGKLADCSERDPEFTEIFIVEGDSAGGSAKEGRDRRYQA ILALWGKMLNVEKARIDKVYGNDKLTPVVTALGTSIGEDFDITKLRYGKVIIMADADVD GCHIRTLLLTFFFRFMRPLIEQGHVYIAQPPLFKVQKGKQVRYAFSDEERDVYIKELYG DNGAKSDVQRYKGLGEMDPIQLWETTMDPETRTIIKITLEDAEKADETFSILMGDKVQP RKEFIEKNAQFASNLDF" /locus_tag="LOCUS_2710" /gene="gyrB" /EC_number="5.6.2.2" /note="WP_000435982.1 DNA topoisomerase (ATP-hydrolyzing) subunit B (Bacillus cereus) [pid:57.2%, q_cov:97.7%, s_cov:98.9%, Eval:3.5e-210]" /note="MGA_331" CDS complement(2159..2428) /product="DUF370 domain-containing protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003359336.1" /transl_table=11 /codon_start=1 /translation="MFLHLGNDHMVYAKNIIAIFDIENASTSKDTREFLASAGKAKRVI TCSYELPKSFVVTLDNDFTELIYISAISPETLKKRLNNITQGKF" /locus_tag="LOCUS_2720" /note="WP_003359336.1 DUF370 domain-containing protein (Clostridium) [pid:45.0%, q_cov:89.9%, s_cov:90.8%, Eval:9.6e-09]" /note="MGA_332" CDS complement(2433..3545) /product="DNA replication/repair protein RecF" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003429303.1" /transl_table=11 /codon_start=1 /translation="MIIKNIKADGYKNLKAVDIQPDPKINVLYGDNAQGKTNLVEALWI LTGAKSFRGTKERDMVGFESEKAEVTVDFQDAVRDQKIELVLTKNSRERRILLNGLKQK SFSGLFGQLKCVVFTPEDLELSKGSPEIRRDFLDLCISQIRPSYSATVAKYENILLQRN TLLKNIFSGISQEDELDVWDVQLARLGAYISVLRYAYAQKLWQFAGGVYNDLCAGKEKL IIKYSSSIYDELDGRTDYAGEMAREYLEKLNESRRDDIRFGFTQRGIHRDDVYVYIDGL LAKDFGSQGQNRSAALSMKLGQAYILHEETRDMPVMLLDDVLSELDSKRREFILSKLKD MQVFITCCEPVKKLSGRYFEVSGGNIRKVR" /locus_tag="LOCUS_2730" /gene="recF" /note="WP_003429303.1 DNA replication/repair protein RecF (Clostridioides difficile) [pid:37.6%, q_cov:94.3%, s_cov:91.9%, Eval:1.6e-59]" /note="MGA_333" CDS complement(3542..3760) /product="S4 domain-containing protein YaaA" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_010963332.1" /transl_table=11 /codon_start=1 /translation="MRFEEISIRDEFIKLDSLLKFAGFAETGGMAKDLIQMGKVKVNGE VCTMRGKKIRSGDKVTFDELDEGIIIK" /locus_tag="LOCUS_2740" /gene="yaaA" /note="WP_010963332.1 S4 domain-containing protein YaaA (Clostridium) [pid:58.3%, q_cov:83.3%, s_cov:88.2%, Eval:1.8e-10]" /note="MGA_334" misc_feature complement(3959..>4560) /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_010963331.1:DNA polymerase III subunit beta" /note="WP_010963331.1 DNA polymerase III subunit beta (Clostridium) [pid:37.2%, q_cov:98.5%, s_cov:53.0%, Eval:2.8e-33, partial hit]" /note="MGA_335" /locus_tag="LOCUS_2750" ORIGIN 1 gctcaacaaa gagcgccaaa ggaatgagga agaccgctgc acggatatat accgactttt 61 gcttataggt cttgtaatat aactcccagc cctcaagcca ttcgttttta tcaatgccgt 121 atttaacttt caacataaat atacctcggg tgttaaaaaa atcagaagtc aaggttggat 181 gcaaactggg cattcttctc gatgaattcc tttctgggct gaaccttgtc gcccatcaaa 241 attgagaagg tttcgtctgc cttttcggca tcctcaagtg tgatcttgat tattgttctg 301 gtttcggggt ccatggttgt ttcccaaagc tgaatggggt ccatttcacc caaaccttta 361 tatcgctgaa catccgactt tgcgccgtta tcgccgtaaa gctccttgat gtatacatct 421 cgctcttcat ccgagaatgc atagcgcacc tgcttgccct tttgaacctt gaaaagcggg 481 ggctgtgcaa tatatacatg tccctgttca attaaaggtc tcataaatct gaagaagaag 541 gtcaaaagaa gggtacggat atggcagccg tcgacgtcgg catcggccat gatgatgacc 601 ttgccatagc gaagcttagt aatatcaaaa tcctcgccga tagaggtgcc caaagctgtt 661 acaacagggg tcagcttgtc gtttccgtat accttgtcga ttcttgcctt ttcaacgttt 721 agcatcttgc cccaaagagc caaaattgcc tgataacgtc tgtctctgcc ttccttggcg 781 gagccgcccg cagagtcacc ctcgacgatg aaaatttcgg taaattcggg gtcacgttcg 841 gaacagtcag ccaatttacc cggcaaagat gccgattcaa gggcggtttt tcttctggtc 901 aaatctcttg cgcgctttgc ggcttctctt gctttttgag cctgcagcgc tttatcgaag 961 atggttcttg caacgtcggg gttttcctca aggaagttca tcagcttttc gttgaccagc 1021 gcttcaacaa agggtctgac ctcgggatta cccaaacgtc ccttggtctg gccttcaaat 1081 tcgcagttgg tgagctttac cgatacgatc gcaattatac cctcgcgcac atcatcttcc 1141 gacaaaactg tgccatcctt caaaaggttg aacttcttgc cgtaatcgtt aataaccttg 1201 cgcaaagctt ttttgaagcc tgtttcgtgg gtaccgccgt cgggggtgcg cacgttgttt 1261 gcaaaggaat aaaccaaatc gttatatgaa tcgttatatt ggaatgcaat ttcgcaggta 1321 taatcgtcct tagttccgcc gagatataca acgccatcgc tcaaggggtc gtgaccgcgc 1381 ttttcgcgct cgaaggttac aaactctctg ataccgccgt tgaagcaaag atcaacctct 1441 tcgtccaact cccctcttct gtcggtaaat acgattctga tgcctgcgtt gaggaaagcc 1501 tgctcgcgga gcatatccaa aagtgtctgg tagtcatatt cagttgactg ctcaaagata 1561 agcgggtcag ccttgaaggt tacaacagta cctgtcttat cagtctcgcc gacaattttg 1621 agctgttctt catatccgcc tctgtcaaag tgctggaaat ggatattttt gccgtcatag 1681 atggtaattt caagccattc ggacaaagcg ttaacaacag atgcaccaac accgtgaagt 1741 cctcccgcaa ctttatatcc gccgccgccg aatttaccgc ctgcgtgcaa aacggtatat 1801 acaacagttg ccgcagagat accttccttg gggtgaatac ccgtggggat tcctcggccg 1861 ttgtcggtta cccttacgat attgcctttc aaaagctcaa catcaattcg ggtgcaatat 1921 cccgccaagg cttcgtcgat cgagttagtg acgatctcat ataccaagtg gtgaagtccc 1981 ttggggcctg tcgaaccgat gtacataccc gggcgttttc ttaccgcctc aagaccttca 2041 agcacctgta tttccgatgc atcatagttg ttgtctttat caactgcagt aactgagttg 2101 ttgatctcgt taatatccaa aatctgtgtc ctccaaacta cttttagtat atctaaagtt 2161 aaaatttacc ttgtgtaata ttattcagcc tctttttcaa ggtttcgggg ctgattgcgc 2221 ttatatatat cagctcggtg aagtcgttat ccaatgtcac cacaaagctt ttcggcagct 2281 catatgaaca ggtgatgacc cttttcgctt taccggcaga cgccaaaaac tctctcgtat 2341 ctttcgatgt ggatgcgttt tcaatatcaa atatggcaat gatgtttttt gcatatacca 2401 tatggtcgtt tcccaaatgc aaaaacatac gcttacctaa cctttctgat gttgccgccc 2461 gacacttcaa aatatcttcc cgagagcttt ttgacaggct cgcaacaggt gataaatacc 2521 tgcatatcct ttagttttga aagaatgaat tccctacgct ttgaatcgag ctccgaaaga 2581 acatcatcca aaagcattac gggcatatcc cgagtttctt cgtgcaaaat atatgcctga 2641 ccaagcttca tcgacaatgc cgccgagcgg ttttgtcctt gagaaccgaa gtcctttgcc 2701 aaaagcccgt cgatatatac atatacatca tcgcgatgga ttccccgctg agtaaaaccg 2761 aagcggatgt catcgcggcg ggattcgtta agtttttcca aatattccct cgccatttcg 2821 cctgcatagt cggtcctgcc gtccagctcg tcataaatgc ttgaagaata cttaattatc 2881 agcttttcct tgcccgcgca aagatcatta tatactccgc cggcaaattg ccagagtttt 2941 tgagcgtaag catatctcaa aacgctgata tatgcaccca aacgcgccaa ctgaacatcc 3001 caaacatcca gctcatcctc ttggctgatt cccgagaaga tgtttttaag cagggtgttt 3061 cgctgaagca aaatgttttc atactttgca accgttgccg aatatgatgg cctgatctgc 3121 gaaatgcaaa ggtccaaaaa gtcgcgccga atttcggggc tgccttttga aagttccaag 3181 tcttcggggg taaataccac gcatttaagc tggccgaaca gtcccgaaaa gcttttttgc 3241 tttaagccgt tcaaaagtat ccgtcgctca cgggaatttt tggttaaaac aagctcgatc 3301 ttctggtcgc ggacggcatc ttgaaaatcc accgtgacct cggctttttc actctcaaac 3361 ccgaccatat cacgctcttt ggtgccacga aagctcttgg cacctgttaa tatccacaaa 3421 gcttcaacca aatttgtctt gccctgggcg ttatcgccat aaagcacatt tattttcggg 3481 tcgggctgaa tatcgacagc tttcaggttt ttataaccgt cggctttaat gtttttaatt 3541 atcattttat aataatgcct tcgtcaagct cgtcaaaagt caccttatcg cccgagcgga 3601 tcttctttcc gcgcatggtg cagacctcgc cgttaacttt gacttttccc atttgaatca 3661 gatcctttgc cataccgccg gtttcagcaa aacctgcaaa tttcagcaaa gaatcaagct 3721 tgatgaattc atctctgatt gatatttcct caaatctcat tgtaaaaaaa tcctttatct 3781 ttcaactttt aaactaagtt ttcaacaatt tagcgtgcta atgacgaaaa ttgatgatag 3841 ttaatatcag gtgagaagcg agacgtggct gtcacggcga tgcgccaacg gtgaattgcc 3901 ggcgacctgc cgtggcgagc ggtcaaaccc cacaaacgtt ggaaattatg gcggtcgctt 3961 actcctgctt aagtcttacc ggcaggacaa gataagtata ttcctcactc ttcataggaa 4021 ctatcttcat aggcagattt ccgccgttca tcaaaagctt gatcttctca tcgccgatga 4081 cctttaaagg atcaagcaaa tacttacagt tgaagccgat ctcaatcatc gggccggaaa 4141 tatcgcaagc gatttcatcg aatatcttgc cgattgatgt ctgacagctg attctgagca 4201 tacccttatc gaacaagcat cttacagggc tcttgattcg ctcatttata agaagcgatg 4261 cacgctccaa acagtcaata agctcacgtc tgggaatgat aacttctgtc accgactttt 4321 gaggaatcga acccttatag ttgtggaact cgccctccaa aagtcttgag aaaacggtgt 4381 aaccgttaaa gtcgaataca atatgcttct ttgaaacgat gatatcgcag ctaagctcgt 4441 cctcatcctt taaaagcttt gaaacctcgc ttaaggtctt tgcgggaatt acaaactttt 4501 tcgattcatc gtttttaatt gcttctgttc gaacagccaa tctgtaaccg tcaattgcaa // LOCUS sequence048 4506 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence048 VERSION sequence048 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..4506 /mol_type="genomic DNA" /organism="" /note="sequence048" CDS complement(551..1105) /product="ribosome recycling factor" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_010965096.1" /transl_table=11 /codon_start=1 /translation="MKNVLNNSKEKMEKTLNVLASQFAAIRAGRANPAVLNPIQVDYYG TPTPIAQMAAVSVQDARILVIQPWDKTTLKSIEKAIQASDLGINPSNDGSVIRLVFPQL TEERRKELSKDIKKLGEESKVAVRSIRRDALDKVKTMKKNNEVTEDDVKNFEKDIQKLT DKYIENVDSAVAVKDKEIMSI" /locus_tag="LOCUS_2760" /gene="frr" /note="WP_010965096.1 ribosome recycling factor (Clostridium) [pid:56.0%, q_cov:100.0%, s_cov:99.5%, Eval:2.1e-58]" /note="MGA_337" CDS complement(1133..1375) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MLKATMVDGVYDKDPHKYPDAVKYETLDLDDVIVKHLAVMDSTSA AMCKDNNIPIIVFNLARPDNIYDAVMGEKVGTLVK" /locus_tag="LOCUS_2770" /note="WP_011124676.1 UMP kinase (Prochlorococcus) [pid:57.0%, q_cov:98.8%, s_cov:33.3%, Eval:3.4e-22, partial hit]" /note="internal stop codon at [1448:1450](-)" /note="MGA_338" CDS complement(1448..1837) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MKPAYKRVLLKLSGEALAGDKKTGLNYDVIADIGKSIKKCYDAGV QIGIVVGGGNFWRGRSSGAMDRTRADHIGMLATAMNALAVADVLESLGMEVRVQTAISM QQVAEPYIRNRAVRHLEKGRVVIFG" /locus_tag="LOCUS_2780" /note="WP_003430597.1 UMP kinase (Clostridioides) [pid:66.4%, q_cov:99.2%, s_cov:54.7%, Eval:4.6e-43, partial hit]" /note="internal stop codon at [1448:1450](-)" /note="MGA_339" CDS complement(1971..2954) /product="NAD(P)H-dependent glycerol-3-phosphate dehydrogenase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011016741.1" /transl_table=11 /codon_start=1 /translation="MLKIAILGSGGFGLALAAACDRLGHDVTVWSAFKDEIDSILRTGE LRAKLPGIQIPKTVHLTTDISCVSNKDIVLVGIPSKFVRSVCESCAEYINKDTIIVSTA KGLEDGSFKRMSEVISEVMPDNKVVVLTGPSHAEELGKGIPTAVSVACEDEDASIFIQK AFSDNVFRLYVNDDVIGCEVGGAVKNVIALCCGVSDGLGLGDNTKAAIMTRGLNEITRL GVAMGGKADTFFGLAGVGDLIVTCTSIHSRNYRAGVLIGQGMNPEEAVRKIGTVEGYAC ANATLELSEKFGIDMPITREINRILFEGRAPKDALDTLMMRPRGKE" /locus_tag="LOCUS_2790" /EC_number="1.1.1.94" /note="WP_011016741.1 NAD(P)H-dependent glycerol-3-phosphate dehydrogenase (Fusobacterium nucleatum) [pid:44.1%, q_cov:100.0%, s_cov:98.8%, Eval:1.1e-80]" /note="MGA_340" CDS complement(2970..3620) /product="glycerol-3-phosphate 1-O-acyltransferase PlsY" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_012583521.1" /transl_table=11 /codon_start=1 /translation="MIIVLIISYLIGSLNSAIIATFVVSGKDIRDYGSKNAGLTNVYRC FGKTAAGLTLLIDICKGFLVVLLARLLFISGWFSYQDYDVVTVCGLAAVFAILGHVFPI FYKFHGGKGILIAGVCMLAIDPVVFLCEFVLFVLLVAITRYISVGSIACCFGYPLFTLI WQSVSNAYFGGVYECILVHTLIALASGILCFWRHMPNVKRLMSHTESKFSFKK" /locus_tag="LOCUS_2800" /gene="plsY" /EC_number="2.3.1.15" /note="WP_012583521.1 glycerol-3-phosphate 1-O-acyltransferase PlsY (Dictyoglomus turgidum) [pid:37.4%, q_cov:99.1%, s_cov:96.5%, Eval:5.4e-28]" /note="MGA_341" misc_feature complement(3653..>4506) /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_011460200.1:ribosome biogenesis GTPase Der" /note="WP_011460200.1 ribosome biogenesis GTPase Der (Desulfitobacterium hafniense) [pid:55.0%, q_cov:98.9%, s_cov:63.3%, Eval:1.5e-88, partial hit]" /note="MGA_342" /locus_tag="LOCUS_2810" ORIGIN 1 ggctaagctc gcatatgcgt tttgcggcat ttgttatctc atcgcgtccg ccatagttga 61 ttgcaatgca tacacacaaa ccgtttctat cacttgatgc tttctcatat cgtgccattt 121 tctcttgtaa ggaatcgtca agtctggtgc ggtcaccaat gaaacatatg cggaagttat 181 tatccgaatt ggcttcaagc tcatcgagat actgcccgaa aaggcgcata agctcgctga 241 cctcttcttc cggacgcttc cagttttccg ttgaaaacgc atagaaggtc gcatattcaa 301 cacccagagc atccagctct ttaataagct ttttgagagt ctgggagcct tcgcggtggc 361 cggctgtgcg ctttaagccg cgcttttgcg cccaacgtcc gtttccgtcc attataaaag 421 caatatggcg aggaataatc agctcgccct ctgatttttt cttaaacaca aagttgcacc 481 ttcatataaa gatgagctct tccaataaca gatgtccata atcggataga gctcatcaat 541 cagtttaatg ttagatggac atgatctcct tgtccttgac agctacagca gaatcaacgt 601 tctcaatata cttgtcggtg agcttctgaa tgtccttttc aaagttctta acgtcgtcct 661 cggtgacttc gttgttcttc ttcattgtct tgaccttgtc aagagcatca cgcctgatgg 721 atcttacagc aaccttggat tcttcgccga gcttcttgat gtccttggaa agttccttac 781 ggcgttcctc ggtgagctga gggaatacaa gtctgattac tgaaccgtcg ttagaggggt 841 taatgcccaa gtcagatgcc tgaatagcct tttcgatgga cttgagggtt gtcttatccc 901 aaggctgaat gacgaggatt cttgcatcct gtacggaaac tgcagccatc tgagcaatgg 961 gtgtgggagt tccgtaatag tcaacctgaa tggggttaag aactgcaggg ttagctctgc 1021 cggctctgat agcggcaaac tgagaagcca aaacgttcag ggtcttttcc attttttcct 1081 tggagttgtt aagtacgttt ttcataatat ctattccttt caaattcttg atttatttta 1141 caagtgtgcc gaccttttcg cccattacag catcatagat attgtcgggg cgcgcaaggt 1201 tgaatacgat aatcgggatg ttattatcct tgcacattgc ggcagaggtg ctgtccataa 1261 ctgcaaggtg cttaacaata acgtcgtcca gatcaagggt ctcatacttg acagcatcgg 1321 gatatttgtg aggatccttg tcatatacac cgtcaaccat agttgccttg agcattacgt 1381 cagcttcaat ttcagcagct cttaaagatg aagcggtgtc ggttgagaag aacggattac 1441 ctgttcctca tccgaagatt acgaccctgc ccttttcaag gtgacgaaca gcacggttgc 1501 gaatatacgg ttcagcaacc tgctgcattg aaattgccgt ctgaactctt acctccatac 1561 ctaaagattc aagcacatca gcaacagcca aagcgttcat tgcggtagcg agcataccga 1621 tgtggtcagc tctggttctg tccatagctc cgcttgagcg gcctctccaa aagtttccgc 1681 ctccaacgac aataccgatc tgaactccgg catcgtagca ctttttgatg ctcttgccga 1741 tatcggcgat aacatcgtag ttaaggcctg tttttttgtc accggcgaga gcttcgccgc 1801 tgagcttaag cagaactctc ttataagcag gtttcatatg acatcctcca ataacattat 1861 tcatatttat tctatattat aataccttaa aaagcaaaaa aagtaaatac acttactgaa 1921 tttttcacat aaaaattcct cgaataatac aattatccga ggaatatatc ttattctttt 1981 ccgcgagggc gcatcataag cgtatctaaa gcatccttcg gtgctcttcc ctcaaacaaa 2041 atcctgttaa tttcgcgggt tatgggcata tcaatgccga acttttcgga aagctcaagg 2101 gttgcgtttg cacaagcgta gccttcaacc gtacctatct ttctgactgc ttcttcgggg 2161 ttcatgccct gtccgatcaa aacacctgca cggtagttgc gcgagtgaat gctggtgcag 2221 gtaacgatta aatcgccaac accggcaaga ccaaagaagg tatcagcttt gccacccatt 2281 gcaacaccca agcgagtgat ctcgtttaag cctcttgtca taattgcggc tttggtgttg 2341 tcgcctaagc ctaagccgtc gcttacgcca cagcaaagcg caattacatt tttaactgcg 2401 ccgccgactt cgcaaccaat gacatcgtcg ttgacataca gacggaacac gttgtcggaa 2461 aaagccttct ggatgaatat tgaagcatct tcgtcctcgc aagcaacgga aaccgcagtc 2521 ggtattccct ttccgagctc ttcagcgtgt gaaggaccgg taagcacaac aactttattg 2581 tcgggcataa cctcagagat aacttcgctc attctcttga aacttccatc ctcaagtccc 2641 ttggcggtac tgacaatgat agtgtctttg ttaatatatt cagcacagga ttcgcaaacc 2701 gaacgaacaa actttgaagg aattccaacc aaaacaatat ccttattgct tacgcaggaa 2761 atatccgttg tcagatggac agtctttgga atctgaattc ccggaagctt ggctcttaac 2821 tcgcctgtgc gaagaataga gtcaatctca tctttaaagg cgctccagac agttacgtcg 2881 tgtcccaatc tgtcacaagc ggcagcaaga gcaagtccaa atccgcccga gccaagaatt 2941 gcaattttta acacactgca ttttcctttc tatttcttaa aagaaaactt tgattccgta 3001 tggctcataa gccttttaac gttaggcata tggcgccaga agcaaagaat tcccgaagca 3061 agcgcaataa gcgtatgaac taaaatgcac tcatatactc cgccgaagta tgcgtttgaa 3121 acactctgcc aaataagcgt aaacaaaggg tacccgaaac agcaggcgat tgatccgacg 3181 gagatatatc ttgttattgc aacaagcaaa acgaacaaga caaattcgca caggaataca 3241 acagggtcaa ttgcaagcat acatacacct gcaattaaaa tgccctttcc gccgtgaaat 3301 ttatagaata tcgggaaaac gtggcccaat attgcaaata ccgctgccaa accgcaaacg 3361 gtcacaacat cataatcctg gtatgaaaac cagccgctga tgaacaataa tcttgcaagc 3421 aaaacgacca aaaagccctt acaaatatca atcagcagag tcaaacctgc ggcagttttg 3481 ccaaaacagc ggtaaacgtt ggtgagtccc gcattcttgc ttccatagtc acgaatatcc 3541 ttacccgaaa caacaaatgt tgcaattatc gccgagttaa gacttccgat caaatatgaa 3601 attattagga caattatcaa cgcgagataa aacgtaaata tgcatccttt cgttattttg 3661 tgtcttgatt atctctttct cttacaacaa acctcacagg tgtgccgtca agtccgccga 3721 aaacttcacg aatctgattt tcaagatatc tcttatatga gaagtggaac agatccattg 3781 agtttacaaa ggttacaaat gtgggcggat tggttgtagg ctgagtcata tagtagatct 3841 tcaagcgtct gcccttatcc gacgggggct gaacacggtt aacagcatat gccagaatat 3901 cgttaagctt acctgttgaa atacgcatag agttattagc gtatacaagg tttacaagct 3961 cgaaaatctt atccaaacgc tgacctgtct ttgcggaaac aaagatgaag ggaacataat 4021 ccatgaaacc gagattttcc ttcaaatcct tggtaaaatc gttcatggtg ttgttatcct 4081 tctcgattgc atcccacttg ttgacacaaa cgatacagcc cttgccctgc tcgtgggcat 4141 atcccgcaac cttggagtcc tggtcggtga aaccaacaga agcatcaatt acgattattg 4201 caacatccgc tctgtcaaca gccatatatg agcgaagaac gctgtaatgc tcaatgctct 4261 ccaaaatctt ggattttctt ctgattccgg cagtgtcgat gaaaacatag cttccgtgct 4321 cgttttcaat gactgtgtcg gtggcatctc gggtagtgcc cgcaatatcg gaaacgatta 4381 cgcgctcttc ccctgcgata gcattgatga ttgaagattt tccgacatta ggcttgccga 4441 tgatcgcaac cttaatgtga tcggcttcct cttcgtgttc aacatcttca ggaaggctct 4501 tgacaa // LOCUS sequence049 4490 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence049 VERSION sequence049 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..4490 /mol_type="genomic DNA" /organism="" /note="sequence049" CDS 132..1487 /product="tRNA uridine-5-carboxymethylaminomethyl(34) synthesis GTPase MnmE" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_010966994.1" /transl_table=11 /codon_start=1 /translation="MSTICALSTPNAVGGIAVIRISGSRAIEIADGIFVPFGSTPVREM AGHTCAYGKIVDGDKTVDDVLLTVFRAPKSYTGEDTVEISCHGGVYVSKKIIRLLLSLG CKPANAGEFTKRAFLNGKLSLTQAEGVADIISAQGEASLQSANLMREGKLYKTARGVCD RLINILGSLAAWTDYPDEDIPETDNVSLGRTLSECESVLNKLLRDYDTGRILRDGIDTA IVGKPNVGKSTLMNMLLGYERSIVTDIAGTTRDVVEESVRLGEVVLRLSDTAGIRNSSD TVESIGVGLAKKKLDEARLVLAVFDGSRMLDDEDRELLSLIENRRHIVIINKSDLEQKL DLEYNNYKNILTVSAKEGIGLDSLKEKIYDMFKLDTLGDSAQIFANERQKLCCEQAYEA VLQAKTALLSGETLDAVTICVDRAASALLELTGEKTTEAVVDDVFSRFCVGK" /locus_tag="LOCUS_2820" /gene="mnmE" /EC_number="3.6.-.-" /note="WP_010966994.1 tRNA uridine-5-carboxymethylaminomethyl(34) synthesis GTPase MnmE (Clostridium) [pid:39.6%, q_cov:99.6%, s_cov:98.9%, Eval:3.4e-94]" /note="MGA_344" CDS 1695..3602 /product="tRNA uridine-5-carboxymethylaminomethyl(34) synthesis enzyme MnmG" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_012048454.1" /transl_table=11 /codon_start=1 /translation="MSKTNFLGQFDIAVIGAGHAGVEAALASARLGFKTALFTITLDAI ANMPCNPSIGGTAKGHLVREIDALGGEMAKAADATFLQSRVLNLGKGPAVHSLRVQSDR TKYHTYMKKVCEAQENLEIKQAEIVDILLDDNGAVCGVVTKLGTKYECRAAIISTGTYL NGVIHVGEVSYESGPDATLPAKGLSERLENLGISLRRFKTGTPARVHKRSIDFSKLERQ DGDEKILPMSYETKGDLANTVSCYISYTNENTHKVILDNLHRSPLYSGRIEGVGPRYCP SIEDKIVRFSDKPRHQLFIEPMGLDTDEYYLQGMSSSLPEEVQLEFLRTIEGLENVEIM RNAYAIEYDCCDSLELLPTLEFKKISGLYGAGQFNGTSGYEEAAAQGLIAGINAAMKLS GKEQIVLDRATSYIGTLIDDLVTKGVMDPYRMMTSRSEYRLLLREDNADERLTEIGHRV GLISDERYEATLEKYRLVGEEVERLEHANIGPSAELNKYLEDCGTEGITNGSTLAKLIR RPQVTYDGLAFIDINRPVLPDDVKEQAELRIKYDGYIKIQLEQVEQMRKLEAKLLPDDA DYASIHGLRLEAREKLAKIKPRSVGQASRISGVNPADVSVLLIWLEQQKRRENFEHTSD " /locus_tag="LOCUS_2830" /gene="mnmG" /note="WP_012048454.1 tRNA uridine-5-carboxymethylaminomethyl(34) synthesis enzyme MnmG (Clostridium botulinum) [pid:58.8%, q_cov:98.0%, s_cov:99.2%, Eval:3.7e-209]" /note="MGA_345" CDS 3583..4290 /product="16S rRNA (guanine(527)-N(7))-methyltransferase RsmG" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_010966992.1" /transl_table=11 /codon_start=1 /translation="MNILPIDETRNLFGNIALSDENYARFSRYADLLVEWNEKINLTAI TDPQGITEKHFLDSILPYEWVNLPENASVIDVGTGAGFPGIPLKIMRDDIRLTLLDSLN KRINFLNTVCGELNITADCIHGRAEDMGTTQLREKFDIATARAVARLSVLCEYCLPLVK VGGTFVALKGSSGVDELKDAENAIKKLGGEPVCAREYNLPCGDGRTLVIIKKVAPTPKG YPRTKGKMNKNPL" /locus_tag="LOCUS_2840" /gene="rsmG" /EC_number="2.1.1.170" /note="WP_010966992.1 16S rRNA (guanine(527)-N(7))-methyltransferase RsmG (Clostridium) [pid:50.9%, q_cov:93.6%, s_cov:93.3%, Eval:1.7e-54]" /note="MGA_346" ORIGIN 1 atcatcactg tctttgggta ggcaaaatga ttgacatttg tgagggcgga cgtgtagtcg 61 gaactgctga aattacaaag atttttaatc ctgttttgga aaaataggat tattcgaaag 121 gtcgtgaaag aatgtcaacg atatgtgcat tatcaactcc gaacgcggtg ggcggaatcg 181 ctgttatccg cataagcggg tcacgtgcaa ttgaaattgc cgatggcatt tttgtgccct 241 ttggttcaac acccgtccga gaaatggcgg gacatacctg tgcatacggc aagatcgtcg 301 atggcgataa gaccgttgac gacgttttgc tgactgtttt tcgcgcccca aaaagctata 361 cgggcgagga caccgttgaa atatcctgcc acggcggagt ttatgtttca aagaaaatta 421 tccgcttgtt gttatctttg ggctgcaaac ctgcaaatgc aggcgaattt accaagcgcg 481 catttttaaa cggcaagctg agtttgacac aggcagaggg cgttgcggac attatttccg 541 ctcagggcga ggcttctctt caatcggcaa atttgatgcg tgagggcaag ctatataaaa 601 ccgcgagggg agtttgcgac cgacttatta acattttagg ctcactggct gcatggacag 661 actatcccga tgaggatatt cccgaaacgg ataatgtttc tctgggacgg acactttccg 721 agtgtgagag tgtgctgaat aagcttcttc gtgactatga cacaggcaga attttgcgcg 781 atggaattga caccgcaatc gtcggcaagc cgaatgtggg caagtcgacg cttatgaata 841 tgctcctcgg atatgagcga tcaatcgtca ccgacattgc gggcactacc cgagatgtgg 901 ttgaggaatc ggtaagattg ggcgaggttg ttttgcggct gagcgatacc gcaggtatca 961 gaaattcttc tgatacggtt gaatccatcg gcgttggtct ggcaaagaaa aagctcgacg 1021 aagcccgatt ggttttggca gtattcgatg gcagccgtat gctggacgat gaggacaggg 1081 agcttctttc gctgatcgaa aaccgcaggc atattgtcat cataaacaag tcggatctgg 1141 aacaaaagtt agacttagag tataataatt ataagaatat actgacagta tctgcaaaag 1201 agggcatcgg gcttgacagc ctgaaggaaa aaatatacga tatgtttaag ctggatactc 1261 ttggcgactc ggcacagatt tttgccaatg agcgtcagaa gctctgctgc gaacaggcat 1321 atgaagctgt tttgcaagca aagaccgctt tgctgtcggg cgaaacattg gatgctgtga 1381 cgatatgtgt tgacagggcg gcgtctgctt tgcttgagtt gacaggcgaa aagaccaccg 1441 aggctgtggt ggatgatgtg ttcagccgat tttgtgttgg aaaataaaca gggtgcgttg 1501 atgcgaaaac ccgcaggggg cgcgaagcgc ccccatcccc gtcaaggctc acgccttgac 1561 ggggcgacaa ttgccatctt gcaaagatgg cgattgtcag cgggttttcg cgcaccaagc 1621 gccgctttta agcaaactaa tagtataaac attactaaat tttacaaatt gtaatcaaaa 1681 atggagtaaa aactatgtcc aagaccaatt ttttaggaca atttgatatc gcagtaatcg 1741 gtgcgggaca cgcaggtgtt gaagcggcgc tggcgtcagc acgcctcggt ttcaaaactg 1801 cgctcttcac catcaccctt gatgccattg caaatatgcc ctgcaaccct tcgatcggcg 1861 gcacggcaaa gggacacctt gtccgcgaaa ttgatgccct gggcggagag atggcaaaag 1921 cggcggatgc aaccttcctg caatcccgtg ttctcaattt gggcaaaggc cctgcggtgc 1981 attctttgcg tgtgcagtcg gacagaacaa aatatcatac ctatatgaaa aaagtctgtg 2041 aagcgcagga aaaccttgaa attaaacagg ctgaaattgt tgatattttg ctggatgata 2101 acggtgctgt ctgcggagtt gtcaccaagc tgggcacaaa gtatgagtgt cgcgctgcaa 2161 tcatttcaac cggaacttac ctcaacggtg ttattcacgt gggcgaggtt tcatatgaaa 2221 gcgggccgga tgcaactctt cccgcaaagg gactcagcga gcgacttgaa aatttgggta 2281 tctcgttgcg ccgattcaag accggcactc ccgcaagagt tcacaaaaga agcatcgact 2341 tttcaaaact tgaacgacag gacggcgacg aaaagatcct tccgatgagt tatgaaacca 2401 agggagattt ggctaacacc gtcagctgtt atatctcata taccaacgaa aatacccaca 2461 aggtcatcct tgataatttg catcgctcgc ccttatattc gggtaggatc gagggtgtgg 2521 ggccgagata ctgtccgtct attgaggaca aaatcgtgcg cttttccgat aagccccgcc 2581 accaattatt cattgaacct atgggtcttg atactgatga atactactta cagggtatgt 2641 catcaagttt gcctgaagag gttcagcttg aatttttgcg gactattgag ggcttggaaa 2701 atgttgaaat aatgcgaaac gcatatgcaa ttgaatatga ctgctgcgac tcccttgagc 2761 ttttgcctac ccttgagttc aagaagattt cgggacttta cggcgcgggt cagtttaacg 2821 gcacctcggg atatgaagaa gccgccgcgc agggattaat tgcaggtatc aacgcggcaa 2881 tgaaactttc gggcaaagaa cagatagttc tggacagagc aacttcatat atcggaactc 2941 ttatcgacga ccttgtgaca aagggagtta tggaccctta ccgaatgatg acatcgcgaa 3001 gcgaatatcg cttgctattg cgtgaggaca atgccgatga gcgtttgacc gagatcggac 3061 acagggtcgg acttataagc gatgagagat atgaagcgac ccttgaaaag taccgccttg 3121 tcggtgaaga ggttgaacga cttgagcacg caaacatcgg tccgtctgcg gaactgaata 3181 aatatttgga agactgcggc accgaaggca tcaccaacgg ctcgacactt gcaaagctca 3241 tccgccgtcc gcaggtgaca tatgatgggc tcgcgtttat cgacataaat cgacctgttt 3301 tgccggatga tgttaaagaa caggcagaac tgcgaattaa atatgacgga tacattaaaa 3361 ttcagctgga acaggtggag cagatgcgta agctcgaagc aaagcttctg ccagatgatg 3421 ccgactatgc atctattcac ggattgagat tggaagcccg cgaaaagctt gcaaaaatca 3481 agccgagaag tgtcggacag gcatcccgaa tttcgggtgt taaccctgcc gatgtatctg 3541 ttttgctgat ttggcttgaa cagcaaaaga ggagggaaaa ttttgaacat acttccgatt 3601 gatgaaacaa gaaacctctt tggaaatatc gcgctgagcg acgaaaacta tgctcgcttt 3661 tcccgttatg ccgatttgct ggtggaatgg aacgaaaaaa tcaaccttac agccataact 3721 gatccccaag gcataaccga aaagcacttt ttggacagca ttttgcccta tgaatgggtg 3781 aatctgccgg aaaatgcatc ggtcatcgac gttggaacag gcgcaggctt cccgggaatc 3841 cctctgaaga taatgagaga tgacattcgc ttgacacttt tggatagcct taacaagcga 3901 atcaactttt tgaacaccgt ttgcggtgaa cttaatatca ccgccgattg cattcacggc 3961 agagcggagg atatgggtac gactcagctt cgggagaagt ttgacattgc aactgcaaga 4021 gccgttgcgc gcttaagcgt tttgtgcgaa tattgcctgc ctttggttaa ggtcggaggg 4081 acgtttgtgg cactcaaggg ttcatcgggc gttgacgagc ttaaagatgc cgaaaatgcg 4141 atcaaaaaac ttggtggaga gccggtatgt gcaagggaat ataatcttcc ttgcggtgac 4201 ggcagaacct tagtcatcat taaaaaggtt gcacccaccc ccaagggcta ccccagaacc 4261 aagggaaaga tgaacaaaaa tcccctctaa ttttccttaa aacagcatat taacctatcg 4321 gatactgcct gattttggcg gtatccgttt tattttgcaa caaacattaa agaaatgtcg 4381 gaaaattata atagaatcga catccgtttg atgataccat caatataaag gatgtgattt 4441 aaacatggca gttaaaacaa gaatttttgc acccaagcga gaaaaggtcg // LOCUS sequence050 4478 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence050 VERSION sequence050 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..4478 /mol_type="genomic DNA" /organism="" /note="sequence050" misc_feature <1..1109 /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_004454972.1:pitrilysin family protein" /note="WP_004454972.1 pitrilysin family protein (Clostridioides difficile) [pid:28.6%, q_cov:96.5%, s_cov:84.8%, Eval:1.7e-40]" /note="MGA_347" /locus_tag="LOCUS_2850" CDS 1099..2376 /product="pitrilysin family protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011861628.1" /transl_table=11 /codon_start=1 /translation="MATEKRRICDPKTVDSYVHIRHASGLDIFVMEMPGFTGSYAAFGT HYGSVHTDFISPSGEKARDPMGIAHFLEHKLFENEECDAYELYAETGANANAYTSFDKT VYLFECTDNFNDSLKILLESVTSPYFTDRSVEKEQGIIAQEILMCEDNPFRRVYFNLLK AAYHTHPVREEIAGTVDSISHIDKDTLYRAHEAFYDLSNMILCCSGNCNIDSIIAVADE VLKPAKNTAPKLVNCDEPSGVYQKRITEKMAVGLPMFAIGYKADPDEGVDLCRKEYISA FLLDMIFGQTSRFYKENTENGLINSRFETETNSGDGFLINIISGESKDPDRVLELMNLE IGRIKREGLDQGEFDALKKTAYGSAIRGFNNVAACSSVMLESHMRGYDAYEPSRIIASI TLDEVLSSIDDLLDTERTCISVITGE" /locus_tag="LOCUS_2860" /note="WP_011861628.1 pitrilysin family protein (Clostridioides difficile) [pid:38.7%, q_cov:93.9%, s_cov:94.9%, Eval:7.6e-72]" /note="MGA_348" CDS 2412..3605 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MTLAMTADFVKEMLASEGGVLYFPNCDWLFPNGLKIDNVMVTIGN LDIYWYGFLIALGMLLAMIYGYRKLEKWGLEPDRFTDTALVGLIGGIIGARVYYVVFSI DKYMSVDGTLNLASVFAIRDGGLAIYGGIIGALIFGCTMAKIRKVRLAPLLDLVGLGLL IGQTLGRWGNFFNQEAFGAKTTLPWGMTSKSILEYLYYNVYYPDAVSVITNRALDMVAH PCFLYESLWCLLGFILLHIYSKHRKFDGEIFIMYIGWYGLGRFWIEGLRTDSLYIPGTE FRVSQVLAGTCVLFAIALYLIFRANVKKNADYKLYVDTDESKELLEMYYAKQKKSKNKT VNADDACETILDPSVMDDTPEEDALAEDAVDEPAEESVEESVEETAEEATEEEPENE" /locus_tag="LOCUS_2870" /note="WP_012257228.1 prolipoprotein diacylglyceryl transferase (Chloroflexus aurantiacus) [pid:38.2%, q_cov:67.8%, s_cov:95.0%, Eval:3.1e-43, partial hit]" /note="MGA_349" CDS 3598..4449 /product="bifunctional methylenetetrahydrofolate dehydrogenase/methenyltetrahydrofolate cyclohydrolase FolD" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011393025.1" /transl_table=11 /codon_start=1 /translation="MSNILNGKEISANVRERLKLETAELFEKTGKRPGLAVIIVGDDPA SRIYVNNKKKACAEIGFASWEYALPAETTEAELLELIEKLNGDDEVHGILCQLPLPKHL DEKTVINAIDPKKDVDAFHPVNVGKIMIGDYDFLPCTPAGCMELIHSAEISVSGKKCVV VGRSNIVGKPMSMLLLHENGTVTTCHSRTKDLKAECLAADILVVATGKAKMITGDMVKE GAVVIDVGMDRDENGKLCGDVDFDSVAPKALYITPVPGGVGPMTIAMLMSNTLTAFKLT LK" /locus_tag="LOCUS_2880" /gene="folD" /EC_number="1.5.1.5; 3.5.4.9" /note="WP_011393025.1 bifunctional methylenetetrahydrofolate dehydrogenase/methenyltetrahydrofolate cyclohydrolase FolD (Moorella thermoacetica) [pid:60.5%, q_cov:97.5%, s_cov:98.2%, Eval:7.8e-90]" /note="MGA_350" ORIGIN 1 acgattccaa cgacaagctt tcccgccgac tcaacgagct ctacggtgct tcgctttcgg 61 gcgtatgttt gcaatgctct gatatgcttg agcttctgtt ctcggtcgat tttatcttag 121 ataaatacgc ttatgacggc gaatcggttg cattcgactg tgcatctctt ctcggcttca 181 gcctgtttga tcccttggct tcaaacggcg agtttgaccc gacagaattt gaaatccgcc 241 gccgcgacct gctggatgcc atagattccg aaatcaacga caaagcatcc tatgcgctta 301 cccgctcctt tgaaacggta taccgcggtg agacccgtgc caagcgccac tatggcacac 361 gtgaggccgt tgccgccctt actcctaagc agacttatga agtatatctt cggatgctta 421 aagaagcatc tgtccatatc accgtttgtg caggtgagga tattccctcg gtcaacaaat 481 accttgagga tgtttttagc gcccgcgagc gcggcgaagt ttcgcttcct tcgtattatt 541 catacagccc ctgcaaatcc gaacccgaat ttgtcagtga atatatggat atcaagcaag 601 cgaatctcgt aatggctttc aaaaccgata tacacgatta ctatatcaac cgtgttttaa 661 gtgctttgta cggcgaatcg cccatttcaa agctttttat gaacgtgcgc gagcgtttaa 721 gcctttgcta ttattgccag agtgtctatt ccgccaccaa ggcaaccatg ctcgttttaa 781 gcgcggtaga taacattaat gttcaaaaga ctgccgacga agtcacccgc cagctttcgc 841 ttatcgcctc gggcgagttc tcggacgatg acctcgcttt aaccaagcta tatcttgttt 901 ctttgattcg tgcaaaatat gaccgcaagg gcgcactcgc cgaatggttc tttgctgaag 961 agctttcggg aagcaacctt acaatcgagc aagcaattga taaaataaac tcggtcacac 1021 gcgaggatat tgtttccgcc gcgaagtcat attctcttga caccctgttt gttctttcaa 1081 acggagagga gataggaaat ggcaactgaa aaacgacgca tttgcgaccc caaaacagtg 1141 gatagctacg tgcatatccg acacgcctcg ggacttgata ttttcgttat ggagatgccc 1201 ggtttcaccg ggtcatacgc cgccttcggc acccattacg gctctgttca caccgatttt 1261 atctccccaa gcggcgaaaa agcccgcgac cccatgggca ttgcccactt tttggagcac 1321 aagctcttcg aaaacgagga atgcgatgca tatgagctat atgccgaaac aggcgccaac 1381 gcaaatgcct atacctcgtt cgataaaacc gtctacctct ttgaatgtac cgacaacttc 1441 aacgattcgc tgaaaatttt gcttgaaagt gtcacaagcc catatttcac cgaccgatcg 1501 gttgaaaagg agcagggaat cattgcacaa gagattttga tgtgtgagga taatcctttc 1561 cgccgagtat atttcaacct tttaaaggcg gcataccaca ctcaccccgt ccgcgaggag 1621 attgcaggca cagtcgattc gatatcacat atcgataagg acaccctata tcgcgcacac 1681 gaagcgtttt acgatctttc aaatatgatt ctttgttgct cgggcaactg caacattgac 1741 agcatcatcg ccgttgccga cgaggtatta aaacccgcaa agaacaccgc ccccaagctt 1801 gttaattgcg acgaaccaag tggagtatat cagaagcgca taaccgaaaa aatggctgtg 1861 ggtttgccga tgttcgccat cggctataaa gctgaccccg acgaaggcgt tgacctttgc 1921 cgaaaggaat atatcagcgc atttttgctg gatatgatat tcggccagac ctcgcggttt 1981 tataaagaga acaccgagaa cggtcttatc aattcccgat ttgaaacaga aaccaactcg 2041 ggcgacggct ttttaatcaa catcataagc ggcgaatcaa aagaccccga cagggtgctt 2101 gagcttatga atcttgaaat cgggcgcatc aagcgcgagg ggcttgacca aggcgagttt 2161 gatgcattga aaaagaccgc ctatggctcg gcaattcgcg gttttaacaa cgttgccgcc 2221 tgctcatcgg taatgcttga atctcatatg cggggctatg atgcatatga accctcgcga 2281 ataatcgctt caatcaccct tgatgaggta ctctcatcaa ttgatgacct gcttgacacc 2341 gagcgcacgt gtatctcggt aataacaggc gaataaacaa cagttaattc aaccgaaagg 2401 atgacaaaat tatgacatta gcaatgaccg ctgatttcgt aaaggaaatg ctcgcatccg 2461 agggcggagt gctctacttc cccaactgcg attggctttt ccccaacgga cttaaaatcg 2521 acaatgtaat ggtgaccatc ggaaacctcg atatctattg gtacggtttc ttaattgccc 2581 tcggtatgct tcttgcaatg atttacggct accgtaagct tgaaaagtgg ggacttgagc 2641 ccgaccgctt caccgataca gcccttgttg gcttgatcgg cggtattatt ggcgcccgtg 2701 tgtactatgt cgtattcagt atcgacaagt atatgtctgt tgacggcacc cttaaccttg 2761 catctgtatt tgcgatccgc gacggcggcc ttgcaatata tggcggtatc atcggcgcac 2821 tgatctttgg ttgcacaatg gcgaaaatca gaaaagttcg cctcgcccct cttctcgacc 2881 tcgttggctt gggtctattg atcggtcaga ccttgggacg ttggggcaac ttcttcaacc 2941 aggaagcttt cggcgcaaag accactcttc cttggggtat gacctcgaaa tcgatccttg 3001 agtatcttta ctataatgtt tactatcccg atgcagtttc tgtcatcacc aacagagcgc 3061 tggatatggt tgcgcatccc tgcttcttgt atgaatccct ctggtgcctt ttgggcttca 3121 ttttgttgca catctattca aagcaccgca agtttgacgg tgagatattc attatgtaca 3181 ttggatggta cggtttaggc agattctgga tcgaaggcct cagaaccgac tccctctaca 3241 ttcccggcac cgaattcaga gtatctcagg ttttggcagg cacctgcgtg ctgtttgcta 3301 tcgcactcta tttaatcttc cgtgcaaacg tcaagaagaa tgccgactat aagctttacg 3361 ttgacaccga cgagtcgaag gagcttctgg agatgtacta cgcaaagcag aagaagtcga 3421 agaataagac tgtaaatgct gatgatgctt gcgaaaccat tttggaccct tccgttatgg 3481 atgacacgcc cgaagaagac gctctcgcag aagatgcagt agatgaacct gcagaagaat 3541 cggttgagga atctgtagaa gaaactgccg aagaagcaac cgaggaggaa cccgaaaatg 3601 agtaatatcc tcaacggaaa agagatttca gcaaatgtcc gcgagcgttt aaagcttgaa 3661 accgccgagc tttttgaaaa aacaggcaag cgccccggac ttgctgtaat tatcgttggt 3721 gatgaccctg catcccgtat ttatgtaaac aacaaaaaga aagcctgcgc cgagatcggc 3781 tttgcttctt gggaatatgc gcttcctgcc gaaaccaccg aagctgagct tctcgaattg 3841 atagagaaat tgaatggcga tgacgaagtt cacggcattt tgtgccagct tcctctgccc 3901 aagcatcttg atgaaaagac tgtcatcaat gctattgacc ccaaaaagga tgtggatgct 3961 ttccaccctg tcaatgtcgg caagatcatg ataggggatt atgacttcct gccttgcacc 4021 cccgcaggct gtatggagct tatccactca gcagaaatca gcgtttcagg taaaaagtgc 4081 gtcgttgtcg gcagatcaaa tatcgtcggc aagccgatgt caatgcttct cttgcacgaa 4141 aacggcaccg tcaccacctg ccattcccgc actaaggact tgaaggctga gtgcttagcg 4201 gctgatatcc tcgttgttgc aacaggcaag gcgaagatga tcacaggcga tatggttaaa 4261 gaaggcgccg ttgtaataga tgtcggtatg gacagagatg aaaacggcaa gctttgcggc 4321 gatgtcgact ttgactccgt tgcacccaag gcattatata tcacccctgt tcccggcggt 4381 gttggtccaa tgaccatcgc aatgctgatg tccaatacac ttacagcgtt taagcttaca 4441 ttgaaatgat caaaacccct gacagagaac tgtcaggg // LOCUS sequence051 4478 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence051 VERSION sequence051 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..4478 /mol_type="genomic DNA" /organism="" /note="sequence051" CDS complement(1251..3851) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MNKKLTSILALVLSLVMVLSTFAACGTPNNDNSDVQNPGVENPVE GDVVPATFKQAEYNNTTTTMPSNWNEFTYADNNDTQIMSYIGSSFFSYDYKFENDEKYN ADGSINKDGIVPGAYTTNYDAATKLEDVTATVDAKWGYTDEQKAEGGYAWKITLRDDLK WDDGTPIVAADFVYSMQQLLDPDFMNFRANTYYDTLMVKNSKIYFFQNEEGTYETVASK GYATNQAAIDAGETIYFNAWAMYGAEGYPDENGNLCPEWLAYNDTTVYTGEYNGEPDPV SGADLYAAYSTTYSEVGAGYGYDATIYVENANRDVAWDSVGIYSIDEENAIVICLDKAY SFLTEDGDLSVWAPYYMSGLPLVKKDLYESCKIAPADGATLWTSNYNSSLETTASWGPY KLSEFEAGSHYKLVKNENWHGWNMEEYKNQYNITAINCRKVEEFATKWMGFLNGTYDDA SLQTENVGEYLDSKYVYFTSTSTGTFGMQLYSNLEVLKESENNNGILAIQEFRHALNLG LNRSDIVEKIWPGSAVPCFGLLNVAYYYDIENSPELEDGGQYRNTALAKEGILRAYGYT EGADGKWSSGDLTGLDLDEAYETLTGYNPTVAKEKMAEAIAILTADPEKYGYDSSKNIT LVYGSSVDNDKQRFRADYLQGVIDGLTEGTALADKIDVVFDASAGAQWAEAFRTGATQI GFGYGFSGNAFNPFDIVGAFVNPDDDLNYHMYWDTSAIDLTLTMPEGDYEGAGETITMS VQNWYFCLNGLAASENQAKTYNWGAGYAPTEARLMILSALEELTIKESRSVMLIADGGG SFLGAKFSYFSEDEHTFMGFGGLRYIEVNYTDAEWAEFVAANNNDLSAEYKKSE" /locus_tag="LOCUS_2890" /note="MGA_352" ORIGIN 1 agaatcctga cagcaacata aagaaatcgt agtcctggaa tgtaatagag tttagataaa 61 gtccgcccac gccattgata ccgaacatct tctcgatgat aagggagccg gaaagaaccg 121 agatgaactc actgaggatc gaggggaaga tgactaccat tgagttgcgc attgcgtggc 181 ggtagatagc ctgttttttg gtaagacctt tggttcttgc caaaagcata aattcaccgg 241 tcaaaacttc tgaaagctca gcacgggtga aacgcgcata acctgcgatt gagccaagac 301 aaagggcaaa tactgcaggg agcattgaat ggaatacagg ccaggtgaaa tattcgtcgc 361 tcgttgacat ggtgagcggg aaccagccga gcttgaagca aaatacatac tgaagcataa 421 gcgcaagtac gattgacgga acggatatca ataggataat tatgatattg atgacctggt 481 cctgccactt gtttttcttg agcgcggcca aaatacctaa gccaagaccg atcggtacac 541 cgataaggct ggaatagata ttgattaaaa ttgtcggtgg gagatgatta acgaatactt 601 tccaaatgtt catattgagg tattcgccgt aggtggtaac aataccgaaa tcggcttttg 661 tcaggattct cttaatatag gttccgtact gaatgagtat cgggactctg tcgtaggtcc 721 agacgccgtt ttcaccttct ttaatgtttg tgatccagcc tcttccctcg agagttttca 781 taacgatttc ggggtcctgt ccaggaagag cgttagtcgg aatcggcaaa agcttgataa 841 gcacaaaaca cattgtaaag atgatgagga atgtgaatag catcaagcca agacgctttg 901 tcacatactt gaacatatac ataggcgttc ctcctctgct ttcttgattt tcttcataag 961 atgtaaggcc atagaaatct atcgttcgtt tggccttaat caaaaagcct gtgcaatcat 1021 aaatgaactg atattctaat ttaacctttg attttcgatt ttagttgctg ttacatagac 1081 cgatagagcc tattttacag agataaagca aaaattatta tgttcaacaa gtaatattgg 1141 tatactgtat taatctcaaa atgagcaaat cagcggtggg cgttatttgc ccaccgccgt 1201 ttgttagaaa caattaatac ttaaactaat cagttagttt atagatataa ttactcagac 1261 ttcttgtatt cagcagagag gtcgttgttg ttagctgcaa cgaattcagc ccattcagcg 1321 tcggtgtagt taacttcgat gtatctcaag ccgccgaagc ccatgaaggt gtgctcgtct 1381 tcagagaagt aagagaactt agcgccgagg aaggatccgc cgccgtcagc gatgagcatt 1441 acggaacgag attccttgat ggtgagctct tcaagagcag agaggatcat aagtcttgct 1501 tcagtaggag cgtagcctgc accccagttg taggtcttag cctggttttc agaagctgca 1561 agaccgttga ggcagaagta ccagttctga acgctcatag tgatggtttc gccagcacct 1621 tcataatcgc cttcgggcat tgtgagggtg aggtcgatag cggaagtatc ccagtacata 1681 tggtagttga gatcgtcatc ggggttaacg aatgcgccaa cgatatcgaa ggggttaaat 1741 gcgttaccgg agaagccgta accgaagccg atctgagttg caccggttct gaatgcttca 1801 gcccactgtg cgccggcaga tgcgtcgaat actacgtcga tcttgtcagc aagagcagtg 1861 ccctcggtaa gaccgtcgat aacgccctgg aggtagtcag cacggaatct ctgcttgtcg 1921 ttatctacag aagaaccgta aacgagggtg atgttcttgg aagaatcata accgtacttt 1981 tcaggatcag cagtaaggat tgcgatagct tctgccatct tttccttagc aactgtgggg 2041 ttgtaaccgg taagggtttc gtaagcttca tcaaggtcaa gacctgtcaa gtcgccgctg 2101 gaccacttgc cgtcagcgcc ttcggtgtag ccgtaagcgc ggaggatgcc ttccttagca 2161 agagcggtgt tgcggtactg accgccgtcc tcaagctcag gagagttttc gatatcatag 2221 tagtaagcta cgttaagaag accgaagcaa ggaacagcag aacccggcca gatcttttca 2281 acgatgtcac ttctgttcaa accgaggtta agagcatgtc tgaattcctg gattgcgagg 2341 ataccgttgt tgttttcgct ttccttaaga acttcaaggt tgctgtaaag ctgcataccg 2401 aatgtaccgg tagaggtaga agtgaagtaa acgtacttgg agtcgaggta ttcgccaacg 2461 ttctcagtct ggagagaagc atcgtcgtaa gtaccgttca agaagcccat ccacttggta 2521 gcgaactctt caaccttacg gcagttgatt gcagtaatgt tgtactggtt cttgtattct 2581 tccatattcc agccgtgcca gttttcgttc tttacgagct tgtagtgaga accagcttcg 2641 aactcagaga gcttgtaggg accccagcta gcagtggttt cgagggaaga gttgtagtta 2701 gaggtccaga gggttgcacc gtcagcggga gcaatcttgc aggactcata gagatccttc 2761 ttaacgaggg gaagtccgga catgtagtaa ggagcccaaa cagagaggtc accgtcttct 2821 gtgaggaagg agtaagcctt gtcgaggcag ataacgatag cattttcttc gtcgatagag 2881 tagataccaa cggaatccca agctacgtcg cggttagcgt tttcaacgta gatggttgca 2941 tcgtagccgt agccagcgcc tacttcagag taggtggtgg agtaagcagc gtagaggtca 3001 gcaccggaaa cggggtcggg ctcaccattg tactcaccag tgtaaacggt ggtgtcgttg 3061 taagcaagcc attcagggca gaggttgccg ttttcatcgg gatagccttc agcgccgtac 3121 atagcccaag cattgaagta gatggtttcg cctgcatcaa tagctgcctg gttggtagcg 3181 tagcccttgc tagcaacagt ctcataggta ccttcttcat tctggaagaa gtagatcttg 3241 gagttcttaa ccatgagagt gtcatagtag gtgttagcac ggaagttcat gaagtcaggg 3301 tcgagcaact gctgcatgga gtatacgaag tcagcagcaa cgataggtgt gccatcgtcc 3361 cacttgaggt cgtcacgaag agtgatcttc caagcatagc cgccttctgc cttctgctcg 3421 tcggtgtagc cccacttagc atcaacagta gcagttacgt cttcgagctt ggtagctgcg 3481 tcgtagttgg tggtgtaagc accgggaacg ataccgtcct tgttgataga gccgtcagca 3541 ttgtacttct cgtcgttctc gaacttgtag tcgtaagaga agaaggaaga gccgatgtag 3601 ctcatgatct gggtgtcgtt gttgtcagca taggtgaatt cgttccagtt gctgggcatt 3661 gtggtggtgg tgttgttgta ttcagcctgc ttgaaggttg cgggaactac atcgccttca 3721 acgggattct caacgccagg attctgaaca tcggaattat cgttgttggg ggttccgcaa 3781 gcagcgaagg ttgaaagaac cataaccaag ctcaatacca gcgcgaggat ggatgtgagt 3841 ttcttgttca taagatagcc tccatattat tttttgtgta acgtatcatt tatatgagca 3901 acgcttctct ttgccgttcc cggcatttta agcgtccgga ttcaggaccg tcaaatagaa 3961 acaatcctca acatagatga taagtgaaca tagacattgt actacataaa tagtggcttg 4021 tcaatatttt ttgcaaaaaa tgcaattatg caggcacttt ggcatcattt tgttaaattc 4081 aaacaagttc tttaataaag gtgagaaata catagataaa aggtccaaag gctttaagca 4141 cacaaatgca taaatatgat tttatgaaaa tttatgcaat ttttcactct ttcatatttc 4201 aattacagcg ctttaaaaca tcaaaaattg gtatacctta ttatatgggt tgccataatt 4261 tacatttgca tagggctggc aaatatggta tgatgtaggt gtcctcgagg acaaaatcta 4321 atcaggaggt acactacaag atgtgcaatt tgttcaacaa cattttcaac tgcggcggtt 4381 ccaactcgga ctgcggtatc tggcaggtcc tctgtcagat cttcggcttc ggctgctaat 4441 ttaatttaca taacagaatt gacataatat atagataa // LOCUS sequence052 4468 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence052 VERSION sequence052 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..4468 /mol_type="genomic DNA" /organism="" /note="sequence052" misc_feature <1..644 /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_010966555.1:ABC transporter ATP-binding protein" /note="WP_010966555.1 ABC transporter ATP-binding protein (Clostridium) [pid:63.2%, q_cov:99.5%, s_cov:30.0%, Eval:1.5e-75, partial hit]" /note="MGA_353" /locus_tag="LOCUS_2900" CDS complement(849..1817) /product="glycosyl hydrolase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_012583002.1" /transl_table=11 /codon_start=1 /translation="MSDKLYIPVNPNALPCVKNVMKYLSDITYEKIITGQHTQTMAMEE LHKIEEVTGKQPALLGFELLGYSPNINYLDTDDECMTEVVENFGTLKRAWEWAAQKGLI TFTWHWFSPLGGRSKSFFSRNTDFDASKAVIDGTPENIALLSDMDYMAGLLRPFCDTGI PILWRPLHEAEGNWFWWGAKGGEIAGKLWRIMYDRFTNIHHLNNLIWVWNSPVPEMYPG DDVVDIISRDMYPPAHVHTSQSEKYYDLLKVTNQPKLVLIGEIGTLPSAEAIASEKIGW CTYMTWSKVFCMTEAFTSYDELRKMYSSPYAVTKDDLPELY" /locus_tag="LOCUS_2910" /note="WP_012583002.1 glycosyl hydrolase (Dictyoglomus turgidum) [pid:40.1%, q_cov:97.2%, s_cov:75.3%, Eval:1.5e-66]" /note="MGA_354" CDS complement(1844..3109) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MHHRRMYANDNGDVAVKPITNITPDQLFEINVVRSGRERASEIAK KCDFVLYCVGNHPVQVAKECYDRKTIALNIQSGMALHLLGENKNTVMAMISSYPYSINE ENAALPAIIYTSHAGMYLGTAVAKTLCGENNPAARTPQTWYKSEHELPGIETYDIEASG TTYMYFKGEPLYPFGYGLSYSSFEYSDLDIMPDGDDYKATLTVKNTSERDGDEVVQIYY TALNSAVSRPIKKLCGFERVNIKAGESVKVEAKIWHRMLEIYNVRNGENVLESGDYKFM AGASSADIRLDKTIHIEADSLGTRPAEFLAETFDRYKDTVIKYSKTWGHYIIGKGWGCN VSYDGLSLSGKKTLTVWASSIHGKGRIYINLGNANVNVDVAPSNAYDDFKPYTVEIPEI SDVLSMNISYSENVAILKFLAE" /locus_tag="LOCUS_2920" /note="WP_012582726.1 glycoside hydrolase family 3 protein (Dictyoglomus turgidum) [pid:40.8%, q_cov:67.0%, s_cov:31.0%, Eval:2.2e-55, partial hit]" /note="internal stop codon at [3128:3130](-)" /note="MGA_355" misc_feature complement(3128..>4468) /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_012582726.1:glycoside hydrolase family 3 protein" /note="WP_012582726.1 glycoside hydrolase family 3 protein (Dictyoglomus turgidum) [pid:42.5%, q_cov:100.0%, s_cov:48.9%, Eval:1.7e-93, partial hit]" /note="internal stop codon at [3128:3130](-)" /note="MGA_356" /locus_tag="LOCUS_2930" ORIGIN 1 aaccgggaaa gacaatcgcg atcgtcggcc cgacaggtgc gggaaaaaca acgatcatca 61 atctgttgat gaggttttat gatgttaact cgggcaagac cgctgttgac ggcaccgatg 121 ccagagagat tacaagagaa tccctcagaa aagcatatac tatggtcttg caggacactt 181 ggttgttcag aggaacgatt tatgataaca tcgcatatgg cagagagggc gcgactctcg 241 acgaggtaaa agcggcggca gaagcggcaa gaatcgactc gtatattgag agcctgcccg 301 atggatatga cacagttttg acggacgacg gaatcaatat atccaagggg cagcgccagc 361 ttattaccat tgcaagagcg atgatttcaa actcgcagat gctgattttg gacgaagcga 421 catcgaacgt tgactcacgc acggagatca agattcaaga agcgatggcc gagctgatga 481 agggcagaac ctgctttatc atcgcccaca gactttccac cattcagaat tccgacaaca 541 ttttggtgat tcaggacgga aagatctccg agtcgggcac acacgatgag ttgcttgaga 601 agggcggatt ttacagcacg ctttataatt cgcagtttgc ttaaaaagcg gagcgccgtc 661 tgcgaagcgc gctcggaacg agctgtgcga gcaggtggcg cggagcgcaa aaatcttgct 721 tcgctcgcag gattttgcaa aaaaccactt cgtggctttt tggcggacga aacacagcaa 781 gatggtatca cctatataaa aaatcaaaga aaagctcccc gatcaaatcg gggagctttg 841 tttattggtt aatatagctc gggaaggtcg tcctttgtaa cagcatatgg gctcgaatac 901 atttttctga gttcatcata tgaagtgaac gcttcagtca tgcaaaagac ctttgaccag 961 gtcatatatg tacaccagcc gatcttttcg cttgctatcg cctcagccga gggcaaggtt 1021 cctatttcac cgataaggac cagctttggc tgattggtaa ctttaagcag atcgtaatac 1081 ttctcgcttt gcgaagtgtg gacatgagca ggcggataca tatcacgcga gattatatca 1141 acaacgtcat ctccgggata catttcggga accggagaat tccaaaccca gatgaggtta 1201 ttaagatgat gaatatttgt aaatctgtca tacatgattc gccaaagttt tccagcaatt 1261 tcgccgccct ttgcgcccca ccagaaccag ttaccctcag cctcgtgtaa aggtctccaa 1321 agaatcggaa tccctgtatc gcagaagggt cgcaaaagcc ccgccatata gtccatatcg 1381 gacaagaggg cgatgttttc gggcgtgccg tcaattacag ccttagaagc atcgaaatcg 1441 gtattgcggg agaaaaacga cttacttctg cctcccaaag gcgagaacca atgccatgta 1501 aaggtaataa gacccttttg ggctgcccat tcccaagcgc gcttgagagt tccgaagttt 1561 tccacaacct ctgtcataca ttcatcgtcg gtgtcgaggt agttgatatt tggagaatag 1621 cccaaaagct caaatccgag aagcgcaggt tgcttgcctg taacttcctc gatcttgtga 1681 agctcctcca tcgccatggt ctgagtgtgc tgaccggtaa tgatcttttc atatgttatg 1741 tcggaaagat atttcatgac atttttaacg caaggcaatg cgttgggatt taccgggata 1801 taaagcttat cactcataag atacgctcct ttgatttagg ttattattca gccaagaact 1861 tgagaattgc aacattctcc gaatatgaga tattcatact taatacatcg ctgatttcgg 1921 gaatctcgac ggtataaggc ttgaaatcgt catatgcgtt tgaaggagcg acatcaacat 1981 tcacattagc atttccaagg ttgatataaa ttcttccttt gccatggata gaggatgccc 2041 aaacggtgag ggtctttttg ccggaaaggc ttaagccgtc atagctcaca ttgcagcccc 2101 aacccttgcc gatgatataa tgtccccaag tctttgaata cttgatgaca gtatccttat 2161 atctgtcaaa ggtttctgcc aagaattccg cgggacgtgt gcccaaggaa tcggcttcaa 2221 tatggatggt cttatccaga cggatgtcgg cacttgaagc acctgccatg aacttataat 2281 cgccgctttc aaggacattt tcgccgttgc ggacattata gatctcaagc attctgtgcc 2341 agatctttgc ttcaacctta acactttcgc ctgccttaat gttcactctt tcaaaaccgc 2401 agagcttttt gatcgggcgg gaaacagctg aattgagagc ggtgtaatag atttgaacaa 2461 cttcgtcgcc gtcgcgctcg gaggtattct tgacagttaa ggttgcctta tagtcatcgc 2521 cgtcgggcat aatatcaagg tcggaatatt caaagctcga atatgaaaga ccataaccga 2581 agggataaag aggctcgccc ttgaagtaca tataagtggt gcccgaggct tcaatatcgt 2641 aggtttcaat gccgggaagc tcatgctccg acttgtacca agtctgagga gttcttgcgg 2701 cggggttgtt ttctccacag agggtcttgg caactgcagt acccagatac attcccgcat 2761 gggaagtata gataattgcg ggaagagcgg cgttttcctc attgattgaa taaggatagc 2821 tggagatcat tgccattacg gtgtttttgt tttcacctaa gagatgcaaa gccatacccg 2881 actgaatatt aagggcaata gtcttgcggt catagcattc ctttgcaacc tgaacagggt 2941 gattaccaac acaatagaga acgaagtcgc attttttcgc aatttcgctt gcgcgctcgc 3001 ggccacttct gacaacattg atttcaaaga gctggtcggg agtgatgttt gtaataggct 3061 taacagcgac atcgccgtta tcgtttgcat acatacgtct gtggtgcaag aattcctcga 3121 tgagatacta gtcgccaact tttttgagat tgagggtttc gcgggtaaac caatcgtaga 3181 tgcgacggtt atgtaagcgc aaacggttat cgtcagccag ctttaaatat ctcttatgct 3241 tgacgctgaa gaggttgatc cagttttcgc cccaatcctg aagctcgaaa atttcgtcct 3301 cgccaacggt atcggcggtt gcacagagca agccgtcttc attaacgctc agatacttgc 3361 cgttagcggc tttaaggctg acgtggtccc aaaggctgtc gtgaattatc tcgctgtctg 3421 taaactgctc acgcattccg cgaaggacgg agatttcatc agaccaaaca cctgtatacc 3481 agtccaaaag gttttcatct gccatcgcac ccacaactgc aatcttttta ggtgcagttt 3541 taaggggcag aattccattg tttttaagca agatgatctg ctcgagagtt gcgcggagat 3601 ttttcttttt gtgttcatcg caatcgacaa cgcttgtatc aatgctgtca aaatcacact 3661 catcaaactg tcccaaagca aagcgcgaga agagggtgtt tgcgagggtt tcgtcgatat 3721 cggcttcggt gaggtgtccc tcatcaaggg cgatgtatgc ggccgccttg acaagaacgc 3781 cgttgtcggt catgctgtcc gagcccgcct tgagagagag tgccagcgat tcgctatgag 3841 taggaacaaa gcggtgagct gtgacggtct gggagaagtc tccgccgtca gtgacggtat 3901 accaaagccc ccatttatcc tttaagacgg tttttaaatc gggattgagc accgcaggac 3961 aaccgttgat gtcgttatat gcggtcataa ggctacgggc gccgccttta acaacggaat 4021 tttcaaatgc ggcgtagtag taatcatact tcaggcgcaa gggcataaat gcatcgcaat 4081 tagcacgggt cttctcattg ttgtttgcgc aaaaatgctt aagcgaggga atggtcatga 4141 aaaatctgcc gttatcccct gccataccct cggtataagc agcggaaagc tcacctgcaa 4201 ggcagacatc ttcgccgtag gcttcttcat ttctgcccca gcgagggtcg cgttccatat 4261 caacggttgg gccccaaagt gcaaggccgc caagcttttc gatattataa taagctcttg 4321 cctcaacacc ggcaattttg ccgagattat gcataagatc tctgtcaaag gtcgatgcca 4381 gacctgttgg ctgagggaat acagtcgata ctcgatcggc gcttctgcca acaaagccac 4441 gtgctacttc ggtgccaatg tggtattc // LOCUS sequence053 4455 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence053 VERSION sequence053 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..4455 /mol_type="genomic DNA" /organism="" /note="sequence053" CDS complement(389..1057) /product="RNA polymerase sporulation sigma factor SigF" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_010965603.1" /transl_table=11 /codon_start=1 /translation="MYLLNEAYAETSATAEENLGLVRLCAGRFKGKGIEYEELYSAGCI GLLKAVKSFDSTRGVRFSTYAVPVILGEIKRLFRDGGMIKVSRGLKERSLQIARARERF ERENLREPTVEELADLTGLEPLDIAEAISVMQPTVSLTSGEDGETELDIPVPPPDDKII NSLALKQVLDKLDESDRALIQLRFFCGLTQQAVAAKLGCTQVQVSRREKKLLERLRSEL " /locus_tag="LOCUS_2940" /gene="sigF" /note="WP_010965603.1 RNA polymerase sporulation sigma factor SigF (Clostridium) [pid:39.7%, q_cov:86.5%, s_cov:79.0%, Eval:4.0e-34]" /note="MGA_358" CDS complement(1067..1507) /product="anti-sigma F factor" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003230452.1" /transl_table=11 /codon_start=1 /translation="MARKTVNEMKIKFPSLSENERLARSAISGFVALKNPQIDELSDIK TAVSEAVTNSIVHGYRNTLGEIEMTAKIFDDNTVYIRIKDKGVGIEDIKQAMTPLFTTL AQEERSGLGFSVMESFCDSVRVSSKKGAGTTVVLTKRLRTKL" /locus_tag="LOCUS_2950" /gene="spoIIAB" /note="WP_003230452.1 anti-sigma F factor (Bacillus) [pid:48.2%, q_cov:93.2%, s_cov:93.2%, Eval:7.4e-32]" /note="MGA_359" CDS complement(1522..1830) /product="anti-sigma F factor antagonist" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003357811.1" /transl_table=11 /codon_start=1 /translation="MAVYIETKTKDELLARLSGEIDHHSSLWLRMDIDTAICENKPKTL QLDFSDVSFMDSSGVGLVMGRYKLMKEIGGSVELCNLPDSIERVMLLAGMNRICKIK" /locus_tag="LOCUS_2960" /gene="spoIIAA" /note="WP_003357811.1 anti-sigma F factor antagonist (Clostridium) [pid:42.6%, q_cov:92.2%, s_cov:84.7%, Eval:1.2e-14]" /note="MGA_360" CDS 2052..3092 /product="heat-inducible transcriptional repressor HrcA" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_010964592.1" /transl_table=11 /codon_start=1 /translation="MDDRKLRILAAVVDEYITTGEPVGSKAISRYINASSATIRNEMAE LEKQGYLEQPHTSAGRVPTYNGYRLYVDRLMTTSPLSDEEKRLLDDMLPNDVYSEEVLV QSASNALATLTSCATFISSENPKFSVISKVEIIPTGKRMYVLLMITSNGKIKNRTCRLE LDLTNEQLQYFSNYVKQNLEGVPVEVLSDEMLEKLETAMGTYLLTLSPLIKGLFDMSKE MTQRDVSVSGGKNLLKRTDVDQNEIIAFLDNSAELQRLIDDSFSGIHVMFSEEQNDFVI GNSSLISSNFRKNGKVAGHLGVIGPMRIDYRKVIPYIEYFTQKISEMLSNDDEYDTEEE GSIYDE" /locus_tag="LOCUS_2970" /gene="hrcA" /note="WP_010964592.1 heat-inducible transcriptional repressor HrcA (Clostridium) [pid:33.3%, q_cov:95.1%, s_cov:97.7%, Eval:2.2e-47]" /note="MGA_361" CDS 3082..3480 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MMNEEKMTAEELEKNQDVGTAEEANEPTPEELLIKENEELKTKLS EAKDKHLRLMAEYDNFRKRTAQEKLSIYPDATAKAVEAFLPLADNFERALAAETADEKY KAGVQMIYNQLCETFKKLNVEVIDRVGE" /locus_tag="LOCUS_2980" /note="WP_012048003.1 nucleotide exchange factor GrpE (Clostridium) [pid:36.2%, q_cov:93.9%, s_cov:60.7%, Eval:3.7e-16, partial hit]" /note="internal stop codon at [3478:3480](+)" /note="MGA_362" CDS 3697..3861 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MSKIIGIDLGTTNSCVAVMEGGEAVVITNSEGARTTPSVVGVSKN GERLVGQVA" /locus_tag="LOCUS_2990" /note="WP_005816476.1 molecular chaperone DnaK (Desulfitobacterium) [pid:87.0%, q_cov:100.0%, s_cov:8.8%, Eval:7.2e-20, partial hit]" /note="internal stop codon at [3859:3861](+)" /note="MGA_363" ORIGIN 1 aaagcgctgc tttaagtgat ggctcggtat gcgttctttt cagattcttt accgggactg 61 ccatagtagt agtaccctcc ttttcatatt ggtgaactac attacttgca cattatacct 121 caaatattac aaaaagtcaa tgattatgac aaaaaatgtt taaaagtttt aaagaaacat 181 ttttgaaaaa acctcgcaaa tagactaaat tcaacgtatt gtcgctttta aaagctcttt 241 gtttaggcgg ttttagaaag atttaagaaa atgaaacgcg aaagataaat cgctgatata 301 aaatttttat aaaaccatcc agtgtattat ttatcattgt aaagcgcaaa atcaaaaaag 361 tcagttgtgg gaactttttg gacactaatc aaagctcgct tcgaaggcgt tcaagaagct 421 ttttttcgcg ccttgaaacc tgcacctgtg tgcatcccag cttggctgcc acagcttgtt 481 gagtcagacc gcaaaagaat ctcagctgta taagtgcgcg atcactctcg tccagcttgt 541 ccagcacctg cttcaacgcc aacgaattga ttattttatc gtcgggcggg ggaacgggaa 601 tatcaagctc ggtttcgccg tcctcgcccg atgtcagact caccgtcggt tgcatcacgc 661 ttatcgcctc tgcaatgtcc aacggctcca atccggttaa gtcagccaac tcctcaaccg 721 tcggctcacg caggttttcc cgctcaaacc gttccctcgc ccgcgcaatc tgaagcgagc 781 gttctttaag cccgcgagaa accttaatca ttccgccgtc gcggaaaagc cgtttaattt 841 cgcccaatat tacaggcacc gcataggtcg aaaacctaac acctcgggtg ctgtcaaagc 901 ttttgaccgc cttgagcaac ccgatacacc ctgccgaata aagctcctca tattcaattc 961 ctttgccctt aaatctgccc gcgcaaaggc gcaccaaacc gaggttctcc tcggcagttg 1021 cgcttgtttc ggcatatgct tcatttaaaa gatacatttt tcacctttac agtttagttc 1081 ggagcctctt tgttaaaact actgttgtgc ctgcgccctt tttgcttgaa accctaacgc 1141 tgtcgcagaa gctctccatt accgagaatc ccaaccctga gcgctcttcc tgcgccaaag 1201 tggtgaaaag gggagtcatt gcctgcttaa tgtcctcaat gcccacgccc ttgtccttga 1261 ttcttatgta aacggtgttg tcgtcaaaaa tcttcgccgt catctcaatc tcgcccaagg 1321 tgtttcgata tccgtggacg attgagtttg tcaccgcctc gctgacagcg gttttaatat 1381 cgctcagctc atctatctgc ggatttttca gtgcaacaaa tccgcttatt gccgaacgcg 1441 ccaacctttc gttttccgaa agtgaaggga acttaatttt catttcgttg actgtctttc 1501 ttgccatatt tctcacatcc tttacttaat tttgcaaatt ctgttcattc ccgccaaaag 1561 catgacccgc tcaatgctgt cgggaagatt acaaagctca acgcttccgc cgatctcctt 1621 catcagctta tatctcccca ttaccagacc cacgcccgag ctgtccataa agctgacatc 1681 ggaaaaatcg agctgcaaag ttttcggctt gttttcgcag atcgccgtgt caatgtccat 1741 tctcagccaa agggacgaat ggtggtcaat ttctcccgag agccttgcca aaagctcatc 1801 ctttgtcttt gtttcaatat atactgccat agttgcctcc ttcatatata aatgtgaaaa 1861 cgcttctttt tggatgatac acccccatat gcgggaagtt tgtcaaagtg tgaagcttga 1921 aaagattttt gaaaagtgtg tgaaatctat tgacattagg aaaaatcggg gtataataaa 1981 attagcactc ggggatatag agtgctaaca ctctaagaca tcaactgcta aaaccgattg 2041 gagggtattg tgtggacgac cgaaaactga ggattcttgc cgccgttgtc gatgaatata 2101 taaccacagg tgagcctgtc ggttcaaagg caatcagccg atatatcaac gcatccagtg 2161 ccaccatccg caacgaaatg gcggagcttg aaaagcaagg ctatctcgaa cagccccaca 2221 cctctgcagg acgtgtacct acatataacg gctaccgcct atatgtcgac cgtctgatga 2281 ccacctctcc cttgtcggat gaagaaaagc gcctgctcga tgatatgctc cccaacgatg 2341 tatattcgga agaagtgctg gttcaatccg catcaaatgc gcttgcaaca ttgaccagct 2401 gtgcaacatt catatcaagc gaaaacccga aattctcggt catctcaaag gtcgagataa 2461 ttccgaccgg caagcggatg tatgttttgc tgatgataac ctcaaacggc aagattaaaa 2521 accgcacctg ccgacttgag cttgatttga ccaacgaaca gctccagtat ttttccaact 2581 atgtcaagca gaatcttgag ggtgtgccgg ttgaagtttt aagcgatgaa atgcttgaaa 2641 agcttgaaac cgcaatggga acatatcttt tgaccctctc gccgctaatt aaaggcctgt 2701 tcgatatgtc caaagaaatg actcagcgtg atgtttccgt ttcgggaggc aaaaacctct 2761 tgaagcgcac cgacgttgac cagaacgaga taattgcatt tttggacaac agcgccgagc 2821 ttcagcgact gattgatgac agcttctcgg gcatacacgt aatgttctcg gaggagcaga 2881 atgactttgt aatcggaaac tcaagtctta taagctcgaa cttccgcaaa aacggcaagg 2941 ttgcgggaca tttgggagta atcggcccga tgcgaatcga ctaccgaaag gtaatcccat 3001 atatcgaata ttttacacag aaaatttccg aaatgctttc aaacgatgat gaatatgata 3061 ccgaggagga aggaagcata tatgatgaat gaagaaaaga tgacagccga ggagcttgaa 3121 aagaatcagg atgtcggcac cgccgaagag gcaaatgagc caacacccga agagcttctc 3181 attaaagaaa acgaagaact caaaaccaag cttagcgaag cgaaggataa gcaccttcgt 3241 ctgatggcgg aatatgataa cttccgcaag cgcaccgcgc aagaaaagct ttcaatatat 3301 cccgatgcga cagcaaaggc agttgaagca tttttgcccc ttgcagataa ttttgaaaga 3361 gctttggcgg cagaaaccgc cgatgaaaaa tataaagcag gcgtccagat gatctataat 3421 cagctttgcg aaaccttcaa aaagctgaat gtcgaagtga tcgaccgcgt cggtgaataa 3481 tttgatcctc gccttgaaaa tgcagtcagc cagataaccg acgaaaacct cggcgaaaac 3541 gtggtcgcgc aggtatatca aaagggctac aagatgggcg ataaggtgat cagacccgca 3601 atggtcattg ttgcaaactg ttaaaaccgg tgcaagccga ttaaataaac acaaacaaat 3661 acatttttat atttaatttt aaaggagaaa tgaactatgt ctaaaattat aggtatcgac 3721 cttggtacaa ccaattcctg cgttgccgtt atggaaggcg gcgaggcagt agtaatcacc 3781 aacagcgaag gcgcaagaac aaccccttcc gttgtcggtg tttccaagaa cggcgagcgt 3841 cttgtcggtc aggttgcata gcgccaggct gttgttaact atgacaacac cgtaagctcc 3901 atcaagcgcc atatgggctc tgactataag gcaaatatgg gtggcaaggc atatacaccc 3961 caggagatct ccgcaatgat cctgctcaag ctcaagaccg atgctgaagc atacctcggc 4021 gaaaaggtaa ccgaagctgt aatcaccgtt cctgcatact tcactgacgc tcagcgccag 4081 gcaaccaagg acgcaggcca gattgcaggt cttaacgtaa gaagaatcat caacgagcct 4141 accgctgctg cactttccta tggcattgac aaggaagaag agcagaagat catggtttat 4201 gacctcggcg gcggtacctt cgacgtttcc atcatcgaga tgggcgacgg cgtaaccgaa 4261 gttttggcaa ccgcaggtaa taaccgtctt ggcggtgacg acttcgacca gagaattatc 4321 gaccttttgg ttgctgaatt caagaagagc gaaggaattg acctttcaaa cgataaaatg 4381 gcaatgcagc gcctcaagga agctgctgaa aaggcaaaga tcgagctttc aagcgttccc 4441 tcttcaaaca tcaac // LOCUS sequence054 4420 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence054 VERSION sequence054 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..4420 /mol_type="genomic DNA" /organism="" /note="sequence054" CDS 654..1946 /product="flippase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_000939580.1" /transl_table=11 /codon_start=1 /translation="MNLIKILKNRTVKNAGWIVGGRLANKILAFVVGVFTARYLGPDNF GLINYAAAYTAFFASLCNLGINSIIIKDFSDNPDEEGEALGTTLVLRAISSFLSALMIV GIVSIVDKNEPLTILVTTLSSIGLLFQIFDAFSQWFQYRLKSKYYAVATVIAYIAVSVY KIILLIAGKSVAWFALATSVDYIVIAILLLLAYKKNNGPKLSFSMRKAKQLLAASSGFI VSGLMISIYAYTDKFMLKQMLDEAAAGYYSLAFSLSTFWEFILVAVMDSMYPSIIDSYN VDRERFDRKNRQLYAMVIYISLTASILICIFGRLIVQILYGAEYLPTVQPLRIVVWYTT FSYLGAARNAWVVSENKQKYLKYLYAAAAIINVVLNLVLIPLWGASGAALASLVTQIST TVILPAFIPALRPNARLMVEALMLKNVFKKE" /locus_tag="LOCUS_3000" /note="WP_000939580.1 flippase (Leptospira interrogans) [pid:24.5%, q_cov:96.7%, s_cov:93.5%, Eval:3.2e-41]" /note="MGA_366" ORIGIN 1 tgcatattgc aatggcttct tttttgggat atttcatcct cgaaagccag tcaagaaaca 61 gtcttttggc gtttgttgca tttacagcga tatgcgcttg gctgattttc aagagccgca 121 gacagctcag aataactaag ttcggcgcaa cggtattttc aattgcgcct gcattgtttg 181 tgatgttcta tatggtcatg gtaaaccttc cttgggtaca gctgattctt gacttccttg 241 taggtgaagg caaggcgctg acatcaagac acgacgtttg ggaaacggca cttacggctc 301 tgtattcatc tccgctcatc ggcgcttaca gccaaatttc aaacggtgaa ggtgcctcgc 361 agatgcacaa ctcccatctt gacattgccg catcttacgg cattattgtt ttcctgctgg 421 tttgctatct tttgtggaga tatttatatc agaagggcag atattacaat cacaagagca 481 actatgttta tatcctcgga tttgtctgtg ccatactcct cggcatcggt gaggcggcgc 541 tgttctccgg cggattggga atttatgttt tcatcggaac attcctgatg ctggcgaatt 601 atgaaaaaca agaaagcatc ggttgactaa tgagataact ttggagttat agaatgaatt 661 tgataaaaat tctgaaaaac agaaccgtta aaaacgcagg ttggatagtc ggaggacgtc 721 ttgcaaacaa gattttggca tttgtcgtcg gagttttcac tgcaagatat ttgggacccg 781 acaacttcgg ccttatcaac tatgccgcgg catataccgc attttttgca tctctttgca 841 acttgggcat aaattcaata atcatcaaag atttttccga taatccggac gaagagggcg 901 aggctctggg aacgaccctt gttctgcggg cgatttcaag ctttttgtca gctttaatga 961 tagttggcat tgtttcgatt gttgacaaaa acgagccgct gactattttg gtaacgacgc 1021 tgagcagtat cgggcttttg ttccagattt tcgatgcctt cagccagtgg ttccaatata 1081 ggctgaagtc taagtattac gcagttgcga cggttatcgc atatatcgcc gtttcggtct 1141 ataaaataat tttgctgata gcaggcaaaa gcgttgcctg gtttgccctt gcaacctcgg 1201 tcgattatat tgttattgca atacttttgc tgttggcata taagaaaaac aacggaccaa 1261 agctgtcgtt ttcaatgcgt aaggcaaaac agcttcttgc ggcaagctcc ggttttattg 1321 tttcggggct gatgatttcg atttatgctt atacggacaa gtttatgctc aagcagatgt 1381 tggatgaagc tgcggcggga tattattccc tggcgttctc gttgagcaca ttttgggagt 1441 tcattctggt cgccgttatg gattcgatgt atccgtcgat aattgattca tataacgttg 1501 atagggaacg gttcgaccgc aaaaaccgac agctgtatgc tatggtcata tacatatcct 1561 taactgcgtc gatactcata tgtattttcg gcaggctgat cgttcagatt ctttacggcg 1621 cggaatattt gccgaccgta cagcccttga ggatagttgt ttggtatacg accttctcat 1681 atttgggcgc cgcccgaaat gcctgggtgg tcagcgaaaa caagcagaaa tatctcaagt 1741 atctgtacgc agccgccgca attatcaacg ttgttttaaa ccttgtgctc ataccccttt 1801 ggggagcatc gggcgcggcg ttggcatcgc tcgtaactca gatttcaact accgttattt 1861 tgcctgcatt tatccccgca ctcaggccga acgcccgcct tatggtcgag gctctgatgc 1921 tgaaaaatgt gttcaaaaag gaatgatttt ccaatttacc cgtcttgaaa attcaaggcg 1981 ggttttgctt ttttctgcgt actttttaag gtttgtgcaa tatgttgcaa ttcagattac 2041 ctgaattatc taatcgtgca aaaaagtaaa atatgtacag aaactattgc aaaaattggt 2101 ttggcatgat attatataat cgtataatag gcgagatagc caaaaaacac agatatgatc 2161 gggataataa aacgattata tcgcattgtg tcgcaaattt cggcattttg cctttgacaa 2221 tgagtatcat gacataagca ttgtaacgag aattatgaaa gtaggaggag taaaatgaat 2281 acgaacagat tctctaaaat tttgtcgctg tttttggctg tatgcttagc attcagcatg 2341 atggctcccg ccgttgtttc ggccaccgaa accgagggca cgggaaccgt tattgaaggc 2401 ggcgaaaccc ccacaattga aggcaacgag ggtggtgaga tctccggagg agaagatatt 2461 tctgccggta ccgaagaggt catcatgccc attattgacg agccctatat tgcagactat 2521 gcaaccttcc ttgcaaacct caagttgctc gaaggttatg ctgaaagctt catatcggta 2581 aataccggat ataccgaccc tgttttgctg gttatcaact acatccgtac aggtgtagct 2641 aagtataccg aggacgaatg ggttactctt gcaggtgagg agatcaccgc atttaccgac 2701 tatgttgccg ctcaggatgc tttgaccggc aatactgtaa gagcgctccg aaatgttgaa 2761 aacttcgtca ctcccgacgg cgagtgggtt gaattcaatc atatgttcgg tacaatgaac 2821 attttgtacc ttgcgcagag catctttaaa ggctcgggcg accttggcgg ttgggcaggc 2881 gatatttgtg atcttgtcaa catccttgtt gttaaggggc tcacaggtaa ctcgatcgac 2941 gagctggttg cgaccatttc cgcaaaccac ctcttcgttg aaagtgatat cgaaggtgtc 3001 agctccttcg gcaagcttga ctactacggc gacatcgacg ctatgtactt tgtcaccaag 3061 ctcaagtcag aaggcggaaa gcttagccag tggatggaaa gctactttac tcccacgctc 3121 accgagagcg acagagccgc attcttcctc aataccagat tcaacggcaa gcttacaaag 3181 gcgacagtcc gtgcggctat ttacaacaca tattctgccg acacgatgat cagaatcctt 3241 gaaagtaagc gaggaatcaa caagaacaac gacatcgacg gtgacgacat tcccgactgt 3301 aaccatgccg acatcagaat cgcagcttgc tatgcttttg ctgattatgt gtttgcgctt 3361 gctgacggac gccttgttga agctcccgaa gaaccggaag gcttcactgt tacctggctg 3421 aactatgacg gcactgtttt ggagcttgac gagaatgttc aagcgggcga aatgccttca 3481 tatgacggcg caactcccga aaaggcaccc gttgataagt atgtatatat ctttgacggt 3541 tggactcctg agatttctgc agttacaaac cacgttatct atactgcggt ttataccgaa 3601 tcaattcttt ccaaccctta ctataccgtt accgccagcg aatcttcaac actcgctccg 3661 ggtatcttac agaccattga aaccgcaaga actgccgaca ataagcagat agtatattat 3721 cttgcaactg ttgacgtcaa ccgtagcgac gttagtattc acgctaacta taacaacaac 3781 gatccctcat tgggttgggg tatgcagaag gtcactgacc agatcgctgc ggcagttaaa 3841 agacataccg atcccacatc gcccctttac gttgaaaact ataaccccat cgtgggcgtg 3901 aatgccgact tcttcaatat gacaaacggt gctccctccg gcgcgctagt catggaagga 3961 atcacatatg cagaagcgcg ctccgaaaac ttctttgcaa ttcttgatga cggaactgca 4021 atgatcggtt ctccctccga ttgggcgggc attaaggaca gagtcaagga agccgttggc 4081 ggaagcatct ggctggttaa gaacggcgag atcgtcgttg ctcccagcgc cgactactat 4141 accagcagag catcaagaac ctgtatcggt attacagccg aaggcaaggt agttcttatg 4201 gtacttgacg gacgtcagga accccgttct gcaggcggca gcagccagga aattgcacag 4261 ataatgtttg aagcaggctg tgttgatgct atcaacctgg acggcggcgg atccaccaca 4321 ttcgcagcta agcaggcggg tagcgactcg atcacagttg ttaacagacc ttccgacggc 4381 tttgctcgtt cggtaagctc ctcgctgttt gttgtatcca // LOCUS sequence055 4413 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence055 VERSION sequence055 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..4413 /mol_type="genomic DNA" /organism="" /note="sequence055" CDS 17..1867 /product="excinuclease ABC subunit UvrC" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_010963830.1" /transl_table=11 /codon_start=1 /translation="MRVTLSDNPRLEYLREKTQKLSTRPGCYIMKNKAGTIIYIGKSKH LRNRVSSYFRDNDPLTKVYKMVTNVYDYDFIVTDSEYEALVLESSLIKQHQPKYNILLK DDKGYTYIKVSNEDFPRITRAMQKKGDGKFIGPYTSGLTTKQTVEEVNRVFMLPTCKRV FPRDFGKQRPCLNYQIKRCIGLCRGCFTKDEYAKIIEQALDYIKSGSSLSCDELTREME LASENLEFERAAMLRDRIAAIKRAAETQKIFDKSLPDTDIIALAQNGENACISVLIYRG GRLYDKADYMLGELEDEEAMREDFLLQYYDRGVKIPKNIYIDFELADADNLVRYLREKS GHAVYIANPKRGDMLSLLKMAKANATEHLSLAVGRTGKEISALEDLATLIGLKNTPLYI ECYDISNIGSADMVGGMVVLDNGRPLKKNYRKFNIKTVYEQNDYASMREVLRRRFENYF DPEEKDESFKTMPDLIFLDGGRGHVAAVAPLLSEMGVPCPVYGLVKDNKHHTRAVIAPD GQEITVSKNRAVFSLLTRLQDEVHRYTITFQTKKHLSSMYETALTSVKGVGQAKAKALL STFKTKESLKNASVEDIAAVMKISFEKAEEVKRVFIDELK" /locus_tag="LOCUS_3010" /gene="uvrC" /note="WP_010963830.1 excinuclease ABC subunit UvrC (Clostridium) [pid:38.6%, q_cov:96.3%, s_cov:97.8%, Eval:3.4e-114]" /note="MGA_368" CDS 1945..2499 /product="16S rRNA (guanine(966)-N(2))-methyltransferase RsmD" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003431108.1" /transl_table=11 /codon_start=1 /translation="MRVITGTARGKRLKTLEGLDVRPTSDKVKEAIFSIIQFDLPGASV LDLFAGSGQLGIEALSRGAKHCVFVDKSRASIAVVRENVQNCGFVNESRIVNMDSVDYL RSAKAGIDIALLDPPYEQGLILKALPLLEPKLSDGAIVICEHEAGLELPDEVARLEKWR TYNYGKHVALTTYKIKEADEE" /locus_tag="LOCUS_3020" /gene="rsmD" /EC_number="2.1.1.171" /note="WP_003431108.1 16S rRNA (guanine(966)-N(2))-methyltransferase RsmD (Clostridioides difficile) [pid:42.4%, q_cov:97.3%, s_cov:99.5%, Eval:2.5e-35]" /note="MGA_369" CDS 2496..2993 /product="pantetheine-phosphate adenylyltransferase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_012583503.1" /transl_table=11 /codon_start=1 /translation="MSERIAVCPGSFDPVTLGHLDIMTRASKLFDRVIVLVSVNPQKHP SFSAEERVEMIKAVTHDLPNIEVDILPGLLADYVREKKAVAIVKGLRAVTDFEYEFQQA LANKKLYPDAETVFLVTTSENMFLSSSVVKQIASFGGDIADFVPPEIKDKIQNRLRNVN NI" /locus_tag="LOCUS_3030" /gene="coaD" /EC_number="2.7.7.3" /note="WP_012583503.1 pantetheine-phosphate adenylyltransferase (Dictyoglomus turgidum) [pid:54.2%, q_cov:93.9%, s_cov:96.9%, Eval:4.4e-43]" /note="MGA_370" CDS 3009..3470 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MTIDEILEMMDDLLDKSVTVPFSGKKCMVDTDQLREYIDNIRYNL PTEIKRAKEMVADRSVILTDANEQAEDIIKKAEEKAKILVSEEEIVKQAKAAADDLTAQ AKMMDSTIRKAMVEKLDSILGESEKALNKTLNELKAMREAVKSANKADE" /locus_tag="LOCUS_3040" /note="MGA_371" ORIGIN 1 agggacacaa aaacccatgc gcgtaaccct aagcgacaac ccgcgtcttg aatatctgcg 61 ggaaaaaacg caaaagcttt caacccgacc gggatgctat attatgaaga acaaggcggg 121 aacgatcata tacatcggca agtcgaagca cctgcgtaac cgagtttcaa gctatttccg 181 cgacaacgac cctctgacca aagtttataa aatggtcaca aatgtatatg attatgactt 241 catcgtcacc gactcggaat atgaagcgct ggttttggaa tcgtccctta tcaaacagca 301 tcagccgaaa tataacatcc ttctcaaaga tgacaaaggc tatacctaca tcaaggtgtc 361 aaatgaggat ttcccccgta tcacccgagc gatgcagaaa aaaggcgatg gcaagttcat 421 tgggccttat accagcggtt taaccaccaa gcagacggtt gaagaggtca accgtgtgtt 481 tatgcttccc acctgcaaac gggtattccc acgcgacttc ggcaaacagc gcccctgctt 541 aaactatcag ataaaacggt gcatcgggct ttgccgaggt tgcttcacca aagatgaata 601 cgcaaaaata atcgagcagg ctcttgatta tattaaaagc ggaagctctc tttcctgcga 661 tgagttgacc agagaaatgg aactggcttc ggaaaacctc gaattcgaac gtgcagcaat 721 gctgcgcgac agaattgccg caatcaagcg cgccgcagaa acacagaaga tatttgacaa 781 atcgttgccc gacaccgaca ttattgcgct ggcgcaaaac ggcgaaaacg cctgcatctc 841 ggtgcttatc tatcgtggcg gacgccttta cgacaaggcg gattatatgc tcggcgagct 901 tgaggacgaa gaagccatgc gcgaggactt tctcctgcaa tattacgacc gcggcgtgaa 961 gattccgaaa aacatatata ttgattttga acttgcggat gcggacaact tggttcggta 1021 tctgcgggaa aaatcggggc atgctgtata tatagccaac cccaagcgtg gcgatatgct 1081 gtcgcttttg aaaatggcaa aggcgaacgc aacggagcac ctttccctcg ccgtcggcag 1141 aacgggcaag gagatctccg cccttgaaga cctcgcgacc ctcattgggc tcaaaaacac 1201 accgctgtat atcgagtgtt atgatatttc aaacatcggc tcggcagata tggtcggcgg 1261 aatggtggtt ttggataacg gcagaccctt aaagaaaaac taccgcaaat tcaatattaa 1321 aacggtctat gagcaaaacg actacgcttc tatgcgcgag gttttgcgca ggcgttttga 1381 aaactacttc gaccccgagg aaaaggacga aagctttaaa acgatgcccg accttatctt 1441 cctcgacggc ggacgtggcc acgttgcggc ggtagctccg cttttaagcg aaatgggtgt 1501 tccttgccct gtatatggcc ttgttaagga caacaagcac cacacccgcg ctgtaattgc 1561 ccctgacggg caggagatca ccgtttcaaa aaaccgcgcg gtattctcgc tgttaacaag 1621 gttgcaggac gaggtgcaca gatacaccat cacattccag acgaaaaagc atttaagctc 1681 gatgtatgaa accgcgctga catccgtcaa gggcgttggg caagcaaagg cgaaagctct 1741 tttaagcacc ttcaagacca aggaatcgct gaaaaacgcg agtgttgagg acatcgcggc 1801 ggtgatgaaa atatcttttg agaaggcgga agaggtaaaa agagttttca ttgacgaatt 1861 aaagtgattt ttagtataga catttgctga tttttaagat ataatcagct tagtatgaaa 1921 taaatcggga aaggacaggc aaaaatgaga gtcattaccg gtactgcacg aggcaagcga 1981 ttaaagaccc ttgagggact tgatgttcgc cccacctcgg acaaggttaa agaagcaatt 2041 ttttcaatta tacagtttga tctgcccggt gcgtcggttc tcgacctttt tgcaggatcg 2101 ggacagcttg gcattgaagc gctgagccgc ggagccaagc attgcgtttt tgttgataaa 2161 tcccgcgcat caattgcggt cgtaagagaa aatgttcaga actgcggatt tgttaacgaa 2221 tcacgtattg tcaatatgga ttcggtcgac tatctgcgct cggcaaaagc gggaattgac 2281 attgcgcttt tggacccgcc ttatgaacag ggacttatcc ttaaagcact cccccttttg 2341 gaaccaaagc tgagcgacgg cgcgatcgtt atatgcgaac acgaagcggg acttgagctt 2401 cccgacgaag ttgcaagact tgaaaagtgg cggacatata actatggcaa gcacgttgcg 2461 ctgacaacat acaaaattaa ggaggcggac gaagaatgag cgaaagaatt gcagtctgcc 2521 ccggcagctt cgaccccgtt acactcggtc accttgacat tatgaccaga gcttcaaagc 2581 ttttcgaccg cgtgatcgtt ttggtgtcgg tgaaccccca aaagcacccc agcttttctg 2641 cggaagagcg cgttgaaatg attaaagctg tcacccacga cctgcccaac attgaggttg 2701 acattttgcc gggactttta gccgactatg tcagagaaaa aaaggctgtt gcaatcgtca 2761 agggccttcg tgcggtgacc gactttgaat atgaattcca gcaggcgctt gccaacaaaa 2821 agctctatcc cgatgcggaa acggtatttt tggtaaccac cagcgagaat atgttccttt 2881 cctccagcgt tgtaaagcaa attgcctctt tcggcgggga tattgcagat tttgtaccgc 2941 ccgagatcaa ggataagatt cagaacagac ttcgcaatgt aaataacata taaggagata 3001 gattatttat gactattgat gaaattttgg aaatgatgga cgacctgctt gacaagtcgg 3061 tcacggttcc cttctcgggc aaaaagtgca tggttgacac cgaccagctc cgcgaatata 3121 ttgacaacat ccgctacaat ctgcccaccg agatcaagcg tgcaaaggaa atggttgctg 3181 accgttcggt aattcttact gatgcaaacg agcaggcaga ggatatcatt aagaaggctg 3241 aggaaaaggc aaagatcctt gtttccgaag aggaaattgt taagcaggct aaggctgccg 3301 ctgacgacct gaccgcacag gcaaagatga tggattcaac catccgcaag gcaatggttg 3361 aaaagcttga cagcatcttg ggcgaatcgg aaaaggctct taacaagacc cttaacgagc 3421 ttaaagcgat gcgcgaggct gttaaatctg ccaacaaggc tgatgagtaa ttaaatgaat 3481 tatccgcact ttggcttcaa ggtgcgtatt ttttcggtaa tttacttgtt tttcaacaat 3541 gaaatgctct aaaatcgggg caatttcgtt ttttgtgtta attgactata ttttcaaaaa 3601 ataatataat gtagtacata acaacatata aggagaatca taccgtgttg acaaaagttg 3661 ttaaattcgg cggctcaagc cttgccgatg caaatcagtt tgttaaggtt gcaaacatca 3721 tccgcgctga tgaagcgaga agatacgttg tgccctctgc tcccggcaaa cgcgagccaa 3781 aggacacaaa agtgactgat atgctttacg cttgctatga cgtagcagtc agaggacagg 3841 actttttgcc catgttcgct gaaattgaaa agagatatac cgacattatt gaaggcctgg 3901 gacttgacct tagccttgca aacgagtttg aaaccatcaa gcacagcttc cgtgcaagag 3961 ccggacgtga ctatgccgct tccagaggcg aataccttaa cggtatcatt ctggcgaaat 4021 atttgggcta tgaattcatc gacgccgcag atgtgatcta tttcggtgag gacggcaagc 4081 ttcttttgga gcagaccttg aaggtgctca aaaagcgcct cgaaaaggtg agccacgctg 4141 tgatccccgg attctacggc tcgcgcccca acgacaccgt taagaccttc tcacgcgggg 4201 gctcggatat tacaggttcg atcgttgcgg cagcgtgcga agcagacctt tatgaaaact 4261 ggacagacgt ttcgggcttt ttggtatgcg acccgagaat cgttgcaaac cccgttccga 4321 ttcagacgat aacataccgt gagctccgcg agctttcata tatgggcgca ggcgttttgc 4381 acgaggaagc gatcttcccc gtccgcaagg cag // LOCUS sequence056 4395 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence056 VERSION sequence056 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..4395 /mol_type="genomic DNA" /organism="" /note="sequence056" CDS 528..1337 /product="dipicolinic acid synthetase subunit A" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003231888.1" /transl_table=11 /codon_start=1 /translation="MNEVFVLSGDMRQKALATELCARGIAIDTGTILDGIYKAVILPYV SFSGEYLNTVDGRLQLDDIVPYLRRGTVVFAGMYPSKFKDACEERQVRLIDWFADEELT VKNAYLTAEGALGIAIEKSPRAIKDSLVTIIGYGRVAKACARMFNLMGAHVRIMARSYA ARIDAYTHGYKSYEIENDAPLNDADIIINTVPSMILNAKRMANVNNNAMIIELASKPYG TDSAAAEKSGIPLYIAPGLPAKVAPLTAGRLMADMAMKYLKEVQSDG" /locus_tag="LOCUS_3050" /gene="dpaA" /note="WP_003231888.1 dipicolinic acid synthetase subunit A (Bacillus) [pid:32.8%, q_cov:85.5%, s_cov:79.1%, Eval:7.1e-29]" /note="MGA_374" CDS 1330..1902 /product="dipicolinate synthase subunit B" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003429956.1" /transl_table=11 /codon_start=1 /translation="MDKLKIGFALTGSFCTFKPAFDAAKALVAEGHELTPIMSFNAYNI STRFGSYEQNREILWEITGRDIIASIEDAEPIGPKSMFDILVVAPCSSNTLAKLATGVN DTPVTMAVKSHLRNARPVVIALSTNDALAAAAKNIGALQNYRNYYFCPYRQDNFTAKPM SMVADMTLLPQTIELAMKGEQLQPMVR" /locus_tag="LOCUS_3060" /note="WP_003429956.1 dipicolinate synthase subunit B (Clostridioides difficile) [pid:46.3%, q_cov:100.0%, s_cov:96.9%, Eval:3.5e-43]" /note="MGA_375" CDS complement(2118..2795) /product="tRNA (guanosine(46)-N7)-methyltransferase TrmB" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_001239380.1" /transl_table=11 /codon_start=1 /translation="MRMRRKKNLEERLAVCEAAGKLKIIWCEERNFEESIKTKDLFNFE AMFGNSNPVHLEIGCGKGQFAVDLAKQNPNINILAVEKTSNVIVDAAEKVIEEDIPNLM FLRCEAEYLEKFIPAHSIERIYLNFSCPFPKKSYAPHRLTHHRFLRIYEELLAPKAEIH QKTDNKGLFEFSINEFSEYGFTLKNVTLDLHASDFEGNIMTEYEKKFHEMGLPIYRLEA YLK" /locus_tag="LOCUS_3070" /gene="trmB" /EC_number="2.1.1.33" /note="WP_001239380.1 tRNA (guanosine(46)-N7)-methyltransferase TrmB (Bacillus) [pid:53.3%, q_cov:80.0%, s_cov:82.9%, Eval:2.6e-52]" /note="MGA_376" CDS complement(2810..4051) /product="galactokinase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011263235.1" /transl_table=11 /codon_start=1 /translation="MPTRTLSELYEGKYDEQRKRYEDACVEFIKIYKEKPTRFFSAPGR TEVSGNHTDHNHGRVIAAAVDLDIIACVCPIDEPVVYLKSEGFPEDKVDLRELSVIESE KNTSASLIRGVAKGLVDRGYKIGGFKAYTTSDVLKGSGLSSSAAFEVLIGTILNELYNA PHIANPIEIAQIAQYAENVYFGKPSGLMDQMASSWGGFITIDFADTNEPEIDCLMFDLA KHNFSLCIVDTKGNHADLTPEYAAIPNEMKSVARFFGKDYLREITKDDVLSNIVALREK CGDRAILRALHFFEENERVAELCHFIDTDNFEWFLKYINASGNSSYKYLQNVFASSVPD EQGVSLALNVIERLLDGEGAHRVHGGGFAGTVQAFVPNKMLEKFKAGIEAVFGEGSCYV LNIRECGGTEVLFD" /locus_tag="LOCUS_3080" /gene="galK" /EC_number="2.7.1.6" /note="WP_011263235.1 galactokinase (Aliivibrio fischeri) [pid:28.4%, q_cov:90.6%, s_cov:92.7%, Eval:1.2e-34]" /note="MGA_377" CDS complement(4077..4394) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MGQTLGFIGCLGLIILLGLIMLKIIYNGLRAADDLGKYICMGVFA YLFTHCVLNIGMVLGITPVIGIPLPFISAGGSAMLTSTVSIGLILSVYFHQSRFDTLFK K" /locus_tag="LOCUS_3090" /note="WP_011948344.1 rod shape-determining protein RodA (Clostridium botulinum) [pid:50.6%, q_cov:73.3%, s_cov:19.9%, Eval:7.0e-15, partial hit]" /note="MGA_378" ORIGIN 1 gactttctgt aagcgtcaat aaggcgcaga acatcgaggt cataggtgat gccgatatcg 61 ccgcggacct tgttttgttc aatgtcctca gcgttgataa caatgacgat ctctgcctga 121 tctttaagct gcaaaagcat ctggagctta ctgtccggct ggaatccggg aagtacgcgt 181 gaggcgtggt agtcgtcaaa aagcttgccg ccgaattcaa gatatagctt gccgccaaag 241 aattcgatgc gctttttaat atgctccgac tgtgtggaaa gatatttttc gttgtcaaac 301 ccctttgtaa acacaaaaat ccccctaaca aacaatatac actttagtat aacatttttt 361 gcgtgtgctt tcaagcgtga ctcccaaaaa actcatacag atttatcctg cctgttttat 421 tgattttgca taagtgcccc cgatttaccc tttcgcatat actgaactat gaaacctgtt 481 ttttggagcc tggctccgat tccatatacg aaaggaaagg tcaaaaaatg aatgaagttt 541 ttgttttatc gggcgatatg cgccaaaaag ccctggcaac cgagctttgc gcccgcggta 601 tcgctataga tacaggcacg atccttgacg gaatatataa agctgtaatc cttccctatg 661 tttccttctc gggcgaatac ttaaacaccg tcgatgggcg gttgcagctt gatgatattg 721 tcccatatct tcgccgcgga acggtcgtct ttgcgggaat gtatccctca aaattcaaag 781 acgcctgcga agagcggcaa gtgcgcttaa tcgactggtt tgccgacgag gagctgactg 841 ttaaaaacgc atacctgact gctgaggggg ccttgggcat tgcaattgaa aaatcgcccc 901 gagccattaa agacagcctt gtgaccatta tcggctacgg cagagttgca aaagcgtgtg 961 caagaatgtt taatcttatg ggtgctcacg tccgtattat ggcgcgaagc tatgccgcgc 1021 gaatcgacgc ctatacccac gggtataaat catatgaaat tgaaaacgac gcaccgttaa 1081 atgatgccga tataatcatc aataccgtcc caagtatgat tttgaatgcg aagagaatgg 1141 caaatgtcaa taataatgca atgataattg agcttgcctc aaagccttac ggcacagatt 1201 ccgccgccgc tgaaaaatcg ggcatcccgc tctatatagc ccccgggctg cccgcgaaag 1261 ttgcaccgct aaccgcaggc agacttatgg cagatatggc aatgaaatat ttgaaggagg 1321 tgcaaagcga tggataaact aaaaatcggc tttgccttaa caggctcatt ttgcaccttc 1381 aagcctgcct tcgatgccgc aaaggcgctt gttgccgagg gccacgagct gacacccata 1441 atgtcgttca atgcatataa catctctacc cgctttggtt catatgaaca aaatcgcgaa 1501 attttgtggg aaattacagg tagggatatt attgcatcca tcgaggatgc cgaaccgatt 1561 ggcccgaagt cgatgttcga tattctggtg gtggcgccct gttcgtcaaa cacgctggca 1621 aagctcgcaa caggcgtaaa cgacacgcct gtgacaatgg cagtcaaaag ccatttgcgc 1681 aacgcccgcc cagttgtcat cgccctttca accaacgatg cccttgccgc cgcggcaaaa 1741 aatatcggcg cactgcaaaa ctaccgcaac tactatttct gcccctatcg gcaggataac 1801 ttcaccgcca agcctatgtc tatggttgcc gatatgaccc ttctgcccca aacgatcgag 1861 ctggcgatga aaggggagca actccagccg atggtgagat gatagatagc cttccccttg 1921 aggggaaggc gccgaggaac gaggcggatg aagtgccctc tgttttcggc aggggagacc 1981 ctacgtggtc gcccgactcg gggcaggcac acagtcctgc ccctataaat tatcgccgaa 2041 ggcgattcca caatttttca ctattcatta agcgaagcaa taaaagaaaa aaacctcccg 2101 aaaagggagg tttttagcta tttcaaatac gcctctaacc tataaatcgg caagcccatc 2161 tcgtggaact ttttctcata ttccgtcatg atgttgccct caaaatcgct tgcgtgcagg 2221 tcaagcgtca cgtttttcag cgtgaaacca tattccgaga actcattgat cgaaaattca 2281 aacaaacctt tgttgtctgt tttctggtga atctccgcct tgggcgccaa cagttcctca 2341 tatattctta agaatctgtg gtgggtcaat ctgtggggag catagctttt cttcgggaat 2401 gggcaggaaa agttgagata tatcctctca atcgagtggg cgggaatgaa cttttcaaga 2461 tactccgcct cacatcgcaa aaacataagg ttgggaatat cctcttcaat taccttttcc 2521 gccgcatcga caatgacatt agaagtcttt tcaactgcaa gaatgttaat attcgggttt 2581 tgcttcgcca aatctaccgc aaactgtccc tttccgcatc cgatttcgag atgaacgggg 2641 ttactgttgc cgaacatcgc ttcaaaattg aagaggtctt ttgtcttaat tgattcttcg 2701 aagtttcgtt cttcgcacca gatgatttta agcttgcccg cggcttcgca gaccgccaaa 2761 cgctcttcaa gatttttctt tcttctcatt ctcatacggg tgcgtcctct caatcaaaca 2821 aaacttctgt gccgccacat tcgcggatgt tcaaaacata gcaggagcct tctccgaata 2881 ccgcttcaat gcctgccttg aacttttcga gcatcttgtt cggcacaaat gcctgaactg 2941 ttcccgcaaa gccgcctccg tgaacacggt gtgcgccctc gccgtcaagc aaacgctcga 3001 tcacattaag cgccaacgaa acgccctgct cgtcgggtac gcttgatgca aaaacattct 3061 gcagatattt atatgagctg ttgcccgatg cgttgatgta ctttaagaac cactcaaagt 3121 tgtcggtatc aataaagtgg caaagctcgg caacgcgttc gttctcctcg aagaagtgaa 3181 gcgcccttaa aatcgccctg tcgccgcatt tttctctcag ggcgacgatg tttgaaagca 3241 cgtcgtcctt tgttatctcc cgcagatagt ccttgccgaa gaagcgcgcc acactcttca 3301 tttcattggg aattgcagca tattcagggg taagatcggc gtggttgccc ttggtatcaa 3361 caatgcaaag gctaaagttg tgctttgcca aatcaaacat aaggcagtcg atttcaggct 3421 cattggtgtc agcgaagtca atggtgataa atccgcccca gctcgatgcc atctggtcca 3481 taagtcccga aggctttccg aaatatacat tctcggcata ctgtgcaatc tgtgcgattt 3541 caatggggtt tgcaatgtga ggagcgttgt aaagctcatt gagaatagtt ccgataagaa 3601 cttcaaacgc cgctgacgaa gaaagacccg agcctttaag cacatccgat gtggtatatg 3661 ccttaaagcc gccgatctta tatccgcggt cgacaagtcc ctttgcaaca ccgcgaatca 3721 aagatgccga ggtgttcttt tcgctttcaa tcacactaag ctcgcgcaga tcgaccttat 3781 cctcggggaa gccttccgat ttaagatata ccaccggctc gtcaatgggg catacgcagg 3841 cgataatgtc aaggtcaaca gccgctgcaa taactctgcc gtggttgtgg tcggtgtgat 3901 ttcccgaaac ctcggttctt ccgggagcag agaaaaatct cgtaggcttt tccttataga 3961 ttttgataaa ttcgacgcaa gcgtcctcat atctctttct ttgctcgtca tactttcctt 4021 cgtaaagctc gctaagtgtt cttgttggca taattttgtc atcctttcaa agatgtttat 4081 tttttaaaga gcgtgtcaaa tctgctttgg tggaaatata ccgacagtat caacccgatt 4141 gaaacggtgg aagtcagcat cgcagagccg cccgccgaaa taaagggcag gggaattccg 4201 attacggggg taattcccaa aaccataccg atattcaata cgcaatgcgt gaatagatat 4261 gcaaagacgc ccatacaaat atattttccc aaatcatccg ccgcgcgcaa gccattatag 4321 atgattttga gcataataag tcccaaaagt attatcagtc ccaaacagcc gatgaagccc 4381 agcgtctgtc ccaca // LOCUS sequence057 4338 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence057 VERSION sequence057 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..4338 /mol_type="genomic DNA" /organism="" /note="sequence057" CDS 1422..1685 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MDLTHNVIIENRARMSLSGVTDVENFDENEISLYTSMGDMVIRGK NLHVESVSIESGEMSISGEIKSLVWGDKDRTKKPTLWQKMTR" /locus_tag="LOCUS_3100" /note="MGA_380" CDS 1682..2086 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MNGIGTFFGTDYELKLVLLAMLLGATLGSFFDIFRALRRTLKHHP AVVFLEDAFFAIVFGISYYSFSLSLCGGALRGFVLVSMLIGFLVYIYTLGKIICDFFSL TLQALVKIVKKCIRLLCVVQHFTKRKENLS" /locus_tag="LOCUS_3110" /note="MGA_381" CDS 2158..2460 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MAKGEKKRRSAFFDLVKLAVFTLLLLYSVSEIVSTQAEIAEQKTM IEKLHAEIEETKQENDEYLRILGSENEEEYMLTIAVERLGYAYPRERRFYAKPIG" /locus_tag="LOCUS_3120" /note="MGA_382" CDS 2494..3042 /product="S1 domain-containing RNA-binding protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003703194.1" /transl_table=11 /codon_start=1 /translation="MQLEVGAVLEGKVTGILKFGAFVDLGGGKSGMVHISEVSNTFVND INEVLKVGQVVKVKILTIADDGKISLSIKKAQPAPERPQKDFKKREGDFKPKGGDNFRP QDKDKDAPPRNFNRPAPKKPVKKEPVMDITQAEYAYEPKTTVTDAGFEDMLAKFKSSSE DRMSDLKRTMDVKRRSRRK" /locus_tag="LOCUS_3130" /note="WP_003703194.1 S1 domain-containing RNA-binding protein (Ligilactobacillus) [pid:43.9%, q_cov:98.9%, s_cov:96.8%, Eval:4.1e-30]" /note="MGA_383" CDS 3126..3827 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MKLNSTLLIIIVSLMALCLCSCEGEPVAGEDLILAARAEYVSLDS ARVDVINDETGQSEQIFIYKYDEKDMMTYSYIGIGEGLYIAQFNNGYEQFTEENGIIRI ENVGDDGFATYSRDVPYPYADEGLILFYKSAVNNELSYVASNEMATEVCHVYDISKLDG YDTAENMTGFMVKYYFDGDGKLLYLKEITTLTLESGEKKEYSYSIYITERNAIERVDNP IDVSFVEDSIM" /locus_tag="LOCUS_3140" /note="MGA_384" ORIGIN 1 ctcagaaaag tacggcagtg agatcgaatg gatcgaatgt acttacggtt caagattcga 61 tgaccttgca aaccttgttt tggcaggtac atctcccgac ttcaccacct gctccgttaa 121 caccttccct tattattgca ttaagggtat gttccagcct gtaaccgact atctcgatta 181 caccgatccc ctttgggcag gcagtgctga attcgttcag aactacttct ccatgggcgg 241 cgaaccctat atcattttgt gcgacgttaa ggctaccaac gtttgcggat ataaccgccg 301 tgtaattgaa gaatggggct tcgatgatcc cgctgagctt tactataacg acgaatggac 361 ttgggacgta ttctatgata tgtgccttga cttctccgat cccgatgacg acagatatgc 421 tcttgacggt tggtattggc agcaggcatt ggttgactcc accggtacaa ccatcattgc 481 aattgaagac ggccagttcg ttgccaacat tgatgcacct attttggaaa ctgttgaaac 541 cttgctttac gatatcaaca agaacgaagc caacttcccc atctgggcta acggctacaa 601 gccccgtaac gacactgtcg gcggcggtat caaggaaggc cagtgcttgt tctatctcgt 661 agagaagtgg ggcttcaccg acactgttga aactatcagc ggcatctggg gcgacatcac 721 cgcaggcgaa gttatgttct gcccgttgcc cagagcaacc gatggcgacg gtatctatta 781 cctcgcatct cagcctgtag gataccatat catcaccggc gctgaaaacc ccgaagcagt 841 agtattgttc tctatgtgcg aacgcttcaa gatcttggac cccactgttg tatctatcga 901 cagacgtcag cttgaagaag tttatatgtg gacagaagaa atgctcgcaa tggataccat 961 ttgctatgac cttgctgcag ctaacccgat cgttaacttc tctgtaggtt gccagcccaa 1021 cctccagtct gcagttgaca acctcattaa gggtacaacc ggcggcaacc cctccacttg 1081 ggcacagctc aaggaacagt attctgaaag cattgaatac tatgttgaag aactcaatgc 1141 aatgtacgct gaaatggatc agtaatacat agtttttgaa caaaatccct cgctgaaaag 1201 cgggggattt tttatgcctg cgatgaagcg attggtttaa aggtgtcggc tcagccgaca 1261 ttattttgaa tgcgccttcg gcgcataacg ctccggggca cctgccgtcc gcctcgacag 1321 gctcggcaca tcggcagacg cccctccgcg tgccgcggcc actcgcatat tcccgtcatt 1381 tccgccataa acttaaacaa aaaccgaaag gcgggcaaaa aatggacctg acccacaatg 1441 tgataattga aaaccgcgcg cggatgtccc tgtcgggcgt gacggatgtt gaaaacttcg 1501 acgagaacga aatctcatta tatacttcta tgggcgatat ggtcattcga gggaagaacc 1561 tccacgtgga gtcggtcagt atcgaatcgg gcgagatgag catctcgggt gaaataaaat 1621 cgctggtttg gggcgataag gacagaacaa aaaagcccac cctttggcag aagatgacaa 1681 gatgaacgga atcggaacgt ttttcggcac cgattatgag ctgaagctcg tcttgcttgc 1741 aatgcttttg ggcgcgaccc tcggctcatt ttttgatatt ttccgtgcac tgcgccgtac 1801 tctcaagcat caccctgctg tcgtctttct tgaggatgcg tttttcgcga tcgtcttcgg 1861 aattagctat tacagctttt ctttatccct ctgcggcggt gcgcttcgag ggtttgtttt 1921 ggtgtcaatg ctcattggct ttttagtgta tatttatact cttggtaaaa tcatatgtga 1981 ttttttcagt ttgacattgc aagcgcttgt taaaatcgtc aaaaagtgca taaggctttt 2041 gtgcgtggtg caacatttta caaaaagaaa agaaaattta agctaaccga cttgaaaagc 2101 ctaccacttg tgtagtataa tatttatgta tcattatgct caggaggagg tgcgaatatg 2161 gcaaaaggcg aaaagaagcg caggtctgcg ttttttgacc ttgtcaaact ggctgtattc 2221 acacttttgc ttctctattc ggtgagcgaa atcgtttcca cccaggctga aattgccgag 2281 cagaaaacga tgatcgaaaa gctccatgcg gaaattgagg agaccaagca ggaaaatgat 2341 gaatatttgc gtattttagg ttcggagaac gaggaagagt atatgctcac catcgcagtt 2401 gaaagactgg gatacgcata tccgagggaa agacgttttt acgccaagcc catcgggtga 2461 taatgaagtt gaaaagagga aaccaaaaga tttatgcagc ttgaagtagg agcagtttta 2521 gagggaaaag taacaggtat actcaaattc ggtgcgtttg ttgatttggg tggcggcaaa 2581 agcggaatgg ttcacatttc cgaggtttcg aacacctttg tcaacgacat caacgaagtg 2641 ttgaaggtcg gtcaggtcgt taaggttaaa attttgacca ttgctgacga cggtaagatc 2701 agcctttcaa ttaaaaaggc gcagcctgcg cccgaaagac cccagaagga tttcaaaaag 2761 cgcgaaggcg actttaagcc caagggcggc gataatttcc gtccccagga taaagataag 2821 gatgccccgc ccagaaactt taaccgtccc gcgcccaaaa agccggtgaa aaaggaaccc 2881 gtaatggata tcacacaggc ggaatatgcc tatgagccga agacaacggt taccgatgcg 2941 ggctttgagg atatgctggc gaagttcaaa tcctccagcg aggacagaat gagcgacctc 3001 aagcgcacta tggacgttaa gcgccgctca agacgcaagt aatacatata atagatagaa 3061 gaccccaagc tccttgtgag acccatgagg agctttttga tttaaaggat gttgaaagga 3121 aaaccatgaa gcttaactct acactcctta ttataatagt atcccttatg gctttgtgtc 3181 tttgctcctg cgagggcgag cctgttgcgg gtgaggactt gattttggcg gctcgcgccg 3241 aatatgtcag ccttgattcc gcaagggtcg atgtcatcaa cgatgaaacc ggccagtcgg 3301 agcagatatt catttataag tatgacgaga aggatatgat gacatattcc tatatcggca 3361 tcggcgaggg attatatatt gctcagttta acaacggcta tgagcagttc accgaggaaa 3421 acggcatcat ccgaattgag aacgtcggcg acgacggctt tgccacatac agccgcgatg 3481 tgccgtatcc ttatgcggat gagggactta tactatttta taagagcgcg gttaacaacg 3541 agctttcgta tgttgcctca aacgagatgg caaccgaggt ctgccacgtt tatgacattt 3601 caaagcttga cggatatgac actgctgaaa atatgaccgg ctttatggtg aaatactact 3661 tcgacggcga tggcaagctg ctctatttga aggagatcac aactctgacc cttgaatcgg 3721 gggagaaaaa ggaatattcc tattcgatct acatcaccga gcgcaacgcg atcgagcgag 3781 ttgacaaccc gatcgacgtt tcctttgttg aagatagcat aatgtaataa tttttgcaga 3841 ttataaccga tgattttgcc ctcggttata atctgtatat tttgaacaaa aacagcgccc 3901 gaaaacgcaa gaatttctac actaaaatga tgggacaaat ttgcaaaaat gcttgcaatt 3961 gcccatatag cgtgataaaa tataccttgc gtgactgcga agatatgcga tgaagctgaa 4021 ggttgctgac ggtatgtcag gtaatttcgg ccgagtatgt ccgattttaa accgggcgac 4081 tgtaataatg aacacggtat gtgcttttag catcttgcga gcagggattc ctgcggctgt 4141 aagtgcgtag attccatgtg tgttattatg tccaccgaaa aatgaaagtt tttcggtttt 4201 ttatatggga catcgtgaaa cacacggaag cgtgtttaaa aacagagaca gctaccaaat 4261 ctggagcttc cgcccccaac acacacaaac tataggaggc gttttaaaaa tggcagtcaa 4321 tgaaaaaatc agaatcaa // LOCUS sequence058 4305 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence058 VERSION sequence058 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..4305 /mol_type="genomic DNA" /organism="" /note="sequence058" CDS complement(506..1072) /product="indolepyruvate oxidoreductase subunit beta" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_010965300.1" /transl_table=11 /codon_start=1 /translation="MSKNIMIVGVGGQGTLLTSRIIGNLLISEGYDVKVSEVHGMSQRG GSVVTYVKYGDKVSSPIIDKGEADIVLAFEMLEALRALPFVKDGGKLITNTQEIAPMPV IIGATKYPENIADTLSKNTELVAVNAVDMALEAGNIKAVNVVLIGVMAAKTDISYDKWV EALKMTVPPKFLEVNLKAFDLGYNS" /locus_tag="LOCUS_3150" /note="WP_010965300.1 indolepyruvate oxidoreductase subunit beta (Clostridium) [pid:51.4%, q_cov:96.8%, s_cov:95.3%, Eval:2.2e-50]" /note="MGA_386" CDS complement(1077..2813) /product="indolepyruvate ferredoxin oxidoreductase subunit alpha" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_010965301.1" /transl_table=11 /codon_start=1 /translation="MKKLLIGNAAVARGAYEAGARFCSSYPGTPSTEITEEIVKYNEIY AEWAPNEKVACEAAIGASLGGARAMSCMKHVGLNVMADPVFTVSYMGVNGGLVLCVADD PGMHSSQNEQDSRHYAKASKITMLEPSDSQECKDFTKMAFELSEQFDTPVFVRLSTRVS HSQSLVELCEREEVELKPYEKNIAKNVMMPANAIKRHVVVEERIKALREYAETTPINKI IDNGSKIGVITAGIDYEYSQEALGNEVNYLKLGMLYPLPEKLILDFVKGLDKVYVIEEL DPYIEEHCKALGIEVIGKDELTLLGEYTPAMIKKLVLNIDPPKSASIDSPLPARPPVMC AGCPHRATFYVLKKLGLTVCGDIGCYTLGAVAPLGAVDTVVCMGASIGAAFGMAKVRGE EFNKKLVAVIGDSTFVHSGITGLIDIVYNKGNNTVIILDNSITGMTGHQDNPTTGYTIR GEETKQLNLVALCKAIGVEHITVADPFDLKNFEEVVKRETERDEPSVIIAQRPCALLKT VKYSGHCEINEKCKKCRKCMGLGCPAIRNDDGVISIDATQCNGCGLCIGICPFGAIEKK EG" /locus_tag="LOCUS_3160" /gene="iorA" /EC_number="1.2.7.8" /note="WP_010965301.1 indolepyruvate ferredoxin oxidoreductase subunit alpha (Clostridium) [pid:57.2%, q_cov:99.5%, s_cov:98.6%, Eval:1.8e-191]" /note="MGA_387" misc_feature complement(2826..>4305) /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_011461744.1:class I adenylate-forming enzyme family protein" /note="WP_011461744.1 class I adenylate-forming enzyme family protein (Desulfitobacterium hafniense) [pid:34.0%, q_cov:97.0%, s_cov:90.7%, Eval:2.3e-70]" /note="MGA_388" /locus_tag="LOCUS_3170" ORIGIN 1 gcattgtcca agcagccgtg acgttttgta tacttacgct tgtaataaaa cggaatatga 61 ccgccgaatg cggttttcca tccatcgaga attccgtcca aatcgcgggt gaacaaaaac 121 gcaggagtgt tttcgggaat cgctttcaaa tacttcggct cggtgatgac ataagcatac 181 aaatcatccg aatcggtata ttctcccaaa tcgttgataa atctgctgat tccgagtgat 241 gcatcatgct tatttgcata gcattcctcg tcgacgagaa cttggaaata tgcgtatttt 301 ccaagctctt caatgaaatt gtcgataccc gtgttgactt cgccgataag tgcaaaaagc 361 atatttccat ctccttttca ctgattttac tgttccggcc acctgttcgg acggcctctg 421 atacaccttc agtagccttc cccttgaggg gaaggtgtcg gcggatgccg acggatgagg 481 tgaaagaaaa cctgttgatt tttacttacg aattataccc caaatcaaat gccttgaggt 541 tgacctccaa gaacttgggc ggaacggtca ttttaagcgc ttcgacccat ttgtcatagc 601 taatgtcggt ctttgccgcc atgacaccga tgagcaccac attaaccgcc ttgatatttc 661 ccgcttcaag tgccatatcg acagcattaa cagctaccag ctcggtgttc tttgaaagtg 721 tatccgcaat gttttcggga tattttgtag caccgataat gacaggcatc ggcgcaattt 781 cctgtgtgtt ggtgataagc ttgccgccat ctttaacaaa aggcaacgca cgcaaagctt 841 caagcatctc aaatgccaaa acaatatccg cctcgccctt gtcaataatt ggggagctta 901 ccttgtcgcc atacttaaca tatgtaacaa cgcttccgcc gcgctggctc ataccgtgaa 961 cctcgctgac cttaacgtcg taaccctcgc tgatcaaaag gtttccgata attctcgagg 1021 tcaaaagtgt gccctgtccg ccgacaccga cgatcataat gttcttagac atccctttag 1081 ccctccttct tttcgattgc accaaacggg caaattccga tgcaaagtcc gcatccgttg 1141 cactgtgttg catcaattga tataactccg tcatcatttc tgattgcggg gcaaccaagg 1201 cccatgcact tacggcactt tttgcacttt tcgttgatct cgcaatgacc cgaatactta 1261 actgttttca gcaacgcgca gggacgctgt gcgatgataa cgctgggctc atcgcgctcg 1321 gtctcgcgct taacaacttc ttcaaagttt ttaaggtcaa acggatcggc aacggtgatg 1381 tgctcaactc cgatagcttt gcaaagagca accaaattga gctgctttgt ttcttctccg 1441 cgaatggtat atcccgtggt cgggttatcc tgatgtcccg tcataccggt aattgagtta 1501 tctaaaatga taacggtgtt gttgcccttg ttgtaaacaa tgtcaataag gcctgtaatg 1561 cccgagtgaa caaatgtgga atctccgata acggcaacga gctttttgtt gaactcctcg 1621 cctctgacct ttgccatacc gaatgccgcg ccgatagatg cacccataca tacaaccgta 1681 tcaactgcgc ccagaggagc aactgcgccg agggtatagc aaccaatgtc gccgcaaacg 1741 gtcaggccca gctttttgag tacatagaat gtcgctctgt gagggcatcc tgcgcacata 1801 acgggaggtc ttgcaggcag gggagagtcg atgctagccg acttcggcgg gtcaatgttc 1861 aaaacaagct tcttgatcat tgcaggggta tattcgccca aaagtgtcag ctcatccttg 1921 ccgatgacct caatgcccaa tgccttgcaa tgctcttcaa tataagggtc aagctcttca 1981 ataacgtaaa ccttatcaag ccccttgaca aagtccaaaa tcagcttttc gggcagggga 2041 taaagcatac cgagctttaa gtagttgacc tcatttccca acgcttcctg agagtattca 2101 taatcgatac ctgcggtgat gacaccgatt ttcgagccgt tgtcaataat cttgtttatc 2161 ggtgtggttt ctgcatattc gcggagtgcc ttgattcgct cttcaacaac aacgtggcgc 2221 ttaattgcgt tcgcaggcat cattacgttc tttgcaatgt tcttttcata tggtttaagc 2281 tcaacttcct cgcgttcgca aagctcaacc aagctctggg aatgggaaac tcttgttgaa 2341 aggcgcacga aaacaggtgt atcaaactgt tccgaaagct cgaatgccat ttttgtgaaa 2401 tccttgcatt cctgggagtc agaaggctca agcatcgtaa ttttggatgc ctttgcatag 2461 tgacgggagt cctgctcgtt ctgcgaggag tgcatacccg ggtcatcggc tacgcacaaa 2521 accaatccgc cgttaacgcc catatagctg acggtaaaca cagggtcagc cataacgttc 2581 aagccaacat gcttcataca gctcattgct ctcgcgccgc caagtgatgc accgattgcc 2641 gcttcgcagg cgaccttttc gttgggtgcc cattcggcat atatctcatt atattttaca 2701 atttcttcgg ttatttccgt cgaaggtgtt cccggatatg acgagcagaa tcttgcgccc 2761 gcttcatatg cgccccttgc aacggcggca ttgccgataa gaagtttctt catttactaa 2821 tctccttaaa gtgtaatttc attctgcatt gcaaccaagc tgtcgccgca gtagatcttt 2881 ctaagcttcg gtttttcaat cttgcctgtc gcgtttctgg gaatgtctgc aaagatgatc 2941 ttcttgggtc gcttatatct gggcaggctc atgcagaaac gctcaagctc gtcttcgctc 3001 agcttataac cttccttgac ctcgacaata gctgcggcaa tttcgcccaa acgcgggtcg 3061 ggaagaccga taacagcaac gtccttgacc ttgaagttct ggcgaatgaa gttctcgatc 3121 tgaacaggat aaaggttttc gccgcctgta ataataacat ccttcttgcg gtcaacaaga 3181 taaatgaagc cgtcctcgtc catttccgcc atatcgcctg tataaagcca accgtcgggg 3241 cttaatgttt cggcagttgc cttttcgtcc ttataataac attccattac gccggggccc 3301 ttaactgcaa gctcaccgac atcgcctttt tgaacctcat tcttgttttc gtcaactatc 3361 ttaacttccc agccatatcc gggaatgccg atcgcgccga ccttgtgaat gttttccata 3421 ccaaggtgaa cacagccggg accgattgat tcgctgaggc cgtagttggt gtcatatgcg 3481 tgattgggga agatctcctt ccaatatttg atcagcgacg gaggaacggg ctgtgcaccg 3541 atatgcatca ggcgccactg tgaaagctca tagtcgtcaa ggttgatttc gcctctgtca 3601 atggcatcca aaatatcctg cgcccacgga accaaaagcc aaacgatagt acacttttcc 3661 tcgcttacgg tcttaattac ccactcgggc ttgacacctt taagcaaaac agccttgccg 3721 ccgacaagga agcttccgaa ccagtgcatc tttgcgcccg tgtgataaag cgggggaatg 3781 caaaggaaaa cgtcgtcctt ggtctgatgg tggtggttct gctcaacctt gcaggaatgc 3841 atcagcgagc ggtgcttatg tataatagcc ttggggaagc ctgttgttcc cgaagagaag 3901 tagattgcgg catagtcgtc atccgaaatc tcaatgctgg gacgctcggt actgtaatat 3961 tgcagcatct tgttatagct ttccgcaaag gtggggcaat cctcaccgac atagtaacag 4021 gttttaactc tgggaaccat atcaatgatt tcttctacac gtccgataaa ttcggggccg 4081 aaaaccaaag cgtcaacatc cgcaagctcc aaacagtaac gaatttcatc tgcagcataa 4141 cggaagttca gcggtaccgc cattgcacct gttttcaaga ttccgaagta tatgggaagc 4201 cattcgatgc agttcattaa aagaattgca accttgtcgc ccttcttaat gccgtgggca 4261 taaagcatat ttgaaaatct gtttgccttt ttgtcaaatt caagc // LOCUS sequence059 4272 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence059 VERSION sequence059 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..4272 /mol_type="genomic DNA" /organism="" /note="sequence059" CDS 403..1389 /product="bifunctional oligoribonuclease/PAP phosphatase NrnA" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_010989747.1" /transl_table=11 /codon_start=1 /translation="MSLEVMNKILDKIKEYDRILLFRHFRPDGDAVGSTKGLQAILRAT YPEKKILLQNCDFASYLEFMGKEDELLADEEYTNALGIVIDCGTADRVSNEKFKLCKEV VKIDHHIDIKPYGNYSWVEEEKSSACEMIVKFYDTFKDELKITKEAATYLYIGMVTDSG RFKFSCVSGDTLRYAAILLDQKIDTDVIFANLYLEEFSNLKFKAYVYENMQMSENGVAY LYVNKEMQDRFGLSQEDASASISYLEAIKGCLCWIVFIATNDGAGTIRVRLRSRFAEIN KIAENFRGGGHACASGATIYNEEEMRALIDEADAHIKNYKETHEGWL" /locus_tag="LOCUS_3180" /note="WP_010989747.1 bifunctional oligoribonuclease/PAP phosphatase NrnA (Listeria monocytogenes) [pid:41.6%, q_cov:92.4%, s_cov:95.8%, Eval:9.4e-61]" /note="MGA_390" CDS 1386..2099 /product="5'/3'-nucleotidase SurE" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_004082178.1" /transl_table=11 /codon_start=1 /translation="MRILITNDDSVSSTVLIPLVRWAMKHGDVTVCVPKFEQSAKSHAI ELRHAFEVKKIDLVEGADCYTVDSTPADCVRYAVLGLDKEYDLVISGINKGYNMGQDII YSGTVSAVMEGAYLGIKGVAVSTDVGTFTEAMAKLDEVYYYFKERRLFDLNMVYNVNIP PRAEGILITRQGGAFYTDSFEPIGNDMYQPTGRCVYEDTGDDTIDTNAVMHGHISITPL SLNRTEMTVFEGLKG" /locus_tag="LOCUS_3190" /gene="surE" /EC_number="3.1.3.6" /note="WP_004082178.1 5'/3'-nucleotidase SurE (Thermotoga maritima) [pid:37.2%, q_cov:93.7%, s_cov:92.7%, Eval:1.6e-31]" /note="MGA_391" CDS 2104..2538 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MKDTDTKVPAMFGIFFSILSFAFVINAWVLSMTEIATESVHGPGF GSWMISVILALMSTLCYAFDGIISLIKALHKISPRFNIALAVVTLISVPMVLFVGGGLG INILIWNTYHLAIVIMEIISIVMHLKAERCEEESPQLSER" /locus_tag="LOCUS_3200" /note="MGA_392" ORIGIN 1 attgacacca acgagatata tcgaaatctt tatgccgaca gctttgagag caagaagcta 61 agagctcact ttaccctcaa aatcaacctg accggcaagg gagttgcata tatctataca 121 actcttgacg aggttaagga gctcggtgtt gatacattca cgatttcccg cggaatggtc 181 ggaacaatgg cagacaccaa gggtgttgac atttgggcca acttcaccga aacagaaaac 241 ggcattcttt gtgagcttcg ctcatcaaaa tataacatta acccaatcgc tgtgaaatat 301 ggcggcggcg gacacgaaaa ggcaagcggt gcaaccgtaa tgactaagga agaagcattt 361 gcaatgctcg ccgaccttga tgatatgatg gagggaaaat aaatgagcct tgaagtaatg 421 aacaaaattt tagataagat taaggaatat gaccgcattc tccttttcag acattttcgt 481 cccgacggcg atgctgttgg ttcaacaaag ggcttgcagg caattctaag agccacatat 541 cccgaaaaaa aaattctgct tcaaaactgc gactttgcaa gttatttgga atttatgggc 601 aaagaagacg agcttttggc ggatgaagaa tatacaaacg ctttgggcat tgtaatcgac 661 tgcggcacag cggacagagt ttccaacgag aagttcaagc tctgcaaaga agtcgttaaa 721 attgaccacc acattgacat taagccttat ggcaactact cctgggtcga agaggagaag 781 tcttccgcct gcgagatgat cgtcaagttt tacgacacct tcaaggacga gctgaagata 841 actaaagagg cggcgacata tctttacatc ggtatggtca ccgactcggg cagatttaaa 901 tttagctgtg tttcgggaga tactttgcgt tatgcggcaa ttctgctcga tcagaaaatt 961 gacaccgacg ttatttttgc aaatctatat ttggaggaat tctcaaacct caagtttaag 1021 gcatatgttt atgaaaatat gcagatgagc gaaaacggcg tggcgtatct ttatgtcaat 1081 aaggagatgc aggatagatt cgggctcagt caagaggatg caagtgcctc gatctcttat 1141 cttgaagcga ttaaaggctg cctttgctgg atagttttta ttgctacaaa tgacggcgcg 1201 ggcactatca gagttcgttt gcgttcgaga tttgccgaga taaacaagat tgccgaaaac 1261 ttccgcggcg gaggacacgc ttgtgcaagc ggagcgacga tctataatga agaagaaatg 1321 cgcgcgctga ttgatgaagc ggatgcacac attaaaaatt ataaagaaac ccacgagggc 1381 tggctatgag aatacttatt acgaatgacg acagcgtaag ctcgacggtg ttgattccgc 1441 tggtgcgctg ggcaatgaaa cacggcgatg tgaccgtttg tgtgccgaaa tttgaacaga 1501 gcgcgaaaag ccatgcaatt gagcttagac acgcatttga agtgaagaaa attgaccttg 1561 tcgagggcgc agattgctat actgttgatt cgacacctgc cgactgcgta agatatgcgg 1621 tcttgggact tgataaggaa tatgacctgg ttatatctgg aatcaacaag ggatataaca 1681 tgggtcagga cattatatat tcgggtacgg tcagcgctgt tatggagggc gcatacctcg 1741 gaattaaggg cgttgctgta tcgacagatg tcggcacatt cacagaagcg atggcaaagc 1801 tcgacgaggt gtattactac ttcaaagagc gcaggctgtt tgatttgaat atggtttaca 1861 atgtgaatat tcccccgcgg gctgagggaa ttcttatcac ccgtcagggc ggagcgtttt 1921 ataccgacag ctttgagcct atcggcaacg atatgtatca gcccacaggc agatgcgttt 1981 atgaggacac gggcgatgac acgattgaca ccaatgcggt tatgcacggg catatatcca 2041 ttacacctct ttcgctcaac agaaccgaga tgacggtgtt tgagggattg aagggatgaa 2101 gatatgaaag acacagatac caaagtacct gcaatgtttg gaatattctt cagcattctc 2161 agctttgctt ttgtgattaa tgcttgggtt ctttctatga ctgagattgc aaccgaaagc 2221 gtacacggtc caggattcgg ttcttggatg atcagcgtta tacttgcttt gatgagtacg 2281 ttgtgctacg cttttgacgg catcatttcc ttgataaaag cccttcacaa aatcagcccg 2341 agatttaaca ttgccttggc agttgtaaca ttaatcagtg tgccgatggt cttgtttgtc 2401 ggcggaggac ttggaattaa cattctgatt tggaatacct atcaccttgc aatcgttatt 2461 atggagataa tttcaatcgt gatgcattta aaggctgaaa ggtgtgaaga ggagtcccct 2521 cagctctccg agcggtaaaa tagcgcaaaa aacaaacata aaaaaagacc ccacagatgt 2581 gaggtctttt tattatgcgg ttaggtatga attatcccaa ggtgcagccg gcatcgaatt 2641 cgatggtgcc cttgtagttc ttcaaagtac cggtaacggt gatggtgtcg ccaactgcga 2701 gagtagcagc gccttcgccc ttgaggcggt agcactggat tgccttgcct tcaacttcga 2761 tggtaacggt gatgttgccg tactgttcgc tgtattcggt gtcgatagag gtgatagcac 2821 cggtgagggt tgcttcctga ggcaaagatg cgccgtcagc aagtgcatat gcagcttcaa 2881 cgatagcagc gggctcggtg ggcatcacaa agagagtgca accagcgtca aattcgatgg 2941 tgcccttgta attcttcaag gtaccggtaa cggtgataac gtcgccaaca gcgatggtat 3001 cagcgccttc gcccttgagg cggtagcaca taatgggctt gtcttccttg cctgcaacag 3061 cgatggtaac ggtaacgttg ccgtagtcag cgctgtattc ggtatcaaca gaaacgattg 3121 cacaggtaag ggttgcggtg taaggcaagg ttgcgccgtc ttcaagagcg taagcagcat 3181 caacgatctc ccaaggatcg gaaggagctt caacaactac ttcttcagca gcgtcgtcgg 3241 tcttagcctt aacaacgttg tcaagtgtgc agccggcatc gaattcgatg gtgcccttat 3301 agttcttcat gatacctgta acggtgatgc agtcgccgac agcgagctcc ttagcgcctt 3361 cgcccttgag gcggtagcac ataatgagtc tttcgggatc gccgcagtcc atggtaacgg 3421 tgatgttctg gtagtcttcg ctccaagcgg tatcgatctt aacgatagta cctacgagag 3481 tgcagggatc ggtaaatgca aggccgtctt caagtgcata agcagcatca agcaaagcgg 3541 tctggtcctt aacttcgcca tagccaacga ggatgcatcc tgcatcgtat tcgatggtgc 3601 ccttgtagtt cttgaaggta ccttcaacgg tgatagcatc gcctactgcg aggtccttag 3661 cgccttcgcc cttgaggcgg tagcacatga tgggcttgtc ttccttgccg gcaacggcaa 3721 tggtaacggt gatgttctta taatcggcgc tccagggagt gtcgatgttc acgatcttac 3781 cgaacagacg gaaggtgttc tcgttcttct cgccgtctgc cagagcgtaa cccatatcta 3841 cgatctgcgc ataggtcagg ccatctacgt tcaggcctgc gggcagaatg tgattccagg 3901 agtgggtcgc aacattgccg ttctcatcgg tgatggtagc agtcagaacg tagggagtat 3961 ccgcctctgc gccctcgttt acgattacgg taaccaggcc gtcctcggcg acctcgatct 4021 taacgagatc ctcggatacg tcggtggtcc aaacaacggt gtacacggta tcgccaacgg 4081 gaaccttacc aacgcgctgg taatccttgg cggtgttctc agccgctttc ttataagcgg 4141 tctttacgta tgcgatcgca ttgtccaggc cgttttcagc gggctcgact acatcggggg 4201 tatcgttggg aggggtggtt tcgttgcagc ctgcatatac acacacgctc attgccagaa 4261 gcaagaggca ag // LOCUS sequence060 4252 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence060 VERSION sequence060 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..4252 /mol_type="genomic DNA" /organism="" /note="sequence060" CDS 181..1512 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MKLERIVIVLLSAVFIIVSLAIALGRDRADIPTSVTDDTPVSTMD TTVNDPPATSETTTEEPEITEPSQTEPSQLAETPTEPPASEAEPEPEYPIDATVRICIG GDTSIDGEFADVCYDKGIDYPWRQVSEILNAADLSILNLETCVSDAGVSEKKEGFGFRT PPEMLEGFVDAGIDMVNLANNHVRDFGYDALLATFDNLEAYGIDYFGAGRDLNQAGGLV IKEVNGVKIGFTGCNRVWLTDDCEAAEGHAGVNQVHSLNKPSTQAYLERIREYDSQVDV LICFMHYGTEEVFEVTSYQEDMSRALIDNGVDIFVGGHSHTLQPIEFYKEKLIIYSIGN FIFWHVDDDIDGLSAIFDITVDREGFVSLKLHPVFIKRYRANLVEKGSDRYDQIIALSN TLCNPYGLAFDEDGNMIEYVPPLPEETVATDMTDTIAETEIIPE" /locus_tag="LOCUS_3210" /note="WP_009930706.1 CapA family protein (Listeria monocytogenes) [pid:31.9%, q_cov:69.8%, s_cov:81.2%, Eval:7.1e-36, partial hit]" /note="MGA_395" CDS complement(1634..2491) /product="HAD family hydrolase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_012027122.1" /transl_table=11 /codon_start=1 /translation="MSVFDTFEKKHDYLICVDSDGCAMDTMKCKHERCFGPCMVKRWEL DEWKDDILYRWDYINLYSMTRGINRFKGLAMALEEIDKQYKKIIGVKTLVEWANNAPKL SNDALLEAVEECDDLDGKQCLYMAYLWSVAVNESIEKLHDSLKVPFVGALEGLREAHEF ADVAVVSSANRDAVEKEWADHGLVDHVDILLTQDCGSKAHCIAEMLKKGYSLDHVLMVG DAPGDLDAADKNGVLCFPILVGAEMTSWADFRRVALENLKNGKYAGEYQADVKEKFYKN LGAR" /locus_tag="LOCUS_3220" /note="WP_012027122.1 HAD family hydrolase (Streptococcus suis) [pid:40.7%, q_cov:95.8%, s_cov:98.5%, Eval:2.9e-52]" /note="MGA_396" misc_feature complement(2504..>4252) /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_012775581.1:glycoside hydrolase family 3 N-terminal domain-containing protein" /note="WP_012775581.1 glycoside hydrolase family 3 N-terminal domain-containing protein (Streptococcus suis) [pid:42.8%, q_cov:100.0%, s_cov:97.5%, Eval:2.3e-133]" /note="MGA_397" /locus_tag="LOCUS_3230" ORIGIN 1 cgcgcccgca gggcgcgggg acaccgacag caatgctgtc ggtgtggcgg cgcttcgcgc 61 aaacgccacc gaaatcgcaa ccgttcaaac agcaatttcc tgctttgcta tatagacaaa 121 cagctacggt tagtatataa taatagttaa caaagataac tgatgaaacg aggtgctacc 181 ttgaagcttg aacgaatcgt aatagtcctg ctcagcgcag ttttcataat tgtttcgctt 241 gcgattgcct tgggccgcga ccgcgcggac attcccacat ccgttaccga tgacactccc 301 gtgtcaacga tggacacaac cgtaaacgac ccgcccgcca cgagcgaaac caccaccgaa 361 gaaccggaaa ttaccgagcc ttcgcaaact gagccatctc agctcgctga aacacccacc 421 gagccgccgg catctgaggc agagcctgaa cctgagtatc cgattgatgc aactgttcgc 481 atctgcattg gcggtgacac ctcgatcgac ggcgagttcg ccgacgtttg ctatgataag 541 ggcatcgact atccttggcg gcaggtaagt gaaattttga acgctgcaga tctgtcgatc 601 ctcaacctcg aaacctgtgt cagcgatgca ggtgtatccg aaaaaaagga gggcttcggt 661 ttccgtaccc cgcccgaaat gcttgagggc tttgttgatg cgggaattga tatggtcaac 721 cttgcaaata accatgtccg cgacttcggc tatgatgcac ttttggcaac gtttgacaac 781 ctcgaagcat atggtattga ctacttcggc gcaggccgcg accttaatca agcaggcgga 841 cttgtgataa aagaagtcaa cggcgtgaag attggtttta caggctgtaa ccgtgtttgg 901 ctgaccgatg actgtgaggc ggcagaaggt cacgcaggag taaatcaggt acactccctc 961 aacaagccct caacccaggc atatcttgag cgtatccgtg aatatgattc acaggtcgat 1021 gtcctcatct gctttatgca ctatggtacc gaggaagttt ttgaagtcac ctcttatcag 1081 gaggatatgt cccgcgcact tattgataac ggtgttgata tttttgtcgg aggacactcc 1141 cacactctcc aacccatcga gttttataaa gaaaagctga ttatttacag tatcggcaac 1201 ttcatcttct ggcatgttga cgacgatatc gacggacttt cagcgatttt tgatatcact 1261 gttgaccgag agggctttgt gtcgctcaaa ctccaccccg tatttatcaa acgctaccgc 1321 gcaaaccttg ttgaaaaggg gtcagataga tacgaccaga taatcgctct ttcaaacacc 1381 ctttgcaatc cttatggtct cgcattcgac gaggacggca atatgataga gtatgttccg 1441 ccattgcccg aggaaactgt tgcaacagat atgacagaca ccatcgccga aacggagata 1501 attcccgaat agacataaaa acccagccct tacaaaccat cgccgaaggc gatatcgcaa 1561 ttattcacta ttcattaagt cataaaaaac caagcctcgc ttattttcat aagcgaggct 1621 ttttgctgtt aatttatctt gcgccgagat tcttataaaa cttctcctta acgtctgcct 1681 gatattcacc ggcatatttg ccgtttttga gattttcaag tgcaacgcga cggaagtctg 1741 cccagcttgt catctccgcg ccgacgagga tggggaaaca gagcacgccg tttttgtcag 1801 cggcatccaa gtcgccggga gcatcgccaa ccatcagcac atggtcaaga gagtaaccct 1861 ttttgagcat ttctgcgatg caatgcgctt ttgaaccgca atcctgagtc agcaaaatgt 1921 caacgtggtc aacaagtccg tggtctgccc attctttctc aactgcatct ctgtttgcgc 1981 tggatacgac cgcaacgtcc gcaaattcgt gagcctcgcg caagccttca agtgcgccga 2041 caaagggaac cttcagcgaa tcgtgaagct tctcaatact ctcatttact gcaacgctcc 2101 acagatacgc catatataag cactgcttgc cgtcaaggtc atcgcactct tcaactgctt 2161 caagcaaagc atcgtttgaa agcttgggcg cattgtttgc ccattcaacc agcgttttaa 2221 cgccgataat tttcttatac tgcttgtcga tctcctcaag cgccattgca agtcctttga 2281 aacgattgat tcctcttgtc atcgaataga ggttgatgta atcccagcga tagaggatat 2341 catccttcca ctcatcaagc tcccaacgct tcaccataca agggccgaag catctttcgt 2401 gcttacactt cattgtgtcc atagcacagc cgtccgagtc tacgcagata agatagtcgt 2461 gcttcttttc gaaagtatca aatactgaca tattgatttc accttacagt cttgtatccc 2521 aaagtccgca gaagctgtca atagggtcag ttcccttaaa tgcctcgggg cctgtaacaa 2581 gggcatcaac caaagcatca agagtgctgt cggtcgagtc gtaagcgttg atatatgttc 2641 tgagcatagg tacgtcagcg agcattgtgg gcgcatttac gctgatgccg ataacatcct 2701 gctcaaatac ataccacgga atttctccgc cgcccttaga cattccgaag caaggtctgc 2761 cggtcatacc gtcataaagc gagatgataa catcctggcc tgcaacgaat tcggaaatag 2821 cgttcttacc catgaagtat acgttgaggt tgaacttttc gcctgcggcg atctgcttct 2881 taattctgtc aatggggctc tcataaatga aagcatcaaa gccctttgca ataagtctgt 2941 cgcggagctt ttcagcgggg ttttgcttgc ctgcgcccat acccatagca agagctgcaa 3001 gctgcatcat cgggctgtca tatcccttga tgtaaacgat catgactctc tttgtctttt 3061 cggggttgat gggcaatacg ccttcgtcct tatacttaac aagagtcaaa gcatcgcggc 3121 tgattgcatt tgcaacctca gcaccttcgg ggtttctcat acaagcaaga gcagcctcat 3181 cgggaacgag gtcttcctta gccttcttgt taagacccat atgtgccttg aggcccaaga 3241 ttctggtcaa agcttcgacc attctttcct cgctgataac gcctgtcttg taagcatcga 3301 gcattgttgc gaagtcctcg tcggggtcat tgaagaacag gaacatatcg cagcctgcat 3361 tgatagcagc agggagcatt tcctttcttg tcattctgtc ggtcatacca accatatggg 3421 aagcgtcggt aactaccata ccgttgaagc cgagcttttc gcgcaaaagt cctgtcataa 3481 tttcggggca gagggttgcg ggcaaaagct cttcgtcctt aatgtccggc ttaacgtcgc 3541 gcatatagtt tctcatcata atgtgtccgc ccatgattgc atcaaggtcg gcgtcaatga 3601 gagtcttata tacatggccg aatgtttcca tccattcctt ttcgttaagg tcgttaatgt 3661 tgtttgatgt gtgtgcatct ctaaagtcaa gaccgtttcc ggggaagtgc ttagcggcac 3721 aagcgaatcc atcaatggtg tgtgcaccct tgagatattc gcggctcata agtgcaactc 3781 tttcggggtc attaccgaat gcacgggaaa cgacttcggt gttttcccag ttcatatgaa 3841 tatcgcaaac agggctgaat gccatattac agccgattgc agcagcctgt tcgtttgcaa 3901 ttctgccaag gtcattagca tactgcaaat tgcctgttgc accgatcttg atgcccgaag 3961 cgataggtgt gccgtcggcg caagcaccgt tgccgcctgc ttcggtattg caagcgatga 4021 tgagaggaat tttagcatac tcctgcaaaa ttctgttctg atcctgaacc atttttgaag 4081 gcataccgtt atagcggcat ccgccgaggt gatatttctc cataagctcc ttgagataat 4141 cctcgcttac acctgcggtg agctggaaga agagctgtcc gaccttttcc tcgtcggtca 4201 tagaagcgat agtgctttcg acccacttga tatcctcatc gttaagataa ta // LOCUS sequence061 4249 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence061 VERSION sequence061 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..4249 /mol_type="genomic DNA" /organism="" /note="sequence061" misc_feature <1..1039 /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_003433873.1:AI-2E family transporter" /note="WP_003433873.1 AI-2E family transporter (Clostridioides difficile) [pid:41.6%, q_cov:87.5%, s_cov:77.6%, Eval:2.0e-61]" /note="MGA_398" /locus_tag="LOCUS_3240" CDS complement(1078..2763) /product="glycoside hydrolase 43 family protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_010992104.1" /transl_table=11 /codon_start=1 /translation="MKTNLIFRLLALILCLVTLLSMLAGCGNAPAVNNNGSKVEESKNT NKITLTNPLIWSDIPDPDIIRVGDTYYMVSTTMFYNPGIPIMKSTDLAHWELIGYAYDV LEHNPRTDLYGDNHSYASGTWASCIRYNDGYFYILSFAYDTGKSYIFKTADIENPDWTV YEFDRIFHDPSLLFDDDGRVYVVYGVGDVWITELEPDCSKVKAGGVNQKLFNSGLAEGL SGAEGSHIYKIDGTYYITMISYATNGDCARCELCFRSDNLLKGWEGKVVLCDSMGYYGA GVAQGGIVDTPEGDWYALLFQDHGAVGRVPALQPVTWEKGWPMMGENGDAAANVKVLSD KSEWTESSLMSNDEFDYTENKLSLYWQFNHNPDNKYWSVTERPGYYRITTSEIDTDIFH ASNTLTQRAEGPYSTTEVKLDVSGLNVGDYAGISAFQTWAGVIGVYVDDDGAKKVYFET RHRKNGGEIINEEVIEQDEIYLKIEYKFSEIDEDGKITTQDQARFYYSLDGEKWIKFGK GFTMTYDLDLFTGYRTGLYCYSTVEAGGHADFDYYHIYKGANPN" /locus_tag="LOCUS_3250" /note="WP_010992104.1 glycoside hydrolase 43 family protein (Bacteroides fragilis) [pid:36.4%, q_cov:89.8%, s_cov:93.0%, Eval:3.9e-82]" /note="MGA_399" misc_feature complement(2938..>4249) /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_001973414.1:2,3-bisphosphoglycerate-independent phosphoglycerate mutase" /note="WP_001973414.1 2,3-bisphosphoglycerate-independent phosphoglycerate mutase (Leptospira interrogans) [pid:52.0%, q_cov:99.8%, s_cov:81.4%, Eval:2.5e-126]" /note="MGA_400" /locus_tag="LOCUS_3260" ORIGIN 1 attctcaaga gtcattggca ttttctgtgc ctctgttgtt ttaatagcaa tcatcgcact 61 ggtaatctta tcggtaatcc ctgaattgat ttcaagtatc cccgggattt acgatggcat 121 tacaaatgag cttatacccg gaattcaaac atgggtaaat aagctccttg aggataatcc 181 cagcatatca aatattgtca gcaatgagtt gaacgatatt tacaaaggca ttcaatcgct 241 tgtttcgtca attattcctc agttgacaaa tgttttaaca gagattttgg actttgcaaa 301 ctctgttaaa aacttcgttt ttggatttat cctggcaatt tacttcctat ttactaagga 361 aattttgcag gcacaaacca aaaagcttat tgtggcgctg ttcagtgtgc agacatatac 421 aagaatattt gcaattacat caaacaccaa caatgctttg cttaacttct tttatggaaa 481 tataatcgac tccaccatca tcggacttat ctgtgctgta tttatgcttg tgacaaagat 541 gccttacgtg ttgatcattt cgctgattat cggaatcaca aacataatcc ctgtatttgg 601 accgttcatc ggtgcaatcc cttcagcaat acttgtttta attgctgacc ctccaaaaac 661 aatttggttt gtaatattta ttgtcgtgct tcagcaaatt gacggcaaca tcattggtcc 721 taaaattttg ggcgacaaaa tcggtatatc ttccttctgg acactgttct caattttggt 781 attcggttca atgttcggaa ttgttggaat gattatcggt gtaccgatat ttgcagttat 841 catggatatt gtcaagacca ttgttaacag caagctcaga tcaaaggata tgccaaccga 901 cagggattac tattctattc cgggaaagca gatcggttcc ggtggcgcgg cagttcaaat 961 taacggcgtc gtaaaggtaa ttgagggaac ggatgagcaa gacgaaaacc agtttaactt 1021 ttttgagagt gacaaataaa aaaacggccc actgtgaagt gggctgtttt tattatatca 1081 gttgggattt gcgcctttat agatatgata atagtcgaaa tcagcgtggc ctcctgcctc 1141 aacagttgag tagcaatata gacctgtgcg gtaacctgta aaaagatcaa ggtcataggt 1201 cattgtgaat cccttgccga acttgatcca tttttcacca tcgagggaat aatagaatct 1261 cgcctgatcc tgcgtggtga tttttccgtc ttcgtcgatt tcagagaatt tatattcaat 1321 cttgagatat atctcatcct gttcaatgac ttcctcattg atgatttcac cgccgttttt 1381 gcgatgacgt gtttcaaagt ataccttttt ggctccatcg tcatcaacat atacgccgat 1441 cactcctgcc catgtctgga atgctgaaat gcctgcgtag tcaccaacat taagacccga 1501 aacatcaagc tttacctcag ttgttgaata aggaccctcg gcgcgctgag taagggtgtt 1561 tgaagcgtgg aagatatctg tatcgatctc gcttgttgtg attctgtaat agccgggacg 1621 ctcggttaca gaccaatatt tgttgtcggg attgtggtta aactgccaat ataggctgag 1681 cttattctct gtataatcga attcatcatt agacataagc gagctttcgg tccattcgga 1741 tttgtcagat aaaaccttca catttgctgc agcatcgccg ttttcgccca tcattggcca 1801 gcccttttcc caagttacag gctgaagcgc aggaactctg ccaacagcgc catgatcctg 1861 aaacagcaat gcataccaat caccttcggg agtgtcaaca ataccgcctt gagcaacacc 1921 tgcgccgtaa tagcccatag agtcgcacaa aacgaccttt ccttcccaac ccttcaaaag 1981 attatccgag cggaagcaaa gctcacatct tgcgcaatct ccgttggtgg cataggatat 2041 catcgtgata taataagtgc cgtcgatctt atagatatgc gagccctcag caccgctgag 2101 gccctcagcg agtcctgaat tgaatagttt ttgatttacg cctcccgctt taacctttga 2161 gcagtcgggt tcaagctctg tgatccagac atcacccaca ccgtaaacaa catatactct 2221 gccgtcgtca tcaaacaaaa gcgaggggtc atggaagatc cgatcgaatt cataaacagt 2281 ccaatcggga ttttcaatat cggcagtttt aaagatatag ctctttcctg tgtcataagc 2341 aaaggagaga atgtaaaaat atccatcatt atatcggatg caggatgccc aagtgcctga 2401 ggcataagag tggttatcgc catagaggtc ggttctgggg ttgtgttcca aaacatcgta 2461 ggcatagccg ataagctccc aatgtgcaag atctgtcgat ttcattatcg gaatgccggg 2521 gttatagaac atagttgtac ttaccatata gtaagtatcc cctactcgta taatatcagg 2581 gtctggaata tccgaccaga tcaatggatt tgtaagcgtg atcttattgg tgtttttgga 2641 ttcttcgact ttactaccgt tattattaac agcaggagca ttgccgcaac ccgcaagcat 2701 agacaataag gttacaagac aaagaattaa tgctaaaagc cggaaaataa ggttagtttt 2761 cattagcgca cctcttttgc gaaatgttcc aagtttatta taattatata ataacacatc 2821 aatttaaaaa ttgcatctgt tttgagtaaa gatgttacga tatatcaatc atatcaaaat 2881 atatgtaaat aaggcacgca aaaacgcgtg cctaattttt gatttaatgt gaaattatca 2941 gatcatgctg tcttcccagc agtcgggagc ggtaagaccg aagatggttg caacggtagg 3001 tgcaacgttt gcaaggccat attcgccgtc cttaattaca aactcgcgct cggtatcata 3061 aataatgaaa ggtacgcggt tgagagagtg agcagttctt actgcaacat tgcccttctt 3121 gtccttttcg agcatttcat cagcattgcc atggtcagcg gtgataagta cggttgcacc 3181 gacttcatca gcagccttga gcactcttgc aagacccaaa tcaactgctt caacgccaac 3241 gatagtggca tccagattgc ctgtgtggcc aaccatatcg ccgttggggt agttgcaacg 3301 aatgaaatca tactttccac tcttgagagc ggcgataaca tcgtctgtaa cctctgcagc 3361 cttcatccag gggcgttcat caaatgaaac cttgtcggaa ggaatttcgt tgaaggtttc 3421 aagctcttcg ctaaactttt ctgacttgtt gccgttccag aagtaggtta cgtggccata 3481 tttctgggtc tcggaaacag catactgacg caaaccgttt tcaacaagaa gctcggaaag 3541 agtgttcttg atttcagggg gatttacaag gtacttctca ggcaacttga ggtcgccgtc 3601 atactgaagc atacctgcat agataacctt gggcattgct cccctgtcaa atgcagtgaa 3661 gtcagcctgg tcgaatgcca tggacatttc gattgctctg tcgccgcgga agttgaaaag 3721 aactacgcta tcgttatcca cgattttgcc gacaggctcg ccgttcttgg cgattacaaa 3781 tgcagggaga tcctggtcaa ttacatcaag ctctgcgcgg taggtttcaa ttgcttcggt 3841 tgcagtttca aactgtctgc caagaccgtg aacgtgggta tcccagccga gcttgaccat 3901 atcccagtta gcctggtatc tgtccattgt taccttcatt ctgccgccgc ccgaagcgat 3961 taccgcgttg aagttatcat cattcaagga agccatatga gcttcaaggt cgttaacata 4021 tatcaaagca gaggttgcgg gaacgtcacg tccatccaaa agaacatgac atttaacgct 4081 cttaacgccc atttccttag cttttgtaat catctgcttg aggtgggaaa tgttggagtg 4141 tacgttaccg tcggaaagaa ggccgataaa gtggagagat gagccgttgg caacacagtt 4201 gttaacaagc tcgttccaag tgcttgatgc aaacatcttg ccagattcg // LOCUS sequence062 4224 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence062 VERSION sequence062 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..4224 /mol_type="genomic DNA" /organism="" /note="sequence062" CDS 1..486 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MGDMLTLIEKAQTTFDDKQAEKLADRMSEGKFDFNDLLEQTKQIK KMGSLQSILSMMPGGNQVDPSQIDEKQIPRMEAMILSMTPAEREKPSLINPSRKRRIAA GSGTRVEDVNRLIKQYEQMQKLMKQMGITGSGRNGKGKRKKFGAGLPKDFLKNFEGM" /locus_tag="LOCUS_3270" /note="WP_002293709.1 signal recognition particle protein (Enterococcus) [pid:51.0%, q_cov:93.2%, s_cov:32.0%, Eval:1.2e-37, partial hit]" /note="MGA_401" CDS 565..729 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MAVKIRLRRIGAKKAPFYRIVVADSRYPRDGRFIEELGYYDPTTE PTTLQVDAE" /locus_tag="LOCUS_3280" /note="WP_004451027.1 30S ribosomal protein S16 (Clostridium) [pid:75.9%, q_cov:100.0%, s_cov:65.9%, Eval:2.7e-19, partial hit]" /note="internal stop codon at [727:729](+)" /note="MGA_402" CDS 924..1157 /product="KH domain-containing protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_010965063.1" /transl_table=11 /codon_start=1 /translation="MKELLKTIVTGLVEDKDAIEITADEPNAEGVVVYHLHVAPSDMGR VIGKQGRIAKAIRVLMRAGAARTNEKIMVEID" /locus_tag="LOCUS_3290" /note="WP_010965063.1 KH domain-containing protein (Clostridium) [pid:48.7%, q_cov:98.7%, s_cov:98.7%, Eval:1.0e-13]" /note="MGA_403" CDS 1425..1928 /product="ribosome maturation factor RimM" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003384687.1" /transl_table=11 /codon_start=1 /translation="MRKYLDIGKIVTTHGIKGEVKIQPWCDSPEVLCEFDTLYNKDGSK SYKISARPHGNMVIAKIKGIDTIEQAQELRNKVLYMDRDDAELPEGTYFVADLLGLEVY DEAGKLYGKLTDVSSAGGANDVYEIKNGDKAYYIPAIPSVVLKTDIEGGKMIIYPMEGL FDED" /locus_tag="LOCUS_3300" /gene="rimM" /note="WP_003384687.1 ribosome maturation factor RimM (Clostridium) [pid:40.1%, q_cov:96.4%, s_cov:97.0%, Eval:7.7e-27]" /note="MGA_404" CDS 1918..2673 /product="tRNA (guanosine(37)-N1)-methyltransferase TrmD" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003384686.1" /transl_table=11 /codon_start=1 /translation="MRIDIATLFPDVCESYLSTSIVGRARAKGTFELKCHQIRDWAFDK HHRVDDTPYSERQGMLLMAEPIYRCYLDVAGERKPHVIYMSPKGKTLTQQRARELSQMS DIFILCGHYEGVDQRVLDKIVDEEISIGDYVLTGGELPAMVLVDSVVRMLDGTLSQPDC YEDESHYNGLLEYPQYTRPEVWEGERVPEILLSGHHANIMKWRREKSLEETYLKRPELL EKRELDDVDKSILSAIKARYEDLEEFLKK" /locus_tag="LOCUS_3310" /gene="trmD" /EC_number="2.1.1.228" /note="WP_003384686.1 tRNA (guanosine(37)-N1)-methyltransferase TrmD (Clostridium botulinum) [pid:50.2%, q_cov:93.6%, s_cov:97.1%, Eval:6.7e-63]" /note="MGA_405" CDS 2866..3135 /product="HPr family phosphocarrier protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011391564.1" /transl_table=11 /codon_start=1 /translation="MFVKDVVVKNQVGLHARPATFFIQKANEFKSSIWVEKEERRVNGK SLLGVLSLGIIGGTSIRIIADGADEVAAVSDLVALIEGDFAEEA" /locus_tag="LOCUS_3320" /note="WP_011391564.1 HPr family phosphocarrier protein (Moorella thermoacetica) [pid:40.2%, q_cov:97.8%, s_cov:93.5%, Eval:3.2e-12]" /note="MGA_406" ORIGIN 1 atgggcgata tgctcaccct gatcgaaaag gcgcagacca cgtttgacga taagcaggcg 61 gaaaagcttg ccgatcgaat gagcgaaggc aaatttgact ttaacgacct tttggagcag 121 accaagcaga tcaagaaaat gggctcgctc cagtcgattt tgtcgatgat gccgggcgga 181 aaccaggtcg accccagcca gatagatgaa aagcagattc cccgcatgga agcgatgatt 241 ttgtcgatga ctcctgcgga gcgagaaaag ccatcactca tcaacccatc aagaaaaagg 301 cgaattgccg caggctcggg cacaagggtt gaggatgtca accgcttgat caagcagtat 361 gagcagatgc aaaagctgat gaagcagatg ggcattacag gctcgggcag aaacggcaag 421 ggtaagcgca agaaattcgg cgcaggattg cccaaagact tcctcaaaaa ttttgaggga 481 atgtaaacca aagttgatta acctatagca tatgtcaaaa ggttaatata tattgtgaaa 541 tttcaatttg gaggtgaaac aaacatggca gtaaagatca gactcagaag aatcggcgct 601 aagaaggctc ccttctacag aatcgtagtt gctgattcca gatatcccag agacggtcgt 661 ttcatcgaag agctcggcta ctatgatcct accaccgagc ccactaccct ccaggtagac 721 gctgaatagg ctcagaagtg ggtatccacc ggcgcacagc ccaccgacac cgttaaggct 781 ctcttcaaga agaacggcat cctctaattt ttcaaattat gatccatcct ttcagcaagg 841 cgaccactac aattacccct gccttgctga atataacggg atcaaaatgg ggaaaagctt 901 aactttaagg agtattacaa gctatgaaag agcttttgaa aacaatagta acaggtcttg 961 ttgaggataa ggacgctatt gaaattacag cggacgagcc caacgcagaa ggcgttgtgg 1021 tatatcatct tcacgttgcc ccctctgaca tgggcagagt tatcggcaag cagggcagaa 1081 ttgccaaggc aatcagagtt ttgatgcgtg caggcgctgc aagaaccaac gagaagataa 1141 tggtcgagat cgactaagga ccttttggca gcctgacggg tagtcgggct gtttttattt 1201 gtgatgaata taggggcggg cctatgtgcc cgcccattaa ggcgcattct tcgggcaggc 1261 acataggcct gcccccatac agcaaaatcg caatttatgt tgaatttgct gttattgtct 1321 tttccgcgtt tgcctgcgcg gacctatgtg tccgcgcaaa cagcaacgcc ggcagggcgg 1381 ccacgcaggg ccgcccctaa caatccccca tcggaggtta acaaatgcga aaatatcttg 1441 atatcggaaa aatcgtcacc acccacggaa tcaagggcga ggttaaaatc caaccctggt 1501 gtgactcccc tgaggttctg tgcgagtttg acacattata taataaggac ggctcaaaga 1561 gctataaaat ttccgcgcgc cctcacggca atatggtaat tgcaaaaatc aaaggcattg 1621 acaccattga gcaggcgcag gaattgagaa ataaggtact gtatatggac cgcgacgatg 1681 ccgagttgcc cgagggcaca tattttgtgg ctgatctttt gggccttgag gtatatgacg 1741 aagcgggcaa gctctatggc aagctgaccg atgtcagctc tgcgggcggt gccaacgatg 1801 tatatgagat caaaaacggc gacaaggcat actatatccc tgcgattccc tcggtcgtgc 1861 tgaaaaccga tatcgagggc gggaagatga ttatttatcc catggaggga cttttcgatg 1921 aggattgaca ttgcgaccct tttccccgac gtctgcgaaa gctatctttc gacaagcatt 1981 gtcggcagag caagagcaaa gggcacattc gagcttaaat gccatcagat ccgcgattgg 2041 gcgtttgaca agcaccaccg cgttgatgac accccttaca gcgaacgaca gggaatgctt 2101 ttaatggcgg agccgatcta ccgttgctat ctggatgttg cgggcgagcg caagccccac 2161 gttatctata tgtcccccaa gggcaagaca ctgacccaac agcgcgcccg cgagctttca 2221 caaatgagcg acattttcat tctctgcggg cattacgagg gagtagacca gcgagttttg 2281 gataaaatag tcgatgagga aatttccatc ggcgattatg ttttaacggg cggcgagcta 2341 cctgcaatgg ttttggtcga ttctgttgtg cgtatgcttg acggcaccct ttcccagccc 2401 gattgctatg aggacgagag ccactataac ggccttttgg aatatcccca gtatacccgt 2461 cccgaggttt gggagggcga gcgtgtgccc gaaatattgc tttccggtca ccacgcgaat 2521 ataatgaaat ggcgacggga aaaatctctt gaggaaacat atttaaagcg cccagagctt 2581 ctggaaaagc gggagcttga cgatgtggat aagtcaatct tgtccgcaat taaggcaaga 2641 tatgaggact tggaagaatt tttgaaaaaa taaggtaaaa acccattgtg attttgcaca 2701 agtttgttga ttacatttgg gtagactgtc ggtataaagt agaattttgc ccgaaaagcg 2761 gtgttttggc caatttgtcc gttgacttcc ttcgccaaag ttgatatact gctaacagtt 2821 acgttgggcg ttatgcctta ttgaatgaaa tggagagtat ttaatatgtt cgtaaaagat 2881 gtagttgtta agaatcaggt tggtttgcac gctcgtcccg ctaccttctt catccagaag 2941 gctaacgaat tcaagtccag catctgggtt gaaaaggaag aaagacgtgt aaacggcaag 3001 tcccttttgg gcgttctttc cttgggcatc atcggcggca catccatcag aatcattgct 3061 gacggtgctg acgaagttgc tgctgtaagc gaccttgttg ctcttatcga gggcgacttt 3121 gcagaagaag cttaattttt aggcttttta acaacagata caaaatatag cggtcatacc 3181 ttgcggtgtg gccgcttatt ttgcgtataa caatgggaaa tttgtgctca tatctgcggt 3241 ttccataaca attatgacga aaaaattgga tatttttgac ttgattttta gcacgcttag 3301 taattgtgta taaaaaaaca tcatttgttt tgacttgttt acaatttctt aacactttcc 3361 gctataaaat gtgctacaat ttgtataaat gaggtgcact ctttttgtgt agtattctca 3421 ttcggttaaa ataaccacaa tcaaacagat aattgtgtca aaaattgcga aagcgggatt 3481 taaaaatgtc aaacagatta ttccaaggta taattcatca gatgagtgag accatcggct 3541 gcatgtgcgg tgttatcgac gagaattctc agatagttgc ctgcagcgac ctttcaagac 3601 tcggcaccag acttgacagc atttccttcg acggcgttga ttcctttgag cgctttgtgc 3661 gcgacggtta tgccttaagg cccatcggct caaaatccaa gcccgaatac cttgtattcg 3721 tcgaaggtac cgacgaggtc gcccgcagat atgcggatat gatcggcgtg acattatcca 3781 gccttcagca gttctatgac gaaaaatatg acagaaacaa cttcattaaa aacgttgttc 3841 tcgataacgt tttgcccgga gatatccaga tcaaggccag agagcttcac ttcaattctg 3901 atgtcagccg agttgtgttc ttaatcagaa tcgttgcctc gaacgaagtt tctgcctttg 3961 aagttattca gaatctcttc cccgacaaga acaaggactt tgttttcaac atcaccgagt 4021 cggatatcgt tcttatcaag gaagtcagac ccaacattga gatgcacgac cttgaaaagc 4081 ttgcatattc aatttccgac actctttcaa gtgagttcta taccaaggtc aacatcggta 4141 tcggcaccgt tgtcgacaat atccgcgcac ttgccgtatc cttcaaggaa gctcagatct 4201 cccttgaagt aagcaaggta tttg // LOCUS sequence063 4222 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence063 VERSION sequence063 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..4222 /mol_type="genomic DNA" /organism="" /note="sequence063" CDS complement(952..2118) /product="NAD-dependent epimerase/dehydratase family protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011107232.1" /transl_table=11 /codon_start=1 /translation="MKILVTGARGFVGKNLCAALAAIKDGKRRLDGITVTEIFEYDINS TVDKLDEYCAKADFVFHLAGVNRTDNAADFMAVNGGLTQRLVNALENCGNNCPIMLSSS IQASLDGRFANSEYGKSKLESERIVFNHAEKTGAPAYVYRLANLFGKWCKPDYNSVVAT FCHNIARDLPIRIDNRETELELIYIDDLVDELLRALCGNANKSGEFCAAPTTHKTTVGD LADMIYKFAEYPKTFTIPEIPENSLEKKLYSTYVSYLPSDKVCVPLKMNCDDRGSFTEL IKTANCGQISVNISKPGITKGNHWHDTKWEFFMVVSGIGLIEMRRLDCDEVLRFEVSGE KLEAVYMLPGYTHSITNLSDTDDLITVMWANEQFDPNDPDTYFEKVNE" /locus_tag="LOCUS_3330" /note="WP_011107232.1 NAD-dependent epimerase/dehydratase family protein (Bacteroides thetaiotaomicron) [pid:57.4%, q_cov:100.0%, s_cov:100.0%, Eval:7.3e-135]" /note="MGA_409" CDS complement(2119..3162) /product="polysaccharide biosynthesis protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011107231.1" /transl_table=11 /codon_start=1 /translation="MNNFSGAKLLITGGTGSFGNAVLNRFLETDIGEIRIFSRDEKKQD DMRHEFQAKMPHVANKIKFYIGDVRDIQSVKNAMHGVDYVFHAAALKQVPSCEFFPLEA VKTNVLGTDNVLTAAVEAGVKSVICLSTDKAAYPVNAMGTSKAMMEKVVVAKSRTSGDT KICCTRYGNVLCSRGSVVPLWIDQIKAGNPITVTEPAMTRFVMSLEEAVELVLFAFEKG ESGDILVQKAPACTIETLAKAVCELFEVDCEIKTIGIRHGEKMYETLLTNEECSGAVDL GGFYRVPCDKRSLNYDKYFKDGDTKRNPLTEFNSSNTAQLDVDEVKAKLLELDYIREEL SSWKAGR" /locus_tag="LOCUS_3340" /note="WP_011107231.1 polysaccharide biosynthesis protein (Bacteroides thetaiotaomicron) [pid:76.9%, q_cov:98.3%, s_cov:98.0%, Eval:8.7e-153]" /note="MGA_410" ORIGIN 1 ctcggtcgag gtgcggatgc atatagcggg gaatgactta ccgattgagg tataatagct 61 cgattcctca ggcagagttc cgctgtcaga tacaacagca aaggcgttca tctgcaggca 121 gttatagtca gtaaagccga gaggctcgtg cataattacc cgctcgtcaa gcttgaattc 181 gcttgcatcc aaacgctttt tgcttctggg atggcaggag taaagaatcg gcatatcata 241 ctttttcgcc atttcattga tcgcggtaaa gagtgaaaca aagttctttt cggtgtcgat 301 attttcctca cggtgggcag aaagaaggat atattttccc ttttcaaggc cgaggcgaga 361 gtgaatatcg cttgaaagaa tcttttcaat gtgagcattc agcacttcag ccattggcga 421 tcctgtgaca aaggtgcgct cctccggcaa accgcattcg tcaagatatc ttcttgcgtg 481 ctcggaatat gccatattaa catcggaaat gatatcgacg attcggcggt ttgtttcttc 541 gggcagacat tcgtccttgc aacggttgcc cgcttccata tggaatatcg gaatatgcag 601 acgcttcgca ccaattaccg acagacagga gtttgtgtcg cccaaaacaa gaactgcatc 661 gggctttgtt tttaccataa gctgatagct cttcgcaatt atattgccca ttgtttcgcc 721 aagatcggca ccgacagcat caagatatac ctcgggcgcg tcaagcccca aatcgtcaaa 781 gaaaatgccg ttgaggttat agtcataatt ctgacctgtg tgcgcaagca gggtgtcaaa 841 atatgtgcgg cactttttta tcacctcgga tagcctgatg atttcagggc gcgttccgac 901 gattattaaa agcctaagct tgccgttgtt tttaaaggag ggggtgttca tttattcatt 961 caccttctca aaataagtat cggggtcgtt ggggtcaaac tgttcatttg cccacatgac 1021 cgttattaaa tcatctgtat cgctcaggtt tgtgatgctg tgggtatagc cggggagcat 1081 atataccgcc tcgagctttt caccgctgac ttcaaagcga agcacttcgt cgcagtcaag 1141 tcggcgcatt tcaattagtc ctattcccga cacgaccatg aagaattccc acttggtgtc 1201 atgccagtgg ttgcccttgg tgatgcccgg ctttgaaata ttcacactta tctgtccgca 1261 gtttgcagtt ttaatcaact cggtgaagct tccgcggtca tcacagttca ttttcagcgg 1321 aacgcagacc ttatcgctcg gaagatatga aacataggtc gaatacagct tcttttcgag 1381 ggagttttcg ggaatctcgg gaattgtaaa ggtcttggga tattccgcga atttatatat 1441 catatccgca aggtcgccca ccgtcgtttt gtgggtggtc ggggcggcgc agaactcgcc 1501 cgacttattg gcgttgccgc aaagcgcacg aagaagctcg tccaccagat cgtcgatata 1561 tataagctca agctcggttt cgcggttgtc gattcttatg ggcaggtcgc gggcgatatt 1621 gtggcaaaat gttgcaacaa cgctgttata gtccggcttg caccacttgc cgaaaaggtt 1681 tgcaaggcga taaacatatg caggtgcgcc tgttttttcg gcgtggttaa aaacgattct 1741 ttcgctttca agcttgcttt ttccatattc ggagtttgca aatctgccat caaggcttgc 1801 ctgaatgctg gacgacagca tgatcgggca gttgtttccg caattttcaa gggcgttgac 1861 aagtctttgt gtcagaccgc cgtttacggc cataaaatca gccgcgttat ctgtgcggtt 1921 gactcccgca aggtggaaga caaaatccgc cttggcgcag tattcatcaa gcttgtcaac 1981 agtcgagttt atgtcatatt caaaaatttc ggtgacagta atgccgtcaa gcctgcgctt 2041 gccgtcttta atggcagcca gcgcggcgca taggtttttc ccaacaaatc cgcgggcgcc 2101 tgtaacgaga attttcattt atcttcccgc cttccaagat gaaagctctt cgcggatgta 2161 atcaagctcc agaagctttg ccttgacttc atcaacatca agctgcgcgg tgttggagct 2221 gttgaattcg gttaaaggat tgcgctttgt gtcgccgtcc ttgaaatatt tatcatagtt 2281 aagacttctc ttatcgcagg gtacacggta gaagccgccc aaatcaactg cgcccgagca 2341 ttcctcattg gtcaaaaggg tttcatacat cttttcgccg tggcgaatgc cgatggtttt 2401 aatttcacaa tcaacctcaa acagctcgca aacagcctta gccagcgttt caatggtgca 2461 ggcaggggct ttctgaacaa gaatatctcc gctttcgccc ttttcaaagg caaagagcac 2521 aagctccacc gcctcctcaa ggctcataac aaagcgggtc attgcaggct cggtgacggt 2581 aatggggttg ccagccttta tctggtcgat ccacaggggc acaacagagc cgcggctgca 2641 caaaacattg ccatagcggg tgcaacaaat tttggtatcg cccgaggtgc ggctttttgc 2701 aacaacgacc ttttccatca tcgcctttga ggttcccatt gcattgacag ggtatgccgc 2761 cttgtcggtg gataagcaga tcacgctttt aacgcccgct tcaacagcgg ctgtgagaac 2821 attgtcggtg cccaaaacat tggttttaac tgcttcaagg gggaagaatt cacaggaagg 2881 aacctgcttc agggcggcgg catggaaaac atagtccaca ccgtgcatag cgtttttgac 2941 cgactgaata tcccttacat cgccgatata gaacttgatt ttgtttgcaa cgtggggcat 3001 cttcgcttga aattcatggc gcatatcatc ctgctttttc tcatcacggg agaaaatgcg 3061 gatctcaccg atatccgttt cgagaaagcg gtttaaaacc gcgtttccaa atgaaccggt 3121 accaccggtt atgagcagct tcgctccgga aaaattattc attgcgtttt gcctcccctt 3181 cttaaaagcg ccgaaaagcg gcgttttcgc tcatattgcc gtcaacatgg catacgaata 3241 caattatagt ttattttatc ataattcttc cttctttgca atatccctcg acaaaaaagt 3301 ggttgtttgt cggaaaatgg ttggcggggc ggaggccgtc gtacctccga aggaggtgtg 3361 acggagggga cccgcatccc cgacgctcaa actttacggc cgcttctccc ctttttcgct 3421 tcgcaaatac cgcaaaatag cacgcaaaaa cgacccaccg attgctcggt aggccgtttt 3481 gttttagatt atcagtccaa agggtatctt gcttcgccga agagcgcgtg atacaacaga 3541 tagatcgcat cgttcttgtc gagcgagccg tcgccgttga agtcagcatc ctggttcaaa 3601 ggatatctta cttcgccgaa gagcacgctg tacaagcaat agatagcgtc gttcttgtca 3661 acatcgccgt cgtcgtcgag gtcgccgcga agaacaaatg tgagtcgtcc ctgcttgtcg 3721 aatctataag tatcggcagg caagaggtcg tttgttctta taacttcata cttgccgtcg 3781 gcaaccatta ctccttcgtt gttgaagtaa tagtaatact cgccatcaaa gacaagaccc 3841 atatatgcct tgacaccgtc aacgtaatag tatgtcacac cgtcagcttc ggtgatcttg 3901 ccgttcttcg aggtatcctc atcgtggagg atgacgccga attcgtcgaa gacatagtta 3961 ttggtgggaa gcaacagaac gttggtcttt tcaaccgatg cggtagtgcc cttaacagcc 4021 ttgccggaaa cgaagtaata gtaattaacc tcgccgtcgg gcttgacgat tcttacaagt 4081 ccttcggtat tcttgatctc accgttttca gccatatagg tgtctgcgcc gtgatcataa 4141 agtcccgaat aatcagcagc gaacgcacct gtggtttcat cgaagatgaa cttggcaatg 4201 cgtgtgccgt acttggcggg aa // LOCUS sequence064 4213 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence064 VERSION sequence064 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..4213 /mol_type="genomic DNA" /organism="" /note="sequence064" CDS 204..803 /product="HD domain-containing protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_010965241.1" /transl_table=11 /codon_start=1 /translation="MDNNLFKQRYIEIFKEHIKRDGADRLLDYLMSEKCDFFTAPASTK FHCAYEGGLCEHSLNVYDCLKSYLESDRVKEKFGLEYSDETIAIVALLHDVCKINTYKV SMRNTKNEKGVWVQVPYYDYNDTLPYGHGEKSVYIVSGFIRLTRDEAMAIRWQMGFSGQ EDQKLIGNALHAYPLALALNIADCEASTFIEERKSN" /locus_tag="LOCUS_3350" /note="WP_010965241.1 HD domain-containing protein (Clostridium) [pid:33.2%, q_cov:89.4%, s_cov:92.1%, Eval:3.4e-15]" /note="MGA_413" CDS complement(848..1750) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MKKKEFLEIAAQMQNIYSGILYNYRSFEGKRADNVTYNFSCPEYT ELRDKYELVKIAGKGSDFKKAKRLLHYFAPKLTHSSWYDNHVECNALKLLEYSFDNPKQ GINCLNKSKILEECCLALGIYSRRVRIMPFSPYDFDNHVVNEIFDKKLNKWIMLDMTTD GYFVDENKTPLSLLEIREKFALDEFVTFVKSTDRLSNLEKSRDNNVDKNYYICKNLFWF SIGAECKFGEPSKWYDICSAGYSIKDNKIANIKYRINHLPKEYSDWVPQYEERLKNAES AEYTVYDAEIMMRCPLGRR" /locus_tag="LOCUS_3360" /note="WP_010965665.1 hypothetical protein (Clostridium) [pid:42.9%, q_cov:37.3%, s_cov:82.0%, Eval:9.6e-17, partial hit]" /note="MGA_414" CDS complement(1832..3223) /product="asparagine--tRNA ligase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011462263.1" /transl_table=11 /codon_start=1 /translation="MSKYLIDEIYKSVKGLCPNDELTEGALVTVEGWIRTNRSNNKIGF ISLNDGSCFSCCQIVYEDEKINNFADISKLLTGCAVKITGKLIITPEAKQPFEINATEA ELLGACDSAYPLQKKRHSLEFLREIPHLRPRTNTFMAVFKIRSVISQSLHEFFRSNGFT YIHTPLITGNDAEGAGETFTVTTREDANYAEDFFGKHACLTVSGQLHVEPFALALGKVY TFGPTFRAENSNTPYHASEFWMIEPEMAFCDLKGDMAVMEAMLKYVIKDVMNTCPDELK FLNDFVDKDHTLIEKLDRVVNSDFKVITYTEAVDYLKNSGEKFEFPVEWGMDFAKEHEI YICEKVAKGPVFLIDFPKDIKAFYMKINPDGKTVAACDLLVPGVGELIGGSQREENYDV LVKKMDDMGMEKESLEWYLDLRKYGGVVHSGFGLGLERLLMYVTGVANIRDVSAYARTP KNLKF" /locus_tag="LOCUS_3370" /gene="asnS" /EC_number="6.1.1.22" /note="WP_011462263.1 asparagine--tRNA ligase (Desulfitobacterium hafniense) [pid:56.0%, q_cov:100.0%, s_cov:100.0%, Eval:1.1e-151]" /note="MGA_415" CDS complement(3347..4042) /product="DNA repair protein RadC" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_133415038.1" /transl_table=11 /codon_start=1 /translation="MKEENLHKGHRARMKKQFLDMGIETFEEHQILELLLFFAIPQHDT NEYAHNLINRFGDLHSVFSARYEDLKTVDGIGDNAATLLKLIPELCVKLNAEKRLGTVL NTAESLVDFFKTQFFGVPDEEIKLACFDDRLKLLDIVLINKGDIGSVRLDARKVFQELL RTNCSQIIISHNHPIGNAQPSPADMLITKTVQDMIKPMDVTLLDHIVVGTDGVHFILAN KFYPHKSKD" /locus_tag="LOCUS_3380" /gene="radC" /note="WP_133415038.1 DNA repair protein RadC (Bradyrhizobium diazoefficiens) [pid:30.5%, q_cov:90.5%, s_cov:88.8%, Eval:1.5e-26]" /note="MGA_416" ORIGIN 1 gataccggtg tcggtgacaa atggcgagat attgctttgt gctaccgaag tcttaagcac 61 aactttgatg gcacatatgg cggaaaggtt tacacggact ttgatgccga tatgctgttt 121 gatgctctgg gaattgagaa aaacgaagaa aaatttcggt attacatcct tttggatgaa 181 ctattttgat atgggaggat actatggata acaatttgtt caagcaaaga tatattgaga 241 ttttcaagga gcatatcaag cgcgacggag ctgacagatt gctcgactat ttgatgagcg 301 agaaatgtga cttcttcaca gctcccgcat cgacaaaatt ccactgtgca tatgaaggcg 361 gactatgcga gcatagcttg aacgtttacg actgcttgaa gtcatatctt gaatcggaca 421 gagttaaaga gaaattcgga cttgaatatt ctgacgagac cattgcgatc gttgcgttgc 481 tgcacgatgt ctgcaagata aatacatata aggtcagcat gagaaatacc aagaacgaaa 541 agggcgtttg ggtgcaggtt ccgtattatg actataacga cactctcccc tacggtcacg 601 gtgaaaagtc agtatatatc gtcagcggat ttattcgttt gacccgtgac gaagcgatgg 661 caattcgctg gcagatgggc ttctcgggtc aggaggacca gaagcttatc ggcaacgctt 721 tgcacgctta tcctttggct ttggcgctta atattgccga ctgcgaagct tcaacattca 781 ttgaggaaag aaaatcaaac tgatataaaa taatcccacc tgtgagggtg ggatttgttt 841 tatgtattta cctgcgtccg agaggacatc tcatcattat ctccgcatcg taaaccgtat 901 actccgctga ttcagcattt tttaaccgtt cttcatactg cggtacccag tcactatatt 961 cttttggaag atggtttatc cgatatttaa tatttgcgat cttattatcc ttgattgaat 1021 aacctgctga acaaatatca taccatttgc tcggctcgcc gaatttgcat tctgctccaa 1081 tgctgaacca aaacagattt ttgcagatat aatagttttt gtcaacatta ttatctcttg 1141 atttttccaa atttgacaga cgatcggtcg atttgacaaa tgtaacgaat tcatcaagcg 1201 caaacttttc gcgaatttca agaagcgata acggtgtttt attctcgtcg acaaaatatc 1261 cgtctgtggt catatccagc attatccact tgtttagctt tttgtcaaaa atctcgttga 1321 caacgtggtt gtcaaaatcg tatggcgaga atggcataat tcgtactctt ctcgagtaaa 1381 ttcccaaggc tagacagcat tcttccaaga tctttgactt attaagacag ttgatcccct 1441 gcttagggtt atcaaagcta tattccaaga gcttcagcgc gttgcactcg acgtggttat 1501 cataccagga gctgtgcgtg agctttggcg caaaataatg gagcaagcgc tttgcttttt 1561 tgaagtcgct gcctttcccc gcaattttca caagctcata tttgtcccga agctctgtat 1621 attcagggca tgaaaaattg tacgtaacat tgtctgctcg ttttccttca aatgaacggt 1681 aattataaag tattccgctg taaatattct gcatttgagc tgctatttca agaaactctt 1741 tcttcttcat tctatctacc tcgttacaaa atcaagtgtt gtttgattat gttttattaa 1801 aaatccccga ccgaagtcag ggattttaat tttagaactt gagattcttt ggggttcttg 1861 catatgcaga tacgtcacgg atatttgcaa cgcctgttac atacataaga agtctttcaa 1921 ggccaaggcc gaaaccggag tgtacaacac cgccgtactt tctaaggtca agataccact 1981 caagggattc cttttccata cccatatcgt ccatcttctt gacgaggaca tcatagtttt 2041 cttcacgctg agaaccgccg ataagttcgc cgacgccggg aaccaaaagg tcgcaagcag 2101 caacagtctt tccgtcgggg tttatcttca tatagaatgc cttgatatcc ttcgggaagt 2161 caatgaggaa tacggggccc tttgcaacct tctcgcaaat gtagatctcg tgttccttag 2221 cgaagtccat gccccactca acggggaatt caaacttctc acctgagttc ttcaaatagt 2281 caacagcttc tgtataggtg ataaccttaa agtcggagtt aacaaccctg tcaagctttt 2341 caatgagagt gtgatccttg tcaacaaagt cgttaaggaa cttgagctca tcgggacagg 2401 tattcataac atccttgatt acgtatttga gcattgcctc cattacagcc atatcgccct 2461 tgaggtcaca gaatgccatt tcgggctcga tcatccagaa ctcggaagcg tggtaaggcg 2521 tgttggagtt ttccgctctg aaggtagggc caaaggtata taccttgccc aaagcaagag 2581 caaaaggctc aacgtggagc tgacccgaaa cagtcagaca agcgtgcttg ccgaagaagt 2641 cctcagcata gtttgcatcc tcgcgtgttg taacggtgaa cgtttcgcct gcgccttcag 2701 catcgttacc tgtgatgaga ggagtatgaa tataggtgaa accgttggag cggaagaatt 2761 cgtggagcga ctggctgatt actgaacgaa ttttaaatac agccataaag gtgttggttc 2821 tggggcgaag atgagggatc tcgcgaagga attcaaggga gtggcgcttc ttctgcaagg 2881 gatatgcaga gtcgcaagca cccaaaagct cagcttcggt ggcattgatc tcaaaaggct 2941 gctttgcctc gggagtgatg ataagcttac ctgtgatctt aacagcacag cctgtcaaaa 3001 gctttgatat atcagcaaaa ttatttatct tttcatcttc atatactatc tggcagcagc 3061 tgaagcagga gccgtcatta agtgaaatga agccgatttt attattggaa cggttggttc 3121 ttatccagcc ttcaacggtg accaaagcac cttcggtgag ttcgtcatta gggcaaaggc 3181 ccttgacact cttatagatt tcgtcaatta aatacttgct catgttttac aatctccttt 3241 aaagagttaa gtattcttta attatattac tgcaaagttg caaagtcaag tttaattgaa 3301 ataatagcta caaaaaggca cccgaaactg agtgccgttg aaattatcaa tctttagatt 3361 tatgaggata gaatttattt gcaaggatga aatgcacacc gtcggttccg acgacaatat 3421 ggtcaagcag agttacatcc ataggcttga tcatatcctg tactgttttt gtgataagca 3481 tatccgcggg cgaaggctgt gcattgccaa ttggatgatt gtgagaaata atgatttgtg 3541 agcaatttgt gcgtaaaagc tcctgaaaca cttttcttgc atctaatctc acagaaccga 3601 tatcaccttt attgatcaat acgatatcca aaagtttgag cctgtcatca aagcaagcaa 3661 gcttgatttc ttcgtcaggc acgccgaaga actgagtttt aaagaagtcg acaaggcttt 3721 cagcggtatt taaaactgtt cccaagcgct tttcggcgtt aagcttcaca catagctcgg 3781 gtatcagttt taagagagtt gcggcgttgt ccccaatacc gtcaacggtc ttaagatctt 3841 cgtatcgtgc agaaaaaaca gagtgaagat cgccaaagcg atttataagg ttgtgagcat 3901 attcattggt gtcatgctga ggaatagcaa aaaacaaaag aagctcaaga atttggtgtt 3961 cttcaaaggt ttcaattccc atatcgagaa actgcttttt cattcttgct ctatgacctt 4021 tgtgaaggtt ctcttctttc attttaaatc acttccctgc cgcttgatat attatatatt 4081 agctgatatt tagatttatg tcaacataat tcgacataga ggctgttttg aaaactaaaa 4141 gataaacaaa taaaggtcgg gagaaatccc gacctttttt ctgcagtaaa ttatttaatt 4201 atttctttgc taa // LOCUS sequence065 4212 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence065 VERSION sequence065 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..4212 /mol_type="genomic DNA" /organism="" /note="sequence065" misc_feature <1..695 /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_003432446.1:glutamine--fructose-6-phosphate transaminase (isomerizing)" /note="WP_003432446.1 glutamine--fructose-6-phosphate transaminase (isomerizing) (Clostridioides difficile) [pid:47.8%, q_cov:100.0%, s_cov:37.7%, Eval:5.0e-51, partial hit]" /note="MGA_417" /locus_tag="LOCUS_3390" CDS 723..1460 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MSKSKTYKSKKSGVNIFILLPIILVALIAVILVVNGVQNAKIKNL MGDYTEYAYGERANVKMTHAIGEGYDIWQNEKYVYDVLNGLIYDYAANEADASYVSAGI QNAVTALEDGSTLSNLQYVTYSDANDFSKKYNGVVFTLANSENTTDSADAAAEKIWNII NSIEGMTYTGIEVGMFDRENEYNIFIDAMSGETLTLETIKENITVPEEHSPLYGYWLSG VEAADNAVVENAEGETAENTTEE" /locus_tag="LOCUS_3400" /note="MGA_418" CDS 1577..2584 /product="aspartate--ammonia ligase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003549578.1" /transl_table=11 /codon_start=1 /translation="MSKLYVPKGYTSSLTAYETQTAIGLIKRSFEINLCQSLNLKRASA PLFVDGHRGLNDDLNGYERPVSFDLLETGENAEVVHSLAKWKRMALKEYGFHIGEGLYT DMNAIRRDEEMDNLHSVYVDQWDWERIITKEDRNLEFLKDIVTKIVSAVCDTQELVSKV YPNVKCRLSREIKFVTTQELEDMYPDLTGKERENEIVKEHKTVFIMQIGDKLRSGNKHD GRAPDYDDWSLNGDIMFWDDTLECAMEISSMGIRVDEKELTDQLKKAECEWRSGLEFHK KLLAGELPLTIGGGIGQSRLCMLLLGKAHIGEVQVSVWDKKTIDGCKEAGIMLL" /locus_tag="LOCUS_3410" /gene="asnA" /EC_number="6.3.1.1" /note="WP_003549578.1 aspartate--ammonia ligase (Lactobacillus acidophilus) [pid:59.7%, q_cov:99.4%, s_cov:99.7%, Eval:1.2e-111]" /note="MGA_419" CDS 2713..4200 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MAENIINEEIHLVDLLYPSETKRRECLDRGLAIAKLPQDYVTNLE LEMLSRLICPENSLNALRIFTQLTDDPEVLNYRLDILEDFLNVPSLEAVLYENVHKLYI NEHVNIQKLGLADSFFALNTRLNSLKTYIDCITACHQFCDKNQDKFKSQALKNLVGYFA SVYNSEYFDEVKRETDECLKILAKGVKSVTVGINFDDMMRPVEAMLLSVSTDLIKKKGR FDWIFKHIDQSSSRAIGKTHSLYNENGGTNDLEAPLFRELKEINSEYIAHLDTAIRAYF KKSTEDILTFESQMSFYIGAKKIVEAVRSRGLDMCRPKYLPAEERKFKADGIFDLSFYI QMVGSDPMAKLNDKIIRNECTMDDDGRFYVLTGANNGGKTTYTRAIGIIQVLAQAGIYV PATSCELSPVDFIYTHFPKEEEVGLNSSRFTQECKQFKETLDTATSHSMLLLNESIQST TPTECVYIATELAKIFRCVGVRGVYATHLLELARSLD" /locus_tag="LOCUS_3420" /note="WP_011058073.1 DNA mismatch repair protein MutS (Thermosynechococcus vestitus) [pid:33.8%, q_cov:27.3%, s_cov:15.6%, Eval:9.8e-13, partial hit]" /note="MGA_420" ORIGIN 1 catcaattgc acgtgaagca gatatggtta tctacaccaa tgcaggccct gagatttccg 61 tttgctcaac aaaggcatac actgttcaga cggcgactct ttgcgccttt gcatttaact 121 tggcgtatgt taaaggaaaa atcagccatg ataagctggt aagcctttca acggttctaa 181 tgaaccgact cggcaccgtt attgcagagg tcatctcgga tgagccgatg cttgcggaca 241 ttgccagcga gctttataag caggaggaca ttttcttcat cggtcgcgga ctggacagct 301 tcattgttca ggaagcatcg ctgaaactga aggagatctc ctacatccac tcggaggcgt 361 atgccgccgg cgagcttaag cacggaacta tctcgcttat taccgaggac acccctacct 421 gcgctttggc gactctgccc gagctttacg aaaagacccg ctcgaacatc cgtgagattg 481 aaacaagagg cggtaaggtc tttttgatct gcggtcctga ttatcccaag gaccctgaca 541 ccgcttatga atatcgtctg ccggaaattg acagactatt catgggaatt gcggcatcaa 601 cagcttatca gctgtttgca tatcacgttg cggcactcag aggctgtgac atcgacaagc 661 cgagaaattt ggctaagtcg gtaactgttg aataattatt tatatgaaag aggattttta 721 aaatgagcaa aagcaagact tacaaaagca aaaagagcgg agttaacatt tttattcttc 781 tccctataat tttggtggca cttattgcag ttattcttgt agttaacggt gtacagaacg 841 ctaagatcaa gaatcttatg ggcgactata ctgaatatgc atacggcgaa agagcaaatg 901 ttaagatgac ccacgctatc ggcgaaggat atgacatttg gcagaacgaa aaatatgttt 961 acgatgttct taacggcctt atctatgact atgctgcaaa cgaagcagac gcttcttacg 1021 ttagcgctgg cattcagaat gcagttaccg cgcttgagga cggttctact ttgagcaatc 1081 tccagtatgt aacatattca gatgcaaacg atttctccaa gaaatataac ggcgttgtat 1141 ttacacttgc aaacagcgaa aacaccaccg attcggctga tgccgccgca gagaagatct 1201 ggaacatcat caactcaatt gagggtatga cctataccgg aattgaagtc ggtatgttcg 1261 acagagagaa tgaatataac atctttattg atgctatgag cggtgagacc ttgacccttg 1321 aaacaattaa ggaaaacatc acagttcccg aagaacactc tcctctttac ggctactggc 1381 tttccggtgt tgaagcagca gataatgctg tggttgaaaa tgctgaaggc gaaactgcag 1441 agaatactac ggaagaataa aataattagt ttagcgcagt attgacataa agcattaaaa 1501 cgagtataat ttttaggtaa gcatcgtaaa cttacggtgc ttacctttat tttgacgcag 1561 gaaaggactg acaaagatga gcaagcttta cgtgcctaag ggttatacat caagcctgac 1621 ggcatatgaa acacaaacag caatcggact tattaagagg agctttgaaa ttaatttgtg 1681 tcagtcgctt aatttgaaga gagcttctgc tcccctattc gttgacggac acagaggcct 1741 taatgatgac ctcaacggtt atgaacgccc tgtcagcttt gaccttttgg aaacaggcga 1801 aaatgccgag gtcgttcatt cgctggcaaa gtggaagaga atggcactta aagaatacgg 1861 cttccacatc ggcgagggac tttatacgga tatgaacgcg attcgccgcg acgaagagat 1921 ggataatctg cactcggtat atgttgacca gtgggattgg gagagaatta ttacaaaaga 1981 ggacagaaac ctcgaattcc taaaggatat tgttacaaag atcgtcagcg cggtatgcga 2041 tacgcaggag ctggtttcaa aggtatatcc gaacgttaaa tgccgcctca gccgcgagat 2101 caagtttgta acaacccaag agcttgagga tatgtatccc gatttgacgg gaaaagagcg 2161 tgaaaacgaa attgtcaagg agcataagac cgttttcatc atgcagatcg gcgacaagct 2221 tcgctcggga aataagcacg acggcagagc acccgactat gacgactggt cgctgaacgg 2281 cgatattatg ttctgggatg atactcttga atgcgcgatg gagatctctt caatgggcat 2341 cagagttgat gaaaaggaac tgaccgacca gcttaaaaaa gccgagtgtg agtggcgctc 2401 gggccttgaa ttccacaaga agcttttggc gggcgaattg ccgttaacta tcggtggagg 2461 tattggacag tcgcgccttt gtatgctcct tttgggcaag gctcatatcg gcgaggtgca 2521 ggtttcagtt tgggataaga agactattga tggctgtaaa gaagccggaa ttatgctttt 2581 gtgatattaa ctcaaaaaag attgattatt taaaacattc gcacaaaaaa gtagtgcaaa 2641 aatatgtcct atgatgttat actgacatca taggacattt ttgttcaatg acccaagaaa 2701 ggtaaattaa ttatggcgga aaatatcatc aacgaagaga tccatttggt agacctgctt 2761 tatccctcgg aaactaaaag gcgcgaatgc ttggaccgcg gtctggcaat tgcaaagctt 2821 ccccaggatt atgttacaaa ccttgagctt gaaatgctct cccgtttaat ctgtcccgaa 2881 aattcgctga atgctttaag aattttcaca cagctgacag atgacccgga agttttaaac 2941 taccgtcttg acattttgga ggactttttg aatgttcctt cgcttgaagc tgtgctttat 3001 gaaaatgtac acaagctata tattaacgag cacgttaaca ttcagaagct cggtcttgct 3061 gacagcttct ttgcgctgaa tacaagactc aactccctta aaacatatat cgactgtatt 3121 actgcttgtc atcagttctg cgacaagaac caggataagt ttaagtcgca ggcactcaaa 3181 aacttggtcg gatacttcgc cagtgtttat aattcggaat atttcgatga ggttaagcgc 3241 gaaacagatg aatgcttaaa gattttggca aagggcgtta aaagcgtcac cgtcggcatc 3301 aactttgacg atatgatgcg ccctgttgag gcgatgctcc tttctgtatc cacagatctt 3361 atcaagaaga agggccgttt cgattggata ttcaagcaca ttgatcagag ctcctcaaga 3421 gcgatcggca agacccactc gctttacaat gaaaacggcg gcaccaacga ccttgaggct 3481 cccctcttca gagagcttaa agagatcaac tcggaatata tcgcacacct tgacaccgct 3541 atcagagcat atttcaagaa gtcgaccgaa gatattttga catttgaaag ccagatgagc 3601 ttctatatcg gcgcaaagaa gatcgttgaa gcggttagaa gccgcggact cgatatgtgc 3661 agaccgaaat atttgcctgc tgaagaaaga aagtttaaag cagacggcat tttcgacctt 3721 tccttctata ttcagatggt tggctccgac cccatggcaa aactcaatga caagatcatc 3781 agaaacgaat gcacgatgga tgatgacgga agattttatg ttcttacagg cgctaataac 3841 ggcggtaaga ccacatatac aagagctatc ggcattattc aggttttggc gcaggcgggt 3901 atttatgttc ctgcgacaag ctgtgagctt agccctgttg acttcattta cacccacttc 3961 cccaaggaag aagaggttgg tctgaactcc tccagattca ctcaggaatg caagcagttt 4021 aaggagacct tggacaccgc caccagccac agtatgctcc ttttgaatga gtcgatccag 4081 tccaccactc ccaccgagtg tgtatacatt gcgacagagc ttgcaaagat cttccgctgc 4141 gtgggtgtca gaggtgtata tgccacccac ttactcgagt tggcacgcag tcttgactga 4201 ctcaacgaag ag // LOCUS sequence066 4200 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence066 VERSION sequence066 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..4200 /mol_type="genomic DNA" /organism="" /note="sequence066" CDS complement(395..2413) /product="ribonuclease J" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_010964990.1" /transl_table=11 /codon_start=1 /translation="MANKKLDEKLTVSASKKSKKQPNTESALDAAIAAAISAPKPPKKA ASYSAKNQKPKSAKKSSPKAQEKKNAPKSEPKAEPKKKTPKVQETEPAEPKSAKKSSKK QTQKTPAPEVYVPTNFAKGEKLKIIPLGGLNEIGKNMTLIEFGNDIIIIDCGMTFPDAE MPGVDIVIPDFTYVEKNADRIRGVLLTHGHEDHIGGVPYLLKKLNVPVYGTKLTIGLVN SKLKEHNPGKVTLHTVVPGETVRLGCFTAEFIRVNHSIPDAVAIAVHTPLGNLLHMGDF KVDYTPIEGGIIDLARIAELGKEGILALMSDSTNSERPGFTPSERVVGSTFENLFVKAE GKRIIIATFSSNVHRVQQIINYAARYGRKVAVFGRSMINVIRMGTELGYLKNVGDVLID IDKMKNYTDGEIVLVTTGSQGEPMSALTRMALNDHRQVSITSNDFIIISARPIPGNEKF VGKVVNELLKLGAEVVYEDMYEVHVSGHACQEEQKLILALSQPKFFIPVHGEYKHLSHH AETAISIGIPEHRVIIADIGNIIETDGEVMRINGTVPAGKVLVDGYGVGDVGAVVLRDR KHLAEDGVIVVTLTIDRIARRLLSGPDVVTRGLVYEKESEEFLSKLRELAREVSLSELD TRHDYKAISNKLRDELGDYVFSKTKRRPMVIPVIMDI" /locus_tag="LOCUS_3430" /note="WP_010964990.1 ribonuclease J (Clostridium) [pid:55.3%, q_cov:81.7%, s_cov:99.1%, Eval:2.6e-184]" /note="MGA_422" misc_feature complement(3000..>4200) /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_012583098.1:ASKHA domain-containing protein" /note="WP_012583098.1 ASKHA domain-containing protein (Dictyoglomus turgidum) [pid:36.2%, q_cov:96.7%, s_cov:70.7%, Eval:4.7e-60, partial hit]" /note="MGA_423" /locus_tag="LOCUS_3440" ORIGIN 1 aggtgaatac cgtatgcgcg gtcttcaccg aaaatatgct cttcaaagct ggcattatac 61 cagatgacct tttcgtcttc atccacaatg acgatcggct cgggatagtc ataaaacgtt 121 tctctgccga cggtgataat gtctttatcc attgtagtga cataacgggt caggttgtag 181 ttgaaaacaa gggtgacaat taaaagaacc aacgcgcaaa gcccgcaaag tcccgaggca 241 attggcacat atttggttaa gtcagcagaa gcaagtgaga gcgcgcaaga tatcagggaa 301 aacacaatca aaagcgcaag cggaattata aatgcgggag cacttcgctt tttcattact 361 tatccgtcct ttcttggctg ttattttaaa aatgtcagat gtccattatt acgggaatga 421 ccatcgggcg gcgcttggtt tttgagaaaa catagtcgcc aagctcatcg cggagcttgt 481 tgctgatggc tttataatcg tgacgggtgt caagctcgct taaagatacc tcgcgggcaa 541 gctcgcggag cttggaaagg aattcctcgc tctctttttc atatacaagt ccgcgggtaa 601 caacatcggg accggaaaga agccgtcttg caattctgtc aattgtgagg gtaacaacga 661 ttacgccgtc ctcagcaaga tgcttgcggt cacgcaaaac aaccgctccg acgtcgccga 721 caccgtaacc atccacaagt accttgcctg cagggacagt gccgttgatg cgcattactt 781 cgccatcggt ttcaattatg ttgccgatat cggcaattat taccctatgc tcgggaatgc 841 cgatgctgat tgcagtttcg gcgtgatggg aaaggtgttt atattcacca tgcacgggaa 901 tgaagaactt gggttgagaa agagccaaaa tcagcttctg ctcctcctgg caggcgtggc 961 cggaaacgtg aacttcatac atatcttcat atacaacctc ggcgcccagc tttaaaagct 1021 cgtttacaac cttgccgaca aacttttcgt tgccgggaat ggggcgtgcg gagattatga 1081 taaagtcgtt agaggtgatg ctaacctgac ggtggtcatt aagcgccata cgggtaagag 1141 cactcatagg ctcgccctga gaacctgtgg tgaccaaaac gatctcgccg tcggtatagt 1201 ttttcatctt atcgatgtca atgagtacgt cgccgacgtt tttaagatat ccaagctcgg 1261 tgcccattcg gattacattt atcatgcttc ttccgaaaac ggcaaccttt ctgccgtaac 1321 gggcggcata gttgattatc tgctgaacgc ggtggacatt tgaggagaag gtcgcaatta 1381 taatgcgctt gccctcagcc ttaacaaaca gattttcaaa tgttgatccg acaactcgct 1441 cactcggtgt aaaaccgggg cgctccgagt tggtggagtc actcataagt gccaaaatgc 1501 cttcttttcc aagctcggca attcgggcaa ggtcaatgat tccgccctcg atgggggtat 1561 aatcgacctt gaagtcgccc atatgcaaaa gattgcccag aggggtatga acagcgattg 1621 ctacggcatc gggaattgaa tgatttactc ttatgaactc agcggtgaag catcccaagc 1681 ggacagtttc tccggggaca acggtatgaa gtgtcacctt gccgggatta tgctccttga 1741 gctttgaatt tacaagacct atggtcagtt tagtgccata tacaggaaca ttcagctttt 1801 tgagaagata aggaacgccg ccgatatggt cctcgtggcc atgggtaaga agaactccgc 1861 gaatgcggtc ggcattcttt tcaacatagg tgaaatcggg aatgacgata tcgacaccgg 1921 gcatttcggc atcggggaag gtcataccgc agtcgataat tatgatatcg ttgccgaact 1981 caatgagggt catatttttg ccgatctcat tgagtccgcc gaggggaatg attttaagct 2041 tttcgccctt tgcaaagttt gtgggaacat aaacctcggg agcgggagtc ttttgggtct 2101 gcttctttga agatttcttt gcagacttag gctctgcagg ctcggtttcc tgtaccttcg 2161 gggttttctt tttaggttct gccttcggtt cggacttagg tgcgttcttt ttctcctgcg 2221 ccttgggcga agacttcttc gcagatttgg gtttttgatt ttttgcggaa tatgaagctg 2281 cctttttcgg gggcttgggt gcagagatcg cagcggcgat agcggcatca agcgcagact 2341 cggtgttggg ctgcttcttg gattttttag atgctgatac ggtcagcttt tcatcaagtt 2401 ttttattagc catgaaatac ctttcttttc tttgaaattg cttagagata tgtatccgac 2461 agtgcccgat atgttgtcgg gatttgtgca ggataaaaca tttatccgca cgggggcaca 2521 ataatccata attaaagata atactatatt actacaaagc aagaataatg tcaagttcgg 2581 agtgttgttc gcaaacgttt ggaattcatc ggtttctgcg aggaaatccg aaacttgagt 2641 ttcggaagat gaattcatag caaccgcaat gataattgcg tttgcttgtg gccaggcaca 2701 aacgtggcct atattgcaaa cttcggcggc cgcttggagc gaggcgtctg cgggcgcgtt 2761 cccgaatggg aacagtgccg caggtgccga gcggagcgga aaagatgcac aaaggttgga 2821 ttcattgcct actttaacct catccttcgg cgtttgctga caccccgcca tcaagggaag 2881 ggctttcacc gcttgttatt gattattcac cgcaaaccca gtttatatcc aatttacggc 2941 gaaatatgat aaaaccgcgc actgccaaag caatgcacgg ttcaaaaaag ttgttaagtt 3001 taaagttctt cgccgaagaa catattgttg acatagctat cgttgaactt ggggtttcca 3061 ccgagattga cgtgccttga aacagaagcg atccgttcaa gctctgcttt ttcgtcttca 3121 ttcaaaagaa ccattgcaca tcctgcgaga gcggcgttgc ccaaaatttc ggttttatcg 3181 gcaagctcgt ttggtatcag tccaatatat gcggcgctct caacgttgag gtgacttccg 3241 aatccacctg caatgtaaag cttattaact tcgctcagtt ttacatcagc ttccgaaagc 3301 attgtttcaa tgcctgcggc gatcgccgcc tttgcaagct gaacagctcg gatatctcga 3361 ggctgaagcg aaacattttc ggcaagacaa agctcatctt ccatagcgcc cgtttcttca 3421 atatctcccc tgttgagtcc gacggcaacg gcatccaaaa ggcccgagcc gcagatgcca 3481 actgcaggag catcagcgat agtgtggatt ttgatgtcat cgccttcaag ccagactttg 3541 tcgatcgctc cgctgatact tcccgttccg caggagattc cggcgccttc aaatgcaggt 3601 cccgcagcag tagaggtgac gtaaaggcga tcgcctttcc acagggccat ttctccgttg 3661 gtgccaatgt cgcaaagaag ggatatttca tccgacttac acattccgct tgcaagcaca 3721 gcacaggtta tatctgcgcc cacaaaggcg ttcatacacg gcggaaggta tgtattgatg 3781 cccaaaatct cggtttgatt tccaaagagt gtgtctgcca aaaacggagc acgggataag 3841 cacaacggcg atctttccgt caaaagatag agcattgtgg tgtttcccgt tattacagcg 3901 cggtctggta cataaggggt actgtcaatc agctctttga tgcagtcatt tatcagcatg 3961 caaagatgct caagtctgcc gttaattgca gagtctattc tgcccataac atcagcggcg 4021 atttccgttt gaggattgag tttcgcgcaa gtggcgatgc atttgccgtc tgtcaagtta 4081 tacagcttta cagcaacggt tgtggtgcca atatcaatcg cggcaccgat cttgccattc 4141 atcggcttca gattgtcgat aatttcgttg aatcccgttt caatctgtct gactgtgccg // LOCUS sequence067 4191 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence067 VERSION sequence067 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..4191 /mol_type="genomic DNA" /organism="" /note="sequence067" CDS complement(1001..1867) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MATVNSETLAKINKFTRRELTADEVFCFSVILCDNEIDRDNEKFS VDALNKLAQLYVGKTGIFNHDPKGENQTARIYDTAVIKDETRKTADREVYTYLQAEVYM VKTEKNADLIKEIDGGIKKEVSVGCAVEREICSICGKDRRTNPCNHRKGASYGGKKCFG ILNSPTDAYEWSFVAVPAQRNAGVTKRYGEDYASKGAFPEEVRLEAELYNELTEDLKRE IIRLSYLEGDSVPVALTKAAIERMDISELITLKKALVSEANEAQECEISAALEKKQESE NNKSFKL" /locus_tag="LOCUS_3450" /note="MGA_425" CDS complement(1888..3048) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MAIFRKNKDIPVLDSGAVMPARVGDKEIFKISPAMGESERELYGV LREQVPIVDACIGKIIRLVGGFKPVALDPNFQPQLDAFAQNLKVGASGQSLNTFIDCYL DSLLTYGCALAEVVYDKSHRNIAGVYVAPVKKLDIREGKKPFTRDYYVGRGKNAVKIKH AENLLFTALSPTAENPMGVSVLRGLPALSKILLRIYESVGQNFDRVGSVRYAVTYKPSS DGDKAFARERAMQIAREWSSGMQMAKNGEIRDFVAVGDVDIKVIGADNQIIDTEVPVRQ LLEQLISKLGIPPFLLGLSWSTSERMSIQQCDILTSELEYYRRLLEPAIKQLCCSYLRL IGCADGVAIEWDDIDLMDTEALSKARLNNAQARAIELENLKLEQTA" /locus_tag="LOCUS_3460" /note="MGA_426" misc_feature complement(3068..>4191) /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_011674653.1:PBSX family phage terminase large subunit" /note="WP_011674653.1 PBSX family phage terminase large subunit (Lacticaseibacillus paracasei) [pid:47.1%, q_cov:96.0%, s_cov:86.1%, Eval:5.9e-94]" /note="MGA_427" /locus_tag="LOCUS_3470" ORIGIN 1 gtaagaatat ttacagcttc gggataaacc ttggtaaagc ctgcgctgat gcttacaacg 61 attctgtcga tctgagtgga gatgagctta tcgtggtcaa caatgacgtc ggagccgaga 121 accatttcaa gtgtgctggt ggaatccaaa ccgataaggg tattgtcatc cataccgggg 181 cacttgacca aggtcacgcc gtaaggagtc ttgacgatgt tgccgttaat aacctcggtg 241 tcgttatagt gcatttcttc catcgagaga ataattgcca taactgtggg ggagcagatc 301 attgcgttca tattgtgacc cttgagggat gcccagaaca atgcaaggtc gatgaaggta 361 aggctgtcgc cgatagtatc ggtaatggct gcgttcttct taattgcttc cattgcatcg 421 atattgaggg ttctggaaat atttgcgccg atgctcttaa gaacaactgc aaatacgtca 481 aggcgctgct ttctgagcac ttcataggaa gtgttgatct ctctgccata cttggagatc 541 tcaacaatgt tctcggagta tgcgatttcg gtgttgggga attctgcgcc gacgccgaca 601 gcagctgtgt cttcgtcgtt tacgatggta agtcctctgt aatcaatacc gtcggtatat 661 gtggttgctg caaccaaata aggcaaaatt gaagcctcat ccataccctg cttgatcata 721 cgtctgatga attcggggaa cagaactgca gactgggttg ttttgaagaa cttttcaact 781 ctgtcggaat tcgcgccgct gatcttaatg tcaaagcgct tgagctgacg ctcataagcg 841 tccaagcctt caagctctgt gccgatgtag ttttcatcgt ggtcaagctc tgcaagtgct 901 tctgtgaagg ttttgccgga gatgttgtaa agtccctttt caagtgtaat attatcgtac 961 atatttttta tcctttctgt tataaagtga ttttgattgt ttaaagctta aagcttttgt 1021 tgttttccga ctcctgcttc ttttcaagag ccgctgaaat ttcgcattcc tgcgcttcgt 1081 ttgcctcaga taccaacgcc tttttaagag ttataagctc gcttatgtcc atccgttcaa 1141 tggcagcctt ggtgagcgca acgggcacgc tgtcgccctc aagatatgaa agtcgaataa 1201 tttcgcgctt cagatcctcg gtcagctcat tataaagctc tgcctcaagt ctgacctctt 1261 cggggaatgc tcccttgctt gcataatcct cgccatagcg ctttgtgacg cctgcgtttc 1321 tctgggcagg taccgcaaca aagctccatt cataggcatc tgtggggctg ttcaaaatgc 1381 cgaagcactt ttttccgcca tagcttgcgc ccttgcgatg attgcaaggg tttgtgcgtc 1441 tgtccttgcc gcagattgaa caaatttcac gctcaaccgc acagccgacc gacacttcct 1501 ttttgatgcc gccgtcaatt tccttgatca gatcggcgtt tttctcggtc ttgaccatat 1561 atacctctgc ctgaagatat gtatatacct ccctgtcggc ggtctttctg gtttcgtcct 1621 tgataactgc ggtgtcataa attctcgcag tctgattttc acccttgggg tcgtggttga 1681 aaatgcctgt cttgccaaca taaagctgtg caagcttgtt aagcgcatca accgaaaact 1741 tctcgttatc tctgtcgatc tcgttatcgc aaaggatcac cgagaaacaa aaaacctcat 1801 ctgccgtcaa ttcacggcgg gtgaacttgt ttatctttgc aagtgtttcg ctgttaactg 1861 ttgccaaatt cttacctcct tttgtgttta tgcagtttgc tcgagcttaa ggttttcaag 1921 ctcaattgct cttgcctgtg cgttattaag gcgtgccttg ctcaatgctt cggtatccat 1981 aaggtcgatg tcgtcccatt cgatcgcaac gccgtcggca cagccgatga gtcttaaata 2041 tgaacagcag agctgtttga ttgcaggctc aagcaagcgg cggtaatatt ccagctcgct 2101 ggttaaaatg tcgcactgct gaatgctcat tcgttcgctt gttgaccagc tcaggcccaa 2161 gaggaaaggc ggaatgccca gctttgagat aagctgttcc aaaagctgac gtacaggcac 2221 ctcggtatcg ataatctggt tgtcggcacc gatcaccttg atgtcaacat cgccaacagc 2281 cacgaaatct cttatctcac cgtttttcgc catctgcata ccgcttgacc actcgcgtgc 2341 gatctgcatt gcgcgctcac gggcaaatgc cttgtcgccg tccgatgaag gcttataggt 2401 tacagcatag cgcacacttc ccacgcggtc gaagttctga cccaccgatt cataaattcg 2461 caaaagaatt tttgaaagcg caggcaagcc tctgagcacc gatacaccca tggggttttc 2521 cgctgtggga gaaagtgcgg tgaacaaaag gttttccgcg tgcttgattt taacggcgtt 2581 tttacctctg ccgacataat aatcgcgggt gaagggcttt ttgccctcgc ggatgtcaag 2641 cttcttaacg ggtgccacat atacccccgc gatgtttcga tgggatttgt catatacgac 2701 ctctgccaag gcacagccat aagtcaaaag cgagtcgaga tagcagtcga taaaggtgtt 2761 cagcgactgt cccgatgcac cgactttaag gttttgcgcg aaggcatcca gctgaggctg 2821 gaaattcggg tcgagggcaa caggcttgaa tccgcccaca aggcgaataa ttttgccgat 2881 gcaggcatcg acgatcggca cctgctcgcg caagactccg tatagctcgc gctccgattc 2941 gcccatcgca gggctgattt tgaagatttc cttatcccct actcttgcag gcattacagc 3001 acccgaatcg agaacgggga tatctttgtt tttacgaaat atcgccaata tttcacttcc 3061 tttcgattta gcggctgacc gacagggcga agaagcagtc ttcctttgcc gagccgataa 3121 actcgctgac aaaatagcga atgtcgtcca tcgcgtggtc gttttcttta ataacggtgt 3181 cgttgcccga gcgctcatcc cagcgatata gcgagaactc gcggatagcg tccttacatt 3241 cgggtgagaa ttttatcttt cccgatttaa gggcatcgct tacccgacgg atgcccgaga 3301 tgacatcgtt ttttgcaggc aaaaccttga atttaccgtg ccgacggata cattcgatga 3361 agctggctgc cgacggatcg cagacaacag cttcgggttt aaggttttcg caaagctctt 3421 ccaaagcctt gtaatgctcc tcatcggtgc gaagtgtccc ctcacgcttt gaggaaaaat 3481 aatattcgcg aaggcgatac cacacgccgt caaggtatcc ccacagaccg aaggatgcgg 3541 ggttgacggt gccgtagtcg caactaacgg catagcgggt gcagcattgc ggtgcaggga 3601 caacgtgggt cgcttctgaa aacatcgggt ataccgcacc gctgacagcg caccatttgc 3661 ccaaaacgta gcgctcataa aacgcaccgc tgtataggct ttcataacgt tttaataccc 3721 tttgggaaag gctggggttg tcgctcatat caaagtggat atacagcgca tttttttgct 3781 tcgccttttt gatccattcg gtataaaacc agtgtgcggg gttgtcgggg ttgcagttga 3841 accagagctt tgagccttca agagagcacc ttgctattgc ctgctcaaca aaggagcggg 3901 gcattaacac gacttcatca agcaaaactc cgcccagggt cataccctga atcagcgagg 3961 cacttgattc gtccttgccg ccgaaaatat aaaaccgatt ggtgactccg cgaaaggaaa 4021 catcgaagtg gttgcgggat gctttttcgc gtacatcgaa gccaagcgtt ttaaggtcgg 4081 caacaaggcg atcggtaaga ttgcgccgcg cagaggttaa ggtctttccg caaattgcaa 4141 agtcggtatt tctaaaactt cgcatcgccc acgccgcaaa ggaaaggctc a // LOCUS sequence068 4145 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence068 VERSION sequence068 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..4145 /mol_type="genomic DNA" /organism="" /note="sequence068" CDS 31..156 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MTRGDEQNALADTAYTRNFLLPAHVNRAIIIKDTIAKDKSP" /locus_tag="LOCUS_3480" /note="MGA_428" CDS 153..674 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MTLKEILTLHAKTYPEMTPTDAVKLIYQNEFCPGHLIRNRDRAFE YLKAEYDCTDSTADCLIEHIGNGIVRVYLSEFKARGLDLNVLFDAFCESAEEVKGNVES LKEKLEILKELAEENIFKFSVSELCDYLCAYEAAGYPMVSHSEVYKEHYHPSYRIVTEN LFNTYFKEEE" /locus_tag="LOCUS_3490" /note="MGA_429" CDS 676..2175 /product="carboxypeptidase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_004398513.1" /transl_table=11 /codon_start=1 /translation="MELSTAIQNLKDLQIKMYAFNAASSALYLDGVTVAPKETSEGRGV ALGILAGESHKLFANEEVGALLKFLGENKAELDRETVRQVELLQRSYDQLSKIPAEEYM EFAQLTNDADDVWHKAKKTSNFDLFRPYLEKIVAFNIKFAGYYDPNKKPYDALLNEFER GVDMEYLDGFFADVRENLVPIIKKINEGEQIDDSFLHKHYPIEIQRKFSDWLMEIMGMD RNHSTIGETEHPFTLNFNSQDVRITTNYKEDNLVDSMYSVIHEGGHALYELGVNPEYDY NCLAGGASMGVHESQSRFYENIIGRSEAFAKAIFPKVKEFFPEQLEGVDADMFYRAINK AQPSLIRTEADELTYAFHVMVRYEIEKQLIGGTLEVKDVPAEWNRLYKEYLGVDVPDDK RVCLQDSHWAGGSFGYFPSYALGSAYGAQMLAQMEKDFDVWGAVEKCDLSPVTAWLKDK VHKYGCLLEPSEIVENACGGKFDPSYYTEYLKNKFTRLYNL" /locus_tag="LOCUS_3500" /gene="ypwA" /EC_number="3.4.17.19" /note="WP_004398513.1 carboxypeptidase (Bacillus) [pid:39.5%, q_cov:100.0%, s_cov:100.0%, Eval:9.5e-109]" /note="MGA_430" CDS 2189..3067 /product="carbon-nitrogen hydrolase family protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_002679543.1" /transl_table=11 /codon_start=1 /translation="MTDLKIALLQIMPAGSQEANLAKGISACREAKKMGAHIALFPEMW NTGYDIPQNATVLEAMAISHDSEFINAFADLARELDMAIGITFLESHSPRPRNSLCLFD RKGNLALHYAKVHTCDFGDECMLDGGGDFYVCDLDVGDDTVKVGAMICYDREFPESVRI LMLKGAEIILVPNACPMEINRLSQLRGRAYENMLGIATCNYPSPKPDCNGHSSAYDGIA YREDVVGSCDTEILLAPETEGIYIADFALDDIRDYRNREVHGNAYRRPQMYNKLIDEEI LPPFVRHDRKK" /locus_tag="LOCUS_3510" /note="WP_002679543.1 carbon-nitrogen hydrolase family protein (Treponema denticola) [pid:63.0%, q_cov:100.0%, s_cov:99.0%, Eval:2.5e-102]" /note="MGA_431" ORIGIN 1 ccgaaaggtg aacgatggag gggacccgca atgacgcggg gcgatgagca aaacgcctta 61 gctgacaccg catatactcg caatttcctg ttgcccgcgc acgtaaaccg tgctataatt 121 ataaaagaca ctatcgcaaa ggacaaatcg ccatgaccct caaagaaatt ctcactcttc 181 acgcaaaaac ataccccgaa atgactccaa ccgatgccgt caagctcatt tatcaaaacg 241 agttctgtcc ggggcacctc attcgcaacc gagatcgagc ttttgaatat ctcaaagcgg 301 aatatgactg cacagattca actgccgatt gcctgattga acacattgga aacggaattg 361 ttcgtgtgta tctttcagaa tttaaagctc gcggacttga tttgaacgtt ctgttcgatg 421 ctttttgcga gtctgccgaa gaggtaaaag gaaatgtcga gtcgctcaaa gaaaagcttg 481 aaattttaaa agagcttgcc gaagaaaaca ttttcaaatt ctcggtttcg gagctttgcg 541 attatctttg tgcatatgaa gccgcgggat acccgatggt atcgcacagc gaagtatata 601 aagagcacta tcacccgtct tacagaatcg taaccgaaaa tcttttcaat acatatttca 661 aggaggaaga ataatatgga attatcaacc gcaattcaaa atttgaagga cttgcagata 721 aaaatgtatg cctttaacgc cgcatcaagt gcgctttatc ttgacggcgt gaccgtcgca 781 cccaaggaaa caagcgaggg cagaggtgtt gcgctcggaa ttttggcagg cgaatcccac 841 aagctttttg caaacgaaga ggtgggagca cttttgaaat tccttggcga aaacaaggcc 901 gagcttgacc gcgagaccgt ccgccaggtt gagcttttac agcgctcata tgaccagctt 961 tcaaagattc ctgcagagga atatatggaa tttgctcagc taacaaacga tgccgatgat 1021 gtttggcata aagccaagaa aacaagcaat tttgatcttt tcagacccta tcttgaaaag 1081 atcgttgcgt tcaacatcaa gtttgcagga tattacgatc caaacaagaa accatatgac 1141 gctttgctca acgagtttga gcgcggtgtg gatatggaat atctcgatgg tttctttgcg 1201 gatgtgagag aaaatctcgt tcccatcatc aaaaaaatca acgaaggtga gcagatcgac 1261 gacagcttcc ttcacaaaca ctaccctatt gaaattcagc gcaaattctc cgactggctg 1321 atggaaatta tgggtatgga cagaaaccac tccaccattg gtgagaccga gcaccccttc 1381 actctcaact tcaactcgca ggatgtaaga attaccacca actacaagga agacaatctc 1441 gttgattcga tgtattccgt tattcacgag ggcggccacg ctttgtatga gctgggtgta 1501 aatcccgaat atgactataa ctgccttgcg ggcggcgcat ccatgggtgt tcacgaaagc 1561 caatcgagat tctatgaaaa catcatcggc agaagcgaag cttttgcaaa ggcgatcttc 1621 cccaaggtca aggaattctt ccccgaacag cttgaggggg ttgatgcgga tatgttctat 1681 cgcgcaataa acaaggcaca gccctcgctc ataagaacgg aagccgacga actcacctat 1741 gctttccacg ttatggtgcg atatgaaatc gaaaagcagc tcattggcgg cacccttgaa 1801 gttaaggatg tccccgcaga gtggaaccgc ctttataagg aatatttggg cgttgatgtt 1861 cccgacgaca agcgcgtatg cttgcaggac agccactggg cgggcggctc attcggatac 1921 ttcccctcat acgctttggg ctcagcctac ggcgcgcaga tgctggcgca aatggaaaaa 1981 gatttcgatg tttggggcgc tgttgaaaag tgcgacctct ctcctgtcac cgcttggctg 2041 aaggataagg tgcataaata cggttgcttg cttgaaccct cagaaattgt tgaaaatgcc 2101 tgcggcggaa agtttgaccc aagctactat accgagtatc tgaagaataa gtttaccaga 2161 ctttataatc tttaattgga gttacaaaat gaccgatcta aaaatcgccc tcctgcagat 2221 aatgcccgca ggctcgcagg aagctaacct tgccaaggga ataagtgcct gccgtgaggc 2281 aaagaaaatg ggggcgcata tcgccttgtt ccccgaaatg tggaatacag gatatgacat 2341 tccgcagaat gcaaccgtgc ttgaagcgat ggcaatttcg catgatagcg agtttataaa 2401 cgcatttgcc gacttggcgc gggagcttga tatggcgatt ggcattacat ttttggagag 2461 ccactcccct cgcccgcgca actcactctg tttgtttgac cgcaagggca acctcgcatt 2521 gcattacgca aaggtgcata cctgcgactt tggggatgaa tgtatgcttg atgggggcgg 2581 tgatttttac gtttgcgatc tggatgtggg tgacgacaca gttaaggtcg gcgcgatgat 2641 atgctatgac cgcgaattcc ctgaaagcgt gagaattttg atgcttaaag gagcggaaat 2701 aattttggta cctaatgcct gcccgatgga gattaaccgt ctttcgcagc ttcggggcag 2761 agcatatgaa aatatgctgg gtattgcgac ctgcaattac ccctccccca agcccgattg 2821 caacggacat tcatcagcat atgacggcat tgcatatcgc gaggacgttg tcggctcctg 2881 cgatacggag atacttttgg cacccgaaac cgagggtatt tatattgccg attttgcgct 2941 tgacgatatc agagattacc gcaaccgtga ggtacacgga aatgcatacc gcaggccgca 3001 aatgtataat aaactgatcg acgaggaaat attgcctccg tttgtaaggc atgaccgcaa 3061 gaaatagagc gattaacact atcggcatac agccgatagt gttattttta acaaaaaact 3121 ccgcgatgaa agacaatatt tctaaaagaa atatctgcaa acatattgaa atatgaaatg 3181 gggcatgata taattaactg taatttggct tttgccgttg caattccatt ttttaaaaag 3241 aggtaatcag catgaacaat catgagcgca gagtaggtac ggtttcacgc ggaatccgct 3301 gtcctatcat tcgtcagggc gatgaccttg cagagcttgt aaccgtcagt gtattggaag 3361 ctgcataata tgaaggattt gaacttcgtg acagagatgt tatctctctt accgagtcta 3421 tcgttgcacg tgcacagggc aactatgctt ctgttaatga tattgccgag gacattaagg 3481 ctaaggttgg cgcagacact gtcggcgtta tcttccccat tctttcaaga aaccgcttcg 3541 caatttgcct taaaggtatt gcaatgggcg ttaagaaagt tgtattgatg ctttcttacc 3601 cttctgacga agttggcaac gagcttgtaa gcttggataa gatcgacgaa gcaggcgtta 3661 acccctatag cgatattctg actcttgaaa gataccgcga actgtttggc ttcaataagc 3721 acgagttaac aggcgttgac tatgttgatt actattccga tataattaag gaagcaggcg 3781 ctgaggttga ggttatcttt gcaaaccagc ccagagcaat tcttaactat accaagaacg 3841 tcatcacctg cgatattcac acaagagcaa gaaccaagag aatccttaag gctgcaggag 3901 ctgagatcgt tttgggactt gacgatattc ttaacgctcc cgttaatggc agcggatgca 3961 acgaagctta cggtctttta ggctcgaaca aatccaccga ggatcagatc aagctcttcc 4021 ccagagaatg cacacagctt gttttggata ttcagcagaa ggttttggaa aaaacgggca 4081 agcacgttga agttatggta tacggcgacg gcgcatttaa ggatcccaag ggcaagatct 4141 gggag // LOCUS sequence069 4116 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence069 VERSION sequence069 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..4116 /mol_type="genomic DNA" /organism="" /note="sequence069" CDS complement(198..1757) /product="polysaccharide biosynthesis tyrosine autokinase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011068360.1" /transl_table=11 /codon_start=1 /translation="MNENITERKEDIEVDLQRLVKALWKKLWVIVFSCIFGAVIALLVS TLLITPLYQSSAMFYVNNGSLSVGDAALSLTTGDISAAKNLVDSYIVILNTRTSLNDVI DYAEVDRTYEEVREMISAAAVNSTEIFEVVVTSSDAEEAEKIASAIAYILPKRISGIIE GTSAEVVDSAIIASKPSFPNHLTNTVIGFVLGMVLSAAIIVLKEVSNITIRNEEDVASV CKHPILAAVPDMTAHSKGGYYYYSHDKQKQKIQRPGVANQPVLIGRDISFAASEAYKLL RTKLQFSFADDSNSHVIGLSSALSGEGKSLTAVNLAYTLSQLNKKVVLIDCDMRRPTLA EKLEIQKKPGLSEFLSGQSKGELTCQKCGIKNDEDAFDVIAAGQNPPNPVELLSSARME KVVNRLRDIYDYVILDLPPVEEVSDALAVAKMTDGMLLVVRQNYCNRPALSDTSHQFEF INARVLGIVFNGTSESDGKYGKKYYKKYGKYGKYYGRYESSYEAAAKKAEPVNKSTESK DE" /locus_tag="LOCUS_3520" /note="WP_011068360.1 polysaccharide biosynthesis tyrosine autokinase (Bifidobacterium longum) [pid:26.4%, q_cov:85.0%, s_cov:88.3%, Eval:8.7e-36]" /note="MGA_434" CDS complement(1918..3840) /product="nucleoside-diphosphate sugar epimerase/dehydratase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_009897930.1" /transl_table=11 /codon_start=1 /translation="MKFIDIMDKILDGNYRHRLVLVLFDLICFIAVDIFYYFVAANVAN SMPVEEKEVFLINSLAQVVFVFAFRFALGIYNTVWRYSNNRAYFSLVVADALGSMAGLI IIRFADLFFDGVYYGVWHASTVGALTALITLMSRFTYSLAYKARSKSKVVKSKIPVVIV GAGRLGSYLAGDLRNNPKSQFEPQFFIDKNPTKVGNRVSALKVYSPEDGVELIEKLGIR EVIIAIVNRDGEDLSKLYYEYHNLGCNVRVYDSLVSGNEVKKGVLREFSIEDLLFRNTV DVSDERELEFYSGKTVLVTGGGGSIGSEICRQIAKCHPKKLVVLDIYENNAYDIQQELI RKYGDRLDFAVEIGSVRDYDRLDEIFNTYRPDVVFHAAAHKHVPLMESCGAEAIKNNCI GTYNTANAAEKYGAEKFILISTDKAVNPTNIMGATKRICEMIVQCRADSKTSFAAVRFG NVLGSNGSVIPLFKRQIAEGGPVTITDKRIIRYFMTITEASQLVILAGAMAKKGELFVL NMGKPVKIYDLAVNMIKLSGLEPDKDIKIEEIGLRPGEKLYEELLMKTEVLDKTENNMI FIERDASYTREEVDKKLEMLIGALGDNNRIKEAVAAAVPTYRAPDEINKDAEKSEEMKL AETTI" /locus_tag="LOCUS_3530" /note="WP_009897930.1 nucleoside-diphosphate sugar epimerase/dehydratase (Clostridioides difficile) [pid:44.0%, q_cov:95.3%, s_cov:95.1%, Eval:2.3e-129]" /note="MGA_435" ORIGIN 1 attcaaggcg ttcctgcgcc attttgcggc gttccaggaa tgcctcgggc gaatcgtgat 61 tcgcgtaaaa atgaggggtc gcaaccaccg tttcaatccc ctgctccgct tcaagccgaa 121 gcattccgat tgactcttta agcgaagagc ttccgtcgtc aattttgggg agaacgtggg 181 tgtgaaaatc aatgatctta ctcatctttg ctttccgtcg atttattaac gggttcggct 241 ttctttgcgg cggcttcata gctgctttca tatctgccgt aatacttgcc gtacttacca 301 tactttttgt aatacttctt gccgtatttg ccatcgctct cggaggtgcc gttgaagacg 361 atacccaaaa cgcgggcgtt gataaattcg aactgatgcg aagtgtccga aagagcggga 421 cggttgcaat agttctgtct gacgacaaga agcattccgt cggtcatctt tgcaactgcc 481 aaagcatcgc ttacttcctc aacaggagga aggtccagaa ttacgtagtc atatatatca 541 cgcaggcgat taacgacctt ttccattctc gcagagctta aaagttcaac agggttggga 601 ggattctgtc ccgcggcgat gacatcgaat gcgtcctcat cgtttttgat tccgcatttc 661 tggcaggtca gctcgccctt gctctgtccc gaaaggaatt cagaaagtcc gggctttttc 721 tggatctcaa gcttttcggc aagagtgggt cggcgcatat cgcagtcgat aagtacgacc 781 ttcttgttga gctgagaaag ggtgtaggca aggttaacag cggtcagcga tttgccttcg 841 cccgaaagag cactcgataa accaattacg tggctgttgc tgtcatcggc aaaggagaac 901 tgaagcttcg ttcttaaaag cttatatgct tcagatgcgg caaagctgat atccctgccg 961 atcaaaacag gctggttcgc aacgccgggg cgctggatct tttgcttctg tttgtcgtgg 1021 ctatagtaat aatatccgcc cttgctgtgc gcggtcatat cgggtacagc ggcaagaatc 1081 ggatgcttgc aaacggacgc aacatcttct tcgttgcgga tggtgatgtt ggatacttcc 1141 ttgaggacga ttatcgcggc gctcagcacc atgccgagaa caaaaccgat gacagtattg 1201 gtcaagtggt tggggaagct gggctttgaa gcgattattg cagaatcgac gacctcggca 1261 gaggtgcctt caataatgcc ggaaattcgc ttgggaagta tgtatgcaat tgcgctggcg 1321 atcttttcag cctcttcagc atcggagctg gtgacaacga cctcgaaaat ttccgttgaa 1381 ttaacagcgg cagcagagat catttcgcgg acttcttcat atgttcggtc cacttcagcg 1441 taatcaataa catcgtttaa ggatgttctg gtgtttaaga ttacgatata ggagtcgacc 1501 aagttcttag cggcggaaat gtcgccggtt gtcaggctca gggcggcatc acctaccgag 1561 agcgaaccgt tgttgacata aaacatcgca gaggactggt ataagggtgt gatcaacagg 1621 gtcgatacca aaagcgcaat caccgcaccg aagatgcagg agaagacgat cacccaaagc 1681 tttttccaaa gcgctttgac cagcctttgt agatcaactt cgatatcttc tttacgttct 1741 gttatatttt cattcatttg tgtaaacctc cgaaagggct gtgccaaacg gcacaatccc 1801 taattaaagt ataacacgag gattttcgta tgtcaataca gttaaacaaa cttgtgttgc 1861 caaacagtta gaaaaatgag cgatttaagg ttttttcatt gtgcaatcga acgataatta 1921 aatcgttgtt tcggcaagct tcatttcttc cgatttttcg gcatccttgt taatctcatc 1981 gggtgcgcgg tatgtgggta ccgctgccgc aacagcctct ttaattcggt tgttgtcacc 2041 caaggcaccg atgagcatct caagcttttt gtccacctct tcgcgagtat atgaagcatc 2101 cctctcgatg aagatcatgt tgttttcggt cttgtcgaga acttcagtct tcatcaaaag 2161 ctcctcatat agcttctcgc ccggtcgcag gccgatctct tcaatcttaa tatccttatc 2221 gggctcaaga ccggaaagct ttatcatatt gacggcaagg tcataaatct taaccggttt 2281 gcccatattc aaaacaaaca gctcgccttt ttttgccatt gcgcccgcca gaattacaag 2341 ctggcttgcc tcggtaatgg tcataaaata gcggatgatg cgcttgtcgg ttattgtgac 2401 aggaccgccc tcagcaatct ggcgcttaaa cagcggaatt accgagccgt tggagcccaa 2461 aacatttccg aaacggacag ccgcaaagct tgttttgctg tcagctcggc actgaacgat 2521 catttcgcag atacgcttgg tagcacccat aatgttggtt gggttgaccg ccttgtcggt 2581 ggagatcaaa atgaacttct ccgcgccgta tttctcggca gcgttggcgg tgttgtatgt 2641 tccgatgcag ttgtttttaa ttgcctctgc gccgcaactt tccatcaagg gaacgtgctt 2701 gtgtgcagca gcgtggaata ctacgtcggg acggtaggta ttaaatattt catcaagcct 2761 gtcataatcc ctcacagagc cgatctctac ggcgaagtcg agcctgtcgc catattttct 2821 tataagctcc tgctggatgt cataggcatt attttcataa atatcgagaa caacgagctt 2881 tttcggatgg cattttgcaa tttgtcggca aatttccgag ccgatcgaac cgcctccgcc 2941 tgttacaaga acagtcttgc ccgaataaaa ctcaagctcg cgctcatcgc tgacgtcaac 3001 ggtgtttcgg aaaagcaaat cctcaattga aaattcacgc aatacacctt ttttaacctc 3061 atttccgctg acgagcgaat catatacacg gacattgcaa cccaggttgt gatattcgta 3121 atatagcttt gaaaggtcct cgccgtcgcg gttgacaatt gcgattatga cctcgcggat 3181 gcccagcttt tcgataagct ccacgccgtc ctcagggcta tataccttta aggcggaaac 3241 gcggttgccg accttagttg ggtttttatc aatgaaaaac tgtggctcaa actgggattt 3301 cggattgtta cgcagatccc ccgccaaata tgagccaagt ctgcccgcac cgacaattac 3361 aacgggtatc ttcgatttta cgaccttcga cttcgacctc gccttatatg ccaagctgta 3421 tgtaaaacgg gacataaggg tgatgagcgc agtcagcgca ccgacggttg aagcgtgcca 3481 tacaccgtag tatacgccgt caaagaacag gtctgcaaaa cgtatgatta taagtcccgc 3541 catactgccc aaggcatctg ccacaacaag gctgaaatat gcacggttgt ttgaatatct 3601 ccagacggtg ttataaatgc ccaaagcgaa tcggaaagca aacacaaaca cgacctgtgc 3661 caaagagtta atgaggaata cttccttttc ttcaacaggc atactgtttg caacatttgc 3721 cgcaacaaag taatagaata tatcgacagc gataaaacat atcaggtcaa acagcaccag 3781 aacaagtcgg tgccgatagt taccgtcgag tattttatcc attatatcaa tgaatttcat 3841 taaatagcca acttcctaaa aagtatatgt ccctgagggt ttagaattta cgccaaacgt 3901 ttttgttcac cacgtttgta tacgactgaa taagcttgac gaccttggtt gaaacgttag 3961 tgtccacata atcgggcacg ggaatgccta tgtcggcgtt tttgttcatt aaaacagcgg 4021 tgtcaacagc ctgcaaaagt gaaactgtgt cgatacctgc aagaacgaag caggctttat 4081 ccaacgcttc ggggcgctcg gtcgaggtgc ggatgc // LOCUS sequence070 4060 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence070 VERSION sequence070 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..4060 /mol_type="genomic DNA" /organism="" /note="sequence070" misc_feature <1..542 /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_000453154.1:deoxyribose-phosphate aldolase" /note="WP_000453154.1 deoxyribose-phosphate aldolase (Streptococcus) [pid:68.0%, q_cov:96.1%, s_cov:77.1%, Eval:1.5e-61]" /note="MGA_437" /locus_tag="LOCUS_3540" CDS 532..1254 /product="purine-nucleoside phosphorylase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_000160304.1" /transl_table=11 /codon_start=1 /translation="MATNYPTPHINATPEDFAKVVLMPGDPLRAKFIAENFLENARLVN NVRGIHGYTGTYKGVPVSVMASGMGMPSIGIYSYELFNFFGVETIMRIGSAGSMQKDIH IRDIVFGQAACTDSNYVNQFCLAGHYAPICSYDVLKIAIEEAEKVGARYHVGNLLSSDC FYGDNPNASPAWQKMGVMAVEMEAAALYMNAARAGKKALALCTISDSLVSGEATSAEER QNSFTQMMEIALNTAIRL" /locus_tag="LOCUS_3550" /gene="deoD" /EC_number="2.4.2.1" /note="WP_000160304.1 purine-nucleoside phosphorylase (Staphylococcus) [pid:58.0%, q_cov:96.2%, s_cov:97.9%, Eval:9.2e-75]" /note="MGA_438" CDS 1251..2831 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MIIMDKRVFLIVLDSVGAGALPDAELFGDAGTNTLRSCYNTGKLN ILNMLKMGLGNIDGLEFLGICENPCASYGRLRERSMGKDTTIGHWEISGIVSEKPLPTY PDGFPQEILDEFSRQTGRGVLCNQPYSGTDVIRDYGDEHVKSGDLIVYTSADSVFQIAA HEEIVPVETLYEYCRIARKILAGEHAVGRVIARPFIGESGNYTRTSNRHDFSLEPYGET MLDAIKTGGKDVIAVGKITDIFAGRGVTETIFTHGNTEGMKITSDVANRDFNGLCFTNL VDFDMLYGHRNDAVSYAEALNEFDAWLGEFVKTLRDDDVLIITADHGCDPGDISTDHTR EYTPILVYGKGINPVKLNTLTTFSDIAATVCDYLDVDFDCPGTSFLENMTYEPEKLATF AKEAMMKAYAPYSGYKVGAALLCADGSVYTGCNIENAGYSATNCAERTAIFKAVSEGKR NFVAIAVCGGKDGVLADEPFPPCGICRQVMREFCRDDFRIHMVTADKLKDFTLSEILPM SFGPDHIDK" /locus_tag="LOCUS_3560" /note="WP_011393009.1 phosphopentomutase (Moorella thermoacetica) [pid:55.1%, q_cov:72.1%, s_cov:97.4%, Eval:2.6e-120, partial hit]" /note="MGA_439" ORIGIN 1 catattacgt taaacaggca aaggaatacg tcggcgataa gcttgcaatc tgcaccgtca 61 ttggttttcc taacggatat tcaacaaccg aaacgaaggt atatgaaaca gcagatgctg 121 ttaaaaacgg tgccgatgaa attgatatgg tcatcaatat cggtatgctc aaggacaaaa 181 agtatgacga attgctcgac gagatcaagc gtattaaagc ggcttgtgat gacagaattt 241 tgaaggtcat aattgaaacc tgcctgttaa cagatgatga gaagatcaaa atgtgcgaaa 301 tcgtttccgc ctcgggcgct gattatatca agacatcaac cggcttctca actgcgggag 361 ccacaaagga agatgttaaa ctctttgctg aacacgttgc accacactta aagatcaaag 421 ctgcgggcgg aatatcatcc attcaggatg ctgaggactt cataaatctc ggagcatccc 481 gacttggaac tagcagaatc gttaaaattg taaaacagga ggacaaagga tatggctact 541 aattatccaa ccccgcatat taacgcaaca cccgaggatt tcgcaaaagt tgttttaatg 601 cccggagatc ccttgagagc aaaattcatt gctgaaaatt tccttgaaaa cgcgcgcctt 661 gttaacaacg tccgcggaat tcacggatac acaggaacat ataaaggcgt tcctgtttcg 721 gttatggcca gcggtatggg tatgccttca attggtattt attcttatga gcttttcaat 781 ttctttggag ttgaaacaat tatgcgaata ggctctgcag gctcgatgca gaaggatatt 841 cacattcgcg acatcgtttt cggacaggca gcttgtaccg attctaacta tgtaaatcag 901 ttctgtttgg cgggtcatta cgcacctatt tgctcatatg acgttttgaa aatagcaatt 961 gaagaagctg aaaaggtcgg cgcacgttat catgtcggca accttctttc gtccgattgc 1021 ttctatggcg ataatcccaa cgcttctcct gcatggcaga agatgggcgt aatggctgtt 1081 gaaatggaag ccgcggcact ttatatgaac gccgcacgcg caggcaaaaa ggcacttgca 1141 ctttgcacta tctccgattc gcttgtatcg ggcgaggcaa caagcgccga ggaacgccag 1201 aattcattca ctcagatgat ggaaattgcg cttaacaccg caataagatt gtgataatta 1261 tggataaaag agtattttta atcgttttgg acagtgtcgg cgcaggggct ttaccagatg 1321 ctgagctgtt cggtgacgca ggcacaaata ccctgcgaag ctgttataat acaggcaagc 1381 tcaatattct caatatgctc aaaatgggac ttggaaatat tgatgggctg gagtttttgg 1441 gcatttgtga gaatccctgc gcttcatatg gtcgacttcg cgagagaagt atgggcaaag 1501 acacaacaat tggtcattgg gaaatttcgg gaatcgtttc cgaaaaacct ttgcccacat 1561 atcctgatgg cttcccgcag gagattttag atgagttttc ccgtcaaaca ggccggggag 1621 ttctttgcaa tcaaccttat tcgggtaccg atgtcattcg tgactatggc gatgagcacg 1681 ttaaatcggg cgatttaatt gtttacacct ccgcggacag cgtatttcaa attgcggcgc 1741 atgaggaaat cgtgcccgtt gaaacgcttt atgaatattg cagaattgca agaaagattc 1801 ttgcgggtga gcatgctgtc ggaagagtga ttgcaagacc gtttatcggt gaaagcggaa 1861 attatacaag aacctcaaat cgccacgact tctcgctgga gccttacggc gaaacaatgc 1921 tcgacgcgat taaaactggc ggcaaggatg tcatcgctgt tggaaagatt actgatatat 1981 tcgcaggcag aggagttacc gaaacgatct tcacacacgg caacaccgag ggaatgaaga 2041 ttacaagtga tgtcgcaaat cgcgatttca acggtctttg ctttaccaat cttgtcgact 2101 ttgatatgct ctatggccac cgcaacgatg ctgtttccta tgcagaggca ttgaatgaat 2161 ttgatgcttg gctgggcgag tttgtcaaaa cattgcgtga tgacgatgtt ttgataatta 2221 ccgctgacca cggctgtgat cccggagata taagcaccga tcacacacgt gaatatacac 2281 ctattcttgt ttacggaaag ggaataaatc ccgtaaagct taacaccttg acaacatttt 2341 cggatatcgc tgcaactgtt tgcgactatt tggacgtcga ttttgactgt cctggtacaa 2401 gctttcttga aaatatgaca tatgaacccg aaaaacttgc aacttttgca aaagaggcga 2461 tgatgaaagc atatgcacca tattctggat ataaggtggg tgctgcgctg ttatgcgccg 2521 acggttcggt atatacaggc tgcaatatcg aaaatgcagg ttattctgca acaaactgcg 2581 ctgagcgtac agcgattttt aaggctgtca gcgaaggcaa gcgcaatttc gttgcaattg 2641 ctgtatgtgg cggcaaggac ggcgttttag ctgatgagcc cttcccgccc tgcggaattt 2701 gcagacaggt aatgcgtgaa ttctgtcgtg atgactttag aatccatatg gtgacagctg 2761 acaagcttaa agactttaca ctttccgaga ttcttccgat gagctttgga cccgaccata 2821 tagacaaata acgaatacag gtgatcaata tatgagaatg tacgatatca tctataaaaa 2881 acgcgcaggt ggagagctta gcgatgctga aattcgcttt gcgattaaag gtttcaccga 2941 tggctcaatt cctgactatc aaatgtcagc acttgcaatg gccattctgt ttgtcggtat 3001 gaccgacaga gaaactgcaa ccctcacaga tgccatggca atatcgggtg atacggttga 3061 tttgagcgaa ttcggaaacc tatctgttga taagcattca acaggcggcg taggagataa 3121 aacttcgctg atcgtcgcgc cgatcgttgc atcctgtggt gcgaagattg caaaaatgtc 3181 cggtagaggc ttgggacata caggcggaac cgttgataag ctcgagtcaa ttaagggata 3241 taaaactgag cttccgataa gcgatttctt tgaacaggtg cggaatatcg gtatttctgt 3301 catttgtcat agcggaaata tgaccccggc ggacaaaaag ctttacgctt tgcgcgatgt 3361 caccgcaact gtcgattcga ttccgctgat cgtttcaagc attatgagca agaaacttgc 3421 ggcgggtgct cgttcaattg ttttggatgt caaggttgga agcggcgcgt ttatgcccga 3481 tcttgaatct gcgacaactt tagcggaaaa tatggtcagc attggcaagg cttgcgaaag 3541 gaacatatct gcactgataa ccaatatgga cttgccattg ggcaatgccg tcggaaactc 3601 ccttgaggtt attgaagcaa tcaatgtgct taaaggcgtg gatgtcggtg accttaaaga 3661 gatatgtctt gcgctttcat cgtcaatttt ggagctttgc tttggcttgt ccgacaaaga 3721 agcacacgat atggcatatg atgctctgca aagtggaaag gcgtatgaaa aattcaagga 3781 atggatctca tatcaaggcg gcgacatttc ttgggtcgag gaaacttcaa aatttcctaa 3841 ggctaaatat tgcttagatg ttttagctga agctgacggt tggatttccc atatgaacac 3901 cgctaaaatc ggtaatgttt catctcattt gggagccgga cgaatcaaaa aggatgatgt 3961 tatcgacttt gatgcgggaa taataatctc aaagaaaaca ggggactacg tcaaatcggg 4021 cgaagccctt gcaacgcttt attcaaacaa tgaatctgtc // LOCUS sequence071 4057 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence071 VERSION sequence071 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..4057 /mol_type="genomic DNA" /organism="" /note="sequence071" CDS complement(34..1488) /product="glycerol kinase GlpK" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011015864.1" /transl_table=11 /codon_start=1 /translation="MKCVIGIDQSTQGTKALLIDENARIIAKAYMAHRQIITPEGYICH DPEEIYENVKSVVKDVIRQVTDAEVTAIGISNQRETTVAWDAFSKKPIMDAVVWQCTRA KDVCKQISDSNGEYIRRVTGIPLSPYFPAAKMKWILENSSQTSDLSKDGRLKFGTVDSW LIYKMTGEHLTDTSNASRTQLMNLETLDWDEKALEIFGVERASLAKICPSDGDFGETDL GGIFEHKVPIYAVMGDSHAALFAQRCHSAGELKVTYGTGSSVMMNTGDDIISSNHGLAS SVAFSFMGKTSYALEGNVNYSGAVISWLKSDLELIKSADETEALALMANKQDKTYLVPA FSGLGAPYWKNDVRAVIVGMTRLTGKAELVRAALDSIALQINDVLVAMSEDSGTKIMTI ATDGGPTKNKYLMQFQSDIAMAEIRVSKTEELSGMGAGLMAGIKSGVFDAKIAFKGIEY SRYAPKMSATRRNEIIAGWKEAVEKV" /locus_tag="LOCUS_3570" /gene="glpK" /EC_number="2.7.1.30" /note="WP_011015864.1 glycerol kinase GlpK (Fusobacterium nucleatum) [pid:41.1%, q_cov:99.8%, s_cov:98.8%, Eval:3.7e-110]" /note="MGA_441" CDS complement(1485..2423) /product="transketolase C-terminal domain-containing protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003732677.1" /transl_table=11 /codon_start=1 /translation="MNRIANRAVICEVLMKHAKSDQDIVVLCSDSRGSASMTPFANAYP QQFVETGIAEQNLVGIAAGLAKCGKKAFACSPACFLSTRSYEQIKIDCAYSRTGVKLIG ISGGISYGALGMSHHSLQDIAAISAIPNIKIYLPSDRHQTKFLTEKLLDEPISAYIRVG RNPVEDVYNETQKFEYDKAVWIKQGEDVAIIACGEMVKPAVEAAEILEIEGISVSVIDM YCLKPLDEEAIIRAAKDAKVVITVEEHSPFGGLGSMVSSVVSRHCPKRVMSLSLPDAPV VTGASKEVFRHYGLDGEGIAKSAKMLLEEVL" /locus_tag="LOCUS_3580" /note="WP_003732677.1 transketolase C-terminal domain-containing protein (Listeria monocytogenes) [pid:54.6%, q_cov:96.2%, s_cov:95.0%, Eval:6.5e-88]" /note="MGA_442" CDS complement(2416..3246) /product="transketolase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_010989643.1" /transl_table=11 /codon_start=1 /translation="MNYNAFSFDLRRDIVDIIMAGNGGHIGGDMSVIDTLMTLYFRVMN ISPENDDSPDRDLFVLSKGHCVEALYAVLAAKGFFSLDEVKANFSRFGSQFIGHPNNKL KGIEMNSGSLGHGLSVCVGIALASKMNKTNNRIYTVMGDGELAEGSVWEAAMAASHYGL DNLCAVVDRNRLQISGNTEDVMHHDDLGARFESFGWNVIDVKNGNDSNCLFEAFMIAKE GKGKPTVIIANTVKGFGSAVMENKDEWHHHVPSDEEYERIIKDFAKRKEALLSE" /locus_tag="LOCUS_3590" /note="WP_010989643.1 transketolase (Listeria monocytogenes) [pid:55.2%, q_cov:97.8%, s_cov:97.4%, Eval:2.7e-79]" /note="MGA_443" misc_feature complement(3248..>4057) /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_010989642.1:L-fucose/L-arabinose isomerase family protein" /note="WP_010989642.1 L-fucose/L-arabinose isomerase family protein (Listeria monocytogenes) [pid:64.8%, q_cov:100.0%, s_cov:57.8%, Eval:1.1e-101, partial hit]" /note="MGA_444" /locus_tag="LOCUS_3600" ORIGIN 1 gatacccaag ccgaacgggt atctgctttt ttgttatact ttctcaaccg cttccttcca 61 gcctgcgatt atttcatttc gccttgtggc actcatcttc ggcgcatatc gggagtattc 121 aatcccctta aatgcaattt ttgcatcgaa aacgcctgac ttgattcccg ccatcagccc 181 agcacccatt cccgaaagct cctctgtttt ggaaaccctt atttccgcca tcgcaatatc 241 gctctggaac tgcataagat acttgttttt ggtagggcca ccgtctgtgg caatggtcat 301 aatcttagtg cccgaatcct cactcatcgc cactaaaaca tcgtttatct gtaacgcaat 361 cgaatcaagt gccgcgcgaa caagctccgc tttgcccgtc agccttgtca ttccgacgat 421 aactgctctc acatcgtttt tccaatatgg tgcacccaga ccgctgaacg caggcaccaa 481 ataggtttta tcctgcttat tcgccataag cgctaacgct tcggtttcat ctgccgattt 541 aataagttca aggtcgcttt ttagccacga gatcacagcg cccgaatagt tgacattgcc 601 ctccaaggca tatgatgtct tacccataaa gctgaatgcc accgagcttg ccagcccgtg 661 attggaactg atgatatcat cacctgtatt catcatgacc gatgagcctg tgccgtaggt 721 caccttcagt tcgcccgccg agtggcatct ttgcgcaaac agcgccgcgt gggagtcgcc 781 cataaccgca tatatgggca ccttatgttc aaaaattccg ccgaggtctg tttcgccgaa 841 atcgccgtca gaggggcata tcttcgcgag cgatgccctc tcaacgccga atatttcaag 901 cgctttttca tcccaatcaa gcgtttcaag attcataagc tgtgtgcgcg aggcgtttga 961 ggtgtcggtc agatgctcgc ctgtcatctt gtagatcaac caggagtcaa ctgtgccgaa 1021 tttaagcctg ccatcctttg ataaatcact tgtctgcgat gaattctcca agatccactt 1081 cattttcgcg gcgggaaaat acggcgacag gggaataccc gtgacacgcc taatgtattc 1141 gccgttgcta tcgctgattt gcttgcaaac atccttcgct cttgtgcatt gccacacaac 1201 ggcatccata atcggttttt tgctgaatgc atcccaggca acggtggttt cacgctgatt 1261 tgatataccg attgccgtaa cttcggcatc cgtcacctgc ctgatgacat ctttaacaac 1321 cgattttacg ttttcatata tctcctcggg gtcatggcag atatacccct cgggggtaat 1381 tatctggcgg tgagccatat atgccttggc gatgatcctt gcgttttcgt cgatcagcag 1441 agcttttgtt ccttgggtcg attggtcaat tcctatcacg catttcatag aacttcctcc 1501 aaaagcattt ttgcgctttt tgcaatgcct tcgccgtcaa gaccgtagtg ccggaaaact 1561 tcctttgatg cgcctgtgac tacaggcgca tcgggcagcg acaggctcat aaccctcttg 1621 gggcaatgcc ttgaaacgac cgatgatacc atcgagccga gcccgccaaa gggcgaatgc 1681 tcctcgacgg tgatgacaac ttttgcgtcc ttcgccgccc tgatgattgc ctcctcgtcg 1741 agaggcttta agcaatacat atcaataacg ctcacgctga tgccctctat ttcgaggatt 1801 tcagccgcct caaccgcagg cttgaccatc tctccgcagg cgatgattgc aacgtcctcg 1861 ccttgcttta tccatacagc cttgtcatat tcaaacttct gcgtttcatt gtaaacatct 1921 tcaacgggat ttcgtcccac gcggatatat gcagatatcg gctcatctaa cagcttttca 1981 gttaagaatt tcgtctgatg cctatcgctg ggcaggtata ttttgatgtt cggaatcgcc 2041 gaaatcgcgg cgatgtcctg caaagaatgg tgactcattc cgagcgcgcc gtagctgatc 2101 cctccgctga ttccaatcag cttgacgcct gtgcgcgaat atgcgcagtc gatcttaatc 2161 tgctcatagc ttcttgtcga gaggaagcag gcaggcgagc aggcgaacgc cttctttccg 2221 catttcgcaa gccctgccgc aataccaaca aggttttgct cggcaattcc cgtttctaca 2281 aactgctggg gatatgcgtt cgcaaaaggt gtcatcgaag cgcttcctct tgaatcggag 2341 caaagcacga caatgtcctg atcactcttc gcgtgcttca tcagcacttc gcagatgacc 2401 gctcggttag caattctatt cactcaaaag cgcctccttc cttttcgcaa aatctttgat 2461 tatccgttca tattcctcat cgctcggtac gtggtgatgc cactcgtcct tgttctccat 2521 aaccgctgag ccaaagccct taacggtgtt tgcgatgata actgtcggct tgcccttgcc 2581 ctctttagca atcataaatg cttcgaaaag gcagttggaa tcattgccgt ttttaacatc 2641 tatcacgttc cagccgaagc tctcaaatct cgctccaagg tcatcgtgat gcataacgtc 2701 ctcggtattg cccgaaatct gcagacggtt gcggtcaaca acagcgcaaa ggttgtcaag 2761 cccatagtgg cttgccgcca tcgccgcctc ccaaacggag ccttccgcca gctcgccgtc 2821 acccataacg gtgtaaatgc ggttgtttgt cttgttcatc ttggatgcca gcgctatacc 2881 cacacagacc gagagcccat gaccgagcga gcccgagttc atttcaattc ctttaagctt 2941 gttgtttggg tgaccgataa actgcgaacc gaagcgggaa aaattcgcct tgacttcatc 3001 aagcgagaag aacccctttg ccgccaaaac tgcataaagt gcctcgacac agtggccctt 3061 gcttaaaaca aacaaatctc tatcgggaga atcgtcgttt tcggggctta tgttcatcac 3121 acggaaatat agcgtcataa gcgtatcaat aacgctcata tccccgccga tatgtccgcc 3181 attgccggcc ataattatgt cgacaatgtc ccttcttaaa tcaaacgaaa acgcgttata 3241 gttcatatca ctcactccaa agccttgctt taacgcttgc ttcatctgca tcaaacaaat 3301 ctgcctgtat gcctatatat ttgcaggctt cgtaaagcac ggggacaaca tccgcatgga 3361 tgcccacgca atggtggata tacggcccct caacgatctt tgcttcaagg ctcggccaat 3421 ccttgacctc gatccacata tatgtgccct tggtataagg cccgtcgatg gtcttggcat 3481 tgcccaaaag caaggaatat tcgcctttgt cgccgtcaaa gcgcgcaatt gtcagctcgc 3541 ccgattttgc caacgcttca actgcacccg ggtggtcaaa tgccaacgga tagccgatag 3601 tcggtttctc ggatgccaca gaaatcggcc aaggtccgca atgctgcaaa agctcgccgt 3661 tgtcattaaa cggatgacgc accgtccaat cggcaaagaa actgcggtac tcgcccaaat 3721 ctgctgcctc gaccattagc gaagttatcg ctccgtgaat gtctgtctcg cagacaacgg 3781 gcagaccttc ctcgttcaaa agcgaatttg ccgcacaagg cataattccc aattcattct 3841 gcagggcgtt ccagcactga attgccacag cattgcaacc gtatttatcc gcaagcgttc 3901 tcatcgcgac tttgagcgca caaatacttt caagttcgct gtccttaacg gcaatattaa 3961 agttttccct gcaatatttc atgacttcag cagctcttat gccttcggcc tttgcaaatt 4021 tcacctcact gcaaagctct gataggggaa tgggcgc // LOCUS sequence072 4057 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence072 VERSION sequence072 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..4057 /mol_type="genomic DNA" /organism="" /note="sequence072" CDS 52..966 /product="glycosyltransferase family 2 protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_005816612.1" /transl_table=11 /codon_start=1 /translation="MLSIILPSFNEEDNILNTASVLEELLCGQNIAYELLFVDDGSRDA TWQRICEASEKDKNVRGLRFSRNFGKESAIFAGLEASKGDACLVMDCDLQHPPKTIIEM YKLWQDGAQVIEGKKSSRGKENALYGGFSKLFYKLIKKASGIDMLDASDFKLLDRKAVD ALLSMPERVTFFRAMSAWVGFESKNVYFDVDERAYGTRKWSTRGLIKYAINNLSSYTNL ALLLPVFLGGFVSLCALILIILNIIGLPLGSLTLGINLLMLIGGMILVSVGVVGYYLWR VFDETRNRPRYIIAKTVGGKNDR" /locus_tag="LOCUS_3610" /note="WP_005816612.1 glycosyltransferase family 2 protein (Desulfitobacterium hafniense) [pid:40.4%, q_cov:97.4%, s_cov:95.6%, Eval:1.2e-62]" /note="MGA_445" CDS 956..3784 /product="YfhO family protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011674564.1" /transl_table=11 /codon_start=1 /translation="MTDNIDGINENINTPEQASDPAPESVKKENRFTAFCEKLGNTRFG KWCYKNRLYLGAFFLPVFIMYVVYSVFGVHPYGDLSVLVLDLNGQYVSYYEMLRDAIWG DGSLIYNWSRNLSGETMGMFGYYLASPFMWIIVLLPRTMMCGSIEIMELAKVGCCGLAM AYYLTDRKNAKKLSALLFSVCYALMTYIVVELMNPMWIDGMIWLPMILLGIERLVDEGK MLPVILPMTIMFISHFYIGYMTAFFSIIYFIYYVFSRPNHIIAPHWFKGGLKFAISGIV SALSSCIVIIPVYCSLRLGKLSFSEPDFSPETQFNIFEFLSKLFQNSYDTVRPEGLPMI ACGTVVMLLVPLFFLNNKISPKEKISLGLLMLAVFGSMYVSTVDIAWHGFQVPNWLPYR YSYTFSFIMIVMAFRAFENLEGVSFKELCLTAFAWVCVLALVSREEYEHMYTFETVWYN ILAIAVIAAVLYLYKKTPDKVMSIILVGLVSVDIFVNAIYTIYAIDYDVVYSKYSSYQD YFIDGREVVSQVEELDEGKFRMEKTFHRTVNDPIGMGFAGISHSSSTMNTPVLKMLKTL GYGMQGHYTKYTGQTLVTDALFGIKYLMYKPDKITPSVDPRELTRQEIQNEIKKPYKAY TEFLTPEDTGVADITVYQNPYALSIGYMADYDILECELDSNDPIKNQQQLLKSLTGEGA VRVFKRIYQSATHTANCTTSTTGDHIMYTTTVDGKDSYVEFTIDIDNDNPVYAFFPTIY QRKCNIWAKSSEWDIVNYAFVDYFFTGEHYSVLNLGSFHEGETVKVRMTLANGEAIFSD VLFYYLDMEEFEEIHAQISDEQWNITEHTDTYLYGTVDAKQDGILFTTIPYEPGWTVKV DGNEVETLTCLDSLIGIELSAGEHTVEMSFWPTYLTLAIIVELIGLSFIAIIAIIEVKD GAILKKIIAKTK" /locus_tag="LOCUS_3620" /note="WP_011674564.1 YfhO family protein (Lacticaseibacillus paracasei) [pid:25.0%, q_cov:91.6%, s_cov:96.2%, Eval:3.1e-77]" /note="MGA_446" ORIGIN 1 agaataaggg cagagcagtg gtataaagaa aacgaataac ggagaaaatc tatgctttca 61 ataattcttc cctcattcaa tgaggaggac aacattttaa acaccgcctc ggtgctcgag 121 gaacttttgt gcggtcaaaa catagcttat gagcttttgt tcgttgatga cggctcacgc 181 gatgcaactt ggcaaagaat ttgcgaggca agcgagaagg ataaaaacgt ccgtggactt 241 cgcttttccc gcaatttcgg caaggagagc gcaattttcg cagggcttga agcatcaaaa 301 ggcgatgcct gccttgtgat ggactgtgat cttcagcatc cgcccaagac gataatcgag 361 atgtataagc tctggcagga cggtgcccag gtcatcgagg gcaaaaaatc ctcccgcggg 421 aaggaaaatg ccctatatgg cggattttcc aagctgtttt ataagctgat caaaaaggct 481 tcgggaattg atatgcttga tgcttccgac ttcaagcttt tggatcgcaa ggcagttgat 541 gcgcttttgt cgatgcctga gcgtgtcaca tttttccgcg caatgtccgc ttgggtgggc 601 tttgagtcta aaaatgtata tttcgatgtg gacgagcgtg catacggcac ccgcaagtgg 661 tcgacccgtg ggctgattaa atatgcaatc aacaatcttt catcatatac aaacttggcg 721 ctcctgctcc ccgttttcct cggaggcttt gtttcgcttt gtgcgctgat tttaataatt 781 cttaacatta tcggcctgcc tctcggctcg ctgaccttgg gaattaatct tttaatgctc 841 atcggcggaa tgattcttgt ttccgtcggc gtggtgggat attatctttg gcgtgtgttt 901 gacgaaacaa gaaaccgccc gcgctatata atcgcaaaaa ccgttggagg aaaaaatgac 961 agataacatt gatggtatca acgaaaatat caacactccc gagcaggcga gcgatcctgc 1021 gcccgagagt gttaaaaaag agaaccgatt tacggctttc tgtgaaaagc tgggcaacac 1081 ccgcttcggc aagtggtgct ataaaaaccg cctatacctg ggcgcgtttt tcctgcccgt 1141 attcataatg tatgtggtat attccgtttt cggcgttcac ccatacggcg acctgtccgt 1201 tttggtcttg gacctcaacg gccagtatgt atcatattat gaaatgctcc gcgatgcaat 1261 ttggggcgac ggaagcctga tttacaactg gtcacgtaac ctcagcggcg aaacaatggg 1321 tatgttcgga tattatcttg ccagcccctt tatgtggata atcgtcctgc ttcccagaac 1381 aatgatgtgc ggctcaattg aaataatgga gcttgcaaag gtcggctgct gtggccttgc 1441 aatggcatat tatttgactg accgcaagaa tgcaaaaaag ctttcggcac ttttgttctc 1501 ggtctgctat gcgctgatga catatatcgt tgtcgagctg atgaacccaa tgtggatcga 1561 cggtatgata tggctgccga tgattctttt gggtatcgag cgacttgtgg atgagggcaa 1621 aatgctccct gtcatacttc cgatgacgat aatgttcatt tctcatttct atatcggata 1681 tatgaccgca ttcttcagca tcatatattt catctattac gtattctccc gacccaatca 1741 catcatcgcg cctcattggt ttaaaggcgg gctgaagttt gcaatttccg gaatcgtttc 1801 ggcgctttca agctgtatcg tgataatccc cgtatattgc tcccttcgtt tgggcaagct 1861 cagcttctcc gagcccgatt tctcacccga aactcagttc aatatctttg aattcctctc 1921 aaagctcttc cagaacagct atgacaccgt ccgtcccgaa ggcttgccga tgattgcctg 1981 cggaaccgtt gttatgcttt tggtgccgct gttcttcctc aacaataaaa tatctcccaa 2041 ggagaaaata tctttgggac ttttaatgct ggctgttttc ggcagtatgt atgtttcaac 2101 tgtcgatata gcgtggcacg gcttccaggt tccaaactgg ctcccttacc gctattcata 2161 caccttctcc ttcataatga tagttatggc gttcagagcc tttgaaaacc ttgagggtgt 2221 atcgtttaaa gagctgtgct taacggcatt cgcttgggta tgcgttttgg cgctcgtttc 2281 aagagaagaa tatgagcata tgtatacctt tgaaacggta tggtataaca ttttggcgat 2341 cgctgtcatc gccgcggtgc tgtatctgta taaaaagacc cccgacaagg tgatgagcat 2401 aattttggtg ggacttgtca gtgtggacat ctttgtcaac gcgatttata ccatctatgc 2461 catcgactat gacgttgtat atagcaaata ttcctcatat caggattatt tcatcgacgg 2521 cagggaagtt gtgtctcagg ttgaagagct tgacgagggc aaattccgaa tggaaaagac 2581 cttccaccgc acagttaatg accccatcgg tatgggcttt gcgggaataa gccactcaag 2641 ctcaacaatg aacacccctg ttctcaagat gctcaaaacc cttggctacg gtatgcaggg 2701 acactatacc aaatataccg gtcagactct tgtcaccgat gcgctctttg gcatcaaata 2761 tctgatgtat aagccggaca agatcactcc ttctgttgac ccccgcgagc ttacaagaca 2821 ggagattcaa aacgagatca agaagccata taaggcatat accgaattct taacgcccga 2881 ggatacaggc gttgcggata tcaccgttta tcagaacccc tatgctttgt ccatcggata 2941 tatggctgat tacgacattt tggaatgtga gctcgactcc aacgacccca tcaagaatca 3001 gcagcagctt ttaaagtcgc tgacaggtga gggcgctgtc agagtgttca agcggatcta 3061 tcagtcggcc acccacaccg caaactgcac cacatcgaca accggcgacc acattatgta 3121 taccaccacc gttgacggca aggattctta tgttgaattc actatcgaca ttgacaacga 3181 caaccctgta tatgccttct tccccacgat ttatcagcgc aagtgcaaca tctgggcaaa 3241 gtcaagcgaa tgggatattg tcaactatgc ctttgttgac tatttcttca caggtgagca 3301 ttacagtgtt ctcaacctcg gttcattcca tgagggagag accgtcaagg tgagaatgac 3361 gcttgccaac ggcgaagcaa ttttcagcga cgttttgttc tattatctcg atatggaaga 3421 gtttgaagaa attcacgctc aaatctccga cgagcagtgg aatatcaccg agcacaccga 3481 cacctacctc tatggtacgg ttgatgccaa gcaggacgga attttgttca caaccattcc 3541 ttatgagccg ggctggactg taaaggtcga cggcaatgag gttgaaactc tcacttgcct 3601 cgattcactt atcggcattg agctttcagc gggcgagcac accgttgaaa tgagcttctg 3661 gcccacatat ctgacgcttg cgataatcgt tgagctgatt ggcttgtcct tcatcgcaat 3721 aattgcgata attgaggtta aggacggcgc aatcctcaaa aaaataatcg ccaagacaaa 3781 gtgaaatcat attgaccaat ggcaaaaatt gtagtaaact aatctgtgga ataaaaacat 3841 aaatattgga ggcatatttc cccctgtaat aattgttgtt atgtagttcg cagaaacaaa 3901 tgtcaatatt gaaaaaatag aagtgtgaaa tgatttttga ttaactgcaa ttccatcgat 3961 aatttgtctt ctctgttcca ataaaacatt gtattttttc tgttcaacat tcagtccttt 4021 agcataatat tgattattaa cctctacttt aggagat // LOCUS sequence073 4026 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence073 VERSION sequence073 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..4026 /mol_type="genomic DNA" /organism="" /note="sequence073" CDS 764..2209 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MKKIIALAMVVLMIFALVGCGSNKRVIVEVTLSTEDSEAILAAAG ISLPDVAEVAAAGSTVQLFSWYDDFHNYSEDEIVNTGFFTFKEKYGCEVEWVETTWAKR FDDLANLILGGTPADFYTMETDIFPTYCIKGMFQPVNDYIDYDDPLWQGTKTVAENYFS LGDNTYIMAIDIGATQVVGYNRRVIDEWGFEDPAQLYYNDEWTWDVFYDMCLEFSDPDE DRFALDGWYYDTALMDSSGTTIVKYNTETGLFESNLDDPRLERSADLVYNLKKNECIFP VWNRGWQLRGGAEVQGTGIKDGLCLFFIVGTWGFTGTVEEISAVWGDVTEGEVMFCPLP RDAAGDGNYYCSVKPTGYCIISGASNPEGVALLAACERFKVLDPTVVSIDEKQLRETYL WTEEMLEMYDICHAAANSEYVSVEYNDGLGIKLADSAGECKRIGRKATAQTWAQLKEKY SEQVIYYIEELNMEIAEYVANLG" /locus_tag="LOCUS_3630" /note="MGA_448" CDS 2502..2807 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MTKKILALGLVLLMIFALVGCGSNKRQIVEVTLSTEDAEAILAAA GITLPAAETVASAGSTIKWFAWYDSFHNYDEDEVVNTGYFTFKEKYGCDIEWVETT" /locus_tag="LOCUS_3640" /note="MGA_449" CDS 2841..3959 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MGGTPPDFYPSSNETFPTYAIKGMFQPVDDYIDYNDPLWADMKDF VDKYFSLGGRRYIIATDNGFESVVPYNRRVIEEWGFDDPAELYYNDEWTWDVFYDMCLD FTDPDDDRYAIDGWAYSGAIMDSCGTQIVSLDLETNQYVSHIDDPRLERAAELLYNLSK NECIYPLWNNGWATRNGTDNEGSGVKEGLTLFYIRGTWAFTGTVEEISNNWGDVSQGEL MFVPMPRDPQGDGNYYIQANAAGYCIISGASNPEGVALFASCERFKVLDPTVVSIDRRQ LEEKYLWTQEMLEMYDECKALAQKGENTLVEYGEGLGNRLYSVSDGMKTIARTAAANAT TWAQSKESNGEKLQYYIDELNAQVAEYISTLG" /locus_tag="LOCUS_3650" /note="MGA_450" ORIGIN 1 cccagagatc ccaacggcga tggaacttac tatacagaat ccactcctac cggatactgc 61 ttggtttccg gcgcatctaa ccccgaaggc gttgcacttt tggctgcttg cgacagattc 121 aaggttttgg atcccaccgt tatctctatc gacagacgtc agcttgaaga aatctacctc 181 tggacagatg aaatgctcga aatgtatgac acctgtgttg atattgctaa ctcgggcagc 241 gtaatcgttg tttatgatgc aggttacggt tccaagcttg acaacgttgt taacacactt 301 gaaggcaacg gtgcaaatca ggaagcttcc acttgggcac agctcaagga gaaatatact 361 gaacagctcg tctactatgt agatgctctt aacgctgaca ttgacaagta tattaacggc 421 taagctacat aatttaaata ttcaatcagc cctttccttg cgagagggct gattttttgt 481 gcaagcgacc gcgtgggtat gcatcacagt agttattgaa cgagctcaaa aagcaaaaaa 541 agtcggttca ttttgtcata tccgaaaaat ttaatctata taagaaaatt agcttttttg 601 ccaaattcaa ggaatatttt tacaatttta acaaaaagcc atctgaactt gtgggtatat 661 tgccaaaaag gtgaagccaa ttttatggaa tttgagcatt gatttttact ttcaattatt 721 ctaaaattaa actataacat ttagttagag gtgacttatt attatgaaga aaattattgc 781 tttggcaatg gttgttttaa tgatatttgc tcttgtgggc tgtggctcaa acaagcgagt 841 tatcgttgaa gtaactcttt ccacagaaga ttcggaagcg atcctcgccg ctgcaggcat 901 cagcctgccc gacgttgccg aggttgcggc tgccggctcg accgttcagc tcttctcctg 961 gtatgatgac ttccacaact attccgagga tgagatcgtt aacaccggat tcttcacctt 1021 caaggaaaag tatggctgtg aggttgaatg ggttgaaacc acatgggcta agcgttttga 1081 cgacttggca aacctgatct tgggcggaac ccctgccgat ttctatacaa tggagaccga 1141 catcttcccc acatattgta tcaagggtat gttccagcct gtaaacgatt acatagacta 1201 tgacgatccc ctttggcagg gcacaaagac tgtagctgaa aactacttct ccttgggcga 1261 caacacctac attatggcga tcgacatcgg cgccacacag gtagttggat ataaccgcag 1321 agttattgac gaatggggct ttgaagatcc cgctcagctt tactataatg acgagtggac 1381 ttgggatgta ttctatgata tgtgtcttga attctccgac cccgatgagg acagatttgc 1441 ccttgacggc tggtattatg acaccgcttt gatggattcc tccggaacaa cgatcgtcaa 1501 gtataatacc gaaacgggat tgttcgagtc taatcttgat gaccccaggc ttgaaagatc 1561 agctgatctt gtttataacc tcaagaaaaa tgaatgtatc ttccctgttt ggaaccgcgg 1621 ctggcagctc agaggcggtg cagaagttca aggtacaggt attaaggacg gcttgtgctt 1681 gttcttcatc gtcggcacat ggggcttcac aggaacagtt gaagaaattt ccgctgtttg 1741 gggcgatgtc accgaaggtg aagtaatgtt ctgcccgttg cccagagacg ctgcaggcga 1801 cggcaactat tattgctccg ttaagcctac cggctactgc attatcagcg gtgcatcaaa 1861 ccccgaaggc gttgcgcttt tggcagcctg cgagagattc aaggttttgg accccacagt 1921 tgtatccatc gacgaaaagc agttgagaga aacctacctt tggaccgaag agatgctcga 1981 gatgtatgac atctgccacg ctgcagcaaa cagcgagtat gtttctgttg aatataacga 2041 cggtttgggc atcaagcttg ccgactccgc cggcgaatgc aagagaatcg gcagaaaggc 2101 aaccgctcag acatgggcac agcttaaaga aaaatattcc gagcaggtca tttattatat 2161 tgaagagctc aatatggaga ttgcagaata cgttgcaaac ttgggataat taaaaattaa 2221 cactgaaacg ggtgggcaaa aatgcctgcc cgtttttatg ctttcggtta atgcgacaat 2281 ttgaaacaaa ccattggggt ttttgctttg agaataaaac ttcatggtcg attttaacaa 2341 aaacagttgt taaatttaat acattacgcg aatttacggc agattataaa atgtgctaaa 2401 atatatacgt aaatgtgtac ggtttgcgga gccgaaaaaa gagggctccg cctttcgcat 2461 ttatgcatta tggtgaaaca tcatgaaagg aaatttgagc tatgacaaag aaaattctcg 2521 ctttgggtct tgttttgttg atgatctttg ccctcgtcgg ctgtggatca aacaagagac 2581 agatcgttga agtaaccctc tcgaccgagg acgctgaagc aattttggct gctgcaggta 2641 tcactctgcc cgccgctgaa actgttgcat ctgccggctc caccatcaag tggtttgctt 2701 ggtatgacag cttccacaac tatgatgagg acgaagttgt taacaccggt tacttcacct 2761 ttaaagaaaa gtacggctgt gatattgagt gggttgaaac tacctaggca gcaagatttg 2821 atgagcttgc aaacctgatt ttgggcggaa ctcctccgga tttctatcct tcatccaacg 2881 aaaccttccc cacatatgca attaagggaa tgttccagcc tgttgatgat tacatcgact 2941 ataacgatcc cctttgggca gatatgaagg actttgttga taagtacttc tctttgggcg 3001 gacgtcgcta cattattgca accgacaacg gctttgaaag cgttgttcct tataacagaa 3061 gagttattga ggaatggggc ttcgacgatc ccgctgagct ttattataac gacgaatgga 3121 cttgggacgt attctatgat atgtgcctcg acttcaccga tcccgatgat gacagatacg 3181 ctatcgacgg ctgggcatac tccggcgcta tcatggactc ctgcggtact cagatagtat 3241 ctttggacct tgagaccaac cagtatgtat cccacatcga cgaccccaga ctcgaaagag 3301 ctgctgagct tctttataac ctttccaaga acgagtgcat ctatccgctt tggaataacg 3361 gctgggcaac cagaaacggc accgacaacg aaggctccgg cgtcaaggaa ggcctcaccc 3421 tcttctatat cagaggtact tgggcattca ccggtacagt tgaagaaatc tccaacaact 3481 ggggcgacgt ttcccagggt gaattgatgt tcgttcctat gcccagagat cctcagggcg 3541 acggcaacta ttacattcag gctaacgctg caggttattg catcatctcc ggcgcttcta 3601 accccgaagg cgtagcgttg ttcgcatctt gtgaaagatt taaggtactc gaccccactg 3661 ttgtatccat cgacagacgt cagcttgaag aaaagtatct ctggactcag gaaatgcttg 3721 aaatgtatga cgaatgcaag gctttggctc agaagggcga aaacaccttg gttgaatatg 3781 gcgaaggctt gggcaacaga ctttactctg tttccgacgg tatgaagacc atcgctcgta 3841 cagctgctgc aaacgcaacc acttgggcac agtccaagga aagcaacggc gaaaagcttc 3901 agtattacat cgacgagctc aacgctcagg ttgctgaata tatttcaact ctcggataat 3961 attgtttaaa aaatcccgct ctcaaaacga gggcgggatt ttttggctat aaaatcaaat 4021 ttttcg // LOCUS sequence074 4025 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence074 VERSION sequence074 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..4025 /mol_type="genomic DNA" /organism="" /note="sequence074" misc_feature <1..519 /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_003426355.1:phosphoribosylaminoimidazolesuccinocarboxami de synthase" /note="WP_003426355.1 phosphoribosylaminoimidazolesuccinocarboxamide synthase (Clostridioides difficile) [pid:62.2%, q_cov:100.0%, s_cov:75.7%, Eval:3.3e-55]" /note="MGA_451" /locus_tag="LOCUS_3660" CDS 766..1419 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MKKNLIANIITLIAIRFLVYVLGTVSIAPLSLFGVMVDISAVLGY LLGLLFNFALIHAMYKNKSLLSKPLFDENEKIFRRYYINKLLILEAFEFVYYFAVSLLM FLPFRYVTMAISDLLLYVLWYVIITKGSRNMIKQRKFFLPTIIISVAIVATNRFAEYVI YSTSYGVLDGSTNIFSYLQILSAGEFLSKLSVISSTAVWIVFLISHSLSVKTEE" /locus_tag="LOCUS_3670" /note="MGA_452" CDS 1520..2248 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MFFEHYISSDAPYVEIFSLPHILYILFCGLTIFLLVKFRKPLTEK RDTVCKIVLWITIFQQVVLQYGWYIFATDIFWKDGLPLHLCRISSIFVMVFLITENPKA MDIVFCFGTFAIASFFYPKNCYHLLHINGFSYMINHLVTVAMPVFAALAYGWRPTWAGF RRSVKLFTLYFPVMLLANRLFDGNYLYMTDRPFAFLDAMPVWIYNPFIYLFSVGVFALI TVIVRTAIAKFSKKPKEVNV" /locus_tag="LOCUS_3680" /note="WP_012258597.1 TIGR02206 family membrane protein (Chloroflexus aurantiacus) [pid:24.9%, q_cov:71.5%, s_cov:72.0%, Eval:5.2e-09, partial hit]" /note="MGA_453" CDS complement(2383..2859) /product="flavin reductase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_002681169.1" /transl_table=11 /codon_start=1 /translation="MRKNFGPKTLMYPEPVLIIGTYAADGTPNAMNAAWGGLSEENEIS ICISANHATTKNLLERKAFSVSFADAENVAAADYVGIVSGNNEPNKLEKCGWHTEKAEF VDAPIICELPVAIECKLKSYDENTCRLVGEIVNVCAEEHVLGEDGLIDLENSAL" /locus_tag="LOCUS_3690" /note="WP_002681169.1 flavin reductase (Treponema denticola) [pid:45.8%, q_cov:96.8%, s_cov:82.4%, Eval:6.3e-33]" /note="frameshifted, insertion/deletion at around 2397" /note="MGA_454" ORIGIN 1 acttctattt attactttga gcttcttaaa aaagaaggca tcaaaaacca ttatgtaagc 61 gctgatatcg aaatcgcaac tatggaggtt ctccccggca aggttttcgg ccacgggtta 121 gaggttattt gcagacttgt tgcaaccggt agcttcatcc gcagatacgg cgaatatatt 181 gcagacggca caccccttga aggcggctat gttgaatgta ccttcaagaa cgatgaaaag 241 ggcgacccgc tcgtaacagg cgaaggcttg gcagcgctcg gcgttatgag ccccgcaatg 301 tttgaaagca tgaaggagca gaccctcaag atcaccaaga tcgttgctga cgacctcaag 361 accatcggat tggacctttg ggatatcaag tttgagttcg gctataacaa cgacgaagtt 421 atcctcatcg acgagatcgc ttcgggcaat atgagagttt ataagggcga caagatcgtt 481 gaccccgttg aactcaccaa gcttattctt gacagataat ttttgtgaaa ataaagaaac 541 cgctgtccct gatggacggc ggttttgttt tgatgcctcc ctctgaggag ggagagattg 601 ctatttttct ctcccccagt caccttctgt gacagccccc tcgtcagagg ttttttactt 661 cacttatata ggtgcaaagc gttggaattg caaaataagc ggctttatct tgcaaaaacc 721 acgaatatgt ggtatactga agaaaatcat gacgggggcg ttaaaatgaa aaagaacctt 781 attgccaata tcatcacatt gattgcaatt agatttcttg tttatgttct cggcaccgta 841 agcattgctc cgctttctct atttggagtt atggtggaca tttccgcggt tttgggttat 901 ctgttgggtc tgctgtttaa ttttgcattg attcacgcaa tgtataaaaa caagagcttg 961 ctctcaaagc ccttgttcga cgagaatgag aagatattta gacgttatta cataaacaag 1021 ttgctgattc ttgaagcttt cgaattcgtg tattattttg cagtgtcctt acttatgttc 1081 ctcccgttcc gctatgttac gatggcgatt tctgatcttt tgttatatgt tttgtggtat 1141 gtaatcatca ccaagggaag ccgtaatatg attaaacagc gcaagttctt tttgccgaca 1201 attattatca gcgtagcgat cgtcgcgact aacagatttg ctgagtatgt gatttattcg 1261 acatcatatg gcgtgctgga tggctcgaca aatatattca gctatctcca aatattgagc 1321 gccggtgaat ttctgtcaaa attgagcgtg atttcctcga cagcagtttg gattgttttc 1381 cttatttccc atagcttaag cgttaaaact gaagaatagt tttttgcccc atcctgcaaa 1441 agggtggggc acttatattg catatttcga cagcctctgc tataattaaa taagctaatt 1501 aactgtttgg agggatagga tgttctttga acactacatt tcaagtgatg caccatatgt 1561 cgagatattc tcgttacccc atattcttta catactcttc tgcgggctga cgatcttcct 1621 gctcgtcaag ttcagaaaac cgctgaccga aaagcgcgac accgtctgca agatcgtgct 1681 gtggataaca attttccagc aagttgtttt gcaatacggc tggtatatct ttgcgaccga 1741 tatcttctgg aaggacggcc tgcccttgca cctttgccga atttcgagca tctttgtaat 1801 ggtctttctc ataaccgaaa acccgaaggc gatggatatt gttttctgct tcggcacctt 1861 tgcaatagca tccttcttct atccgaaaaa ctgctatcac ctgttacata taaacggatt 1921 ttcatatatg atcaaccacc tggtgacagt tgcaatgcct gtttttgccg cgcttgcata 1981 tggctggcga ccgacctggg cgggcttcag acgaagtgtc aagcttttca cgctatattt 2041 ccctgtgatg cttctggcaa atcgcctgtt cgatggcaat tatctttata tgaccgaccg 2101 cccctttgca tttttggatg ccatgcctgt gtggatatac aacccgttta tatatctgtt 2161 ctcggtcggc gttttcgcgc tgataacggt aattgtgcgc acagcaattg cgaagttttc 2221 aaagaaacca aaagaagtga atgtataaaa aaacaaaacc atcggttcga ccgatggttt 2281 tgtttatgtg tactcattat ttgcctatct tttttccctc gctgaatgct tttccgacaa 2341 tatcgccaag tctgcgatag tcatggtgca tcccgtcata gattataggg ctgaattttc 2401 caggtcaata aggccatcct cgcccaaaac atgctcctcg gcacagacat tgacgatttc 2461 gccaaccagt ctgcaggtgt tttcgtcata gcttttgagc ttacactcaa ttgcaacggg 2521 caattcacag attatcggag catcgacaaa ttccgccttt tcggtatgcc agccgcactt 2581 ttcaagcttg tttggctcat tatttcccga aacgattccc acatagtctg ccgcggcaac 2641 gttttcggca tccgcgaagc tgacagagaa agcttttctt tcaagcaggt ttttggtggt 2701 tgcgtggttt gcgctgatgc aaattgaaat ctcgttttcc tcgctcagtc ctccccatgc 2761 cgcattcatc gcgtttggtg tgccgtcggc ggcatatgtg ccgataataa gcaccggctc 2821 gggatacata agggtcttgg ggccgaaatt ctttctcata tttaattgcc tccttcaaaa 2881 gtgttcgggg tgatttatgg gtatagtata acacattcga gggaaaatgt taatagccaa 2941 ggatattatt attttaagca cattgcaaaa aataacttct atgggcgaaa tgtataaatt 3001 tgattgccaa atggctgaaa atccgtcata tttattgaca gcacccattg ttttgttata 3061 tattatttaa tggttattta taatctgtat tgtgggttaa agtgcccgaa agaggctttc 3121 cgcgatacgg cgtaaatatt aaaaaatgga aactaagaaa ggtagggtcc caatatggct 3181 ttttctctta acggcgtcaa ggtgcctcac aaaaagaaca ccgctgatat gcctgccgta 3241 aggatcaaca caccctcatc ggtcacaatt ccaatggtta tgcacatcgg taagcctgcg 3301 attcctgcag tcaaggtggg cgaccatgtg gatgtcggca cacttattgc aactcaggat 3361 ggccccatca gcgcgcccat tcattccagc atctcgggca ctgtcaagaa gatcgacgat 3421 atgttgctct cgagcggctc tcttgccaag gcaatcacaa ttgaatcgga cggcgagatg 3481 accgttgatg caaacatcgc tgtacctgta attaattcga aggacgactt gatcgaagct 3541 ctcaaggcaa gcggtattgt cggcttgggc ggtgcaggat tccccacaca tttcaagttt 3601 aatgtcgacc ccgaaagaat tgaagagctc ataatcaacg gcgcagaatg tgagccatat 3661 attaccagcg acaactgcac aatgatcgac cgtgccgacg atatggcata tgccctttgg 3721 ctcttgaaaa agcatctggg catcaagaag gtcatcatcg gcgttgaaaa gaacaagccc 3781 aacgctatcg catcaatgaa ggctttggcc gaaaaggttg agggcgtaag cgtcaaggag 3841 cttccttccg tatatcccca gggcggcgaa aaggttttgg tatatcacac aacaggcaag 3901 aagatagccg caggaaaact cccgattgat gtcggctgca ttgtatgcaa ctgtacaacc 3961 cttgccgaga tcggcagatt tgcccttaca ggtatgcctt tggttgaaaa gtgtgtgact 4021 gttga // LOCUS sequence075 3942 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence075 VERSION sequence075 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3942 /mol_type="genomic DNA" /organism="" /note="sequence075" CDS complement(1295..2131) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MNIVEGPYVCEAPYFFEASEMNKIGDKYVYTFNGDWSAKEYPVEG YTKSPTCAMEYMVADDPMGPYTYVGWYLRNPGESNLLWGNNHTHLQEFKGNWYIISHSR LLEKHMGMDKSYRSVMIDKIDITIDEEGNVNIPHTYITATGVEQVEYLDPYVHNEAETI CNQSGIMTQMIGNVGDVIVTDIKDGDWIRVKGVDFGSKGAAQFVANVKGTGVIDIRLDD VNSETVGSVDFSVNEFTNIINNIDNITGVHDVYFVFGGKNWEFDAWQFVETAPSAE" /locus_tag="LOCUS_3700" /note="WP_010890799.1 glycoside hydrolase family 43 protein (Clostridium acetobutylicum) [pid:32.3%, q_cov:79.1%, s_cov:48.5%, Eval:1.5e-21, partial hit]" /note="MGA_457" CDS complement(2144..2893) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MNLKKIICILLASLMLMTLLVSCSNQSTVDGGKNTNQTPVSEKED LNMNAIVSLSEKVRVEAEPGASIKPNDEMNPLVSTRFSADPTSVEYNGRVYVFSTNDDQ QYLATPYAVNGFGDIHSLNVFSSADLVNWTDHGYIDVKAASPRINTSWAPSIVKRVEDD GLTHFYLFYAENGWSTGVLTATDPLGPWTDPLGRPVIVPTMPEVNGILSNCFDPGALCD DDGTIYVACGAHKDSDVPGVSKGSGIF" /locus_tag="LOCUS_3710" /note="WP_003245027.1 alpha-L-arabinofuranosidase (Bacillus) [pid:40.8%, q_cov:76.3%, s_cov:37.8%, Eval:1.7e-34, partial hit]" /note="internal stop codon at [2144:2146](-)" /note="MGA_458" CDS 3104..3877 /product="DNA repair protein RadC" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_014328269.1" /transl_table=11 /codon_start=1 /translation="MSNNHAGHRGRLKKKFIDGGLENFYEHQILELILFYSIPQGDTNP TAHRLISRFGSLMGVLNADHEELMTVKGVGNATATWLKALQYITSTDLFDPCDVVCATS VGGMLEFFKYEFAECNEQTARLICADDCMNMVEVIEFVGYTLDRKLDRRILEEVLRANC SQVIMAIYRPTKPAFPTDEDKACGRALRDIFAAFNIDFSELAIIDREYVSYIFRQMRLP ILWHIKNGELLRDGIKRRKVSFDKPKSAAKKHNCT" /locus_tag="LOCUS_3720" /gene="radC" /note="WP_014328269.1 DNA repair protein RadC (Sinorhizobium fredii) [pid:26.2%, q_cov:80.5%, s_cov:79.8%, Eval:7.3e-12]" /note="MGA_459" ORIGIN 1 gtgggtatag aggagcggga acgccgtttc gataccgacg atgccgaagg cgcttttctc 61 aagcccccgt cccttctctt ctgcgctgtg gggggcgtgg tcggtggcga tcatatcgat 121 cgtgccgtcg cagatgccct caaccaaggc ttctttatca gccttcgagc gaaggggagg 181 gttcatttta aatctgccga gctccataag gtcgctgtcg tccagcacca agtagtgcgg 241 tcctgtttca caggtgatgt ccacgccgtc ccgtttggcc tgacgtatga gtgatacgct 301 ttcttttgtc gaaatgtggc agacgtggta acggcagccc gtttcctttg caagctcaat 361 atcacgctcg atctgcttcc attcgctttc cgagcagatg cctctgtgac cgtgagcggc 421 cgcatattca cccttgtgga tatatccgcc gaagagcagg tcgttaacct cgcaatgggc 481 aacgatcatc ttgttaagcg cttttgctct ttccatcgct tcgcgcatca ttcccccgtc 541 ctgaacgccc ttgccgtcgt ccgaaaatgc aatgcattta tccgcaagcg attcaagatc 601 aacaaggctt tcgccctttt gcccaacggt tatcgaagca tatggatata ccgcaatttt 661 agcgtcgcga tcgattatat cctgctgcag cttgatgctt gcaacgttgt cgggcacagg 721 gttaaggtta ggcattgtgc atactgcggt gtatccgccg cgggcggcgc tcatcgaacc 781 ggaaagaatg gtttctttat aagaaaaacc cggctcacga aaatgcacat gcacatcgca 841 aagaccggga aaaacagtat atctgtccaa atcaataccg ccaaaagcgt cagagaacaa 901 aaatgcctta acataggaag aaaagccgtg catatcatcg ggaacgatta ttttcgtgtt 961 attcaatcct gacatggtaa gctcctttca ttggttgaga ggcgggataa aaaaattagc 1021 cctgcatcat atcggcaagg cacacaaaaa ccgatgaagc cccgcttcac cgaaattcca 1081 tataaaacaa tctgccgatc tctctgtatc gtctgttaag atttatctta aaatagaata 1141 ccaccgaatg ggggttttgt caatgaaaaa atgcctcttt cgacaaattt tccatattta 1201 acaaagggca attaaaggtt gagggatttg ttgtaccttt gcgtaacaag ccaaacaaaa 1261 aagcaccctt gcgggtgcct tttgtcggtc aatattattc tgctgaggga gcagtttcaa 1321 caaactgcca agcatcaaat tcccaattct ttccgccgaa tacgaagtaa acatcgtgta 1381 cgccggtgat gttgtcaata ttgttgatga tgttggtgaa ttcgttaacg ctgaaatcga 1441 cgcttccgac ggtttcggag ttaacatcat cgagtctgat atcgatgaca ccggtgccct 1501 tgacatttgc aacgaactga gccgcaccct tggagccaaa gtcaacgccc ttaactctga 1561 tccagtcacc gtctttaatg tcggtaacga taacatcgcc gacattgccg atcatttggg 1621 tcataattcc tgactgattg cagattgttt cagcttcgtt gtgaacataa ggatcaagat 1681 attcaacctg ttcaacgccc gttgcggtta tgtaggtatg aggaatgttg acgtttcctt 1741 cttcgtcaat ggtaatgtcg atcttgtcga tcattaccga gcgatagctc ttatccattc 1801 ccatatgctt ttcaagaagt cttgagtggg aaataatata ccaattgccc ttgaattcct 1861 gcaaatgtgt atggttgttg ccccaaagaa gatttgattc gccggggttt ctcaaatacc 1921 agcccacgta ggtgtaggga cccatcggat cgtctgcaac catgtattcc atagcgcagg 1981 taggagactt tgtatatcct tcaacgggat attcctttgc gctccagtcg ccgttgaatg 2041 tataaacata cttgtcgccg atcttgttca tctcgcttgc ttcgaagaag taaggtgcct 2101 cgcaaacata aggtccttca acaatattca aatcatcgtc aagctagaat ataccgcttc 2161 ccttggatac gccgggaacg tcgctgtcct tgtgggcacc gcaagcaacg tagatagtgc 2221 cgtcatcatc acacaaagca ccggggtcga agcagtttga caaaatcccg tttacttcgg 2281 gcatagtggg aacgatcacg ggtctgccca aaggatctgt ccaggggcca aggggatcgg 2341 tggctgtcag aacgccggtt gaccagccgt tttcggcata gaagaggtag aagtgtgtaa 2401 gtccgtcatc ttcaactctc ttaacaatgg aaggtgccca agaggtgttg attctgggag 2461 aagcagcctt aacgtcgata tatccgtgat cggtccagtt tacaaggtcg gcagaagaga 2521 aaacattcaa cgagtggatg tcgccgaagc cgttcaccgc atacggagtt gccagatact 2581 gctgatcgtc gttggttgag aaaacgtaaa ctctgccgtt atattcaaca gaggtcggat 2641 ctgcggaaaa tcttgtggat acaagaggat tcatctcgtc atttggtttg atagaagctc 2701 cgggctctgc ctcgacgcga actttttccg acaaagaaac aattgcattc atattaaggt 2761 cctccttttc gctaacaggt gtctgattag tattcttgcc tccgtcaaca gttgactgat 2821 tgctacagga cacaagcaag gtcataagca tcagagatgc caacaggata catatgatct 2881 ttttcaaatt cataaacaaa cctccttgat agtttagcgc aattatacca ccatataggc 2941 gtaaaagtca atgagatatt ctgcacgcaa aatactacaa tgtgcaagct tttgcaaaag 3001 aacacttttg ccgttaggta tcagcgggtt ttagtgcttt acatttttgc aaaagtcggt 3061 ataatggata acatacattc aaacaagcaa gaggttaagc caaatgagca acaatcacgc 3121 tggccacaga ggccgactga aaaagaaatt cattgacggc ggattggaaa atttctatga 3181 gcaccagatt cttgagctga ttttgtttta ttccattccg caaggggaca ccaaccccac 3241 tgcccacaga ctcatcagcc gtttcggttc gctgatgggt gttttgaatg cagatcatga 3301 agagcttatg acagttaaag gtgtcggaaa tgccactgca acatggctga aagctctgca 3361 atatataacc tccaccgact tgtttgaccc ttgcgacgtt gtttgcgcca cctctgtcgg 3421 cggaatgctc gaattcttca aatatgaatt tgcagaatgc aacgaacaaa cagcaagact 3481 catttgcgct gatgattgta tgaatatggt cgaggtcatt gagtttgtcg gatatactct 3541 cgacagaaag cttgacagga gaattttgga agaggtgctc agagcaaatt gctcccaggt 3601 cataatggcg atataccgcc cgacaaagcc agcgtttccc accgatgaag acaaagcctg 3661 tggcagagca cttcgcgata tattcgcagc gtttaacatt gatttttctg agcttgccat 3721 aattgatcgg gaatatgtca gctatatttt ccgtcagatg cgtctgccga tactctggca 3781 cattaaaaac ggcgagcttt tgcgtgatgg catcaaaaga agaaaagtca gcttcgacaa 3841 gccgaaatct gcggctaaaa agcataactg cacataataa gagaatgcgg tcacctgccg 3901 cggtgggctt tgcgccccga aactcatttt gcttttcgcc ga // LOCUS sequence076 3912 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence076 VERSION sequence076 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3912 /mol_type="genomic DNA" /organism="" /note="sequence076" CDS 779..2689 /product="1,4-alpha-glucan branching protein GlgB" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_010880434.1" /transl_table=11 /codon_start=1 /translation="MPLNNKTPIAEQIKLFLEGRNYDCFDLFGAHTLDDGNTAFRVWAP NARSVSVVGDFNDWNENANRCERIEGGIWQCIVGGLKEFDVYKYRVEGYDGSIRLKADP YGCHMETKPATGTKLFDISGYTWNDSAWLKKRARTSPYNSPMNIYEVNLGSWRKYPDGN FFSYDKLADELIAYVKDMNYTHVEFMPLTEYPFDGSWGYQVIGYYAPTSRFGTPEDFMK MVDKFHQAGIGVILDWVPAHFPKDEAGLYEFDGTPCYEYYDELKREHKGWGTRVFDFGR REVRSFLISSALYWLEKYHIDGLRVDAVASMLYLNYDRPDGQWRPNINGGCENLEAVEL LQMLNTAVFARNPDVLMIAEESTIWPGVSKPVYTGGLGFNFKWNMGWMNDITKYMSLDP IYRSHHHNQLTFSLMYAFSENFILPISHDEVVHGKCSLVNKMPGDTDMKLRGSKAFLAY MMAHPGKKLLFMGSEFAQFREWDYENGLEWFMVEDYENHRNFQTYSKNLNGFYLKNSPM WDDDCSWEGFKWISADDYTQSIIVFRRIDRKGNEIFAVCNFAPVDRKDYRFGVPYMGKY TEVFNSSSVDGSPYANAPVSAERIPMHGLDQSIAVDIPGLSVMFFKVRKTPGRKPKLRT E" /locus_tag="LOCUS_3730" /gene="glgB" /note="WP_010880434.1 1,4-alpha-glucan branching protein GlgB (Aquifex aeolicus) [pid:51.7%, q_cov:95.9%, s_cov:97.8%, Eval:2.1e-183]" /note="MGA_461" ORIGIN 1 aagcccaact atgttgctga tgtatataca acctgccgtt ctgcatctgc gggcgatgtt 61 tccggcgatg ttttctgcag gttccaaagc ggaagattta gctattttat actctgcgac 121 ggcatgggca caggtaagcc ggcatacaat gctgcccgca agctttctga gtgtataaaa 181 gacttgattc tcggcggaat acctatcgaa gctgcgcttt cattagcttc gcctgttttg 241 cgaacatccg gtattgacga atgcttcgca actcttgacc ttgtgcggct cgatactttt 301 aacggcacag tagtgttcca taaagcaggt gccgccgaca gctatatcct cggagagaac 361 ttccaaactg tcccgtcggg aggatatcca atcggaatct tcgaccgatg ctatacaaca 421 cagactgaat ttgacctttc cgagggaggt gagatagtca tctgttctga cggcgcagat 481 cttgataaat caaagattca acgatctata gcacttgccg atacctctga tgaattggcg 541 gaatcgctcc tcgattcaga gggaaattcc aacgattttg ctcattgtga cgatgctttt 601 gtggcagtaa taagaattag caaggcgaag taaaaatttc ccgtacattc tgcacaaaac 661 tacgtgttgg aaaatgtgta aattctaaga atttgtcaaa ttttgttgca tatttcattc 721 gattttgata caatataaat gttattatcc gatactatgt ttgaaaggag tgcataaagt 781 gcctttaaat aataaaacgc ctatcgcaga gcagatcaag ctgtttttgg aaggcagaaa 841 ttatgactgt ttcgaccttt tcggtgcaca tactcttgac gacggcaaca ccgctttcag 901 agtctgggct ccaaatgcgc gaagcgtttc cgtagtcggc gacttcaacg attggaatga 961 aaacgccaac cgttgtgaac gcattgaagg cggaatctgg caatgcattg tcggcggtct 1021 gaaagagttc gatgtataca aatatcgcgt cgaaggttat gacggctcaa ttcgcctcaa 1081 agctgaccca tacggctgtc atatggaaac caagcctgca acaggcacca agcttttcga 1141 catttctgga tatacttgga atgactcagc gtggctaaaa aagcgtgcaa ggacttcgcc 1201 gtataacagc ccaatgaata tctatgaagt caacctcggc tcgtggagaa aatatcccga 1261 cggcaacttc ttcagctatg acaagcttgc cgatgagctc atcgcatatg taaaggatat 1321 gaactataca cacgttgagt ttatgccttt gaccgaatat cctttcgatg gttcttgggg 1381 ctatcaggta attggatatt atgctccgac atcccgcttc ggcactcccg aagactttat 1441 gaagatggtg gacaaattcc atcaagcggg aatcggtgtg atccttgact gggtacctgc 1501 ccatttcccg aaggatgaag cgggtctata tgaatttgac ggaacacctt gctatgagta 1561 ttatgatgaa ctcaagcgcg agcataaagg gtggggaaca agagtgtttg acttcggcag 1621 acgtgaagtt cgctcattct tgatttccag tgcgctctat tggctcgaaa aatatcacat 1681 tgacggcttg cgtgtggatg ctgtcgcttc gatgctatat cttaattatg accgtcccga 1741 cggtcagtgg cgccccaata tcaacggcgg atgcgaaaac cttgaagctg ttgaactgtt 1801 gcagatgctc aataccgctg tgtttgcaag aaaccctgat gtgctgatga ttgccgaaga 1861 atcgaccatc tggccgggcg tttcaaagcc tgtatataca ggcggcctcg gcttcaactt 1921 caagtggaat atgggctgga tgaacgacat aaccaaatat atgtctctcg acccaatata 1981 ccgctcgcat catcacaatc agcttacttt ctcgctgatg tatgctttca gcgaaaactt 2041 catcctgcct atctctcacg atgaggtcgt tcacggcaaa tgctcgcttg tcaacaagat 2101 gcccggcgat accgatatga agcttcgcgg ctccaaagca tttttggcat atatgatggc 2161 gcaccccggc aaaaagctcc tgtttatggg ttctgagttt gcccagttca gagaatggga 2221 ttatgaaaac ggtcttgaat ggtttatggt tgaagattat gagaaccacc gcaacttcca 2281 gacctattca aagaatctca acggcttcta tctcaagaat tctcccatgt gggatgatga 2341 ctgctcttgg gaaggcttca agtggatatc tgctgatgat tacacccagt cgataatcgt 2401 tttcagacga attgatcgca agggtaacga gattttcgca gtttgcaact ttgcacccgt 2461 tgaccgcaag gactatcgct tcggtgtgcc ctatatgggt aaatacactg aggtgttcaa 2521 ctcctcttct gtcgatggct cgccttatgc aaacgctccc gttagcgccg agagaattcc 2581 gatgcacggc cttgaccaat caatcgctgt tgatattccc ggccttagcg taatgttctt 2641 caaggtcaga aagacccccg gcagaaaacc caaactccgt acagaataac ccgatttttg 2701 ggatattgta atataattga aaggaagacg taaaatgtac aacaagaaag aatgtgtggc 2761 aatgcttctt gcaggcggac agggttcccg tctttatgct ctgaccaaga atgttgccaa 2821 gcccgctgtt ccttacggcg gaaagtaccg catcatcgat ttccctctct ctaactgtgt 2881 caactccggt atcgacacag tcggcgtcct cacccagtat cagcccctcg agctcaacga 2941 ctatatcggc aacggccagg cttgggatct cgaccgcatc aacggcggcg ttcacattct 3001 gcctccttac cagtccaact cgggcgcaca gtggtatgaa ggcaccgcta acgctatcta 3061 tcagaacctt tccttcatcg acagatacga tcctgaatat gttgtgatcc tctccggtga 3121 ccatatctat aagatggact actccgatat gctcaagttc cacaaggaaa agggaagtgc 3181 ctgcaccatc gcagtcatcg acgttgagct tcacgaagca agccgtttcg gtattatgtt 3241 tgccgacaat gaagacagag tttatgactt cgttgaaaag ccaaaggagc ccaagtccac 3301 tttggcatct atgggtatct acatattcga ttatcccgtc ctcaagaaat acctcattga 3361 aaatgagatg gatgaaaccg caaccaagga ctttggtaaa aacatcatcc ccgcacttct 3421 tgagaatgat gaaaagatat atgcttaccg ctttgaaggc tattggaagg acgttggtac 3481 catcgactcc ctttgggaag caaatatgga ccttctcagc cctactgtaa ccctcgatct 3541 ctatgatacc aactggaaga tattctccag caacatctcc cgcgcacctc atatcatcgg 3601 caagaatgcc aagattcaga actcaatggt aaccaacggc tgcgttatcg acggcagcgt 3661 tgaattctca atgatctccg gcggcgtaac aattgaagac ggtgcagttg tcaccagctc 3721 gattcttatg cccggtgcaa ccgttaagtc gggcgctgtt gttgaatacg ctattgttgg 3781 cgaaaacagc gttgtcgaat caggtgcaca catcggcgca agccctgaat ccatcgaaaa 3841 caaggacgag tggggcgttg cagttgtcgg tcatggagtg actgtcagcg gcgaagcagt 3901 tgttttgcct aa // LOCUS sequence077 3904 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence077 VERSION sequence077 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3904 /mol_type="genomic DNA" /organism="" /note="sequence077" CDS complement(633..1430) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MELFKYETHLHTAQGSGCATWRGSLIVERLKELGYSGAFVTDHFF NGNTAVDRRLPWDIKVHLFCQGYEEAKKRGDEIGFDVWFGWEFAMHGTEFLTYGLDKQF LLEHPEIMEMPLERYADFIHQHGGFVVHAHPFREAGYIPSIRLYPRCVDGAEAINCGNS PDANERASWYCDSYGIPKTGGTDGHHLWNYNSGGIALDEKLTCAHDYLERLRAGRITKI LEPSNVAHLPWPENAWESCFRNSVDLLPDDLKERAKKFYEEIG" /locus_tag="LOCUS_3740" /note="MGA_464" CDS 1625..2902 /product="SGNH/GDSL hydrolase family protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011035375.1" /transl_table=11 /codon_start=1 /translation="MRIFKRIVCASLGALLLTSCLCSCAKEEEVIIPDEAGWFATWAAA SMAPVGDEFPLQGLRNNTVRQQVKVSIGGNKLKLTFSNEYGIIPLVIDSVHVAKLLYAG SPNIDTSTDTVVTFNGGSESVTIPEGQTVTSDEIDFNFEALDLLAVTSCFGDYTGGEIT CHSDGGCTAWVTEGNHVGDETFSVMSFKASYYYLCRMDTYAEAGTKTVVCIGDSITDGA CCTFNGFDGWVEVLSQSMQSDPRTQNISVVGTGIGGNCLLHDGWGVSVKNRFERDALNV PGVRYVCVMIGINDIGGAQADISDELIAGYKELIAAAHAKGIKVYACTLTPVKGNFYYS ELHEKIRKTVNEFVFSSNSGFDGVIDMSNAICREDDPEQMKDEYTCGDYLHPGSKGYEA MGKEAYYTLTEIWEAAAKAAEEENKR" /locus_tag="LOCUS_3750" /note="WP_011035375.1 SGNH/GDSL hydrolase family protein (Xanthomonas campestris) [pid:32.7%, q_cov:94.8%, s_cov:99.0%, Eval:3.8e-47]" /note="MGA_465" CDS 2994..3848 /product="sulfide/dihydroorotate dehydrogenase-like FAD/NAD-binding protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011393027.1" /transl_table=11 /codon_start=1 /translation="MYKIVNKKVLNPTVVMMDILAPLVAKKAQAGQFIILRVDDEGERI PLTVAGYDRDAGTVKIIFQVVGATTEKLSHKNEGEYIEDFCGPLGVATKLDGLKKVCIV GGGVGCAIALPIAKALKEMGASVTSIIGFRSKDLLILEDEFKACSQKLYVMTDDGSYGE KGNVCVPLNRMFENGERFDEVIAIGPIIMMKFVVEATRPTGIPCTVSMNPIMIDGTGMC GGCRLTLIRDGKRVIKFACVDGPDFNGYEVDFDEAMSRGSMYRDHERHAYEKTCNLFNK EDK" /locus_tag="LOCUS_3760" /note="WP_011393027.1 sulfide/dihydroorotate dehydrogenase-like FAD/NAD-binding protein (Moorella thermoacetica) [pid:52.4%, q_cov:94.7%, s_cov:95.0%, Eval:2.7e-74]" /note="MGA_466" ORIGIN 1 aaagcttttc ttcaagcaca attccgcctg ctttatacca ccacaaatga tgagcatcgc 61 ttccgcctgt tttgggaagc ccgcaggaat cggcaaacca gattgctctc tcgttggcaa 121 tcgggtcgtt tccgcaattt attgcttcaa ttccgtcgac gtgcttgaaa tatatatgca 181 agccggaaat atatccccta tccctgaatg ggtgcgcctg caccacaaac cagccgcatt 241 tatgaaccag gtcgatgtat tcatcgggtg ccatatgaat cacattcggg tgatttaaaa 301 ggaactgctt gtctaatcca tatgtcaaaa agtcagcaca attccaggaa aattcccaac 361 cgaaccaaac gtcaaagcca agctcgtcgc cgatcttttt tgctttttca tatccctgac 421 agaaaagacc cacctgaata tcccaaggca gacgtgtatc aacagatgta ttgctgttta 481 agaaatggtc tgttacaaag catccgctat agccgagctc gtgcaatctt cttacagcaa 541 cttctgcatt ccagttgccg caggcagagc cttcgcttgt gtgcaaatgc gtttcatatt 601 tgaataatgc catatattat attcagctcc gatcaaccga tttcctcata aaatttcttt 661 gctctttcct ttaaatcatc cggcaggaga tcaacgctgt tgcggaagca gctttcccat 721 gcgttttccg gccaaggtaa atgagcaaca tttgacggtt ccaatatctt tgtgattcgt 781 ccggctctga ggcgctcgag atagtcatgc gcgcaggtga gcttttcatc caaagctatt 841 cctcccgagt tgtagttcca gaggtggtgg ccatcggtgc cgccagtctt tggaattccg 901 taagagtcgc aataccagct tgcgcgctcg ttggcatcgg gtgaatttcc gcagttgata 961 gcctctgcgc cgtcaacaca tcggggataa agtcttattg aaggaatata tcccgcttcg 1021 cggaagggat gagcatgaac gacaaagccg ccgtgctgat gaataaagtc agcatatctt 1081 tcaaggggca tttccataat ttcggggtgc tccaaaagga actgcttgtc aagaccgtag 1141 gtcaggaact cggtgccgtg cattgcaaat tcccagccga accaaacgtc aaagccgatt 1201 tcatcaccgc gcttttttgc ctcctcatat ccctggcaga aaaggtgcac cttaatgtcc 1261 cagggaaggc gtctgtcaac agcggtattg ccgttgaaga agtggtcggt aacaaatgca 1321 cccgaatagc caagctcctt gaggcgttcg acaatcaggc ttccacgcca ggttgcacag 1381 ccggagccct gagcagtatg taagtgggtt tcatatttga acagttccat ttgtttaact 1441 ctccttttaa agaaaaatgc tatcagaagc tattatttac caaataccca gatataatca 1501 ttatactatt tgaaattata agtgtcaaca aaaacagatt ttataaaggc tgtactttac 1561 atactctgtc ggaaatgcta taataattgc atattatgtc atatttgaaa ggaactcccg 1621 taatatgaga attttcaaga gaattgtttg cgcttctttg ggcgcgcttt tgcttacatc 1681 ttgcctttgc tcctgcgcta aagaggaaga ggtcatcatt cccgacgagg caggctggtt 1741 tgccacatgg gcagcggcat caatggcacc cgttggcgat gaatttccct tgcagggact 1801 cagaaacaac accgtccgcc agcaggttaa ggtttctatc ggcggcaaca agcttaaact 1861 gacattttca aacgaatacg gcatcattcc ccttgtgatt gattccgttc acgttgcaaa 1921 gcttttatat gcaggaagcc ccaatattga cacctcgacc gacacagttg tgaccttcaa 1981 cggtggcagc gaatcggtga cgattcccga gggccaaact gttacatcgg acgaaattga 2041 tttcaacttt gaagcgcttg atcttttggc tgtaacctcc tgcttcggag attatacggg 2101 cggagagatc acctgccaca gtgacggcgg atgcacagct tgggttacag aaggcaacca 2161 tgtcggcgat gaaacatttt cagtaatgag ttttaaagca agctattact acctctgccg 2221 aatggataca tatgccgagg cgggaacaaa gacagttgtc tgcattggtg actcgattac 2281 cgacggcgct tgctgtacct ttaacggctt tgacggttgg gttgaagttc ttagccagtc 2341 gatgcaatct gacccgagaa cgcaaaatat ctccgttgtc ggaacgggta ttggcggcaa 2401 ctgcctcttg cacgatggct ggggagtttc tgttaagaac agatttgaac gcgacgcttt 2461 gaatgtcccc ggtgttcgct atgtctgtgt gatgatcggc atcaacgaca tcggcggagc 2521 acaggcagat atttccgatg agttaattgc aggctataag gagcttattg cggcggcaca 2581 cgcaaagggt attaaggtat atgcttgcac gctgacccct gttaagggca atttctatta 2641 ttctgagctt cacgaaaaga taagaaagac tgttaacgag ttcgtgttca gctctaattc 2701 cggatttgac ggcgtaattg atatgtccaa cgccatctgc cgagaggatg accccgagca 2761 gatgaaggat gaatacacat gcggcgacta tctgcacccg ggttcaaagg gatatgaagc 2821 aatgggcaag gaagcatatt ataccctgac cgaaatttgg gaagcagcgg caaaagctgc 2881 cgaagaagaa aataagcgtt gacttattgt aacctgaaga gtataattta gttgaaaagg 2941 gggctgtgca gataatcaca gtcccctaaa taacttgtcg aaggtgcggc actatgtata 3001 aaatagttaa caaaaaggtt ttaaacccca ccgttgttat gatggatatt ttggctccgc 3061 tggttgcaaa aaaagcacag gcgggacagt ttataattct tcgtgtagat gatgagggcg 3121 agcggatacc cttgaccgtt gcgggatatg accgcgacgc aggaacggtt aaaataatct 3181 ttcaggtcgt cggcgccacc accgaaaagc tttcgcataa gaacgaggga gaatatattg 3241 aagatttttg cggccctttg ggcgttgcaa caaagctgga cggactcaag aaggtctgca 3301 ttgtgggcgg cggtgtcggc tgtgcaatcg ctttgccgat cgccaaggcg cttaaagaaa 3361 tgggcgcttc ggttacaagc ataatcggtt tccgctcgaa ggacctgctt attttggagg 3421 atgaattcaa ggcctgctcg caaaagcttt atgttatgac cgacgacggc tcatatggcg 3481 aaaagggcaa tgtctgcgtg cctttaaaca gaatgtttga aaacggcgag cgatttgacg 3541 aggtcatcgc catcggtccg atcataatga tgaaatttgt tgttgaagca acaagaccca 3601 caggtatccc ctgcaccgtt tcaatgaacc cgatcatgat cgacggcacg ggaatgtgcg 3661 gcggatgccg attgacactt attcgggacg gcaagcgggt aattaaattt gcctgtgttg 3721 acggtcccga tttcaacggc tatgaggtgg attttgacga ggcgatgtca agaggctcga 3781 tgtatcgcga tcatgagcgc cacgcatatg aaaaaacctg caaccttttt aacaaggagg 3841 ataagtaatt atggcaaata tgtcccctgt taaaaatccg atgccgacac tggatgccaa 3901 tgca // LOCUS sequence078 3881 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence078 VERSION sequence078 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3881 /mol_type="genomic DNA" /organism="" /note="sequence078" CDS complement(882..1766) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MADYKKRWGDRKDARLIRKLDSMHVIMPYTGPQRTANEAVCVEEI DCTALEAYVEKLNANNPEFKYTFFHVICAAIAKTMVLRPKMNYFYSGHRLYEKDDIVLS FVVKRQFTDDSHEAMAIIKCEKEGVSPLDDIYGKIKKFVTSVRKEGNNGGTADIMDILQ YLPRWLLKAFFGTLRWLEYHGWYPKGLMKEDPYYSSCFISNLGSIKMHADYHHLADWGT NSFFVIIGEKKPTAVFNADGTYEMKNVLKLGITVDERIADGVYFAKTIKIVKKLLANPE LLELPVETPVELD" /locus_tag="LOCUS_3770" /note="MGA_468" CDS 1995..3251 /product="glycoside hydrolase family 27 protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_015776921.1" /transl_table=11 /codon_start=1 /translation="MVAKNPPLGWNSWDCYGASVDEATVKANADYMAKHLKQYGWEYIV VDIQWYQPTATSHSYEPFADLVMDEYSRLLPAPNRFPSSADGKGFAPLAEYVHSLGLKF GIHIMRGIPRQAVFMNAKIKDSKYTARQVAQYNNICYWNPDMYGTDTNCPGAADYYNSI FELYASWGVDFVKVDDICRNHNNEGEIKLIRNAIDNCGRDMVLSLSPGPARIEQAEFLK ENANMWRITDDFWDRWELLYDMFTRAETWCNHAGAGHWPDCDMLPIGPINQDYSKDNYS KFTHDEQQTMMSLWCMVRSPLIIGGEMNGFDDFTMSLLTNEELLNIERDTHCAHMVTRR VVDGNEQIIWLAPAKDASVNYVALFNAGESVCDITVDIARLGIKPTNAYDIWNFTTEAV GDKLTATVNPHGVRLFKLL" /locus_tag="LOCUS_3780" /note="WP_015776921.1 glycoside hydrolase family 27 protein (Brachybacterium faecium) [pid:46.5%, q_cov:90.4%, s_cov:83.3%, Eval:5.3e-94]" /note="MGA_469" ORIGIN 1 atatgtggca ggagtgaact tgggcaccaa aatacatctg ccgccgttgg caagcatcga 61 atgcacggtt acacccaatc caaagccgtg gaacatcggc attacagcca gcatcttgtc 121 gccgggggtg aaaatggggt tggttgcaat gatctgcgct gccaaaacgt tgaaattata 181 gcttgaaagc ataattccct tggtggtgcc tgttgtgccg cccgaataaa gcaaaaccgc 241 catttcgtct ttcgacttct ttgcaatata ttcgcccgtg tgggtctttg cgcccttaat 301 gaaatcgttc cacttaacaa tgggtgcatt ttccggcaag ggagcaatct ttcttccctg 361 ggttaaagca tatcccagct tcattatggg agaaagggcg tccttgatgg atgcgatgat 421 aaggtggggc aggttaacgt tttctctgat cgcttcaaac ttgccataga actggtcaag 481 tgtcagcgcg caggtcgatt ttgaaacctt gagataaaac tcgatctcct tttcactcga 541 aagggggtgg atcatatttg caacagcgcc cacaaccacg caagcataga acataataac 601 ggtctgggga cagtttggca tacagatggt aactctgtca tcctgcttga ttcccaaagc 661 cttcaaagcc ttggcgcatt cgtgtacctg tgcgcggaag tccttatact ttgtggtctt 721 gcccataaag tcaaatgcaa tataatcggg atatttcttt gcaatgtcct caacagagtc 781 ccacattgag ccctcgtgat attcaagagt gtggggcaca tcgccgtagt tattaaacca 841 gggcgtttta acttcattcg ccatagtgat cagttccttt ctcagtcgag ctcgacggga 901 gtttcaacgg gaagctcgag cagctctggg tttgcaagaa gcttcttgac aatctttatc 961 gtctttgcaa aatatacgcc gtcggcaatt cgctcgtcga cggttatgcc gagcttgagc 1021 acatttttca tctcatatgt gccgtccgca ttgaaaacag cggtgggctt tttctcgccg 1081 atgattacaa agaaggagtt tgttccccag tcggcaaggt gatgataatc ggcgtgcatt 1141 ttaattgagc cgaggtttga aatgaagcag ctggaataat atgggtcttc cttcattagc 1201 cccttgggat accagccgtg atattcaagc cagcgaaggg tgccgaaaaa ggctttcaaa 1261 agccagcggg gcagatactg caaaatatcc ataatatctg ctgtgccgcc gttattgcct 1321 tcttttctta cgctggtgac aaactttttg atcttgccgt aaatgtcatc caaaggcgaa 1381 acgccctctt tttcgcattt gataattgcc attgcttcgt gggaatcgtc ggtaaactgc 1441 cttttaacaa cgaagctcaa aacaatatcg tccttttcat aaagtctgtg acccgaatag 1501 aaatagttca tcttgggtcg caagaccatt gtctttgcga ttgccgcgca gataacgtgg 1561 aaaaatgtat acttaaattc gggattattt gcgtttaact tttcaacata tgcttccaaa 1621 gcggtgcagt cgatctcctc aacacagaca gcctcgtttg cggttctctg cggtcctgta 1681 tagggcataa tgacgtgcat cgaatcgagc ttacgtatta aacgggcatc cttgcggtcg 1741 ccccatcttt tcttataatc agccatatta aactcccctc atttcccctg ctcggcaaat 1801 ttgcgacagg tttaccttaa cagtatactc aaaatatgtt gagctgtcaa caaatttcga 1861 caaaattgtt agttgtcatc ctataggtaa aatataaaac cttcaggaaa aataagagca 1921 cattttaata ttgactgagc acggaattat gatataatca aattaacaaa cttattgatt 1981 ggagttgttg atatatggta gcaaaaaatc cccctttggg ttggaacagc tgggactgct 2041 atggtgcttc ggttgatgaa gcaaccgtca aagcaaatgc cgactatatg gcaaagcact 2101 taaagcaata cggctgggaa tatattgttg tggatatcca gtggtatcag ccgacagcta 2161 catctcattc atatgagccg tttgcagatc tggtgatgga tgaatattca cgccttctgc 2221 ccgcacccaa ccgtttcccc tcatcggcag acggaaaagg ctttgctcca ttggctgaat 2281 acgttcactc actgggactt aaattcggca ttcatatcat gagaggtatc ccccgtcaag 2341 cggtatttat gaacgctaaa atcaaggaca gcaaatatac tgcacgtcag gttgctcaat 2401 ataacaatat ttgctactgg aaccccgata tgtatggaac cgatacaaat tgccccggcg 2461 cggctgatta ttataactcc atcttcgagt tgtatgcttc ttggggtgtt gactttgtta 2521 aggttgacga tatctgccga aaccataata acgagggcga aattaagctg atccgtaacg 2581 ccattgacaa ttgcggaaga gatatggttt tgtccctttc tcccggacct gcaagaattg 2641 aacaggcgga attcttgaag gaaaacgcga acatgtggcg catcaccgac gacttctggg 2701 atagatggga gcttttgtac gatatgttca caagagctga aacctggtgc aaccatgcag 2761 gtgcgggaca ttggcccgac tgcgatatgc ttcccatcgg tcctatcaat caggattatt 2821 cgaaggacaa ctattcaaag tttacccacg acgaacagca aacaatgatg agcctttggt 2881 gcatggtgcg ttctcccctc attatcggcg gcgaaatgaa cggctttgat gatttcacaa 2941 tgagcctttt gaccaacgaa gagcttttga atattgaacg cgacacccac tgcgcacaca 3001 tggtcacacg cagagtcgtt gacggcaacg agcagatcat ctggctggca cccgccaagg 3061 atgcaagcgt aaactatgtt gcactgttca atgcaggtga atcggtttgc gacattaccg 3121 ttgatattgc gcgtctcggc atcaagccca ccaacgctta tgacatctgg aactttacaa 3181 ccgaagcggt tggcgataag ctcaccgcaa cagttaaccc ccacggcgta agacttttca 3241 aacttctttg aaaataaaac aaaaaaggaa gcatgcgagg ctgcttcctt ttttgcctta 3301 aattataatg ttccaaacaa atgaacttca tatttatatt ataaacattt tatgcattgg 3361 ccacaatgat gaattgaaag ggaaatattg atttttcctc attagccaag gagaatttat 3421 gatcaagccg acatattttg accgtttcaa gtgccttgca ggcgcttgcc ccgattcctg 3481 ctgtaaagct ggctgggaga taaccgttga tgaaaacgct tttgagatat attccgcatt 3541 agaaggagat atcgggcgaa agttccgcga aaaagtatgc gagggtgcgg acggcgacag 3601 aattttcaag ctgaatgagc ataaagtctg cccgttttat aactgcgacg gactttgcga 3661 tctgtatatc gccacaggcg gaaagatgac tgaaatatgc caaaactatc ccagatttta 3721 cgaggaattt gacggattca gcgaggcagg gatttccgtt tcctgtcccg aggcaataag 3781 attggttttg gacgccgagg agagcgcata tgacctgccc tatgaatatt cagaggacga 3841 gatgcttgat gtgctgataa acgagcgcag gttggcattt g // LOCUS sequence079 3875 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence079 VERSION sequence079 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3875 /mol_type="genomic DNA" /organism="" /note="sequence079" CDS 1144..1914 /product="type III pantothenate kinase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_005809761.1" /transl_table=11 /codon_start=1 /translation="MVFTVDVGNTNIVLGAFDEQDNLLFTSRITTDHSKTADQYAITFK DILLLYDIDKSGFKGAIISSVVPSLIPVLKEAILRLMGIHALVVGPGIKTGLNIRLENP AILGADLVCGAVGALAKYQPPMIIFDFGTATTISAIDKNGAFLGGSIIPGVNVSLKALS NSAALLQDISAGGNVSVIGTNTPDSMRSGSILGNASMMDGMIARYREILGENAICIATG GLAPTIVKYCKTDGIILDNGLLMDGLYTIYQKNR" /locus_tag="LOCUS_3790" /EC_number="2.7.1.33" /note="WP_005809761.1 type III pantothenate kinase (Desulfitobacterium hafniense) [pid:40.4%, q_cov:99.6%, s_cov:98.1%, Eval:2.4e-47]" /note="MGA_472" CDS complement(1956..2249) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MRKFLLIMISLICLSLLVGCGGKNNNDNNNVTPGTSATLGTSSAV NDGVNSVVTDNTNIIQGGVSMVESGMDNVMDGVESGISDAEDAMEPKGRNMR" /locus_tag="LOCUS_3800" /note="MGA_473" CDS complement(2340..2741) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MIRVKSIQRDGNDINETEIITKGTFEKIDSGYLLKYKETDETGYD GANTSLKILDGSKIELLRTGSVSSELIIEEGKKNHCHYGTPYGDMVVGVQGKRVETSLT DIGGQVKASYVMDINAMFMGDYDLTIDVK" /locus_tag="LOCUS_3810" /note="MGA_474" CDS complement(2775..3584) /product="glutamate racemase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_012545640.1" /transl_table=11 /codon_start=1 /translation="MNKFDAIGVFDSGIGGLTAVKELAKLLPNENIVYLGDTARVPYGT KGRETIIKYAKQDAEFLARHNVKMIIAACGTVSSVASSEMSEMGHLYTGVIEPAVKAAV NVTKNGKIGVLGTNATVRSGSYEALIHKLSPESEVYSKACPMFVPLVENGYVNIDCEPT LAIAKEYLEPLKEKGIDTLILGCTHYPLLSGIIAKIMGDDVKLISSGGEAGKYAKELLA ENGLLNDSTEKGKISLYCTDSAELFLENAKHFLEGLDDFEVKSASLD" /locus_tag="LOCUS_3820" /gene="murI" /EC_number="5.1.1.3" /note="WP_012545640.1 glutamate racemase (Thermodesulfovibrio) [pid:49.4%, q_cov:92.9%, s_cov:91.9%, Eval:5.2e-64]" /note="MGA_475" ORIGIN 1 tatatagctt ataatcggga cgaattgaat gaatcagcag cggcagggcg aaaatatccc 61 caaccctatg atatagcgcg atattgagct ttggcgcttg ttcgcttatt gtcttcttcg 121 cgccgtcaat cgtttcaagc tctgcgccct caacatccat tttaatatat gtgcacttat 181 catctttaag aagcgaatcg acacaaacgg caggagtttc aattccctgc tcgctcaaat 241 gtggcattct gccgccgccc tttgagaaga taagagtagt atcgctcgac cagcttgccg 301 cgttgatgag cgaaatgttt tccatcccct cggcatattc ggaaagcttg cggaaattgc 361 gtttgttcgg ctcaacggcg taaattcggc ggtatttgcc tttggtgtgc gccaaaagct 421 cccgcacggt atcgcctgta tatgcaccga ggtcaacata aatttcatcg tcgttggggc 481 gcaaaatagt ttcatatgct tcgtcgggtg tggtctcgca ggcttttaaa actgcgatat 541 cgcccgttat tttaaactcg attacagatt tgaacacctc gcgggattta tcatccgcca 601 aaagcgaata aaccctttca agctcgtcaa agtgcgaaag catatactcc ttggtgaaaa 661 gcccctcgcc gattacgggc atatcgggaa caataagctc gtggcgggca gcgattgtat 721 caatcttttc aatcagctca tgatagcccg cgccgaaagc aagaacgatg atgaagtcat 781 ccaccgcttc ttcaatttcc gagagcttat gtattttatg cccgcagaag actttatcgc 841 ggacaaattc atcgcttgca aaaattcccg cacagggtat gcggtaatct tcaaatattt 901 tcagcacctt taagcatccg tcgcccatac cgtaaatgaa gataggcttt ttggcatgca 961 taaggctgta tagatatgag gtcaagtcga caaaatagtt tttgttaagc attattttct 1021 ctcccgagtg tttgttaaac atattataac ccaaaaaccg attataggca accgcccttg 1081 acttaatggg cacaaagcta taaaataata attgacaaat aaccaattga aaggaacttc 1141 gctatggttt ttacagttga cgttggaaac acgaacattg ttttgggcgc gtttgacgag 1201 caggataacc tgcttttcac ctcacgcatt acgaccgacc attccaagac cgccgaccaa 1261 tatgcaatta cgtttaagga tattcttctg ctttatgata tcgacaaatc gggctttaag 1321 ggcgcaatta tttcaagcgt tgtcccctcg ctgatacctg tgcttaaaga agccatcttg 1381 cgccttatgg gcatccacgc attggttgta ggccccggca ttaagacagg acttaacatc 1441 cgtcttgaaa accccgcaat tttgggcgca gaccttgttt gcggagcggt tggagcactg 1501 gcaaaatatc agcccccgat gataatattt gactttggta ctgccaccac catttccgcc 1561 atcgacaaaa acggcgcatt tttgggcggt tcgataattc ccggcgtgaa cgtttcgctg 1621 aaggcgcttt caaattctgc ggcgctcttg caggacattt ccgcaggcgg aaacgtttcg 1681 gtcatcggca caaacacccc cgattccatg cgctccggct cgattttggg aaacgcatca 1741 atgatggacg gaatgattgc acgctaccgc gaaattttgg gtgaaaacgc aatttgtatt 1801 gcaacgggcg ggttagctcc cactattgtc aagtattgca aaactgatgg catcattctt 1861 gacaacggtc ttttaatgga tggactttat acgatatatc aaaagaacag ataaattaaa 1921 gagggcgttc caaaaacgga gcgccctttt ttgttttatc tcatatttct gcccttcggc 1981 tccattgcat cttcagcatc gctgattccg ctttcaacgc cgtccataac attatccata 2041 ccgctttcga ccattgaaac gccgccctgg atgatgttgg tgttatcggt tacaacagag 2101 ttaacgccgt cattaactgc gcttgatgtt cccaaagttg cacttgtgcc gggagtgaca 2161 ttgttgttat cattgttgtt ctttccgccg cagcccacaa gaagcgacag acaaattaaa 2221 gatatcataa tcaataaaaa ttttctcata tactatcctt tcaagattaa agaagctcga 2281 gcttttgctc gggattagta tatgagaaat attttttcat attcgcacag caaaatttgt 2341 tatttgacat caatcgtcaa atcgtagtca cccataaaca tcgcgttgat gtccataaca 2401 tatgaggctt taacctgacc gccgatgtcg gttaaactgg tttcaacgcg cttgccctgc 2461 actcccacga ccatatcgcc gtaaggtgtg ccatagtggc aatggttttt cttgccctct 2521 tcaattatca gctcggagct tacgctgccc gttcttaaaa gctcgatttt tgaaccgtca 2581 agaattttca gcgaggtgtt ggcgccatca tatcccgttt cgtccgtttc cttatattta 2641 agcaaatatc ccgagtcgat cttttcaaag gttcctttgg ttataatctc ggtttcattg 2701 atgtcgttgc cgtcccgctg aatgcttttg acgcgaatca ttacgttttt aatttcaatc 2761 cactccgttt cctctcagtc aaggcttgcc gacttaacct cgaaatcgtc aagtccctca 2821 agaaaatgct tggcattttc caaaaacagc tcagcagagt cggtgcaata taggcttatt 2881 ttgccctttt cggtgctgtc gttcaaaaga ccgttttcag ccaacagttc ctttgcatat 2941 tttcctgctt cgccgcccga tgagatcagt ttaacatcat cgcccataat tttggcaatg 3001 atgccgctta aaagcggata atgggtgcag cccaaaatta aagtgtcaat acctttttct 3061 ttgagcggct ccaaatattc ctttgcaatt gcaagcgtag gctcgcagtc gatattcaca 3121 tagccgtttt caaccagcgg cacaaacatc gggcaggctt tggaatatac ctcagattcg 3181 ggcgaaagct tatgtataag cgcttcatag ctaccgctcc ttacggttgc attggtgccc 3241 aaaacgccta tcttgccgtt tttggtgacg ttcacagccg ctttgaccgc aggctcgatt 3301 acgcctgtat aaagatgacc catttcggac atttcgcttg aagcgacact tgaaacggtg 3361 ccgcaggcgg caattatcat tttgacgttg tggcgagcca aaaactcggc atcctgcttg 3421 gcatatttaa ttattgtttc cctgcccttt gtgccgtatg gcacgcgggc ggtatcgccc 3481 agatatacga tgttttcgtt tggcaaaagc tttgcaagct ctttaactgc ggtaagtccg 3541 ccgatacccg aatcgaaaac tccgatggca tcaaatttat tcatcagcta ttctccgttc 3601 atatttaatg ttgggaatat tatatgtgtc agtcgtccaa aatactcttt gcggggctgt 3661 tgttgaattc atcctgcaaa cgcttgcgct cgtcgatctt cttcagcaga gtcacaacaa 3721 aaaggcaaag cgcaattatg caatataaaa caatcggtag atatcgccac tcgaagctgg 3781 gtttaaaaac aacttccgtc tgttcggcaa catcaatcat ctccgcagcg gcaacgcaaa 3841 acagcactgt gcctgtggct gtgaatggca ttgaa // LOCUS sequence080 3863 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence080 VERSION sequence080 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3863 /mol_type="genomic DNA" /organism="" /note="sequence080" CDS 378..896 /product="spore maturation protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_010963792.1" /transl_table=11 /codon_start=1 /translation="MNIASVIIPVFVLGVFLYGLYKKVDVFGEFVSGARENIKVGFNIL PSLCALMLAVGMLRGSNALDGLVSLIAPLTEYLGFPPECAPLALLRPVSGSGALSLLEG IFKDYGPDSFIGKVASVMMGSTETTFYTLVVYFEATRVKNTRHALPCALAGDLTAAIMS CVMVRLMLG" /locus_tag="LOCUS_3830" /note="WP_010963792.1 spore maturation protein (Clostridium) [pid:43.5%, q_cov:97.7%, s_cov:97.1%, Eval:1.1e-39]" /note="MGA_478" CDS complement(1177..1944) /product="2',3'-cyclic-nucleotide 2'-phosphodiesterase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003245138.1" /transl_table=11 /codon_start=1 /translation="MKLMFIGDVVGASGCEFLGSRIRGLKQKYNVDITVINGENSATGN GITAVSCEYLTRIGADVITTGNHAFKRRESLSIFDEVEHLVRPCNYPDGVMGRGYYVLD LGRTQVAVVNLMGVVYMEPLGNPYEAMDRVLSEIGTKNIFVDIHAEATAEKKALGYYLD GRVTAVLGTHTHVQTADETVLSNGTAYITDVGMTGPEESVLGVDKVPAIEKQRLNVPVR FVEADTPCMINGVVVEFDEKTGKALKIERFIER" /locus_tag="LOCUS_3840" /gene="ymdB" /EC_number="3.1.4.16" /note="WP_003245138.1 2',3'-cyclic-nucleotide 2'-phosphodiesterase (Bacillus) [pid:46.7%, q_cov:99.2%, s_cov:96.6%, Eval:1.2e-64]" /note="MGA_479" CDS complement(1951..2697) /product="tRNA 2-thiocytidine(32) synthetase TtcA" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003435803.1" /transl_table=11 /codon_start=1 /translation="MQKMLGYMRKAITEFDMIQNGDKIAVGVSGGKDSLVLLKGLILLR RFIGIDYNIVAITLDPQFGGIEGDYSAVQRLCDEHGIQYILERTHIGEIVFDIRKEPNP CSLCARMRRGALHDAAKAAGCNKIALGHHFDDAVETFLMNLFVEGRIGCFAPKSYLSRK DLWMIRPMVFAPEAEVRRAANRANLEVVKSKCPADGHTKREEMKEFIKERERQDKGFAD RIFGAMRRANVDGWGFPTIPEDEETE" /locus_tag="LOCUS_3850" /note="WP_003435803.1 tRNA 2-thiocytidine(32) synthetase TtcA (Clostridioides difficile) [pid:48.5%, q_cov:93.1%, s_cov:93.0%, Eval:1.3e-58]" /note="MGA_480" misc_feature complement(3167..>3863) /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_003357375.1:NCS2 family permease" /note="WP_003357375.1 NCS2 family permease (Clostridium botulinum) [pid:43.4%, q_cov:88.7%, s_cov:47.0%, Eval:8.7e-43, partial hit]" /note="MGA_481" /locus_tag="LOCUS_3860" ORIGIN 1 atatcacggc ttatgatgcc gattcttgta agactgttca aggggcttga taagaactcc 61 cgagctatgc aggcgattgc aatgaatata acggcaaact tattcgggct gggaaatgcc 121 gctactccct tgggtattga agcaatgaag cgacttgagc aagaagagaa aacaggtgaa 181 gttgccagca aaaatatgat tttatttgcg gtgctgaata cttcttccgt tgaacttata 241 cccgcgacag ttgcaacgct tagattggca tatggaagcc gcgaaccgat ggtaattttg 301 ccatgcgtgc tgttggtgtc gctgatgtcg gtggcggtat gtattacact ggtcaacatt 361 ttcaacagga gcgaaaaatg aatatcgcaa gcgtaattat acccgttttt gttttagggg 421 tattcttata tggactatac aaaaaagttg acgttttcgg cgaatttgtt tcgggtgcaa 481 gagaaaacat taaggttggg tttaacattc tcccctcttt gtgcgcgctg atgctggcgg 541 ttggtatgtt aagagggagc aacgcccttg atgggttggt gagcctgatt gcaccgctga 601 cagagtattt gggctttccg cccgagtgcg caccactagc acttttgcga cccgtttcgg 661 ggagcggagc tttgagtctt ttggagggga ttttcaagga ctatggccct gacagcttta 721 tcggtaaagt tgcaagtgtg atgatggggt cgacggagac cactttttac acgctggttg 781 tatattttga ggcaacgagg gtcaaaaata cgcggcacgc tctgccttgt gcgctggcag 841 gagatctgac tgcggcgata atgagctgtg tgatggtgag gttgatgctg ggatgagcgg 901 tggcgtgcag ccaaaaacgt tgctcgctac gtggcttttt gagaataacg gggagcctca 961 ccgtggtgcg acgacgcggc agccctgcgg tgctcagcac cgcagccccg tggcgaagcc 1021 acggggaagg cgtttgcaaa gcaaacgcct tggctgccgc agatggagcg aggggtgtct 1081 gcgagcgcgt tccgacagga acagtgccgc aggtaccccg agcggtttgc tggcacaaaa 1141 gtaaaaaatc cccgacaaaa gctgtcgggg aataaatcat ctctctatga atctttcaat 1201 tttcagcgcc ttaccggttt tttcgtcgaa ttcgaccaca acaccgttta tcatacaagg 1261 tgtgtccgct tcaacaaatc gcacaggcac attaagcctt tgcttctcga ttgcagggac 1321 cttatcaacg cccaagaccg attcctcggg acctgtcatc ccgacatctg tgatatatgc 1381 cgtaccgttc gaaagaaccg tttcgtcggc agtctgaacg tgggtatgtg tacccaaaac 1441 ggcggtaact ctaccgtcga ggtaatatcc cagcgctttc ttttcggcag tagcttcggc 1501 gtgaatatca acaaagatat tcttggttcc gatttcgctc aataccctat ccatcgcttc 1561 ataaggattg ccaagaggtt ccatatatac cacgcccatg agattgacaa cagcgacctg 1621 agttctgccc agatcgagga cataatagcc tctgcccatt actccgtcgg ggtagttaca 1681 tggacggaca agatgctcca cctcgtcaaa aatggaaaga gattcgcggc gtttgaaggc 1741 gtggttacct gttgttatca catctgcccc gatgcgggtc agatattcgc aggaaacagc 1801 ggtaatgccg ttgcctgttg cggaattctc gccgttgatg acggtgatat ccacattata 1861 tttttgtttc agaccgcgga tcctcgagcc gaggaattcg catcccgaag ctccgaccac 1921 atcgccgata aacatcagtt tcatatatat ttactccgtt tcttcatctt cgggtatagt 1981 cgggaatccc caaccgtcca catttgctcg gcgcattgcg ccgaaaattc tgtcagcaaa 2041 tcccttatcc tgtctctcac gctctttaat aaattccttc atttcctcgc gttttgtgtg 2101 accgtccgcg gggcattttg attttacgac ctcaaggttt gctctgtttg ccgcacgtct 2161 gacctcggct tcgggtgcaa agaccatcgg gcgaatcatc cacaagtcct tgcgggaaag 2221 atagctcttc ggcgcgaagc aaccgattct gccttcaaca aaaagattca tcaaaaatgt 2281 ttcaacagcg tcgtcaaagt ggtgacccag agcgattttg ttgcatcctg ccgccttggc 2341 agcatcgtgc aatgcacctc ttctcatacg cgcgcagagc gagcaagggt ttggctcttt 2401 tctgatatcg aaaacgatct cgccgatatg ggtgcgctcg aggatatact gaatgccgtg 2461 ttcatcgcaa agcctttgaa ctgccgagta gtcaccttcg attccgccga actgagggtc 2521 aagagtgata gcgacaatgt tataatcaat gccgataaat ctgcgcaaaa gaataagccc 2581 tttcaaaagc acaaggctgt cctttccgcc cgaaacgccg acagcaattt tgtcgccgtt 2641 ttgaatcata tcgaattctg ttattgcttt acgcatatat cccagcattt tctgcataaa 2701 catttctccc caaggtcagg tttaagatta ctatatcaca tcttgcgaaa aaagaaaaga 2761 ttaaaacgcc aaaaaagtga aataagagaa taccctgcag cactctctta cttcaccatt 2821 tacttggaac attataattt gaagatgtca ataatttaag ggtagccttt tgagctacaa 2881 ttatattata cacatttttg ggcgtttgta aactgtaaaa ttatacgaaa aaccccatat 2941 tttataaata atttatatta aatatgaagc ccgcattaaa atatgaaata tgtgatttgc 3001 taaattagtt aatattatat aagtgtaatg cttttgaaac aaggcgcctt cggagccatc 3061 tgattaacta cgtcgctgat ggtggctgta tcggtcaggt gacggtcaga ggaaaaaagc 3121 ccgcctcttg cgaagcgggc ttttaaaagt ttaattacaa accaaatcag gcagttacaa 3181 agaacttaac gatgaagata agggagataa cagcggtgag ccaagaaact tccttaacct 3241 tgcctgtgca gagcttgata acagtgtagg aaataagtgc caagccgata gcatgaccga 3301 tagagcctgt aacaggcata ccgatgagca taactgcagc aggaaccaat tctgccatat 3361 catcaaagtg aaggttcttg aggccggaga gcataagaac accaacatag atgagagctg 3421 cagaggttgc agcagcagga atgattgcag cgataggagc gatgaacatg caagcgagga 3481 acaagatacc ggtagtcaaa gcagtaagac cggttctgcc gccagcttca acgccggatg 3541 cagattcgat gaaggtggta acggtagaag taccggttgc agcaccgata gaagtaccga 3601 tagcgtcaga aagcaaagct tccttcatgt taggcatatt gccttcttcg tccatcatac 3661 cagctctgga agcggtacca acgagagtac cgattgtatc gaacatatcg atcatgcaga 3721 aggtgataac gagagttaca gcggagaacc aaccgatttc aaagagagtt ccgaagtcga 3781 acttgaagaa ggtaagagca gccatatcgc caaatgcagg aacgaaggat gcagttgcca 3841 aagaagcgaa aggattgttg ccc // LOCUS sequence081 3860 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence081 VERSION sequence081 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3860 /mol_type="genomic DNA" /organism="" /note="sequence081" misc_feature <1..1591 /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_004080135.1:beta-galactosidase LacZ" /note="WP_004080135.1 beta-galactosidase LacZ (Thermotoga maritima) [pid:29.1%, q_cov:99.8%, s_cov:48.4%, Eval:9.1e-65, partial hit]" /note="MGA_482" /locus_tag="LOCUS_3870" CDS complement(1775..2227) /product="RbsD/FucU domain-containing protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_009993892.1" /transl_table=11 /codon_start=1 /translation="MLKGIPTIISPELLKILCEMGHSDRIVLADANFPVESVGKNAKVV RCDGHGICELLEAILKLMPLDDYVKQPVGLMAVMAGDNVATPIWEDYKRIIREQTGMDD SVVGEIERFKFYDEAEKAYCIVATGEGAQYANIMLQKGVIRQGDAV" /locus_tag="LOCUS_3880" /note="WP_009993892.1 RbsD/FucU domain-containing protein (Gardnerella vaginalis) [pid:65.5%, q_cov:98.7%, s_cov:100.0%, Eval:3.8e-50]" /note="MGA_483" CDS complement(2233..2667) /product="GAF domain-containing protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011706144.1" /transl_table=11 /codon_start=1 /translation="MHQRLLREMQALISGHKIADLSNAAALIYNALDDLNWAGFYLKEG DILVLGPFQGKPACIEIPMGRGVCGTAAIMNETLVVENVHEFAGHIACDGASNSEIVIP LRVNGEVMGVLDIDSPIFSRFNDKDKAGLEELAKIIEKVL" /locus_tag="LOCUS_3890" /note="WP_011706144.1 GAF domain-containing protein (Aeromonas) [pid:58.6%, q_cov:99.3%, s_cov:95.4%, Eval:8.6e-46]" /note="MGA_484" misc_feature complement(2838..>3860) /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_011836871.1:SHIRT domain-containing protein" /note="WP_011836871.1 SHIRT domain-containing protein (Streptococcus sanguinis) [pid:32.6%, q_cov:62.9%, s_cov:23.4%, Eval:3.0e-17, partial hit]" /note="MGA_485" /locus_tag="LOCUS_3900" ORIGIN 1 cccatccaga attttgcact atgagagcac ccaccgtctg gacgataccc ctacagacat 61 tttggatgtg gattcttgta tgtatcccgg actcgagttg tttgaccatt accacaagga 121 tgaaaacaag aaaaagccct tgttcctctg tgaatattcc cacgcgatgg gcaacggccc 181 cggtgacctt gaggattatc acaacgcatt ctattcaagc gatcgctatg tcggcggatg 241 catctgggaa tttacagatc actcctgctc gcttggaaag accgaggacg gcaaggataa 301 gtatggctat ggcggtgact ttggcgaacg ccacaacgac ggcaacttct gcgttgacgg 361 actgatctat cccaaccgca agccacacac cggatttatg gaagctaagc aggtatatcg 421 ccctgtaaga atgtataagg gcgaaaccga agacgaattc gttgcaaaaa gtttgctttt 481 gttcgatgat ccgatgagct atctcgactg cgaatatgag atcacagtta acggcgtggt 541 tgccgaaaca ggagcttgcg agcttaactt cattagcggc gaggcaaagc tcacggttga 601 cgcagttaag aattacgcca acggcgacct tgcaataaga ttcatcttca aggcaaagca 661 taataccaag tggtgcgaaa agggctttgt tgtttgcttc aaccagatca tcctccgcga 721 tgctgttaag gcagaaaatg tccctgcatc cggcgttgaa attgttgatg aattgatgtc 781 cgccaccctt gaagcaaacg gtgtcaaggt gatcatcggc aagcgcacag ctaaaattga 841 gcagataatc gcacatggca ctgaaatgct ggctaagccg attgaattta acctcttccg 901 tgcacccacc gacaacgacg gctcgagagg cgattggtat cgcgcacacc tccacgattt 961 cgacaccaag gtatacaata caaaaattga agacggctgc tttgttgccg acctttcctt 1021 cggctggaat attcatcagc ccattgcaaa gggcacagtt aagtatgccc ttgacggcaa 1081 cggaaagctc acaatcagcg cagatatgac aatgagcgag aaggtcagat tcctgccgcg 1141 attcggcata agactgcata tgcccgaaga gtttaaggat gttggatact atggctacgg 1201 cccgattgaa agctatattg ataagcatca ggcaagctgg cttgctaaat ttgaggcaaa 1261 catcaacgat atgcacgagg actacgttaa gcctcaggag aattcatccc actgggattg 1321 ccgcgaagca agcgtttcaa acggcgaaat taagcttttg gcaactgcac cctcaaactt 1381 ctccttcaat gcgtcgaagt atactcagga agagctttca accaaacgtc accactttga 1441 gcttgaaaag agcccataca gcatcatctg cctcgactcg ggcatggcag gcgtcggttc 1501 aaactcctgc ggacctgcac tcccgcagaa atatcgcctt gcgattcccg aacagaagct 1561 tgaatttgtg cttgagtttg agaaagagta atgtgaacat attaaaactg cccctgcatt 1621 taagaatgca ggggcagttt tgcggttgcc aaaagcggag cgaggcgtgg cagacacggc 1681 gacgcgccga aggtgcggcg gcttgtggcg tgccgtgccg agcgtagcag aaaaaagacc 1741 tcttcacacg gaagaggtct ttaaaattgc tgatttaaac cgcgtcgccc tgacggatga 1801 cgcccttttg aagcatgata tttgcatact gagcgccctc gcccgttgca acaatgcaat 1861 atgccttttc agcttcgtca taaaacttaa atctctcaat ttcgccaaca acgctgtcgt 1921 ccatacccgt ctgctcgcgg ataatgcgct tataatcttc ccagattggg gttgcaacat 1981 tgtcgcccgc cataactgcc attagtccaa caggctgttt aacatagtca tcgagtggca 2041 taagctttaa aattgcttcc aaaagctcac agatgccgtg accgtcgcag cggacgacct 2101 ttgcgttttt gccgacgctt tcaacaggga agtttgcatc cgccagaacg attctgtcgc 2161 tatggcccat ctcgcagaga atttttaaca gttcgggaga aattattgtc ggaattcctt 2221 ttaacatagt tttcacaaca ccttttcaat tatttttgca agctcttcaa gtcccgcttt 2281 gtccttatca ttaaatcggc tgaaaatcgg gctgtcgata tcaagtacgc ccataacctc 2341 gccgttaact cttaacggaa tgacaatttc cgagtttgaa gcgccgtcgc aagcgatatg 2401 cccagcaaac tcgtggacat tttcaacgac aagggtctcg ttcattattg cggcagttcc 2461 gcacactccc ctgcccatgg gaatttcgat gcaggcaggc ttgccttgaa acgggccgag 2521 aacgagaatg tcgccctctt tcaaataaaa tcctgcccag ttaaggtcgt caagggcgtt 2581 atatatcagc gccgcggcgt ttgaaagatc ggcgatcttg tgtccgctga tgagagcctg 2641 catttcacgt aaaagtcttt gatgcatttc caacgctgtc cccttccgtt ttttatctaa 2701 tatgatttta gcagaaatgc atacgcatcg caatagcata ttctcaatat ttgatatctt 2761 tttaaaataa acaagaggta accgccgaaa agcgattgcc tcttttgatg tttattcggt 2821 tatgctaagc cttcgaatca gtcgagaata atcgcttcga tttcttcttc gattgcttca 2881 acgggatctt caaccaccag gttgtagatg tttacaaact tagccgcttc ggctcttacg 2941 accttgccgt ccttggtcac atatgtgctg accttgccga cgggaggaat gaagccgatc 3001 tttacaacaa ctgtgtgaac gctttcgtca tataccatgc ctgcgattcc ggtgttttcc 3061 tcggtgatct catatacata ggtcttgccg atatcggatg ctacgtattc gatctcgaag 3121 gttgcgtcgc cgttcgcatc ggatactgcc ttgatctcct tgccggaaga agtgtccttg 3181 agggtgaaga taaagccgtc aagcttgttg taacctgttt cgctcaagtc aacaagttcc 3241 ttcttaatct tgagacggag tctttcgccg atgatcgcgc cggggatggt ggacctatag 3301 gtgttcttaa atactactct ttgaagctct gcgccgtttg catcggtata ggtgatgtca 3361 tagccaagct tgccatcggt gcccttggtg atcacgatcg tgatgcggta ctcgctgtta 3421 tcatacttaa cgcctgcgag tgcgccctta acttcgctta caacatagtt gaatgttccc 3481 tcttcggtga aggtgagggt gccgaaatca accattccgt cagctctgtt ggatgctccc 3541 ttgacgggga tatccgactt cttgacaaag cttgcatcgg tttcatagat ttcgaagcta 3601 aactctcctg caaccaaatc tctgccctca agctgcttaa atgcacttac gggaacatat 3661 gcgttggtgt cgatcttctc gaacaggcct gcctggttgc cggtttcggc aaagctcttg 3721 gtcagcaggg cgatgtcagc ggtggggttg gccttttcag ccatcagctt gttcagacgg 3781 tcaccgttgc cgctggtggg gtcaacgatg atggtgcagc cgtacttgtc cataaagccc 3841 tgagcggcct tcatcagacc // LOCUS sequence082 3854 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence082 VERSION sequence082 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3854 /mol_type="genomic DNA" /organism="" /note="sequence082" CDS complement(2420..2689) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MVNQFLRSGTSIGANIHEANYASSKADFINKFQIALKECYESDYW LSLFKETNMITDGEYNEMYSKCCKIRRVLIASINTAKGNNLPSA" /locus_tag="LOCUS_3910" /note="WP_011107654.1 four helix bundle protein (Bacteroides) [pid:50.6%, q_cov:94.4%, s_cov:70.8%, Eval:3.3e-17, partial hit]" /note="MGA_487" ORIGIN 1 atagcaatct tgattatatc cgcagcggca ccctgaatcg gcgcattcat tgcagcgcgc 61 ttgccgaatg cctgcaggtt tttgttggat gccttaagtt cgggaatata tcttcgtctg 121 ccgaaaaggg tggtgacata tccgttttcc atgccgaaat cgacagtatc cttcatatat 181 ttatcaacac cggggaagtt tgcaaggtag tccttaatat atttatccgc ctcggcaacc 241 gaaacgccga tatcctttga taaactaaat gcgccgatgc cgtaaattat tccgaagttg 301 accgcttttg ccgttcttct catgtctgca tcaacaaaat cttcgggcag tccaaacacc 361 tgcgaagcgg tgcgtgtgtg aatatccgca cccgaaagga acgcctcctg catatttgca 421 tctctgcaga cggatgccaa aaccctcagt tcaatctggc tatagtcggc atcgagcaaa 481 attttgccct cgtccgcgac aaagaacttg cgcatatttc tgcccagctc ttttcttacg 541 ggtatgtttt gcatattcgg gttggcagat gaaattctgc cggttcttgt ttctgtttgc 601 ttaaattccg agcgaactct gccgtcgtcg tgaacgacct ccaacaatcc gtcaacataa 661 gttgatgcaa gctttgttag ggtgcgatat tccaaaatca gcgggattat gggatgacgg 721 ctcgcaagcc cctcaagaat ttcggcattt gtcgaatatc ccgtcttggt ctttttgccg 781 cagggaagcc ccagatcatc aaacagcaca actccaagct gtttcgggct ggaaatgttg 841 aactgcttgc ctgcaagctc gtaaatctgt ccctcgagca gggcaatgtc gcggctgatt 901 gcaattccaa attcctcgat gcctttggta tctacacgca cgcccagagt ttccattgat 961 gccaacacct cgcaaagagg ttgctcaatt tcatacaaca gcttgtccat ttcaagggcg 1021 tgaatttcgc tcttcagctt ttctgacagc gcaggcaagg agagaatctc tccataagcc 1081 tcgtcgcggt tatattgcac accgcaggaa gcacacagac ttttaacact gtagtcgctc 1141 gactgagagt ttaaaagata acccgccaag tcgcagatga agctgacgtt ttcaaggctt 1201 gctccgcgct cgaagcagaa tttatatgcc gattttgcct catatgcggt cttttcgcca 1261 cgtgatgtga aataagccaa aatcagcttt tcgtcatctg tttcatacac cttgccgtca 1321 gcaaaaacgg tcagcctgcc gttaaagata aagtaacttt cacttaattt ccccaaatcg 1381 gtgttgtcgc cttttgccaa gacgatctcc ttggcagggc tctcatcgag cagggaaagc 1441 tgttcttcgg aatccgatgg gtcgagttta aggcgttcca tcagcttgaa catttcaagc 1501 tcggtcaaaa gtcttgccaa ttcgccgtcg cggcgctcat gcatttcata gtccgactta 1561 ttttgcgaaa tgggggaggc gcagtttatt gttgccaacc attttgaatt gaacgccgat 1621 tcacgtccgt ttataagctt gtttttaacg cctgcggaaa ggggagcgtc attgaggttg 1681 tcatatagat tttcaatggt ggtatatgtg ccaataagcg agagcgcggt tttttcgccg 1741 atgcccgcaa cgccgggaat gttgtcggaa gagtcaccca tcagcgcctt gatgtcgatc 1801 aagtttatcg gctcggtgcc gtatacctca taaaacttgt cgcggtcata tttgatcgtt 1861 tccttggtgg tgacaaggcg caccgacacg ccgtccttga tcagctggag agtgtcgcgg 1921 tcgcccgaaa ggacaactgt ttcatcgccg tttgaatcga acaagcggga aacggagccg 1981 agaatgtcat ctgcttcata tccttcgagg gtcaaaacag gcacgcccaa atcggccaaa 2041 atttctttga ttatcggcaa ctgctgggca agctcgtcgg gcatgccctt gcggttggct 2101 ttatagtaat caaacttctc gtggcggaag gtctttttct tcatatcaaa cgccacacag 2161 accgagtcgg gcttgacaat gtcgagctcc ttgagatata tgttcataaa tccggtcaaa 2221 gcgtttgtga atacgccctt ggagtttgaa agcattttaa tgccgtaaaa agcgcggttt 2281 aaaattgagt ttccgtcgat tatcagtaaa cgcataaaca ttctcctatt atataatgca 2341 cgcagtgcaa ttcatgccga tacttgtttc ggctattcat gaacgcagtt ctattcatgc 2401 cggcacttgt tgcggctatt catgccgaag gcaaattatt tccctttgcg gtgtttattg 2461 atgcgataag tacacgccga atcttgcagc attttgaata catttcatta tattcgccgt 2521 cggttatcat gttcgtttct ttgaaaagcg acagccagta atcgctttca tagcattctt 2581 tcaaagcaat ttgaaattta tttataaaat ctgctttgct ggaggcataa tttgcttcgt 2641 gaatgtttgc gccgatactt gtaccgcttc ttagaaattg atttaccaac gcatttgact 2701 ttcctcgccc tttaattgat gaacatagat ttacggtagc tacagcaaac ttcctggata 2761 aattgacaag agcgttttct ttcatggtgt catccccgtt aatgaattga cagctaacgc 2821 cgtcatgaat tggtaaaaca acttcgttgt cttgccatga attgttgcaa gcaacatgaa 2881 ttggctacgc cattaataat ttccattata tattatacca gatattttcc aaaacctcta 2941 cacaaattga aaaaaatatg ttacaattat aatgtatttt tatgtagatt cggagaagca 3001 atggattttt tggacattaa cggagtgaaa attgaaaaaa cagcgggatt gtcgccgatg 3061 gcttccgttg cagacagggc atatcggctg atgtgcaaaa aatacggtgc atcatacttg 3121 gtcagcgaga tggtttccgc aaagggtctt tgctattcgg gcaagaagac cgaaaacctc 3181 tgcgttgtca ccgagcccga acgcccttat gccattcagc ttttcggcga agaggcgcag 3241 tttatgggca gggccaccga gcttttaaac aattatcacc ccgacattat tgatataaat 3301 atgggctgtc ccgtgccgaa ggtcgtcaat cccggcggcg gttcggctct gatgaaggcc 3361 cccgaagtgg catatgacat tgttaaggcg tgtgttggtg cggcaaattg ccccgtgact 3421 gttaaaattc gcgcaggatg ggatgatgag cacattaacg cagtcgaatt tgcaaaactt 3481 atggagcaag cgggcgcatc agctatcgct gttcacccga gaacaagaaa acagatgtat 3541 tcgggtatat gcaattggtc ggtcatcaaa gcggtcaagc aggcggtaag cgtgcctgtc 3601 atcggcaacg gcgacgttaa agacgccctt gattgcaaaa gaatgtatga cgaaacggga 3661 tgcgactatg tgacccttgc gcgcggcaca tacggcagac catgggtatt cagacagatt 3721 aaaacttacc ttgaaacggg aatattgctc cccgagccgt caatagatga gcgcgtttct 3781 gtgatgcttg agcacgcaag gctgatcatt tccgacaagg gcgaaaaaca gggaatcaga 3841 gaagctcgaa aaaa // LOCUS sequence083 3852 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence083 VERSION sequence083 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3852 /mol_type="genomic DNA" /organism="" /note="sequence083" CDS complement(20..1039) /product="zinc-binding alcohol dehydrogenase family protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_012804346.1" /transl_table=11 /codon_start=1 /translation="MKAVLITEPHKIEVGQVEMPVLKEGEALLKIRYCGICGADVASYT GNQPFTTYPRIPGHEFSAEIVSIPENDKGLKAGDIVTANPYFNCTHCYSCERGYVNCCT DNQTMGVQRDGSFCEYVAMPIERIYHGKGLSAQQLALIEPFSISYHACQRAEIKPGDKV LVIGAGPIGLFALISAKLKGAEVYIADILDGRLQMAKEYGADGVINSKTQNLAEETKRI TSGNGFDVCIEACGQAQTFLDCIDCAAFAANIILIGNGKKETTFLHSILLKKELNVHGS RNALAKDFTDLIDIVASGKVDVMKMVSGIYPMDHADDAFKALANNDGSLAKILVEVSK" /locus_tag="LOCUS_3920" /note="WP_012804346.1 zinc-binding alcohol dehydrogenase family protein (Brachybacterium faecium) [pid:45.8%, q_cov:99.1%, s_cov:98.5%, Eval:1.7e-84]" /note="MGA_489" CDS complement(1075..2280) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MIVKGTYFQNDSERPLVYGDVEIINPKRQRLRGEPLKDGILCEPV ICGFCGTDNELMHMGQNHNLSHKFPAGQNLLINGHEGVVWVPSQNRFAIVLIRGGDSYD PTRFTEDETYFEYGCDQADGLFCDCNYFNPDMLLDIPEGYVKDGKLALSFAKKMVFPDP YGCMVFQLERMEDLGVAQNFRVEMAKHKCSEEEARAIAKKNLFDSVVIFGLGTTGMFIG DLIRQNYPDANIVFVGRSDAESPKIKFALDLVGGKYVQSNFETNEELADAICEALGGKA KMFIGVSGSNIEHEIAFKYGVLGCNGIYNSFSLGPQVSYDTMPFGFKNNLIFGSINFRQ DHMEKAIQILAKSKYDEIVQLIDKDEFTADPIGAYKNKIYSKSAPMKTAVIWNEKYIDR NA" /locus_tag="LOCUS_3930" /note="MGA_490" tRNA complement(2455..2530) /product="tRNA-Ala" /inference="COORDINATES:profile:Aragorn:1.2.38" /locus_tag="LOCUS_t0060" /note="Aragorn_6" ORIGIN 1 acagtttctt taacagccat tattttgaaa cctccacaag aattttagca agcgatccgt 61 cgttgttcgc aagagcctta aaagcatcat cagcgtgatc cataggatag attccgctta 121 ccatcttcat aacgtcaacc ttgccggatg caacaatgtc gataaggtcg gtgaagtctt 181 ttgccaaagc gttgcggcta ccgtgaacgt taagctcttt tttgagaaga attgagtgca 241 agaatgtagt ttccttcttg ccgttgccga tcaagatgat atttgcagca aatgcggcac 301 agtcgataca atcaaggaag gtctgtgcct gaccgcaggc ttcgatacaa acgtcaaatc 361 catttccgct tgtaattctc tttgtttctt ctgcaaggtt ctgggtcttg gaattgatga 421 caccgtctgc tccgtattcc ttcgccattt gaagacgtcc atccaagata tctgcgatat 481 atacctcagc acccttgagt tttgcggaga tgagagcaaa aagaccgata ggacctgcac 541 cgattaccaa taccttgtca ccgggcttga tttcagcgcg ctgacaagcg tgatagctga 601 ttgagaaagg ctcgatgagg gcaagctgct gagcactcaa gcccttgccg tgataaattc 661 tttcgatagg cattgcaacg tattcgcaga agctgccgtc gcgctgtacg cccattgtct 721 ggttatcggt acagcagttg acatagccac gctcgcagga gtagcaatga gtgcagttaa 781 aatatggatt tgcggtgaca atatcgcccg ccttgagtcc cttgtcgttt tcgggaatag 841 atacgatttc agcgctgaat tcatgcccgg gaattctggg gtatgtcgtg aaaggctgat 901 tgcccgtata gcttgcaacg tcagcgccac aaataccgca gtagcgaatc tttaaaagcg 961 cttcgccttc cttcaaaaca ggcatttcaa cctgtccgac ttcaatttta tgtggttctg 1021 taataagtac tgccttcata aagaaaaacc tcttttcaaa aattaatata catgtcaagc 1081 atttctgtcg atgtattttt cgttccagat tactgcagtt ttcataggtg cagatttgct 1141 gtagatcttg ttcttatatg ctccaattgg atctgcggtg aattcatctt tgtcaatcaa 1201 ctgaacgatt tcatcatact tgctctttgc aagaatctga atggccttct ccatatggtc 1261 ctgacggaag ttgattgaac caaagatgag gttgttctta aagccaaatg gcattgtatc 1321 ataagatacc tgtgggccga gagaaaagct gttataaatg ccattgcatc ccaaaacgcc 1381 atatttgaaa gcaatttcat gttctatatt tgagccactc acaccgatga acatttttgc 1441 tttgccgcca agtgcttcac aaattgcatc agcaagctct tcgttggttt cgaagttact 1501 ttgaacatat tttcctccga caaggtcaag cgcaaacttg atcttggggc tttcagcgtc 1561 acttctgcca acaaatacaa tgtttgcatc aggatagttc tgtctgataa ggtcgccgat 1621 gaacatacct gttgtgccaa gtccgaagat tacaacacta tcgaaaagat tcttctttgc 1681 gattgctctg gcttcttctt cgctgcactt atgcttagcc atttcaacgc ggaagttctg 1741 tgcaacacca agatcctcca tacgctcaag ctggaatacc atacatccgt atgggtccgg 1801 aaataccatc ttctttgcaa aggacagagc aagctttcca tcctttacgt atccctcggg 1861 gatatcaaga agcatatcgg ggttgaaata gttgcaatcg cagaaaagac cgtcagcctg 1921 atcgcaaccg tattcaaaat atgtttcatc ttctgtgaaa cgggtggggt catagctgtc 1981 gccaccgcga attaaaacaa ttgcaaaacg gttctgtgat ggcacccaaa caacgccctc 2041 gtgtccattg ataagcaggt tctgccctgc agggaattta tgggaaagat tgtggttttg 2101 tcccatatgc atcaactcgt tgtcagttcc gcagaatccg caaattacag gttcgcaaag 2161 gattccatcc ttgagaggct cccctcttaa acgttggcgc ttggggttaa ttatctcaac 2221 atcgccatat acaagcggac gctcgctgtc attctgaaaa taagtacctt taactatcat 2281 cttggtcttc ctttcattta aatttctaaa acaatatgct ttttctcgcc atacaagcca 2341 tatagcagaa ttatttcatc tgatatgata gtttgctaaa gcaaactcgg ggttcaaatc 2401 gaaagtcaac ttataaaaac aaaagagacc ccgacggggt ctcttttgtt tttatggtgg 2461 agcatacggg attcgaaccc gtgacctcca cactgccagt gtggcgcgct tccaactgcg 2521 ctaatacccc gctcggttag aataacacaa attttacaaa taatcaagtg gttttgaaaa 2581 aattgtccct tattttttct gtcattaagt ttgtgtgcat attgtaacag tttttacata 2641 tcaatattac gtcaaaaaat cgcatatgtc aaaatacagc aaaaattgcg ctctgcttat 2701 gctagaccat atatgtacta atgcgctata cattagcgcg aaacataagg aggttcaaca 2761 tgaagagaat tatttcatta cttattatca catcattggt gttatgcctg tttacaggtt 2821 gcggaaagaa agatacgcaa ggcgaggtgt attatctcaa tttcaagcca gaagccgatg 2881 ctgcatggca ggcattagcc gaggaataca ccaggctgac cggagttaag gttacagtta 2941 acaccgcggc gtccgggtca tattcagaga cgcttattgc ggaaatggac aagtcgagaa 3001 tgccaacact gttccaatgc ggaaatcagg caggacttga cacatgggag gattattgct 3061 tagacctgcg aaacacggca gtatacggtg agatgacaac ggatgacttc aacctgatcg 3121 acaaaaacgg tgaggtcaag gcaattggat attgctatga atgcttcgga atcattatta 3181 acaaagagtt attaggacag gccggttata cgattgaaga cattaaaaac tttgacgacc 3241 ttaaaactat tgccgaagac attactgcaa gaaaagatga gctgggattt tctgcatttt 3301 cttctgccgg gcttgatggg tcatcctctt ggagattttc aggacatttg gcaaacatgc 3361 cgctgttttg tgaatttcgc gataacggta tcacctcgca gcctgagcag ataagcggaa 3421 aatatcttga taacttcaag aacatctggg atctttatat caacaatgca acttgcgaca 3481 gaacggagct taccacaaaa acaggtgatg aatcgctggc agaattcgga agcggaaaag 3541 ctgtgtttta tcagaacggt tcgtgggaat ttgcaaatct ggttgacaaa ttcggaatga 3601 aggcagaaaa ccttgcaatg attccgatat atatcggtgt tgagggtgaa gaaaatgcag 3661 gtcttgcatc gggcacggag agctgttggg cggtgaattc acaagcgagc gaatcagata 3721 ttcaagcaac acttgatttc ctatattggg tcgtaacctc agaggaaggc acaaagatga 3781 tggcggaaga gcttggtcct atccccttca agaacgcaaa gacaacggtc aatgtgttct 3841 tcaatgatgc aa // LOCUS sequence084 3842 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence084 VERSION sequence084 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3842 /mol_type="genomic DNA" /organism="" /note="sequence084" misc_feature <1..1831 /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_011460393.1:translation initiation factor IF-2" /note="WP_011460393.1 translation initiation factor IF-2 (Desulfitobacterium hafniense) [pid:62.5%, q_cov:95.1%, s_cov:59.4%, Eval:1.9e-210, partial hit]" /note="MGA_492" /locus_tag="LOCUS_3940" CDS 1879..2259 /product="30S ribosome-binding factor RbfA" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_002670660.1" /transl_table=11 /codon_start=1 /translation="MADFKVGRLSSDIQRIISGKLRDLKDPRVNGSMLTVVKVDVSCDK SVARVYISSFEGIAKAKEAVKGLESASGFLKREIANVLHIRKCPELRFVADDSTEYSAH IAKVIKDLNLKYDDDETEGEEE" /locus_tag="LOCUS_3950" /gene="rbfA" /note="WP_002670660.1 30S ribosome-binding factor RbfA (Treponema) [pid:40.8%, q_cov:97.6%, s_cov:93.9%, Eval:4.6e-19]" /note="MGA_493" CDS 2262..3146 /product="tRNA pseudouridine(55) synthase TruB" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_000399352.1" /transl_table=11 /codon_start=1 /translation="MKQGVILINKPEGFTSFDVIAKCRGILKERRLGHSGTLDPMATGV LPIFIGKATKACDMLPDNEKSYRAGFKLGYSTDTQDTTGETLATSGKKATEGELISALE HFKGEINQLPPMYSAVKVDGKRLYDLARQGVTVERKSRVITVYDITLCGFDEENQEGIL EISCSKGTYIRTIVNDLGEMLGTLGCMSSLVRTSSSGFVLDKCISLEDLQTLADKGEVE SIITPVDECFKCYEMIKLSDKQASMYKNGIKLDLGRLGIKDAGTYRVYADEFLGLARAD ISAGELKIVKNFW" /locus_tag="LOCUS_3960" /gene="truB" /EC_number="5.4.99.25" /note="WP_000399352.1 tRNA pseudouridine(55) synthase TruB (Bacillus cereus) [pid:44.2%, q_cov:85.7%, s_cov:84.0%, Eval:1.0e-55]" /note="MGA_494" ORIGIN 1 gaagaaggaa aagctttcaa acaagcgtga gaccgaggct gaaaagctca agagacttga 61 gcttgagcgc gcaagaaagc agcagctcaa ggttatgatc cccgatgaga tcgttgtaag 121 cgagcttgca tcccgcttaa aggttaccgc aaccgaagtc attaagaagt tgatgggatt 181 gggcgtgttt gcatcgctca atcagactgt tgactttgac accgccgcac ttgttgcaga 241 agagctgggc gcaaaggttg aaaaggaagt tgttgttacc attgaggagc gtcttatcgt 301 tgatgaagag gataaggcgg aggatctggt tgaaagaagc cctgttgttg tcgttatggg 361 tcacgttgac cacggcaaga cctcgctttt ggacagaatc agaaatgcaa acgtaaccgc 421 aaccgaagct ggcggtatca cccagcacat cggtgcttac agagttaacg tttcgggcaa 481 ggacatcacc ttcctcgaca cccccggaca cgaagcattt acatcaatgc gtttgcgcgg 541 cgcaatggta accgatattg caattttggt cgttgcggct gatgacggta tcatgcccca 601 gaccattgaa gcaattaacc acgccaaggc agcagatgta tccatcatcg ttgcgatcaa 661 caagatggat aaggaaaccg caaaccccga aagaatcaag cagcagttaa ccgagcacaa 721 tcttgttgtt gaagactggg gcggcgatgt tatagcagtt cccgtttccg caaagaccgg 781 tatgggcttt gacgagcttt tggaaaacat actcctcgtt gccgaagtta aggagcttaa 841 agccaacccc aaccgtttgg caaagggctc tgtaattgaa gcaagacttg ataagggccg 901 tggccctgtt gcaacaattc tcgtacagaa cggaaccctt agaaccggcg acgttatcat 961 cgcaggtacc gctgtcggac gtgtaagaac aatgaccgac gacaagggca gacttgttaa 1021 ggaagcagga cccagtgttc ctgttgaaat tacaggtctt gcggaagtcc cctctgtagg 1081 tgatatattc aacgcagttg ctgacgaaaa gcttgcaaga gaactcgttg agcagagaaa 1141 gcacgaagcc aaggaagaga tcttcaagca gtatcagaag gtaacccttg ataacctctt 1201 cagccagatc tccgagggtg aaatgaagga gcttcccatc atcgtcaagg ctgatgttca 1261 gggctccgtt gaagctgtta agcagtccct tgaaaagatc tccaacgatg aagtcagggt 1321 taaggttatt cacggcggtg taggcgctgt caacgaatcg gacgttatgc ttgcaaatgc 1381 atcaaacgct atcatcgttg gctttaacgt tcgccccgac cccgttgcaa aggcaagtgc 1441 cgagcgtgac ggcgttgata tgagaatgta ccgcgttatt tacgatgcga tcgaagagat 1501 cgaaaccgct atgaagggta tgctcgctcc caagtttaaa gaggttgaaa ctgcacgcgt 1561 tgagatccgc caggtatata agatcacagg tgtcggcgca gttgccggat gctatgttgt 1621 tgacggtaag atctcaagaa acgacaatgt tagaatcgta cgcgacggta tcatcatcgc 1681 tgatgacaag atgtcctctc tcaagagatt taaggataat gtcaaggatg ttgccgcagg 1741 ctatgagtgc ggtattacgt tagaaaagtt caacgacttc aaggaaggcg acatctttga 1801 agcatacgta atgagcgaaa tagaacagta agcgcgagcg cgttctgttc tgcacaatat 1861 aacaataagg agaaacaaat ggctgatttt aaagtcggac gtttatcaag cgatattcaa 1921 agaataatct cgggcaagct ccgcgacctt aaagaccccc gagttaacgg ctcgatgctg 1981 accgttgtta aggttgacgt ttcgtgtgac aagagcgtgg caagagtata tatctccagc 2041 tttgagggca ttgcaaaggc aaaagaagcc gttaagggat tggagagtgc atcgggcttt 2101 ttgaaacgcg aaattgcaaa tgttttgcat ataagaaaat gccctgagct tagatttgtt 2161 gcagatgatt caaccgaata ttctgcacat attgccaagg tcatcaagga tctgaatctt 2221 aaatatgatg acgacgagac cgagggcgaa gaggaataaa tatgaagcag ggcgtgatct 2281 taatcaacaa gcccgagggg tttacctcct ttgatgtcat tgcaaaatgc cgcggaattt 2341 taaaggagcg gcgtttgggt cactcgggaa cccttgaccc gatggcaacg ggagtcttac 2401 cgatattcat cggcaaggcg acaaaggcct gcgatatgct acccgataac gaaaagtcat 2461 accgcgcggg atttaagctg ggatattcca ccgatactca ggacaccacc ggcgagaccc 2521 ttgcaacaag cggcaaaaaa gccaccgaag gggagctgat ttcggcactt gagcacttca 2581 aaggtgaaat taaccagctt ccgccgatgt attccgccgt caaggtggat ggcaaaaggc 2641 tttacgacct tgcaaggcag ggcgtgacgg ttgagcgcaa atcgagagtt atcacggtct 2701 atgacatcac tctttgcggg tttgatgaag aaaaccaaga gggtatcctc gaaatatcct 2761 gctcgaaggg cacatatatc cgcaccatcg tcaacgatct gggcgagatg ctcggaactc 2821 tgggctgtat gtcaagcctt gtgcgaacat cgtcaagcgg gtttgtgctt gataaatgca 2881 taagcctcga agatttgcaa actcttgccg acaaaggcga ggttgaaagc attatcaccc 2941 ctgtggatga gtgctttaag tgctatgaaa tgattaagct gagcgataag caggcaagta 3001 tgtataaaaa cggcatcaag cttgatcttg gtcgcttagg aattaaagat gcagggactt 3061 acagagtcta tgcggatgag tttttaggct tggcgagggc tgatatatcg gcaggcgagc 3121 ttaaaatagt caaaaatttt tggtaggaaa aaggagttgt caaaatgctc gatagataca 3181 atacagccgt acttttaggg ctttttgaca gcgtacattt gggccatctt aaaaccctcg 3241 acgccctgaa agatacgggc gcgaaaagaa aaatcgtaga tacctttaag ctttcgggcg 3301 ttgacaccaa gggcaagcgg gttccgctga taagcgatgg gcaaaaggaa gctttgctgc 3361 ttgctgcagg cgcggacgag gtcagatcgg agaacttttc cgatgttagg aacctctcac 3421 ctgaggagtt tgtggatgat atactcattc ataagctcgg cgcggatacg gttctgtgcg 3481 gcgaaaactt ccgcttcggc agatacgctg cgggcgatac tcacactctt gagtggctct 3541 gcaaagagcg gggagttgca ttaaaggtaa tacctcttga aagacttgac ggcgaggtga 3601 tatctaccac ccgaataagg gcacttttgg aagttgggga tattgaaaat gcaaatcgct 3661 tgcttgcaag aagatattcg gtcagcggcg agataatcca cggcaacgcc ctcggcagag 3721 agatgggtat aagaacgata aacctttatt atgagggatg tcttaaagac ggcgtgtacg 3781 caacgattac aaatatcgac ggaaaaagct ataaaagtgt gactgacatt ggcttcaagc 3841 cc // LOCUS sequence085 3841 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence085 VERSION sequence085 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3841 /mol_type="genomic DNA" /organism="" /note="sequence085" CDS complement(293..598) /product="MGMT family protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003813638.1" /transl_table=11 /codon_start=1 /translation="MSTFELIYEQVRLIPKGKVASYGQIASYAGNPRWSRVVGYALHVN PEPGAIPCHRVVTKDGGLSSAFAFGGKQAQRALLEAEGIEFDEDGRVIIEKFRWNR" /locus_tag="LOCUS_3970" /EC_number="2.1.1.63" /note="WP_003813638.1 MGMT family protein (Bifidobacterium bifidum) [pid:62.5%, q_cov:79.2%, s_cov:75.5%, Eval:9.5e-25]" /note="MGA_497" CDS complement(666..3005) /product="alpha-xylosidase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_010964400.1" /transl_table=11 /codon_start=1 /translation="MKISDGYWLNQRGYTVSYANQAYEVSYDANSIYVLATPSHIWNRG QTLGGPNLELKFTSTMADVIKVSVVHYKGTFDCGPNFELHDEQGYTPVINDTDKYIEMI SGKTSVKISKENWSVEYYYDGKHLTGGSYRALTYIEEAKSKAKRRLDTQIDDTFWSYPQ DANTSYLREQLTLDVGEYIYGFGEKFTTFTKNGQNVQIWNADGGTCCDQSYKSIPFYVS SRGYGVFVNSSDNVSYEVASDTVSKVSFTVPGEELEYFIIGGENLREVLSNYTTITGKP ALPPAFTFGLWLTTSFTTKYDEETINSFIDGMAQRDIPLQVFHFDCFWMKEFEWCNFEW DTRQFPEPEKMLERLHKDKGLKTCVWINPYIGQRSKLFDEGMENDYFILNKDGSVFQCD MWQPGMAIVDFTNPEACEWYASKLRALCEMGVDCFKTDFGERIPTDVVYHNGADPIKMH NYYTQLYNQTVFNVLKEYYGENKACLFARSATAGGQQFPVHWGGDCSAEYSSMAETIRG GLSLCISGFGFFSHDISGFEATATPDIYKRWCAFGLLSTHSRLHGNSSYRVPWLFDEEA CDVLRFFTKLKGKLMPYMFAQAKYTHDSGVPMMRAMVIDFADDPAALTLDRQYMLGDNL LCAPILNSEGRAEFYVPAGRWTDIITGKVYEGEKWYRETCNYFEMPILARPNSIVTYGD FVRDFEYDYLENAEAVIYELSDGCEASAVIYDKEAEKLCDIKATRDGNKITVSYTKTDK TFKVKVSGTDICAVANAGTTELVIEL" /locus_tag="LOCUS_3980" /gene="yicI" /EC_number="3.2.1.177" /note="WP_010964400.1 alpha-xylosidase (Clostridium) [pid:53.7%, q_cov:95.9%, s_cov:94.0%, Eval:4.5e-244]" /note="MGA_498" misc_feature complement(3048..>3841) /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_011074555.1:CapA family protein" /note="WP_011074555.1 CapA family protein (Streptococcus mutans) [pid:31.1%, q_cov:93.9%, s_cov:65.9%, Eval:1.3e-24, partial hit]" /note="MGA_499" /locus_tag="LOCUS_3990" ORIGIN 1 atacattctt cggtgacagt ttaaatatac gtttgtcgat atatcccgtc agctctgcgt 61 cgcttgattt caccaaccgc tcgatgtcat caacgagcac tgtgcgctcg tgtgcacaaa 121 ctgtgacgac ctcctcgcgc tccttgtcaa taatgatctc gcatcgcatc aaacctcctc 181 ctttcgattg caattttagc ataccgcaaa aataaatcaa tgcttttgaa atattcggtc 241 ggtttcgtgg catattcggc aaacaagccc tcacatttgt gagggcttgt tttcatctat 301 tccacctaaa cttctcaata atcaccctgc cgtcctcgtc aaactcaatg ccttccgctt 361 caagcagcgc gcgctgagcc tgctttccgc caaatgcaaa tgcgcttgaa agtccgccgt 421 ccttggtaac aactctgtgg caggggattg ctcccggctc ggggttaacg tgcaacgcat 481 accccacaac gcgcgaccac ctcgggttcc ctgcatacga tgcaatctgc ccatatgaag 541 caaccttacc tttgggtatg agcctaacct gctcataaat cagttcaaat gtagacatag 601 tgtttttcat ccttttattg aaatcggcat agactgcgcg tctatgccga tttagtgttt 661 acaaattaaa gctcaataac caactctgtg gtgcctgcat ttgcaacagc acaaatgtca 721 gttcccgaaa ccttaacctt aaaggtcttg tcggtcttgg tatagctaac tgtgatcttg 781 ttgccatctc ttgttgcctt aatatcgcaa agcttttcag cttccttatc atagataact 841 gcgcttgctt cgcaaccgtc agaaagctca tagattacag cctctgcgtt ttcaagataa 901 tcatactcga aatctcttac aaagtcgccg tatgtaacaa ttgagttggg acgagcaaga 961 ataggcattt cgaagtagtt gcaggtttct ctataccact tttcgccttc atataccttg 1021 ccggtgatga tgtctgtcca tcttcctgca ggaacataga actctgctct gccttcgctg 1081 ttaagaatag gagcacaaag caagttatca cccagcatat actgtctgtc aagggtcaat 1141 gctgcagggt catctgcaaa gtcaattacc attgctctca tcatcggtac gccagaatcg 1201 tgggtatact tagcctgtgc gaacatataa ggcataagct tgcccttgag cttggtgaag 1261 aatctcaaaa cgtcgcaagc ttcctcgtca aagagccacg gtacacggta agaggagttg 1321 ccgtgaagtc ttgaatgtgt tgacaaaaga ccgaacgcac accatctctt atagatatcg 1381 ggagtagcag tagcttcaaa tccggaaata tcgtgggaga agaaaccgaa gcccgaaatg 1441 caaagggaaa gtccaccacg aattgtttca gccatagagg aatattcagc cgagcagtcg 1501 ccgccccaat gaacagggaa ctgctgaccg cctgctgttg cgcttcttgc aaacagacaa 1561 gccttgtttt caccgtaata ttccttcaaa acattgaata cggtctggtt gtaaagctga 1621 gtatagtagt tgtgcatctt aatggggtct gcgccattat gatatacaac atctgtagga 1681 attctttcgc cgaagtcggt cttgaagcag tcaacgccca tttcgcaaag cgcgcgaagc 1741 ttagaagcat accactcgca agcctcgggg ttggtaaagt caacgatggc catacccggc 1801 tgccacatat cgcactggaa taccgagcca tccttattga gaatgaagta atcgttttcc 1861 attccttcgt caaagagctt agatctctgt ccaatgtaag ggttgatcca tacacaggtc 1921 ttaagaccct tgtctttatg aagtctttca agcatctttt cgggttcggg gaactgacgg 1981 gtatcccatt cgaagttgca ccactcaaat tccttcatcc agaagcagtc aaagtggaat 2041 acctgcaaag gaatatcgcg ctgagccatt ccgtcgataa acgaattgat tgtttcctcg 2101 tcatacttgg ttgtgaacga tgttgtcagc cacagaccga aggtgaatgc aggaggcaaa 2161 gcaggcttgc ctgtaattgt tgtatagttg gaaagaactt ctctgaggtt ttctccgcca 2221 atgatgaagt attcaagctc ttcaccggga actgtgaagc tgacctttga aacggtgtca 2281 gaagcaactt cataggatac attgtcggag gagtttacaa atacaccgta tccgcgtgaa 2341 gaaacataga aggggataga cttgtaagat tgatcgcagc aggttccgcc gtcagcattc 2401 cagatctgaa cattctgacc gtttttggtg aaagttgtga atttttcgcc gaaaccgtag 2461 atatattctc cgacatcaag agtgagctgt tctctcaggt aagaggtgtt tgcatcctga 2521 ggatatgacc agaaggtgtc atcaatttgg gtatcaagac gtctttttgc cttggactta 2581 gcttcttcaa tgtatgtgag cgcacggtag cttccgcctg taaggtgctt gccgtcatag 2641 taatactcaa ccgaccaatt ttccttgctg atcttaacgc ttgtcttgcc ggagatcatt 2701 tcaatatact tgtcggtgtc gttgatgacg ggagtgtagc cctgctcgtc atgaagctca 2761 aaattaggtc cacaatcaaa tgtgccctta tagtgaacaa cgctgacctt aattacatct 2821 gccattgtgg aggtgaactt aagctcaagg ttaggtccgc caagggtctg tccgcggttc 2881 cagatgtgtg agggtgttgc gagcacgtaa attgagttag catcatatga tacttcatat 2941 gcctggtttg cataacttac cgtgtagcct cgctgattaa gccagtagcc gtctgaaatt 3001 ttcataaaaa acagttcctt tcttgtttgg aattattatt tacttattta ttcaatcgaa 3061 agaaattctt tcggtatgaa acttaaaacg tggtcaattg tcttctgagt gaaattctca 3121 ccgccgtgag tcaaaagaag ctcatcggta taattgacat atggaacaat gtgaatgtct 3181 gaatagttgt atccgtattg cgtgattatg ggaattgcct tcacattttc aatggttatt 3241 tcgccgctga gaagctcctt tgtgactgtt aactgtccaa gcattccaac caaagtcaga 3301 ttatagcttt gagcagaaac gaagtttcca aggcagtaga aaacgaatgc cttaccgccg 3361 tccggcttgt cgatgtattc cattgtctgc acagtgtgcg gctgtgtgcc gatgatgata 3421 tcagcacccc attcaacaaa catttttgtt aagttgattt ggttatccgt cagcctgttg 3481 gtggtctctt tgccgaagtg aggtgaaaca acgacaacat ctgcaatttc atcagccttt 3541 ttaatttgct gttcaataag ttccagctct ttaagatatg taatctcata tacagagcct 3601 tccggcagct tcaaaccgtt tgtgtgctcc atatatccta aaaaagcgaa ggtaattccg 3661 ttgacttctg ctgtgcggat gttgttcata tcctccgcgt cgcggtatgc accgtatctt 3721 atgacctcgg gatgagaatc ccagaaatcg agagttgctt caagcccgat ttcatcccta 3781 tcgagaatgt gattgtttga aatggagaaa gcatcaaacc caatttcaat catatattca 3841 c // LOCUS sequence086 3829 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence086 VERSION sequence086 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3829 /mol_type="genomic DNA" /organism="" /note="sequence086" CDS 472..2715 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MNDMNKEVKLSVNNLKISFRTDAGKVQAVRNISFDLYKGETLAIV GESGSGKSVTSKAIMGISAVNSIHEAGEILYDGQDLARIPEEEMHKLRGDKIAMIFQDP LSSLNPIMRIGNQITEAMLLKNKANRREGREAFNSLLKELSETMNEAIVAGNHKEFSAS KVSEYIKTFDNFNIQAIKLENSYNDARTAAEEMIAIIDDFLFLTEKKQKTDVLATLRLV ERKLADIDDKYLTAGYADVLNGYRAPLANAKRAEKAKVSLFDTIKKVVTMSIVKREASS ETAEILSEIRKTAADMLAQPQYNFFRIGYYVYKHHNEDLSVMPAEEANAMAIKFLMDDF LTSFIELEKIAVEYSYNRALENKKKAVAALEDAVKFFKKGDFTEKAANDLCKNVSASVM ASIDRLAVIKDNVAYTFGSALEREIEKYFFYIKNNPLEEARFERQTAKRNALIAKGKTV DWEVIPKSIIEPEVQIETIVSVINRVIAKFKADIESASSFDSLKRCDELIDYLKGKASQ VVYTLTKRIAKEKAIKLMEEVGIPEPRIRFRQYPFEFSGGMRQRIVIAIALSANPDILI CDEPTTALDVTIQAQILELINNLKRERNLSIIFITHDLGVVANMADRIAVMYAGKIVEY GTANEVFYNPQHPYTWALLSSMPDLDTNEKLDAIPGTPPNMIYPPVGDAFAERNKYALA IDYEMEPPMYEVSPTHFAATWLLHPDAPKVEIPRIITERIKHMKERGDKNGEE" /locus_tag="LOCUS_4000" /note="WP_000854337.1 ABC transporter ATP-binding protein (Bacillus cereus) [pid:62.4%, q_cov:29.0%, s_cov:62.8%, Eval:8.3e-78, partial hit]" /note="MGA_501" CDS 2702..3802 /product="ATP-binding cassette domain-containing protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_000166348.1" /transl_table=11 /codon_start=1 /translation="MEKNNEVLLKVDHLCQYFRMGRKDLKAVDNVSFDIKKGEVFGLVG ESGCGKTTTGRSIIKIYDITSGNVYFNGQRICAGTRSYKDEIKAAKKRISAEIAELKKN GEKELIAEKKAELASIIAENKKKIDEARADEKYSRKKKISTKIQMIFQDPIASLDPRMT VRDIIAEGLIINGVTDKEYINEKVYEILETVGLVREHADRYPHEFSGGQRQRIGIARAI IMQPEMIIADEPISALDVSIQAQVINLLNDLREQLGLTILFIAHDLSVVKYFSDRIGVM YFGKMVELADSDELFKNPMHPYTRSLLSAIPLPDPIYEKQRIRMTYNPLAEHDYSVDAP SFREISPGHFVHCNDAEEKKYKEMLK" /locus_tag="LOCUS_4010" /note="WP_000166348.1 ATP-binding cassette domain-containing protein (Bacillus cereus) [pid:13.9%, q_cov:99.5%, s_cov:99.4%, Eval:1.1e-95]" /note="MGA_502" ORIGIN 1 aaatatcata tgggtagtac aagccaggca cttgtactgt ttatctcgtt ctttgtaacg 61 ggatggatcg gtatggccgg cagaactcgt atgcagttct atcgcttcaa gaatcaggaa 121 tatgttcttg ctgcaagaac tctcggcgca agcgacttta gaattatgtt caagcatatc 181 ttcccgaacg gacttggtac catcgtaacg agcttcgcac tcgtaatccc ctcgatgatc 241 tattctgaaa ccagcctttc ttatcttggt atcatcaatc tcgaggcagg aaacaccacc 301 tctgtcggta cattgatcgc tgcaggacag aagtcgatca tggcaaatgc cggatttgtt 361 gctctcttcc cctgcctatt ccttgtactt ttgatgctca gcttcaacct gttcggtaat 421 ggtctgcgtg atgcgttcaa cccgtcgctc agaggatcgg aggattaaga catgaatgat 481 atgaataaag aagttaaatt atcagttaac aatttaaaaa tatccttccg tacagacgcc 541 ggtaaggttc aggctgttcg caacatctcc ttcgaccttt ataagggtga gacccttgca 601 atcgttggtg agtccggctc gggaaaatcc gttacctcca aggcaattat gggtatttcc 661 gcagttaact cgatccacga agcgggcgaa atcctctatg acggtcagga tcttgcacgc 721 attcccgaag aagaaatgca caagcttcgc ggtgacaaga tcgcaatgat cttccaggat 781 ccgctttctt cccttaaccc cataatgcgt atcggtaatc agattaccga agcaatgctt 841 cttaaaaaca aggcaaaccg cagagagggc cgtgaagcat tcaactcgct gttaaaggaa 901 ctttccgaaa caatgaacga agctattgtt gccggaaatc acaaagaatt ctctgcttca 961 aaggtttctg aatacatcaa gacctttgat aacttcaaca tccaggctat caagcttgaa 1021 aacagctata acgatgcccg tacagcagca gaagaaatga tcgctatcat cgacgacttc 1081 ctcttcctca cagaaaagaa gcagaagaca gacgttttgg caaccttgcg acttgttgag 1141 cgcaagctcg ccgatattga tgacaagtat ctcactgcag gctatgctga tgttcttaac 1201 ggctaccgtg ctcctttggc aaacgcaaag cgtgctgaaa aggcaaaggt ttccttgttt 1261 gacaccatta aaaaggttgt cacaatgagc atcgttaaaa gggaagcgtc gtcggaaact 1321 gctgagatct tgagcgagat ccgtaagact gccgctgata tgcttgctca gcctcagtat 1381 aacttcttcc gtataggtta ttacgtatat aagcatcaca acgaggatct tagcgttatg 1441 cctgctgaag aagcaaacgc aatggcaatc aagttcctta tggacgactt cttgacctcc 1501 tttattgagc ttgagaagat tgctgttgag tattcttaca acagagctct tgaaaacaag 1561 aagaaggctg ttgcagctct cgaagatgct gttaagttct tcaaaaaggg cgatttcacc 1621 gaaaaggctg caaacgacct ctgcaagaat gtcagtgcgt cggttatggc gtctatcgac 1681 cgccttgccg ttatcaagga taacgttgct tataccttcg gcagtgctct tgaaagagaa 1741 atcgagaaat acttcttcta tatcaagaac aatcctttgg aagaagccag atttgagcgt 1801 cagaccgcaa agagaaacgc tttgatcgca aagggcaaga ctgtagactg ggaagttatt 1861 cctaagtcga tcattgagcc cgaggttcag atcgaaacta tcgtatcggt tatcaaccgc 1921 gtaatcgcta agttcaaggc tgatatcgaa agcgcttcca gcttcgattc gctcaagcgt 1981 tgcgacgagc ttatcgacta tctcaagggc aaggcttctc aggttgtata tacccttaca 2041 aagagaatcg caaaggaaaa ggcaatcaag ctgatggagg aagttggtat tcccgaaccc 2101 agaattcgtt tcagacagta tcccttcgaa ttctccggcg gtatgcgcca gcgtattgta 2161 atcgctattg ctctttctgc taaccctgat atcttgattt gtgacgagcc tacaaccgct 2221 ttggacgtta caattcaggc tcagattctt gaacttatca ataatcttaa gagagaaaga 2281 aatctttcaa tcatcttcat cactcacgac ctcggtgttg ttgcaaatat ggcagacaga 2341 atcgctgtta tgtatgcagg caagatcgtt gagtacggca cagcaaacga agtattctat 2401 aatcctcagc atccttacac ctgggcactg ctctcgtcga tgcctgacct tgataccaac 2461 gaaaagctgg atgcaattcc cggtacaccc ccgaatatga tctatcctcc cgttggcgat 2521 gcgtttgctg aaagaaacaa gtatgcactt gctatcgact atgagatgga gcctccgatg 2581 tatgaggttt ctcccacaca ctttgcggca acttggttgc tccaccccga cgctcccaag 2641 gttgagatcc ccaggatcat caccgagcgt attaagcata tgaaggaaag aggtgacaaa 2701 aatggagaag aataacgaag ttttgttaaa ggtcgaccat ctttgtcaat atttccgaat 2761 gggccgcaag gatcttaaag ctgttgacaa tgtaagtttt gacattaaaa agggcgaagt 2821 attcggactt gtaggtgagt cgggatgcgg aaagaccact accggccgtt ccatcatcaa 2881 gatctatgac atcacctccg gaaatgtata cttcaacggt cagcgtattt gcgccggcac 2941 cagatcctat aaggatgaga tcaaggctgc gaagaagaga atttctgctg agatcgctga 3001 acttaaaaag aacggcgaaa aggaacttat tgctgaaaag aaagctgagc ttgcttcaat 3061 catcgctgaa aacaaaaaga agattgatga agctcgtgct gacgaaaagt atagccgcaa 3121 gaagaagatc tcaacaaaga tccagatgat cttccaggac cctatcgctt ctttggaccc 3181 cagaatgact gtacgtgata ttatcgctga aggtcttatc atcaacggtg ttaccgacaa 3241 ggaatacatc aacgaaaagg tatatgagat tcttgaaacg gttggtcttg taagagagca 3301 cgcagaccgt tatcctcacg aattctccgg tggtcagcgt cagcgtatcg gtattgcaag 3361 agcaattatc atgcagcccg aaatgatcat cgctgacgag cctatttccg cgctggacgt 3421 atccattcag gcacaggtaa tcaatttgct taatgatctt cgtgaacagc ttggacttac 3481 catcctcttc atcgcgcacg acctgtctgt tgttaaatac ttctctgaca gaatcggtgt 3541 aatgtatttt ggtaagatgg ttgagcttgc cgattctgac gaattgttca agaaccccat 3601 gcatccttac acaagatcgc tgttgtctgc aattccgttg cccgacccga tatatgaaaa 3661 gcagcgcatc cgtatgactt acaatccttt ggctgagcac gattattccg ttgatgctcc 3721 ctcattcaga gagatctctc ccggacattt cgtacattgc aatgatgccg aggaaaagaa 3781 gtataaggaa atgttaaaat aatgaaacgg acggttaaaa tacagtgac // LOCUS sequence087 3797 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence087 VERSION sequence087 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3797 /mol_type="genomic DNA" /organism="" /note="sequence087" CDS 1145..1579 /product="MarR family transcriptional regulator" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003725020.1" /transl_table=11 /codon_start=1 /translation="MATIMRKMNVISRCEGIYRTQQSKDNLPGIYHSYIFAITGNPGLS QDKLAKHMCINKSSVTRHLACLEKEGYVERKVSETDKRETLVYPTQKMLDVLPEVTDIT KTWNEMVAQDISREELELFHRILDKMLDKSMEIVYSGDVQ" /locus_tag="LOCUS_4020" /note="WP_003725020.1 MarR family transcriptional regulator (Listeria) [pid:21.3%, q_cov:97.2%, s_cov:94.6%, Eval:5.8e-10]" /note="MGA_504" CDS 1576..3297 /product="ABC transporter ATP-binding protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_010965689.1" /transl_table=11 /codon_start=1 /translation="MRTVIKYLKKHINRMTVGFCIKTLGTLSELMLPYILSHILENVIG KDVKEVVLWGGVMMLCSGLACLLNIVANRMAARVSRNFAEEMRKDLFIRTLRLSAAQTD KFTIPSLESRITTDTYNIHGFINMMQRLGVRAPIMLIGGIAITLFMDYKLSLVMIALLP LIFITVYFISRNGVPLYTKVQHSVDNMVRVVRENAQGIRVIKALSKTDYEHRRYDEVNK ALVKDETRAGVIMGTVNPIMTVLMNMGSVAVIALGANLITGGNSKPETVIAFMQYFTLI AMAMMSVTRMFVMYTKSAASAKRIAEVLNAPEEITVKEKSEYPDKATDAHIKFDNVSFS YNGKRNNLENISFEIPKGGSLGIIGATGSGKSTLVKLLLRFYDTNQGSIYINGEDIKTI DKARLYAMFGSALQHDFLYAETVEENIKFGRDISFDDVKRATDIAQATDFIEGFADGYG HMLSPHGTNISGGQKQRILISRALAAKPDILILDDSSSALDYKTDANLRKALAENMADT TLVAVAQRVSSVKDCGLIIVLDDGKIIGIGNHEHLLENCPEYKEISDSQMGGAFVE" /locus_tag="LOCUS_4030" /note="WP_010965689.1 ABC transporter ATP-binding protein (Clostridium) [pid:39.3%, q_cov:99.0%, s_cov:99.1%, Eval:1.9e-111]" /note="MGA_505" ORIGIN 1 gccggcgaag ttgcgcccgc agaagtgacc gaagagcctg tgaatggtgc caccgaggaa 61 accaaggctg aagcgactga agtttttaac gaagaagcaa agtcagagga agctgacgaa 121 gaggttaaga ccgaagaagc aactgcagcc gaagatatgc ccgaagagaa acctgaggag 181 aaaaaggcga ctaagaaaaa gcgcaaaaac gactcgctta ttgagattac aaagataaag 241 gtaatcagcg aggaaaccaa gagcgaaatt aagaaggcga ttgacgaggc tcttgacgaa 301 gaggttgaag atatcacacc gcttgagaat gcccctattc agaacgcggg aaaaatcagc 361 ctgcgccaga tttcaagcgc gattttcgga ttctttgtgt tggtattcgc ggtattcgga 421 attatttcaa ccgtttcgag ggtcacaaac tatgttcagt cgctggatga cgacagcgcg 481 ctggttgaag cctttacaaa gcttgccgct ccccttgcgg caacagacgc ttctgttttt 541 gaaaatgtca ccgctgtcag cgaggatgta cttataaccg ccgcttgctg ggacgttatt 601 ttcaatccga gcgaaaacta tacagcagtt gacggaaact ataccgtatc tttccttgat 661 attgacaacc gaattgcggg tcttttcggt gcaggactga cctattccca caagactgtc 721 ggcgacgaag aattggcctt tgaatatgac gaggagtcgg gaatgtatac cattcctgca 781 tatccccaag cgcctgcata tattcccaag ctggtggaat atgctcagac tgctgacgga 841 tataagctca gagtcgaata tgttttgcct atcaccgagc ttatcagttc ggatgtgatt 901 gccgacaagg taatgataat tacccttaaa acaagcggaa cggaatatgt gatctcatcg 961 cttgagctgg gcgagctgta taccggtcag gagctgtaaa ttaaatagca ttataatgac 1021 tcaccttgct ttggcagggt gagttttttg ccaaagaccc acccgttgac aggcaatttg 1081 agatgtggta aaatagttgc aaatgcaaca gttttgtttg caactaattt ttggaggcgt 1141 ttgaatggca accataatga gaaaaatgaa tgtcatcagc cgttgcgagg gaatctatcg 1201 cacacagcaa tcaaaggaca atctgcccgg gatatatcat agctatatct ttgcaattac 1261 aggcaatccg gggctttcgc aggataagct ggcaaagcat atgtgcataa acaaaagcag 1321 tgtgaccaga catcttgcct gccttgaaaa agagggctat gttgagagaa aagtcagcga 1381 aacagacaag cgggaaactt tggtatatcc aacgcaaaag atgcttgatg ttttgccgga 1441 agtgacggac attacaaaaa catggaatga gatggtggcg caggatataa gccgcgagga 1501 gcttgagctt ttccacagaa ttcttgataa gatgcttgat aagtcgatgg agatagtata 1561 ttcgggagat gtgcagtgag aacagtaatt aaatatttga aaaaacatat caatcggatg 1621 accgtcggct tttgcattaa gaccctcggc accctttcgg agcttatgct tccatatatt 1681 ttaagccata ttttggaaaa cgtaatcggt aaagatgtta aagaagtcgt gctttggggc 1741 ggagtgatga tgctttgctc gggattggct tgccttttaa atattgttgc aaaccgaatg 1801 gcagcaaggg tttcaagaaa ctttgctgaa gagatgagaa aagacctgtt catcagaact 1861 cttcggcttt ccgccgccca gacggataaa ttcaccattc cctctttgga atcgagaatt 1921 acgacagaca cttataatat tcacggattt atcaatatga tgcagcgatt gggtgtccgt 1981 gcgccgatta tgctcatcgg cggaattgca ataacattgt ttatggacta taagctgtcg 2041 ctggtaatga ttgctctttt gccgctgata ttcataactg tatacttcat ctcgcgaaac 2101 ggcgtaccgc tttacacaaa ggttcagcac tcggtggata atatggtgcg cgttgtgcgc 2161 gagaatgcac agggtataag agttattaaa gcgctctcaa agaccgacta tgaacaccgc 2221 agatatgacg aggtcaacaa ggcgttggtt aaggatgaga ctcgcgcagg tgtaattatg 2281 ggcacagtta acccgataat gacagttttg atgaatatgg gaagcgttgc ggtaatcgcg 2341 ttgggtgcaa acttgatcac cggtggaaat tcgaagcctg aaactgttat cgcatttatg 2401 caatatttca cgctgatagc aatggcgatg atgtcggtta cgagaatgtt tgttatgtat 2461 acaaaaagtg cggcttcggc aaagcgaatt gccgaggttc tcaatgcccc cgaggagata 2521 accgtcaaag aaaagtcgga atatcccgac aaggcaacgg acgcccacat taagtttgat 2581 aatgtcagct tttcatataa cggaaagcgc aacaaccttg aaaacatcag ttttgaaatt 2641 cccaagggcg gttctttggg aattatcggg gcgacaggct caggaaaatc gacacttgtt 2701 aaactgcttt taaggtttta tgatacaaac caaggaagca tatacataaa cggcgaagac 2761 attaaaacaa ttgacaaagc aagactttat gctatgttcg ggtcggcact tcagcacgat 2821 ttcctttatg ccgaaacggt tgaggaaaac attaagttcg gacgggatat ttcgttcgat 2881 gacgttaaac gtgcaacgga tattgcgcag gcaaccgact ttattgaggg ctttgccgac 2941 ggttacggac atatgctttc gccccacggc accaatattt cgggcggaca aaagcaaaga 3001 attttaatat cacgcgcact tgccgcaaag cctgatattc tcattttgga cgactcgtcg 3061 tcagcacttg actataagac cgacgcaaat ttaagaaaag cactggcgga gaatatggca 3121 gacaccactc tcgttgcagt tgcacaaaga gtcagctcgg tcaaggattg cggacttatt 3181 attgtcttgg acgacggaaa gataatcgga attggcaacc acgagcacct gcttgaaaat 3241 tgcccggaat ataaagagat aagcgattca cagatgggag gtgcttttgt tgagtaaacc 3301 ggaagacaaa aaacttgacc gcaaaacggc aaaaagcatc tttttaaggc tttgcacata 3361 tgtgcttcat tattggtatc tgtttttgcc tgcagttgtt ttaactctgt tttcaaatca 3421 gctttcgcta ttgggtccta agtattcggg cgaagcgatt gacgcgcttg cgactgtcgg 3481 cggagtggat tttgacacag tttcggaaaa tgtcatcaaa atgatcatct gctatatcgc 3541 atcggcagca atgtcatatg ctttggcggc actgatgata catatcagcc aaaagattgt 3601 ttatacaatg cgccgtcagc tttttgaaaa gctcacttcc ctgcccgtcg gatattttga 3661 cactcatcca acgggagata ttatcagcca tatttcatat gatatcgaca ccattaacag 3721 caccctttca cacgaccttg tgcagataat gacaagtgtt tatactgttg tcggctcgct 3781 ggtatttatg tggaata // LOCUS sequence088 3788 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence088 VERSION sequence088 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3788 /mol_type="genomic DNA" /organism="" /note="sequence088" CDS complement(300..647) /product="YbaB/EbfC family nucleoid-associated protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_009887752.1" /transl_table=11 /codon_start=1 /translation="MKARLPQGMGGGPQNMNQMIRQAQKMQEDMAAFQAELEEKEFKAS VGGGAVEITMNGKREVLGVNIKPEVVDPDDIEMLEDLIASAVNEVLLNIETESSEGMNK ITGGISLPGAF" /locus_tag="LOCUS_4040" /note="WP_009887752.1 YbaB/EbfC family nucleoid-associated protein (Clostridioides difficile) [pid:60.4%, q_cov:92.2%, s_cov:89.7%, Eval:4.0e-31]" /note="MGA_508" CDS complement(675..2288) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MYTALYRKWRPLTFDDVVSQPHITTTLSRQIAEGKTAHAYLFTGS RGTGKTTCARIFAKAINCLDPHDGKPCLECDICRAADAGTLSDIIEIDAASNTGVDDIR DLRDSTVYTPELCRYKVYIIDEVHMLSNQAFNALLKIMEEPPAHVKFILATTEVHKVPA TIISRCQRFDFRRIRPRDISDRLLYIASHEGFTLESDAADLIARIADGAMRDALSLLDQ CVAYSSNVDISVVTDAAGIAGRDYLFDILEAVAERDISVAISKTDELYAKSKDMARLCD ELIFQTRNLMLIKTVPDRDELLSCSPNEVERLRKICEKLTLDEIIARLEILQDLSEAMP RATSKRTEIEMALVKLCTVNTTKPTSSGGKANADLSELIARIARLESELAAIKKNGVVP AVATVKEEPKQEMPKAEPKAEPAKEANNEPMVACAQWDEILERLTELNPGCAGALRGSM GYVKGTTLSIIVKNEFFLGLFKKPENAASLKQAALDITGITYSLRAKCEKQDAPKNGDD DPIAQLIARAKKADIPVDIN" /locus_tag="LOCUS_4050" /note="WP_000121588.1 DNA polymerase III subunit gamma/tau (Bacillus cereus) [pid:43.1%, q_cov:74.5%, s_cov:70.3%, Eval:8.6e-87, partial hit]" /note="MGA_509" CDS complement(2527..2730) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MIVYDKLWATLKERGISQYKLINEYHISTGQLDRLRKNANVNTYT LDQLCRILDCELCDIAEYIKEE" /locus_tag="LOCUS_4060" /note="MGA_510" ORIGIN 1 acgggtgcgc tcaaaagcgg aaacatcctt cggtccttca acaacgcaaa taaccgagtg 61 gtcgcgcgtt tcgtttgagc atatgggaca taccgccttg tcggtcagat tctgacatac 121 cgagcaggtg tgaacggtct ttcttgcata tataattgct tttgcgaagg cctctgcgtc 181 ctcatcggac atggacataa cgaagtatgc caatctctgc gctgttttca ttcctattcc 241 cgggagcttt gcaaactgct ccgccaaaag ggtcaagggc aatacattag cgtcagccat 301 cagaatgcac cgggaaggct gatgccgcct gtaatcttgt tcattccttc gctggactcg 361 gtttcaatgt ttaaaagaac ctcgtttaca gcacttgcga tcaaatcttc aagcatttca 421 atatcgtcgg ggtcaacgac ctcgggctta atgttaacgc ccaaaacctc acgcttgccg 481 ttcattgtaa tttcaacagc gccgccgccg acagaagcct taaattcctt ttcttcaagc 541 tctgcctgga atgccgccat atcctcctgc atcttctgtg cctgacggat catctggttc 601 atattctggg ggccgccgcc cataccctgg ggaagtcttg ctttcatagt tatatatctc 661 cttaaaatta aagtttaatt aatatcaacg ggaatgtccg ctttctttgc ccgagcgatc 721 agctgggcaa tagggtcgtc gtcgccgttt ttcggtgcat cctgtttttc gcattttgca 781 cgcaaggaat aggttatgcc tgtaatatcc agcgccgctt gtttaagcga tgctgcattc 841 tccggcttct tgaaaagacc caagaagaac tcatttttaa cgattattga tagggtagtg 901 cctttaacat atcccatcga accgcgcaaa gctcctgcac atccggggtt aagctcggtc 961 aaacgttcca aaatctcgtc ccattgcgca caggcgacca tcggctcgtt gtttgcttcc 1021 tttgccggct ctgcctttgg ttcagccttc ggcatttcct gcttaggttc ttcctttacc 1081 gtggcaactg caggcacaac gccgtttttc ttgattgccg ccagctccga ttcaagccga 1141 gcaattcttg caataagctc gctcaggtcg gcatttgctt ttccgcccga tgatgtaggc 1201 ttcgttgtgt taaccgtaca tagcttaaca agcgccattt caatctccgt gcgcttcgag 1261 gttgctcttg gcattgcttc gctaagatcc tgcaaaatct caagccgtgc gataatctca 1321 tccagcgtca gcttttcgca aattttgcga agacgctcaa cctcattggg tgaacagctc 1381 aaaagctcgt ccctgtcggg aactgtctta atgagcatta agtttctcgt ctggaaaata 1441 agctcgtcgc aaagccttgc catatccttg ctctttgcat aaagctcgtc ggtctttgaa 1501 atcgcaaccg aaatgtcccg ctcggcaact gcctccaaaa tatcaaacag atagtcgcgt 1561 cccgcaattc ctgcggcatc ggtgacaacc gagatgtcaa cattgctcga atatgccacg 1621 cactggtcca aaagcgacag cgcatcgcgc atagctccgt cggcaatacg cgcaatcaaa 1681 tctgcggcgt cgctctcaag ggtgaatccc tcgtgggatg caatatagag cagtctgtcc 1741 gaaatatcgc gaggtcggat tcgtctgaaa tcgaaccgct gacagcggga aataattgtc 1801 gcaggtacct tatgtacctc tgttgttgcc aaaataaact tgacgtgtgc gggcggctct 1861 tccataattt tcaaaagcgc gttgaatgcc tgattggaga gcatatgaac ctcgtcgatg 1921 atatatacct tatatctgca aagctcgggg gtgtaaacag tcgagtcgcg caggtcacgt 1981 atatcatcaa cgcctgtgtt tgaagccgcg tcgatctcaa taatgtccga aagggtgccc 2041 gcgtctgccg cacggcagat atcgcactca aggcagggct tgccgtcgtg gggatcaaga 2101 cagttgatcg cttttgcaaa tattctcgcg caggttgtct tacccgtacc gcgtgagccg 2161 gtaaacaaat aagcgtgagc ggtcttgccc tcggcgatct gtcgggagag ggtggtggta 2221 atgtggggct gcgaaacaac gtcgtcaaag gtcagcggcc gccattttct atataatgct 2281 gtatacataa taccctcccg aaaataaaag tccaatccga caggtgggcg tgcaggcgag 2341 actgcgtcac acaaagcaaa ctgcttaatg ctgctcggtt ccccgcctga catggttcac 2401 agcgcctcgt tgcacaggac ccgcacaccc gcctctcgga ttggctctat aatcatatca 2461 cattcccaca gattttgcaa ggggttagcc aaaacaaaat gacctgattt gctcgttgcg 2521 gtcaggtcat tcttctttta tatattcggc gatgtcgcaa agctcgcaat ccaaaatccg 2581 gcagagctga tcgagggtat atgtgttgac atttgcgttc ttgcgcaggc ggtcaagctg 2641 accggtgctg atgtgatatt catttatcaa tttatattgt gagatgccgc gctctttcag 2701 cgttgcccac agtttgtcat atacgatcat cttaccaccc ccgaatgatt gactgtttct 2761 aatattatga tattttctta tccgccactt gacaatagcc cgtaaatggg ctataatcat 2821 tatagcccga atatgggcaa taaaaaattg gaggaaataa tatgaaaaga gcagtgagaa 2881 ttctatctac tttgttggca atgttaatgc taatatcagt agtgactaca agcgtgtgtg 2941 cgactacttt gaaaaaaggg tcatctggaa aacaagttaa atatcttcaa atgaatctga 3001 atggattggg ttattcctgc ggttctactg acggtaaata cggtgcaaag actgttcaag 3061 ctgttaaggc ttttcaaaag gcgtatgatt tagacgttga tggtatagca ggagataaga 3121 cacaaggcga gatttgttca attatcaaag atttacagca aaaattgtat gatttgggtt 3181 atgcagttgg cgacatagat ggtgtttttg gcagcaagac gattgctgct gtaaagaaat 3241 ttcaaaaaga taattcaatt tcagctaatg gaatagccaa tagtaagact ataaaggcta 3301 taaatgagaa gcataatgct ataaatcaat gcccgctcaa cggatcttac attcctttca 3361 tagatgtgcc ttcatatgaa acttcaatta agacagaaat tgtgagtgta gaatacatta 3421 aagatgttta ttcggattgg aaggccttaa actcagcgtt ttatgcaaga agaaatggac 3481 agtctagtga atttgaaaaa tcggaaaaaa ttaccgtaac gtcatctttg aatctaacgg 3541 cagatttgaa attagttgaa gcaaaacttg gtgtaacagt tgaaaaatct gttacttcta 3601 caattttagg aacgaactct ggtccgctag ctaaaggtga gtattgcaga ttctactatc 3661 gagaacattg gaaacgctat gaagttgtgg aagaaactac cattacacag tttggacggt 3721 catatagtta tacatctact aaaataatcg atgtagcgca agaattgacc gctgatgact 3781 atgggtgg // LOCUS sequence089 3772 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence089 VERSION sequence089 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3772 /mol_type="genomic DNA" /organism="" /note="sequence089" CDS 60..902 /product="AraC family transcriptional regulator" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_012583944.1" /transl_table=11 /codon_start=1 /translation="MQEFYFALLGDEVKLPIYVTGVGSTDPEWHCTRPGGHVYNQIIYS VKGEGVLVIDGTEHRIPKGSGFFLPAKYPHEYYSVGNISWETHWISFAGTCIDSVLPAL DLDKPLVFKLSETSSIESLWGKMLKNIRTNDINCGYTNSSLLYSFLVELNRVITCPAGT KENHRMEQLQPIIDYIDKNYSLNITLKDLARIVDLSPQYICRIFKECMNMRPFEHLAKK RIFESKKLLIETDLSITDVAKAVGYNDCSYFCVVFKRQESVSPADYRAAYSERRSQMK" /locus_tag="LOCUS_4070" /note="WP_012583944.1 AraC family transcriptional regulator (Dictyoglomus turgidum) [pid:25.7%, q_cov:90.4%, s_cov:89.2%, Eval:2.9e-20]" /note="MGA_511" CDS 1521..2564 /product="PRK06851 family protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_012048278.1" /transl_table=11 /codon_start=1 /translation="MVREYFLGRPTPDGFKTHITDEIKSGKYFTYILKGGPGTGKSSLM RTIAKESGLEHELYYCSSDPDSLDAIVFTEKKTIIVDGTSPHVVEPQYPGVKEKLVDLG AYWDGNKLLEKADEIVSLSQENTKYHQRAKRCLKAACAMYQDVETVSDGGLLRAKLDGF CERLGNHIFKKTKEPKGNIRFKQITSITPKGVITLRSAFDGYKVYYIDDRNLAATDHML KRLSILAIEKGYDCIVSENPFLEGCRYQHLIIPRLGLAFTSGQADMAYETKINGARFYD KYYLREKRERIRFGHAAADELINETVLTLKQAKRNHDELEKPYIDAMDFKGVQKLTDDM IKAIKER" /locus_tag="LOCUS_4080" /note="WP_012048278.1 PRK06851 family protein (Clostridium botulinum) [pid:31.3%, q_cov:98.0%, s_cov:96.4%, Eval:3.8e-39]" /note="MGA_512" misc_feature complement(2604..>3772) /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_021373798.1:ATP-dependent zinc metalloprotease FtsH" /note="WP_021373798.1 ATP-dependent zinc metalloprotease FtsH (Clostridioides difficile) [pid:54.7%, q_cov:95.6%, s_cov:56.2%, Eval:4.8e-110, partial hit]" /note="MGA_513" /locus_tag="LOCUS_4090" ORIGIN 1 aatattgtaa tatattgttg aaccagcggt aagaaaatat taacgtggag atgatataaa 61 tgcaggaatt ctattttgca cttttaggcg acgaggtaaa gctcccaata tacgtgacag 121 gtgttggctc tactgacccg gaatggcatt gcacaagacc cggaggacat gtttacaatc 181 agatcatata ttccgttaag ggagagggcg ttctggtcat tgacggaaca gagcacagaa 241 ttccaaaagg ctccggattt ttcctgcctg ccaagtatcc gcacgaatat tacagcgttg 301 gaaatatttc ctgggaaacc cactggatat cctttgcagg tacctgtata gattccgttt 361 tgccggcctt agacttggac aagcctttgg tatttaagct cagcgaaact tcaagcattg 421 aatccctttg gggaaagatg ttgaaaaaca tacgcaccaa cgacatcaac tgcggatata 481 ccaattcatc tttgctttat tccttcctgg ttgaactgaa cagggtcatt acctgccctg 541 caggcaccaa ggaaaaccac cgaatggaac agcttcagcc gattattgat tatattgaca 601 agaactattc tttgaatatc acattaaaag acttggcgag aatagtcgat ctttcgcccc 661 agtatatttg caggatcttt aaagaatgca tgaatatgcg tccctttgag catctggcca 721 aaaagcgcat ttttgaatcg aaaaagcttt tgattgaaac cgatctttcg atcaccgatg 781 ttgcgaaagc agttggatat aatgattgca gttatttctg tgttgtattc aagcggcagg 841 agagcgtttc ccctgctgat taccgagcag cttattcgga aagaagaagt caaatgaaat 901 aatttgatat atgaagcccc ctgcctgttg gcggggggtt attttatatg tctccctctg 961 acgagggagg tggaaaaaat cgaagatttt tgacagagaa agatggtgct tattcgcaaa 1021 ctgatacgag gttcggggaa gaagcgaggc gtgccggaca cggcgccgcg tctaagatgc 1081 ggcggtttgt ggcgcggcgt gccgagcgtg agcggtgagt ttcacaaact ttgggaattc 1141 atcggtttcc gcaggaaatc cgaaacttta gtttcggaag atgaattcat tgcggccaga 1201 cgccaaagtt gcttgttttc tctcactttg accgcagact tgagcaaact ttgggaattc 1261 atcggtttcc gacaggaaat ccgaaacttt agtttcggaa gatgatttca ttgcggccag 1321 acaggaaaga ttctcgcttc cactcacttt gaccgccgac ttgagcaaac tttgggaatt 1381 catcggtttc cgcgggaaat ccgaaacttt agtttcggaa gatgaattca ttgcggccga 1441 caccaaagct tcctgcttcc actcacttta acggccgcat ttccatatta tgaaacataa 1501 tgatttttgg gaggcttttt atggtaagag aatacttttt gggaagaccg acgcccgacg 1561 gctttaaaac gcacataact gacgagatca aatcagggaa atactttact tatattctca 1621 aaggcgggcc gggcacaggt aaatcctcgc tgatgagaac aattgcaaaa gaatcgggac 1681 ttgaacacga attatactat tgttcatccg acccagactc gctggatgcg attgttttca 1741 ccgagaagaa gactattatt gtcgacggaa catcgccgca cgttgttgag ccgcaatatc 1801 ccggagttaa ggaaaagctt gtggatctgg gtgcatattg ggacggtaac aagcttttag 1861 agaaagcgga tgaaattgtg tcccttagtc aagaaaacac gaagtatcac cagagagcga 1921 aaagatgcct taaagcggcg tgtgcgatgt atcaggatgt tgaaacggtg agtgacggag 1981 gactcctcag ggcgaagctg gatggcttct gcgaacgttt ggggaatcat atttttaaaa 2041 agaccaagga accaaaagga aatatccgtt tcaaacagat tacatcaatt acgccgaaag 2101 gggttatcac gcttcggtcg gcatttgatg ggtataaggt ctactatatt gatgacagaa 2161 accttgccgc aactgaccat atgctcaaac ggctgtcgat tttggcaatc gagaagggat 2221 atgactgcat tgtttcggaa aatccgttcc ttgagggatg ccgttatcag catttgatta 2281 ttccgcgact cggtttggcg tttacatcgg ggcaggcgga tatggcatat gaaaccaaaa 2341 tcaatggcgc gaggttttat gataaatatt accttagaga gaagcgggag cgaatcagat 2401 ttggccatgc ggcagcagac gagctgatta atgaaacggt tttaacgctt aagcaagcaa 2461 agcgaaacca cgacgagctt gaaaaaccgt atattgatgc aatggatttt aaaggagttc 2521 aaaagctgac tgacgatatg ataaaggcaa ttaaagaacg ataataaaaa agggaaagca 2581 ctgcgctttc ccttttgttg ctcttattcg tttgtttcgg gcaattcctt gatttcgttt 2641 tctgccacgg tgataatgat gtcatcagag ctgtcggtgt ttgcagttgg catttcaagc 2701 tcggtggttt ccaagctctc gcccttcatg atcttatcaa actcttcgcc tgtgagcttc 2761 tctcttacca aaagctgtcc cgcaactgcg tggagctgat cagcgtgagc ctcaagaatt 2821 gaaagagcat cctgatatgc gccgtgaacg atttcgcgaa cttcggagtc gatctcgctg 2881 gcgatctttt cggaatagga cttctgcgaa ttataatctc tgccgaggaa tacctcatcc 2941 tcgtcggtgc cgtaaacgat cggaccgatc ttgtcggaga agccgtactt ggtgaccaga 3001 tttcttgcaa tctttgttgc acgctgaagg tcatttgatg caccggtgga tacatcgtca 3061 agaatgatct gctctgcagc acggccgccc aagagagtga caatatcttc cttcattctt 3121 gttttggtca catatgactt atcggtttcg ggaaggctga gggtatatcc gcctgcaaat 3181 ccgcgaggaa tgatggatat ctcctgcacc ttatcctgtg tttcacaata gtaatggcag 3241 attgcgtggc ctgcttcgtg gtatgaagtg aggcgttttt cttcttccag aactaccttt 3301 gatttctttt cgggaccgac cattaccttc attgcggcat caccgaagtc ctgcgcggta 3361 attgccttgc ggccgttttt aaccgcaagc agagctgctt cgttgacaag gtttgcaata 3421 tccgcacctg tgaagccaac ggaggatgcg gcgacctttt taaggtcgac atcgggagcg 3481 agaggtttgt ttctggtgtg aaccttgagt atctcttccc tgcccttgat gtcgggatag 3541 ttaacatata cctgtctgtc aaagcgtccc gggcgcaaaa gtgcggggtc cagaacatca 3601 cggcggttag ttgccgccat tacgattaca gattcgtttt gcgcaaagcc gtccatctca 3661 acaagaagct ggttaagggt ctgttctctt tcgtcgtgtc cgccgcccaa gcctgcaccg 3721 cggcgacggc cgacagcgtc aatttcgtca atgaaaatga ttgagggggc ag // LOCUS sequence090 3762 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence090 VERSION sequence090 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3762 /mol_type="genomic DNA" /organism="" /note="sequence090" CDS 976..1434 /product="C-GCAxxG-C-C family protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_008765511.1" /transl_table=11 /codon_start=1 /translation="MDHSQAAYDNFYKGYNCAQSVFSAFCDVTGLDLETSLLLSSSFGG GMGRLREVCGAFSAIIMVAGCIYGYITPKDYDAKSKHYALVQELAARFKAENSSIICRE ILGLTASSDPNVPPRTDEYYKKRPCAEICRNAAKILDDYIREHGECCD" /locus_tag="LOCUS_4100" /note="WP_008765511.1 C-GCAxxG-C-C family protein (Bacteroides) [pid:43.9%, q_cov:96.1%, s_cov:97.4%, Eval:3.5e-30]" /note="MGA_515" CDS 1454..2173 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MLALPPDSFHMSAGVGTLSEKYLHALLKHFFEPDSDYHEVAIGTY TADICRDNKIIEIQTRAFNRLRDKLEYYLLEGYDVTVVLPLPRVKYLIWIDNQTGDVTN RRRSPKKGRFVDAIFELYKIKYFLDWKNLHIKLLLCELEEYRNLDGYGKNRKYRSTRLE RVPLELADTLSLDSVDDYRAFIPDTLPQFFTISDFAKASNIDYGHASTTLNILTYLSLV QKVGKDGKKNLYQVTPK" /locus_tag="LOCUS_4110" /note="MGA_516" CDS 2190..3461 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MKIKVKDLSYDEVLALKPEKHHKPMRPHFIFRLILRIASWFLLLK NRYTYNCIGMEKLNKNEPAFYLMNHSAFVDLLIAVYTLFPRPVNIVASTDAFVGKNLLM RLIGCIPARKFVSDIRLVKDMLHAVRKNKTSVLMYPEAGYSFDGTSTTIADSIGKCIKM LGIPVVMITTRGAFHHDPLYNGLQLRKVKVTADVKYLLSPDKIKEMSEAEINEIVYKEF AFDNFRWQQENGIKIIEKFRADYLNRVLYKCPHCLSEGSTVGDGIHLTCTACGKVYELT EDGFIKALDGNTEFNHIPDWYAWERECVRREIENGTYNLDVPVDILMAVNSKCIYRVGE GNLKHSLNGFELSGCDGKLDFKLRPSATYCINSDFLWYELGDMISIGDTKAFYYCFPKT KGDIVAKTRLATEELYKFGKALKN" /locus_tag="LOCUS_4120" /note="MGA_517" ORIGIN 1 caccgattac ataactatta acattgaatc cggctcatcc atcgaccttg aatattccat 61 cacctgcgat aaggactggc tcatctttga gaatactgaa ggcgttgtaa cccccgttga 121 cggtatgaca agtgtaaacg tcacctgcga cagagcgaag ctttcgggtg aagaaactgc 181 ctgtgtaacc gtaatttgca aatttaaagg ctccgatacc gcacgcgcca agctgtttgt 241 cagtgcttat ggcggaaatt atgactatgc tcctatgacc tttgttgata ccgagggcta 301 tgtgaccatg gatgccgacc acttcagcgc tgttcacgcc ggtgataact gcgcttggac 361 acttatcgac catctctccc gtgttgatag acccgctatt aaggtattgc cctcaactgc 421 tcatcttttg gatgataacg gaaacttcac tatcgaaaat gttccctctg ttgattacac 481 ctttactacg aacaacggcg gcgagtggga tatggaactg tatttatcca accgcaaccc 541 tgttgcaatt gatgcaaaga tgcgcatcgg ttacagcatc aacggctccg atgtgaccat 601 tcactccact attcccgagc attacaaggc aagaaattgt cgcgagtgga ataaggaagt 661 tttggatgtt ttgcgaatca gcaagtcaag tcttgctgtt caaaacggcg ttaacactct 721 taaactctat ggcggtgacc ccaacattat tgttgagcgc atcgtgcttt atcccaaggg 781 aaaagccccc ggcaagacct atatgggtcc tcgcgagagc tattttgtaa agtaaactta 841 gtttattaat attaccgctc cgaattatcc ttcggggcgg taaattttat ggatattcag 901 accgattaat cttgaattat agtgtaaaat atgatactat ttatttaaca atgtgttatt 961 tcaacggagg cgtttatgga tcattctcag gcggcatatg acaatttcta taaaggctat 1021 aattgcgccc aatcggtgtt ttccgcattt tgcgatgtta caggtcttga ccttgaaacc 1081 tcgcttttgc tttcttcgtc attcggcggg ggaatgggca gactgcgcga ggtgtgcggc 1141 gcattcagcg caataattat ggtcgcggga tgcatatacg gttacatcac acccaaggat 1201 tacgatgcta aaagcaagca ctatgctttg gtgcaggagc tcgccgcccg ttttaaggct 1261 gaaaattcat ccataatctg ccgcgagatc ttgggactta ccgcatccag cgacccgaat 1321 gttcccccaa gaacggacga gtattacaaa aagcgtccct gtgcggaaat ttgccgcaat 1381 gctgcaaaaa ttctggatga ctacattcgc gagcacggtg aatgctgtga ctgataagga 1441 aaggtttgca tctttgctgg ctcttccgcc ggacagcttc catatgagtg caggtgtggg 1501 aacattaagc gaaaaatatc tccacgcgct tttaaagcat ttttttgaac ccgattctga 1561 ctatcacgag gttgcaatcg gaacatatac cgcagatatc tgtcgcgata ataaaattat 1621 tgaaattcag actcgtgcat ttaaccgtct tcgcgataag ctggaatatt atctcctcga 1681 gggatatgac gttacggttg ttttgccctt gccgcgagta aaatatctta tttggattga 1741 caaccaaaca ggggatgtga caaaccgccg gcgctctccc aaaaagggca ggtttgtcga 1801 tgcaatattt gagctataca aaatcaaata ctttctcgat tggaaaaacc tgcatatcaa 1861 gcttcttctt tgcgaattgg aagaatatcg caaccttgac ggctacggca aaaaccgcaa 1921 atatcgttct acccgtttgg aacgtgtacc gttggaactt gccgatactc tatctctcga 1981 ctcggtcgat gattaccgcg cctttattcc cgacactttg ccgcaatttt tcactatttc 2041 cgatttcgcc aaagcgtcaa atatcgacta tggccacgct tcgacaacgc tcaacatatt 2101 aacatatctc agccttgtcc aaaaagtcgg caaggacgga aaaaagaatt tatatcaagt 2161 aaccccaaaa tgatttatga ggtgattgtt tgaaaattaa agttaaagat ttaagctatg 2221 atgaggtctt ggcattaaaa cctgaaaagc accataagcc gatgcgtcct catttcattt 2281 tcagacttat tttaagaatt gcatcctggt tcctgctctt aaaaaaccga tacacataca 2341 actgcatcgg aatggaaaag ctgaataaga acgagcctgc gttctatttg atgaaccact 2401 ccgcctttgt cgatcttttg atagctgtat atactctttt cccgcgccct gttaacattg 2461 ttgcatctac cgatgctttt gtcggcaaga atcttctgat gcgtttaatc ggctgcattc 2521 ctgcgagaaa gtttgtttcc gatatccgtc ttgttaaaga tatgcttcac gctgtcagaa 2581 aaaacaaaac ctctgtttta atgtatcccg aagcaggtta ttccttcgac ggcacatcaa 2641 ccaccattgc cgactccatc ggaaagtgca tcaaaatgct cggcattccc gttgtaatga 2701 taaccacccg cggcgcattt caccacgacc cgttgtataa cggacttcag ttaagaaaag 2761 tcaaagtcac cgcagatgtt aagtatcttc tctctcctga caaaataaaa gaaatgtcgg 2821 aagctgagat aaacgaaatc gtatataaag aattcgcgtt tgacaatttc cgctggcaac 2881 aggaaaacgg aatcaaaatc atagaaaaat tccgtgccga ctatcttaac cgtgttctgt 2941 ataaatgtcc tcattgcctc agcgaaggat cgacagttgg cgacggaatt catttgacct 3001 gcaccgcctg cggaaaggta tatgagctga ccgaggacgg tttcattaaa gctcttgacg 3061 gcaacaccga atttaaccac attcccgatt ggtacgcatg ggaacgcgag tgcgtaagga 3121 gagagattga aaacggcaca tataatcttg atgttcctgt tgatatcttg atggctgtca 3181 actcaaaatg tatctatcgc gtaggtgagg gcaatctcaa gcattcattg aacggctttg 3241 agctttcggg atgtgacgga aagctcgatt tcaagcttcg cccctctgca acatattgca 3301 ttaactcgga ctttttgtgg tatgagcttg gcgatatgat ctcaatcggc gataccaagg 3361 cgttttatta ttgcttcccc aaaaccaagg gagatattgt tgcaaagacc cgactcgcaa 3421 ctgaagagtt atataaattc ggtaaagcac ttaaaaatta acgcattaac ggagatgagt 3481 aaatgagcaa acaaaagcgc aaggcgattg gcaagccctt gcgaatagta tattttcttg 3541 cttatcacat ttgcaaggta ttgttctttt ttaagggcgt aaaggttaaa tatgataaaa 3601 ctgctatttc ggacattcaa ggtcctgcat tggtactttg cccacatacc tgtgcttatg 3661 accccgtatt tgtcggctca agcgtatatc ccaagcgtat gacatttgtt gtcagcgagc 3721 attttatggc aaaacctctt ttgcgctttg ctttgaccaa ac // LOCUS sequence091 3759 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence091 VERSION sequence091 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3759 /mol_type="genomic DNA" /organism="" /note="sequence091" CDS complement(1125..1787) /product="DUF4956 domain-containing protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011861070.1" /transl_table=11 /codon_start=1 /translation="MSNIRNILKESIEQLGLVERLSVEYILVSLLCAFVCSLVIYFVYK IFHRGAVYSENFAVLLVMTTCVTAFVVLTIGSNLVLSLGMVGALSIVRFRAAVKEPLDV GFMFWGIAAGITSGAGLYPFAVIATGIIAVIYILFTVLGRGKTTYVLVVKYADEAEEAV NKALEGEKTKLRGKAKYKGGNELTVDIKVSKGNTEFLKKLLETEGVESAVMVEYNGD" /locus_tag="LOCUS_4130" /note="WP_011861070.1 DUF4956 domain-containing protein (Clostridioides difficile) [pid:42.1%, q_cov:87.7%, s_cov:86.4%, Eval:3.2e-36]" /note="MGA_520" CDS complement(2082..2759) /product="polyphosphate polymerase domain-containing protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_001006715.1" /transl_table=11 /codon_start=1 /translation="MLTYPDYLAMRALLKPLMERDKYALADGDYFIRSLYFDDFSDSSY WEKLAGTADRKKYRVRIYNCSDSIIKLECKEKKGDRIHKRSISISRECADKMALGDFSL LEQYDSDLAREVLALAKTKGLKPSVVIDYDREAYVHPVSNVRLTFDKALHAGIESADIF DSKLATVPIYPDGSVIFEVKYDDVMPKFISSLVSVNHGQKLALSKFCLCRDELRRFKPR YIK" /locus_tag="LOCUS_4140" /note="WP_001006715.1 polyphosphate polymerase domain-containing protein (Streptococcus) [pid:30.9%, q_cov:97.8%, s_cov:94.8%, Eval:1.9e-23]" /note="MGA_521" ORIGIN 1 agcatcgcgg atctcaaccg agtcgatcat aatgttttcg ggaagacctg ttaaaaggtt 61 acggccttta atttcaagtt cgcgctcctc ttccatggga tatgcggagc cgattgcaat 121 tttgatctgc tcggcggtgc gctcaccgat gagcagatta tactttttct tgatgaagtt 181 gatgatgctg aagtcaaatt cgtcgcccgc tactcgtaca gaacggctgg ttacaacacc 241 gcaaagggag attacggcaa cttcagaggt gccgccgccg atatcgacga tcatcgagcc 301 ggtaggctcc tcaacaggca agcctgcacc gattgcggca gccataggct cttcaacaat 361 agatactctc tttgcgcctg cgccttctgc ggcttcctta acggcacgtc tttcaactgc 421 ggtaacgccc gaggggatgc agatgattac tcttgtcttg gtgaaggggt ttttgccgat 481 cgccttgcgg ataaattcct ggagcatagc ggtggtcata tcaaagtctg cgataacgcc 541 gtccttgagg gggcgcactg cgcggatgga gccgggggta cggccgatga tgtttttagc 601 atcctgacct acatagcgca cttcgtcggt cttggtgtca accgcaacaa cgctgggctc 661 acgaatgatt attcccttgc ctttgagaaa aacgagggtg tttgcggtac cgaggtcgat 721 accgatatct tttttgaaca tatatttcat ctccgattat atagtcttgc ggcatatgcc 781 gtttattggc ttaattatac catattttta aatatagtac aaggggaaat tttgtaaaag 841 atgggtaaat ttgttgagga gtgtcgggcg gacacatagg tccgccacat acttatcgat 901 aaaggcgtaa gaaaaggggg cgggcctgtg tgcccgcccc cctgcaagga atcagacaaa 961 tgaattgcgc ttcgcacatg aatagacaag caagctgtca tgaatagtcg ctttcgcgac 1021 atgaattgtc cctgcgggac attaaagggc aggcacacag gcctgccccc tatatcatca 1081 caaaaagagg gcgaccctat gtggtcgccc cgtatcaaca aatatcaatc tccgttatac 1141 tcaaccataa ctgcgctttc aacaccttcg gtctcaagga gcttcttaag gaattcggtg 1201 ttgcccttgc tcaccttgat gtcaacggta agctcgttgc cgcccttata tttagccttg 1261 ccgcgaagct tggtcttttc gccttcaagt gccttattaa cggcttcttc tgcctcatcg 1321 gcatacttaa cgaccagcac ataagtggtt ttgcctctgc ccaaaacggt gaagagaatg 1381 tatataacag cgataatgcc ggttgcaatt acagcgaagg gataaagtcc cgcaccagag 1441 gtgatacctg cggcaatgcc ccagaacata aatccgacat cgaggggttc tttaaccgct 1501 gcacggaaac gaacgatcga gagcgcaccc accataccga gggacaaaac gaggttggaa 1561 ccgatggtta aaacaacgaa tgctgtgacg caggtggtca taaccaacaa aactgcaaag 1621 ttttcgctat atacagcgcc gcggtggaag atcttatata caaaatagat gaccagcgag 1681 caaacaaaag cgcagagcaa ggatacaaga atatattcga cggacaagcg ctcaacaagg 1741 ccgagctgtt caatgctttc tttcaaaatg tttctgatgt ttgacatgat gttacctcca 1801 aggtgttaga gttgtcaggc ggcttcgcct taatgaataa tgaagattga ataatgaata 1861 attgcggaat cgccttcggc gatgatttta tagggggtgg agccatatgg ccctcccttt 1921 gaggggcaac gcctgcgacc gccgccggtg gcggaaacag ggagcagggg ttggagcagc 1981 ggtcgacaag ccggaacatt agtgaacggc gagtcgggaa ccgcaaacgg gattggtgtc 2041 ggcgaatgcc gacggatgag gtgggccctc attagggctg tttactttat gtatcttggc 2101 ttgaatcttc tcagttcatc tcggcaaaga cagaactttg aaagtgccag cttctgaccg 2161 tgattaacag aaacaaggct cgatataaac tttggcatca catcgtcata cttaacttca 2221 aatatgacac tgccgtcggg atatatcgga acagttgcaa gcttggaatc aaatatatct 2281 gccgattcaa tgcctgcgtg aagcgcttta tcaaatgtta aacgaacatt tgaaacggga 2341 tggacatatg cctcacggtc gtagtcaata actaccgagg gcttgagccc ctttgttttt 2401 gcaagggcta aaacttctct tgccaggtcc gaatcatatt gctctaaaag tgagaagtcg 2461 ccaagtgcca ttttgtcggc acactcgcgg gagatgctaa tgcttcgctt gtggatccga 2521 tcgccctttt tttctttaca ttcaagttta atgatactgt ccgagcagtt gtaaatacgc 2581 acgcgatatt tctttctgtc ggcggttcct gccagctttt cccaataaga agaatcggaa 2641 aagtcgtcga aatataagct tctgatgaaa taatcgccgt cagcgagcgc atatttgtcg 2701 cgctccataa ggggtttcag caaagcgcgc attgcaaggt aatcgggata tgtcagcaaa 2761 agtttgattt catggcgata tttttttacg ggagtcggta tatgccatca cctctaaaat 2821 cgtaatatga aaatattata tatgattttt caaaacattg caagccatta tttacttttc 2881 acaaagaatt ttgttaagga tttttgttta ctttttacaa tggcaatggt ataataacta 2941 taattggatg attgtacccg tatggggaca aagcacatag gggcagccct atgtggctgc 3001 ccgttatgga aaaagtcttg tcgcatcaaa aggagtcccg caaatgaaca acacctcaat 3061 gagcaaaaag atcataaccc tggcgatcgt tgcagtaatg ctgctttcaa caattgccgt 3121 cgccctatgg ggagaggatt atgtcacata taaccccacc gtttccgagc ctatcgtgga 3181 cgaaacgggt gcggaaatag tcgcccccaa agccgtcggc gacacttctg atgagcctgt 3241 aatcttcagc cttgaatgcg gtttttattc aagcaacgaa actctttatc tgagcgcgcc 3301 taacgctgtt gaaattcgct ataccaagga cggaagcgag cccggcgaat cgggcagaaa 3361 atataaggac ggcatcaact tcaaatcgac aagcgacgaa acaagaatgt acaccattaa 3421 agcctgcgcg gtatatgagg acggcaccta ttcggagcct gttgtccgct catatatcac 3481 aggtgacaat atctccgagc gttttgactg tctggtattt tccatcaccg tcgatcccga 3541 tgtgctttat gactatgaaa cgggaatctt cgtttcaggc aagctccgcg acgattggct 3601 taaagaaacc ggaaccaact cccgcgatgc cgttccgacc gaccccgcga actggaactg 3661 gcgaggacgg gaaagcgaac gcgaatgcta tgttgaggtc tatgaatacg acggtgagtg 3721 tgtaatttcc cagccggcgg gaatgagaat cttcggcgg // LOCUS sequence092 3747 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence092 VERSION sequence092 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3747 /mol_type="genomic DNA" /organism="" /note="sequence092" CDS complement(756..1163) /product="methylglyoxal synthase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_000684755.1" /transl_table=11 /codon_start=1 /translation="MNIALIAHDSKKALMIQFCMAYSGILSKHSLCATGTTGKQVSEAT GLKIQQHLIGIQGGCQQIGAKIACNEIDLLLFFRDPLNRKSNEPNEQDLLRLCDVHNIP VGTNMATADALILALERGDLDWRANSTDLFY" /locus_tag="LOCUS_4150" /gene="mgsA" /EC_number="4.2.3.3" /note="WP_000684755.1 methylglyoxal synthase (Bacillus) [pid:53.5%, q_cov:94.1%, s_cov:96.9%, Eval:1.4e-31]" /note="MGA_523" CDS complement(1322..3400) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MTLKKIFDLARVIFIAAILIVLLCFTGVRLMKMQVVDGELYLAMS KSSATATQTVSAVRGEIVDRNGAALVENRASYNVIIEYSFFPRDKQEQNRIILEIAKIL EADGLEWIDETPITFTEPYEYTAEPDSSAITRILSKLRLNSYATASNCIDKLIENYSIS DEYTAREKRIIAGVRYQMILSDFSSKTDYVFIKDVPIETVSKIRELAHSLPGADIAEDA IRVYSSGDIFPHGIGYVGPIYAEEYDELKGSGYLISDTIGKSGIEKALESSLRGDNGEK TITVTSDGDVSEAITAEAIPGDTVMLTIDAEFQAKVQDILEEHIEALATEKLTKAEYDF TDCKAGAIVVMDVDTGAVLAMATAPSYDINDLFSSYSEVLNREGNPLYNRATDGLYRPG SVMKTITSIAALSEGIITEDSTYSCHKQYNFLDIIVNCTGSHGAINVVKAVEKSCNIFF YQVIQELGLDKFMEYETAFGLGEAPEFEIRTAGGYLASPDTFFNFGLEWTVGQVLQAAI GQSEVGVTPLQMCSIAQTIATKGTRYSPYLVDSVWNYGMTQIINKTEPTVAGTIPADED VFDTVIEGMIKAGQNTTANVYYDTNPNAAYLAQFSTKPLPYDVAIKTGTPQAYNKATQN STVVGFYPAHDPEIAFAVVIENGEYAKYTVRKIIDAYYGYESVINDLGDGKFESVIN" /locus_tag="LOCUS_4160" /note="WP_012545126.1 penicillin-binding protein 2 (Thermodesulfovibrio) [pid:27.3%, q_cov:70.1%, s_cov:79.8%, Eval:9.7e-49, partial hit]" /note="MGA_524" ORIGIN 1 aaaccgcaga aagacaagaa aggcgctcaa aaggaggaag ggcgcaaccg ccgccctctc 61 ttttctttct gaggtttccc cctttggaac cctcttcctg actatctttt ctctcccggc 121 tgcgctatgc tcttcgatat cctatgcgct tacagtcaaa atcactataa ccatagtccg 181 caacgttcaa ggatgccttt tcaaaaagag attattccgc atcaccagca gacttaatct 241 tgcaaccaca gcgtaaagat aaattcgccc agtaggtcgc gcatgggatt caagtgtgat 301 aacggttact tttgcgcgtt gcaatagcgg tgtcgcctac ggcgaatatc cccacccctc 361 cgtcgcgctc tgcgcgccac ctcccaattg cggtgcccga ctcgccattc gcttacgctt 421 tggcttgtcg accgctgctc caaccccttc tccctttttc cgccactggc ggaggtcgac 481 ccctcacggg gagggtctgt ttataacaaa aaacacgcta tcctccctga aagggacgac 541 aacgtgtcgc ggtaccaccc ttgttgccga tctctcggcc actcgttaac tgcccttaac 601 gggggcaaac gtctgcgctt gatcacgcag aggctctaag ggtgtccttc tcccaaactt 661 gttttaagcg ctcgcaccat atgcgccctc tcttgaataa aacaactgtc ggggatactc 721 tccctttcat agcctttgaa tatttaaata ttgaatcaat agaacagatc ggttgaattt 781 gcgcgccagt caaggtcgcc tctttcaagg gccaaaataa gcgcatcggc tgttgccata 841 tttgtgccaa caggaatatt gtgaacgtcg cagagtctta aaagatcctg ctcgttgggt 901 tcgttggatt tgcggttcaa ggggtcgcgg aagaacaaca aaaggtcaat ttcgttgcag 961 gcgatctttg cgccgatctg ctggcagccg ccctgaatac ctatcaggtg ctgctggatt 1021 ttaagacctg tcgcttcgct tacctgtttg ccggtggttc ctgttgcgca gaggctgtgt 1081 ttactcaaaa ttccgctgta tgccatgcag aactgaatca ttagcgcttt ctttgaatcg 1141 tgtgcaataa gagcaatgtt caagtttgaa aacctcctcg taaaattcac atcggtgttt 1201 aagttgaatg ttgtctgtaa aaagaaccat atgtattatc ataacatctc gcacgaattt 1261 tgtcaaaggt tttttgacaa aaaaccgatt cgatttgaca acttttgtca aaattccacc 1321 gttagttgat tacgctttca aactttccgt cgccgagatc gtttataacc gattcatagc 1381 cgtaatatgc gtcaataatt tttctcacgg tatattttgc atattcgccg ttttcaatta 1441 cgaccgcaaa agcaatctcg gggtcgtgtg cgggataaaa tcccacaacg gttgagtttt 1501 gggtcgcctt gttatatgcc tggggtgtgc ccgttttaat cgcaacatca tatggcaaag 1561 gttttgttga aaattgcgcc aaatatgcgg cgttggggtt tgtgtcataa tatacattcg 1621 cggtggtgtt ctgtcccgct tttatcatac cctcgatgac ggtgtcgaaa acgtcctcat 1681 cggcaggaat tgttcctgca acggtgggtt cggttttgtt gattatttgg gtcataccgt 1741 aattccagac ggaatcgacc agatagggcg aatatcttgt gcctttggtt gcaattgtct 1801 gtgcaattga gcacatctgc aagggtgtga cacccacctc cgactgtccg attgcagcct 1861 gcaaaacctg accgactgtc cactcgagtc cgaagttgaa gaatgtatcg gggcttgcaa 1921 gataaccgcc tgcggttcga atttcaaact cgggagcctc gcccaagcca aacgcggttt 1981 catattccat aaacttgtca agtccaagct cttgaatcac ctgatagaag aagatattac 2041 aggatttttc aacagcttta acaacattta tggcaccgtg ggaacctgtg cagtttacaa 2101 taatatccaa aaagttatat tgcttgtggc aggaataggt ggaatcctcg gtaataatgc 2161 cttcgctgag tgcggcaata cttgtaattg tcttcattac cgagccgggg cggtaaagtc 2221 cgtcggtcgc gcggttataa agcgggttgc cctcgcggtt taagacttcg gaatagcttg 2281 aaaacaggtc gttaatgtca tagctgggtg cggttgccat tgcaagcact gcgcctgtat 2341 ccacatccat aacaacaatt gctcccgcct tgcaatcggt gaagtcatat tctgccttgg 2401 tcagcttctc tgttgcaagg gcttcaatat gctcttccag aatgtcctga accttcgctt 2461 gaaactccgc gtcgatggtg agcataaccg tatctcccgg aatcgcttcg gcggtaattg 2521 cttcgcttac gtcgccgtcg gatgtaacgg ttatggtctt ttcgccgttg tcgccgcgta 2581 aagaagattc aagggctttt tcaattccgc ttttgccgat ggtgtcggaa attaagtatc 2641 ccgagccttt aagctcgtca tattcctcgg cataaatcgg tcccacatat ccgatgccgt 2701 gggggaagat gtcgcccgag gagtaaactc gaatggcgtc ctctgcaata tccgcaccgg 2761 gcagagaatg cgccagctcg cggatctttg aaacggtttc aatgggtacg tctttaataa 2821 acacatagtc ggtcttcgat gagaagtcgg ataatatcat ctgatatctc acacctgcga 2881 ttatgcgctt ttcgcgggct gtatattcat ctgaaatgga ataattttca atcagcttgt 2941 caatacagtt ggacgctgtg gcataggaat taagcctcag ctttgaaaga attcttgtaa 3001 tcgcgctcga gtcgggctcg gcggtatatt cataaggctc ggtgaaggtg atcggcgttt 3061 cgtctatcca ttcaaggccg tcagcctcta aaatcttggc aatttcaagg atgatccggt 3121 tttgctcctg cttatctctc gggaaaaagc tatattcgat gataacgttg tatgatgcgc 3181 ggttttcaac caaagcggca ccgttgcggt cgacaatttc gcctctgacg gcggaaacgg 3241 tctgggtcgc ggttgcactc gattttgaca ttgcgagata caactcgccg tcaacgacct 3301 gcattttcat taagcgcacg cctgtgaagc agagcaaaac aatgagtatt gcggcgataa 3361 agataacgcg cgcaaggtcg aatatttttt tcagtgtcat ctttatcagc tccttttggt 3421 tggtataggg gcgggcctgc gtgcccgccc gagcggaaag attgctttgc gggcacccac 3481 ataggggtgc cttttgcttt ttctcattaa aatcttgcaa aagtcttgcc tgtataatag 3541 ggagaatgtt aaaatcttcg atttaatcgg atgtcaaaaa tgtgacaagc gggcgaccac 3601 atagggtcgc ccctatagct atgatgaaac ttgtatgggc gggcctgcgt gcccgcctgc 3661 aggagaaccg ttctcctaag tcctatcgac cattccgttc tgttcctcaa tcacaagtcg 3721 tctggtgatt ccgaacagct tggtcaa // LOCUS sequence093 3743 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence093 VERSION sequence093 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3743 /mol_type="genomic DNA" /organism="" /note="sequence093" CDS complement(148..1980) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MEFYIELKLAGDEFPGSFSNGLTLCGTHAANSLEKFEETENAVRY NDDRDHVLVLNKETKGDALVLSTEFINNSSCDATLEMIASVAIRKIKADRIHRMQSFWS AEGKLKTDSVLDLHLEPSWNGFGSRIEKFGNCGSMPVRKYFPFVVLEDSENSDFLAIEL YSPTSWQFEISLNSDKTLNVVGGLADYDFGHWCKTVASGESFTTPRAIIAQGKTLIEAC DKLVKAQALNISPVDNNMDIMFNDYCTTWGNPNLESIKSIADTLKGKGIKYLIIDAGWY GKQNWWQSMGEWEVNDDKFPNGLKEAADYIRECGMIPGLWFELEVVGPFPKYYNCTEHL LKRNGSVLTTGERRFWDMEDPWVIEHLTERVIKQLRDNGFGYIKIDYNETIGIGCDGYE SLGEGLRKKIKASQEFIKKLGREVPDIVIENCSSGGHRLEPSMMEIVSQASFSDAHETR SIPIIAANLHRVIHPCQSQIWAVLRRYDDKHRIHYSMVNSFLGRMCLSGDIYDLNDEQW ALVDEGIEFYRKAADIIKNGSTVYSESDPKSYQNPQGEQLLIRKLGNRELVIAHRFENS KDIDLSFIDGKKIIAEYGDVSCDFSAKAWIVEAI" /locus_tag="LOCUS_4170" /note="WP_003548136.1 alpha-galactosidase (Lactobacillus acidophilus) [pid:27.0%, q_cov:53.6%, s_cov:46.2%, Eval:9.9e-26, partial hit]" /note="MGA_525" CDS 2202..3128 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MEQKRKFCPNPIITSIYTADPAPMVYGDTLYLYTTHDEDELIGDF YTMFNWHCYSTKDMVNWTDHGQVFSIDDIDWALDRAWAPQAIERNGKFYLHCPVHKTNG GVCIAVGVSDKPEGPFKDLGHPLVDEGDWNDIDPTVYIDDDGQAYLYFGNPELRYVLLN EDMISYDEAVGVKKIPMTEEAFGKGGHMTGTTYAEGPWFYKRNGLYYMVYAAFAKGVHQ EHLAYSTSTSPTGPWTYGGVIMTEEGGTFTNHPGICDFKGHSFLFYHTAQLPGGSLFHR SVCVAEFEYNDDGSISTISKCDGVYEI" /locus_tag="LOCUS_4180" /note="WP_010890799.1 glycoside hydrolase family 43 protein (Clostridium acetobutylicum) [pid:57.5%, q_cov:94.5%, s_cov:62.4%, Eval:1.2e-94, partial hit]" /note="MGA_526" ORIGIN 1 acatacttac caactcattt caacattttt cgccattata tcatacctcg tgtgtagaaa 61 tttgtcgaat accgtcgagg atgtaaaaat cttttattat tttaccactt cgccgttatt 121 tgtgcatagt atgactgcaa aatgtgttta aatagcttcc acaatccatg ccttcgcgct 181 gaaatcacag gacacgtcgc catattccgc aataattttc ttgccgtcaa tgaagctaag 241 gtcgatatcc ttggagtttt cgaatctgtg tgcaataaca agctcacggt tgccgagctt 301 tcttatgagc aactgctcgc cctgaggatt ttgatagctc ttgggatcgc tttcgctata 361 tactgtcgaa ccgttcttga tgatatcggc cgcttttcta tagaattcga ttccctcgtc 421 aacaagggcc cactgttcat cgttcaaatc ataaatatcg ccgcttaagc acattcttcc 481 caaaaatgag ttaaccatcg aatagtgaat tcggtgtttg tcgtcatatc ttctcaaaac 541 tgcccagatc tgtgactgac aggggtgaat aactctgtga agatttgctg caataatcgg 601 aatggatctt gtttcgtgag catcggagaa gcttgcctgc gaaacaattt ccatcatgga 661 aggttcaagt ctgtggccac cgctcgagca gttttcaata acgatatcgg ggacttctct 721 tccgagcttt ttaatgaatt cctgagatgc cttgatcttt tttctaagtc cttcgcccag 781 actttcataa ccgtcacagc cgattccgat tgtttcatta tagtcgatct ttatgtatcc 841 gaatccatta tcgcggagct gtttaataac tctttctgta agatgctcga ttacccacgg 901 atcttccata tcccagaagc gtctttcacc tgtggtcaga accgagccgt tacgcttcaa 961 aagatgctct gtgcagttgt aatattttgg gaatgggcca accacctcaa gctcgaacca 1021 aaggccggga atcattccgc attcacggat gtagtcggca gcctctttaa gtccgttcgg 1081 gaacttatcg tcgttaactt cccattcacc catagactgc caccagttct gctttccata 1141 ccagccggca tcaataatca aatatttaat tcccttaccc ttaagagtgt ctgcaataga 1201 cttaatgctt tcaaggttcg ggttgcccca ggtggtgcag tagtcgttga acataatgtc 1261 catattatta tcaacaggtg agatgttgag ggcctgagct tttacaagct tgtcacaagc 1321 ttcaataagt gtttttccct gtgcaataat cgcgcggggg gttgtgaagc tttcgccgct 1381 tgcaacggtt ttacaccagt ggccgaagtc atagtccgca agaccgccca caacgttaag 1441 agtcttgtcg ctattgagcg aaatctcgaa ctgccatgag gtaggggaat agagttcaat 1501 cgccaagaaa tcgctgtttt cgctatcctc aagaactaca aaggggaaat attttcttac 1561 gggcatagag ccacagtttc cgaatttctc aattctcgaa ccgaatccgt tccaggaagg 1621 ttctaaatga agatccaaaa cagaatcggt tttaagcttt ccttctgcgc tccagaagct 1681 ttgcatacgg tggatcctat cggccttgat ttttctgatg gcaacagatg cgatcatttc 1741 aagtgtggca tcacagctgc tattattaat aaattcagtt gaaagcacca aagcgtcacc 1801 ttttgtttct ttattcaaaa caagaacgtg atctctgtca tcattatatc tgacggcatt 1861 ttcggtttct tcgaattttt ccagcgaatt ggctgcatga gttccacaaa gcgtgagtcc 1921 gtttgagaat gaaccgggga attcgtctcc tgcaagctta agttcaatgt agaattccat 1981 gttttacctc caaatcaatt attaacttca ttatatatcc ttgttgtaag aaaatctact 2041 gttttgtaaa ttttttcaag aaataaagca aaaaaattaa agattttcct catccttgac 2101 ttatccttat gactatattg acagtttcca ttttcaaatt gccatttaat tcgccgtatg 2161 ttatactgat tatactaaaa ttgcctaagg agggcacaaa tatggaacag aaaagaaagt 2221 tttgccccaa ccccataatc acatccatct atacagcaga ccctgcacct atggtatacg 2281 gtgatacttt atatctgtat accacccacg atgaggacga acttatcggc gatttctaca 2341 caatgttcaa ctggcattgc tattccacca aggatatggt caactggacc gaccacggcc 2401 aggtgttctc tatcgatgac atcgactggg cgctcgacag agcttgggct ccccaggcaa 2461 tcgagagaaa cggaaagttc tatcttcact gccctgtaca taaaacaaac ggcggagttt 2521 gcattgctgt cggcgtgtcc gataagccgg aagggccctt caaggatctg gggcatcccc 2581 ttgttgatga aggcgactgg aacgacattg acccaaccgt atatatcgac gatgacgggc 2641 aggcttatct ttacttcggc aaccccgagt tgagatatgt tcttttgaac gaagatatga 2701 tctcatatga tgaagctgtc ggagttaaga agatacccat gaccgaagaa gctttcggca 2761 agggcggaca tatgaccggc acaacatatg ccgagggtcc ttggttctat aagagaaatg 2821 gactttatta tatggtttat gccgcattcg caaagggagt tcatcaggag caccttgcat 2881 attcaacctc gacctcgccc acaggccctt ggacctacgg cggagttatc atgaccgaag 2941 aaggcggaac cttcaccaac caccccggaa tttgtgactt taaaggtcat tcgttcttgt 3001 tctatcacac cgcacagcta cccggcggaa gcttgttcca ccgcagtgtt tgtgttgctg 3061 agtttgaata taacgacgac ggctcaatca gcaccatttc caagtgtgac ggagtttatg 3121 aaatttaagc atcaatcaga gttttcgaca acggtcaaaa ataacctttg cgcaagcctt 3181 ccccttgagg ggaaggtgtc agcgaatgct gacggatgag gtgaccgcaa accgcgaaat 3241 ttcaacgctt gcgctaaccg ccgctccgct cggcacctgc ggcactgttt gccttgcaaa 3301 cgcatccgca gacgcctcgc tccaatcatc ctcaaaaaac caaaagccat acagacattg 3361 tcgtctgtat ggctttttca tatgtataca cattactttg cgctgtaaat tccgacaaag 3421 gaaattacag gctcgcctct tgtttcaaca aacttgatct taattgcatc ggtgacaacg 3481 ttttcaagct tgacgatctt cttatgtccg atcaccgtgc cctttgcaat ttccttgaac 3541 tgtccgtcaa gcttcgcttc aataacatag ttttcaactc tctggctgaa cttaatgttt 3601 tccttaatga caatgtggcc gatattttta gcttcttgcc agccaaacaa aaactctgcg 3661 gtccggttct gtgcgtgata gcttgtgtca tagcaatcaa ccaacagctt gtcggtgccc 3721 atgccttcct tggcggaatc cgc // LOCUS sequence094 3703 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence094 VERSION sequence094 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3703 /mol_type="genomic DNA" /organism="" /note="sequence094" misc_feature <1..1676 /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_003243128.1:arabinogalactan endo-beta-1,4-galactanase" /note="WP_003243128.1 arabinogalactan endo-beta-1,4-galactanase (Bacillus) [pid:59.4%, q_cov:56.9%, s_cov:74.4%, Eval:1.5e-105, partial hit]" /note="MGA_528" /locus_tag="LOCUS_4190" CDS 1869..3395 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MKKILSIILALSLCLCLFAGCGNTANNGGNDNTDLALAGTYDIKV WVAEAAVELTTAQIKKFNETNTDGIVINATIEAVGEGDAATSMTTDIEAGADLYCFAQD QAARLIQSGALAKLGVAAAETVSAANDAGVVSAAMSGEDLYAYPLTADNGYFMYYDKSV ISEDIVGSLEDIIAACEAAGRLFSFEIEGSAWYTASFFFATGCVSDWTTDNDGAFTAVN DTFNSQAGLVAAKGMKKLLSSTAYNNSSACTDFAAATPSAVVVSGTGDYVTASDILGEN LGIAELPSFTVDGNTYHLGSFNGCKLMGVKPQVDAKKAAAIHKLAQYLTSEEAQTERFN TLAWGPANLNAQQSDAVKASPALVALLAQSPYSVPQGQIHGSWWDIGKAVATNIKNATD DAGIQGALDTYTTAINGLFSMSEEVLNAYTVIGSINGDGWTVDLPMTEQADGTWKSNEA YTMDAGVEFKCRQGLNWDVAYPAANFVVETAGTYYVVLDPVSGEVTLSVD" /locus_tag="LOCUS_4200" /note="WP_013399406.1 extracellular solute-binding protein (Gardnerella vaginalis) [pid:27.4%, q_cov:72.8%, s_cov:87.3%, Eval:1.5e-21, partial hit]" /note="MGA_529" ORIGIN 1 acgatcctta tgatgaaaac ggcaacggat atggcggcgg aaactgcgac attgacacgg 61 cagttgaaat tggaaagcgc gccaccaaat acggaatgaa gcttttggtc aacttccatt 121 attccgactt ctgggctgac cctgcaaagc agatggtgcc caaggcttgg gcgggaatgc 181 ccattgaaga aaagaccgaa gcactttatc aatataccct tgagagcctc aaaaagctga 241 aaaaagccgg cgtcgatgtt ggaatggtgc agattggcaa cgaaaccaac ggcgcaatgt 301 gcggagagaa gatctggttc aatatgcagt atctcttcca ggcgggcgca aaggctgtcc 361 gcgaggtatt ccccgaggcg ttggttgcat tgcactttgc caaccccgaa aaggtcactc 421 attatgatga ctacgcaaag aagctcgctt attataatgt ggactacgat gtgttcgcat 481 cctcatacta tcccttctgg cacggtactt tggaaaacct tgcaacggtt ttgacaggaa 541 ttcaggaaaa ctacggcaag aaggttatgg ttatggaaac atcctatgcc tatacccccg 601 acgataccga ctttaacggc aacacaatct ctgacggcag cgttgttaca aaaaactatc 661 cctataccgt acagggacag gcaagagcac tttatgatgt aattgacacc atggcatcaa 721 tcggcggcat cggcgttgta tattgggaag gcacatggat aagcgtcggt cagaactcct 781 gggaagaaaa cagcgcaaag tgggaaaaat acggctccgg ctgggcaagt tcctattctg 841 cgaagtatga ccccaatgac gctggaaaat actatggcgg atgcgcttgg gataaccaag 901 caatgtttga tgcaaacggc aagcctctcc agtcattgag agtgtttaac cttgtgcgct 961 atggcaacga tgtttcgctt aaggcagatg ctttggaaga agtcatcatc acatcggata 1021 tcggaagcag gatagttttg ccagaaaccg tcaacgcaat tatgagcgac ggcagcctgc 1081 aggctgtgcc tgttgagtgg aatacgaccg aggcagagct ggataatatg gcaaactcgg 1141 gcgttgcgaa gtatgaaatt acaggacttg cagacggcga aatcgcgaaa gcatatatct 1201 cggtggttga ctataactat ctgaccaact atagcttcga ggacggcggc cttaacggct 1261 ggacactcac cgatttggca ggatctgacg agctttacgt tgaagataag ctgaccgatt 1321 ccctttcggg cagttggcat atgcacttct ggagcgcagc ccagaacact gttgagttca 1381 cccttgagca agcggttgct gatcttgaat cgggaaaata taaattcacc atttcaatta 1441 tgggcggcga tgcaggcgaa acggacattt atgcgtatgt taaaatcaac ggcgagaccg 1501 ttaagaccgc acctttgggc attacatctt atggcaactg ggagaccgca accgttgcgg 1561 gtattgatta ttccgcaggt gatgaaattg ttgtgggaat atatgtaaaa tgtcagggcg 1621 caggcaacgg agcatgggga aaaatcgacg atgcgttgct aaataaggat ttttgattta 1681 acctgttaaa ccacgtcagc gcaaatatga taataaaatg tgcaagcttt tgtgaggttt 1741 gcacattttt gtttgacaag cattgacttt ttagtcaatt tgctgtatag tatttatgct 1801 gatttcccct cgtttggagg aagtcaaaga aaagccgttt attaacggca aattttttgg 1861 aggcgaatat gaagaagatc ctatccatca tcttggcact ttccttgtgc ctttgcttgt 1921 ttgccggctg cggcaacaca gcaaacaacg gtggcaacga caacactgac cttgcattgg 1981 caggcactta tgacatcaag gtttgggttg cagaagctgc tgttgaactc accaccgcac 2041 agatcaagaa gttcaacgaa accaacactg acggcatcgt aatcaatgct acaatcgaag 2101 ctgtcggcga aggcgacgct gcaacctcta tgaccactga cattgaagcc ggcgcagacc 2161 tttactgctt cgctcaggac caggctgcaa gacttatcca gtcgggcgct ttggctaagc 2221 tcggcgttgc tgctgctgaa accgtttctg ctgctaacga cgcaggtgtt gtttccgctg 2281 ctatgtccgg cgaggacctc tatgcttacc ccttgaccgc tgacaacggc tacttcatgt 2341 actacgacaa gagcgttatc tctgaagaca tcgttggaag tcttgaagac atcatcgctg 2401 cttgtgaagc tgcaggcaga ctcttctcct tcgaaatcga aggttctgct tggtacactg 2461 catcattctt ctttgcaacc ggatgcgttt ccgattggac caccgataac gacggtgctt 2521 tcaccgctgt taacgacacc ttcaactctc aggcaggtct tgtagctgct aagggtatga 2581 agaagctcct ctcctctacc gcttacaaca actcctctgc ttgcaccgac tttgctgctg 2641 caactccttc cgcagtagta gtttccggta ctggggacta tgtaaccgct tctgacattt 2701 tgggcgagaa cctcggcatt gctgaacttc cttccttcac tgttgacggc aatacatatc 2761 acctcggttc cttcaacggc tgcaagctca tgggcgttaa gcctcaggta gacgctaaga 2821 aggctgctgc aatccacaag cttgctcagt acctcaccag cgaagaagct cagaccgaaa 2881 gattcaacac ccttgcttgg ggccctgcta acctcaacgc tcagcagtct gacgctgtta 2941 aggccagccc tgctctcgta gcacttttgg ctcagtctcc ttactctgtt cctcagggcc 3001 agatccacgg ttcttggtgg gatatcggca aggctgtagc aaccaacatc aagaatgcaa 3061 ctgacgacgc tggcattcag ggtgctttgg atacctacac tactgcaatc aacggcttgt 3121 tcagcatgtc tgaagaagtt ttgaacgctt acactgttat cggttctatc aacggcgacg 3181 gctggactgt tgaccttcct atgaccgagc aggctgacgg aacatggaag tctaacgagg 3241 cttacaccat ggatgcaggc gttgagttca agtgccgtca gggccttaac tgggacgttg 3301 cttatcccgc agcaaacttt gttgttgaaa ccgctggcac ctactatgta gttcttgacc 3361 ccgtttccgg cgaagttacc ctttctgttg actaattcga ccgcgaaaac aacagtatag 3421 cataatcatc aagggtcgga gcctgtttga ctccgaccct ttttgaaatt tgcaactaat 3481 ttttgaaaga tttgactttc ccatttcacg aaaggtatgg tcatcaatat gaaaagatac 3541 agtgacctcg aatatttgaa gctgcctaag tggaaaagat ttttatacac cctggtttgc 3601 ttcattgtcg ccattcccgg cggcattctc ggcttcttta aaaagctggg actcggcatt 3661 gcaaacttct tcgtcaaaat taaagacgag tttgtagata tat // LOCUS sequence095 3700 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence095 VERSION sequence095 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3700 /mol_type="genomic DNA" /organism="" /note="sequence095" tRNA complement(104..179) /product="tRNA-Lys" /inference="COORDINATES:profile:Aragorn:1.2.38" /locus_tag="LOCUS_t0070" /note="Aragorn_7" CDS complement(277..825) /product="phosphoribosyltransferase family protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011016017.1" /transl_table=11 /codon_start=1 /translation="MDKKYYKLHVAGLERDLPICPVNDKLDIAAFIMFSDVELTVACAE ELIKKIPECDVLVTAESKGIPLAYEMARQMGNGMKYIVARKMAKLYMHDPVSVDVKSIT TAVEQKLWLDKDEADYLKGKRVLIVDDVISTGESLEALRKLVEYAGGNIIAQAAVLAEG DAADREDIIYLEELPLFFK" /locus_tag="LOCUS_4210" /note="WP_011016017.1 phosphoribosyltransferase family protein (Fusobacterium nucleatum) [pid:54.8%, q_cov:97.3%, s_cov:99.4%, Eval:2.0e-48]" /note="MGA_532" CDS complement(850..1218) /product="HIT domain-containing protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_010964599.1" /transl_table=11 /codon_start=1 /translation="MSDYSHLNDDCLFCKIIKGEIPSKKVYEDESVYAFADINPTAPIH YLFIPKCHIESLDYIKRDLNGYLVGDVYAAIAKVAHLEGFDESGYRVVSNCGHDAGQTV PHIHFHVLAGRELTWPAG" /locus_tag="LOCUS_4220" /note="WP_010964599.1 HIT domain-containing protein (Clostridium) [pid:58.8%, q_cov:93.4%, s_cov:99.1%, Eval:1.8e-34]" /note="MGA_533" misc_feature complement(1255..>3700) /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_009889064.1:alanine--tRNA ligase" /note="WP_009889064.1 alanine--tRNA ligase (Clostridioides difficile) [pid:51.0%, q_cov:99.9%, s_cov:92.7%, Eval:9.6e-237]" /note="MGA_534" /locus_tag="LOCUS_4230" ORIGIN 1 cgtgaagcgc gaaatcagag tttgctaacg caaactcggg gctcaaatcg aataatcttg 61 ccataaaccc aataggcacc ctgttgggtg ccttttgggt ttatggtgag ctactgggga 121 ttcgaacccc agaccctttg attaaaagtc aaatgctctg ccaactgagc tagtagctcg 181 ctgtttagac agctttaata ttatatcaaa tggaaactgc tttgtcaaca caaattttac 241 gggacggaaa atttcttttc cgccccgatt ctttgtttac ttaaagaaca acggcaattc 301 ctcgagatag atgatatctt ctctgtctgc ggcatcgcct tcggccaaaa ctgccgcctg 361 ggcaataatg ttgccaccgg catattcaac aagctttctt aaagcttcaa gcgactcacc 421 tgttgaaata acgtcgtcaa cgatgaggac acgcttgccc ttgagataat cagcctcgtc 481 tttatcaagc cagagcttct gctctaccgc agtggtgatc gactttacat caaccgacac 541 agggtcgtgc atatagagct ttgccatttt tcttgcaaca atatacttca taccgttacc 601 catctggcga gccatttcgt atgccagcgg gatgcccttt gattcagcag ttaccaaaac 661 atcgcactcg ggaatcttct tgatcagttc ctcggcgcag gcaacggtca actcaacatc 721 gctaaacatt ataaatgcgg cgatatcaag cttatcatta acggggcaga taggcaggtc 781 tctttcaagt cctgcaacat gaagcttata atatttctta tccatttttt ctgtcttcct 841 ttctgtcatt tatcctgcgg gccaagttaa ttctctgccg gcgagaacgt ggaagtgaat 901 gtggggaacg gtctgacctg catcgtgacc gcagttggaa acaactctgt agcccgattc 961 gtcaaagcct tcaaggtgtg caaccttggc aatcgcagca tatacatcgc caaccaaata 1021 gccgttcaaa tcgcgcttga tatagtcaag cgactcgata tggcatttgg gaatgaagag 1081 ataatggata ggtgcggtgg ggttgatgtc cgcaaaagcg tatacgcttt catcttcata 1141 taccttcttt gagggaatct cgcccttgat tatcttgcag aacaagcagt cgtcattgag 1201 atgggaataa tcgctcattt tgtttcctcc ttgaatattt ttgattgact taatttactt 1261 tacgaattcg gcaacgattg cttcggcacc gttaagtgca tcgttaacaa ggttcttatc 1321 gccgacacct gccattgcag agtcgggtct gccgccgccc ttgccgtttg taagtgcggc 1381 aatcttgcca acgatcttgc ctgccaacgc gccctttgca acagcctgct tgccacaagc 1441 aacagcgata tttgtgttgc tgatgaggac acagacgttg agttcatcct tatctctgag 1501 gctttcagcc atctggcgaa gctcgccgcc gttggcatcg cccataacag cgcagatgag 1561 cttaacaccg ttaacatcct tagcgttatc agccaaagaa gcggagcgca tctttgcaat 1621 ttcgcccgaa agctcagcgt ttgccttctc caaggtctta acttcgtcca taacgccctt 1681 gcaacgtaca accaatcccg aaggatttgc aagcttgagg gttgcggccg cgttgttgat 1741 ggtgtcaata tgctgggtca taagctcaag cacgccctta cctgttacag cttcgattct 1801 tcttacacct gcagcaacgc tggattcgga gattatcttg aacaaaccga tcttcgaggt 1861 gttgtccata tgggtaccgc cgcagaattc gatcgaagcg tcgcccattg ttacaactct 1921 gacagtttcg ccgtactttt caccgaagag agccattgcg ccgagcttct gagcttcggc 1981 aatgggcatt tccttcatgg tgatgttaag tgcagaaagg atatattcgt ttacaagagc 2041 ctcaaccttg acgatctctt cgggggtcat acccgagaag tggctgaagt cgaatctcaa 2101 gcggttagca tcaacaagct gacctgcctg gtgaacgtgg tcgcccaaaa ctgctctgag 2161 tgctgcctgc aaaaggtgag cacaagagtg gtttctcata acagaaaggc ggttgtcagc 2221 atcaactgag agaactgcgg gctgtccaac ttcaacagca cccgaaacga cctttgcctt 2281 atgaacgatc tttccgccga cagccttctg ggtgtcaaag atctcgcact tgcccgaagc 2341 ggtggtgatg atacccttgt cgccgacctg tccgcccgat tcagcataga agcaggtttc 2401 cttggtgatg atgtatactt catcacctgc gcctgcggca ttgatgattt catcgtcggt 2461 tgcaatccag tcgatggtgg attcgttggt catcttatcg tagccgacaa agtcggagga 2521 atattccttg ggcatcttgt ggaagatggt ttcgtcagca cccatatact tggagtcgcc 2581 tcttgcggca cgggcagttt ccttctggac ctgcaatgcc tgcttatagc cttcttcgtc 2641 gcatccgagt cccttttcct cgagaatttc gcaggtcagg tcgatcggga agccgtaggt 2701 atcggacaaa gtgaagcact tcttgccatc gagaacagtt tcaccgttag cctgcatctc 2761 gtcaatatag gtgttgagaa tggtaagacc gcggtcgatg gtttcgttga agttcttttc 2821 ttcgtttgtg agaagcttta caatgtagtc atacttttct tcaagctcat tatattcgcc 2881 cttgttgcaa tcaacaactg tctttaccag atccttgagg aagaggccgt tgatgcccaa 2941 aagcttgccg tggcgaacag ctctgcgcaa aagtcttctc ataacatagc ctctgccttc 3001 gttggagggc agaacaccgt cggatgccat aaaggttacg cttctgatat ggtcggtgat 3061 gacgcggatg gaaacgtcct tcttatattc cttgccgtat tcggcatttg caagagcgca 3121 gatatggtcg cggattgcct ttacggtgtc aacatcgaag atggagtcaa cgccctgcat 3181 aagtgcagca agtcgctcaa gacccatacc ggtgtctata ttcttctgtg caagaggggt 3241 ataagtgccg tcctcgtgac gctcaaactg ggtgaaaacg aggttccaga attccatata 3301 tctgtcgcag tcgcatccga tcttgcaatc gggcttgccg cagccgtgtt cgggtccgcg 3361 gtcaaagtgg atctccgagc aggggccgca aggaccgtcg atgcctgctt cccagaagtt 3421 gtcttccttg cccatacgga ctattttttc cataggaagg ccgatgtgct cgtgccagat 3481 cttttcagct tcgtcgtcat cctgatatac ggttacgaag agcttttctt cgggaatttc 3541 aagaaccttg gtgatgtatt cccaagccca ttcgattgct tctttcttga aatagtcgcc 3601 gaaggagaag ttgccgagca tttcaaagaa tgttccgtga cgggcggtct tgccgacgtt 3661 ttcaatgtcg tttgttctga cacacttctg gcaagtggtc // LOCUS sequence096 3683 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence096 VERSION sequence096 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3683 /mol_type="genomic DNA" /organism="" /note="sequence096" CDS complement(95..853) /product="imidazole glycerol phosphate synthase subunit HisF" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_002263180.1" /transl_table=11 /codon_start=1 /translation="MITKRIIPCLDVKDGRVVKGVNFTGLGDVNDPVTLGRYYSEAGAD ELVFYDITASNENRKLFADILRKVASEIFIPLTVGGGISTVDDFARVLDCGADKVSVNS GAIANPDIICKASRLYGSQCVVLSVDAKRVDGKFHVFSRGGRVDTGIELLEWIKRGVGD GAGEIVLNSIDTDGVKKGFDLAMLEAVCNIADVPVIASGGAGSVQDFITLFKSVPTVDA GLAASIFHFGEVKIDDLKRTLRESGVNVRI" /locus_tag="LOCUS_4240" /gene="hisF" /EC_number="4.3.2.10" /note="WP_002263180.1 imidazole glycerol phosphate synthase subunit HisF (Streptococcus mutans) [pid:58.3%, q_cov:99.6%, s_cov:100.0%, Eval:1.0e-79]" /note="MGA_535" CDS complement(850..1560) /product="1-(5-phosphoribosyl)-5-[(5-phosphoribosylamino)me thylideneamino]imidazole-4-carboxamide isomerase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011949114.1" /transl_table=11 /codon_start=1 /translation="MIIFPAIDIIDGEAVRLYKGDYNQKTVYGTPYDISLEFKAKGASH VHIVDLDGAKTGGTPNIETIKRIAADCKMFVEVGGGIRSLGVIEKYLHAGVSRAILGTA AIKNEELVRLGVREFGEGIAVGADILDGKIRINGWLEAADISADEFFKRMGDLGVTNII CTDISKDGAMVGTNLELYRELSAKYRMNITASGGVSSLEDIKALKDMGMYGAIVGKAYY TGAVDLEKAIEVAR" /locus_tag="LOCUS_4250" /gene="hisA" /EC_number="5.3.1.16" /note="WP_011949114.1 1-(5-phosphoribosyl)-5-[(5-phosphoribosylamino)methylidenea mino]imidazole-4-carboxamide isomerase (Clostridium botulinum) [pid:46.8%, q_cov:99.2%, s_cov:97.1%, Eval:3.8e-57]" /note="MGA_536" CDS complement(1574..2185) /product="imidazole glycerol phosphate synthase subunit HisH" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003436678.1" /transl_table=11 /codon_start=1 /translation="MIAIINYGAGNLFSLESSLKAIGAQTVVSGDPDVIKSADKLILPG VGAFEDAAKKLKNSGLDEIIKEETLKGKPLLGICLGMQMLFERSYEFGCFEGLGLIKGE IRPISERISKGLKIPHIGWNGLRFTKNDCPIFKYIKDGDYVYFVHSYSAVKCTENTVAM TEYGAELTAAVAKGNVYGCQFHPEKSSDVGLSILKAFNEL" /locus_tag="LOCUS_4260" /gene="hisH" /EC_number="4.3.2.10" /note="WP_003436678.1 imidazole glycerol phosphate synthase subunit HisH (Clostridioides difficile) [pid:53.2%, q_cov:100.0%, s_cov:99.0%, Eval:8.3e-57]" /note="MGA_537" CDS complement(2191..2778) /product="imidazoleglycerol-phosphate dehydratase HisB" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011083477.1" /transl_table=11 /codon_start=1 /translation="MRKAEIIRTTKETDIYLSLDLDGKGVSDINSGCGFLDHMLTLFAK HGAFDLTVKCKGDTEVDYHHTTEDIGIALGQALKKALGDMRGITRYGFMILPMDEMLIL SAVDISGRAQLNFGLNIPTQKVGDFDCELVEEFMLGLVRNADITLHLKQLDGKNSHHII EGTFKSLARSLRAAVKIDEAARDEIPSTKGVL" /locus_tag="LOCUS_4270" /gene="hisB" /EC_number="4.2.1.19" /note="WP_011083477.1 imidazoleglycerol-phosphate dehydratase HisB (Bradyrhizobium diazoefficiens) [pid:58.5%, q_cov:100.0%, s_cov:99.0%, Eval:1.6e-57]" /note="MGA_538" misc_feature complement(2765..>3683) /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_014208421.1:histidinol-phosphate transaminase" /note="WP_014208421.1 histidinol-phosphate transaminase (Acinetobacter pittii) [pid:47.0%, q_cov:97.7%, s_cov:83.1%, Eval:2.1e-75]" /note="MGA_539" /locus_tag="LOCUS_4280" ORIGIN 1 acgaggcgga tgaggtgaaa agcaccgctc gccacggcag gccacttgcg atgcaattgc 61 atcgcatcgc cgtgtcagcc acggctcgct actcctatat cctcacatta accccgctct 121 cgcgaagtgt cctcttcaaa tcatcgatct taacttcgcc gaagtggaat attgatgctg 181 caagcccagc atccaccgtt gggacacttt tgaaaagcgt gataaaatcc tgaacgcttc 241 ctgcgccgcc cgatgcaatg accggcacat ctgcaatgtt gcaaaccgcc tcgagcattg 301 caaggtcaaa tcctttttta acgccgtctg tatcgatcga attgagaacg atctcgcctg 361 cgccgtcgcc gacaccgcgt ttaatccatt ccaaaagctc aattcccgtg tcaacacgtc 421 ctccgcgcga aaaaacgtgg aacttcccat caacccgctt tgcatcgacg cttaaaacaa 481 cgcattgcga tccgtaaagg cggcttgctt tacaaattat gtccgggttc gcaatcgcgc 541 ccgaattaac actgaccttg tcagcaccgc aatcgagcac ccttgcgaag tcatcaactg 601 ttgaaattcc gccgccaacg gtcaagggta tgaatatttc cgaggcaact tttctcaata 661 tatccgcaaa aagcttcctg ttttcgtttg atgccgtaat atcatagaac accagctcgt 721 ctgcgcccgc ttccgagtaa tatcttccca aggtcacggg atcgttcaca tctcccagcc 781 ctgtgaagtt aactcccttt acaactctgc cgtccttgac atccagacaa gggataattc 841 tctttgtaat catcttgcca cctcgatcgc tttttcaagg tcaactgcac ccgtatagta 901 tgctttgccg actatcgcgc cgtacattcc catgtctttg agtgctttaa tgtcctcaag 961 gctggaaaca ccgcccgatg cggtaatgtt cattctatac ttcgcagata actcacggta 1021 aagctccaaa ttggtgccaa ccatcgctcc gtcctttgaa atatcagtgc atatgatgtt 1081 tgtaacgccc aaatcgccca tacgcttaaa gaactcatct gcggaaatat ccgccgcttc 1141 aagccagccg ttaattcgaa tcttaccgtc taaaatatcc gctccaacag caattccttc 1201 gccgaattct cttacgccca agcgcaccag ctcttcgttc ttaattgctg cagtgcccaa 1261 aatagccctt gaaacacctg cgtgaagata cttttcaatc acgcccaggc ttctgattcc 1321 tccgccgact tcaacaaaca tcttgcagtc agcggcaatt cgcttaatgg tttcaatgtt 1381 gggtgtaccg cccgttttcg ctccgtcaag gtcaacaatg tgaacgtgcg aggctccctt 1441 tgccttaaat tcaagggaaa tatcataagg cgttccgtaa acagtttttt ggttataatc 1501 gcccttgtaa aggcgaacag cttcaccgtc aataatatca attgcaggga aaataatcat 1561 tatttttcct ccgttaaagt tcgttaaatg cttttaaaat actcagcccc acgtccgagc 1621 tcttctcggg gtggaattgg catccgtaaa catttccttt tgccaccgcc gctgtcagct 1681 cagcgccgta ttccgtcata gcaacggtgt tctcggtgca cttaaccgca gaataggagt 1741 gtacaaaata tacataatcg ccgtctttaa tatacttaaa aatcgggcag tcatttttag 1801 tgaatctcaa cccattccaa ccgatatggg gaatcttcag tccctttgat attctctcgc 1861 tgataggtct tatttcgcct ttaatcagcc ccagcccctc aaaacaaccg aattcatagc 1921 ttctttcaaa aagcatctgc attcccaagc atattcccaa aagaggcttg ccctttaatg 1981 tttcttcttt gattatttca tcgagtcctg agtttttaag cttttttgcg gcatcctcaa 2041 atgctccgac acccggcaag atcagcttat ctgccgactt gataacatcg gggtcgccgc 2101 tgacaaccgt ctgtgcgccg attgctttaa ggctcgattc aagggaaaac aaatttccag 2161 caccatagtt aattatcgct atcattttgt ttaaagcact ccctttgtgg aaggaatttc 2221 gtcacgagcc gcttcgtcaa ttttaaccgc cgctctcaag cttcttgcca gcgatttaaa 2281 tgttccttca ataatatggt ggctgttttt gccgtcaagc tgtttaaggt gcagggtgat 2341 gtccgcattt cgcacaagcc ccagcataaa ttcctcaacc agctcacagt caaaatctcc 2401 caccttttgt gtgggaatat tcagcccgaa gttaagctgc gctctgcccg aaatatccac 2461 cgccgagagt atcagcattt catccatcgg caaaatcata aacccatatc ttgtaatgcc 2521 tctcatatct cccaacgcct ttttaagcgc ctgaccgagc gcaataccga tatcctcggt 2581 tgtgtgatga taatcaacct ctgtgtcgcc cttgcattta actgtcagat caaatgcacc 2641 atgctttgca aaaagggtaa gcatatggtc caaaaaaccg catcccgagt taatatcgga 2701 aacgcccttt ccgtcaaggt caagactcaa atatatgtcc gtttctttgg ttgtacgaat 2761 aatttcagct tttctcattt aaaatctcct taaccgcccc gacgaatttc tccatatcgc 2821 tgagtgttcc aattgacact cttatatatt cgcagattct ctcgtcatta aagtgcctaa 2881 ctaaaattcc tttgtccttg agcttcaaat ataactcttc gccgccgata tctggtgact 2941 ttgcaaaaat gaagttcgcc ttcgagtcgg tataatcaaa accgagagct ttaagctctc 3001 gctttgtata ttctcttgca tcaataatct ttcggcagtt ggttttatag taatcgcttt 3061 cctcaatcgc tttaattcct gcaatctgcg tcaagcgatt gacattatat gggtttgtcg 3121 agtttctgat tctgtctaaa tctgcgataa gctcgctgtt tgctatcgca aagccaagtc 3181 ttgctcctgc caacgagcgc gattttgaat aggtcatcac aaccaaaagg tttgaatact 3241 tttctgtgag ctttgccgca ctttctccgc cgaaatcgac atatgcttca tcaatcacaa 3301 ccacattatc gggatttgtt tttgcaatct cctcaatttc ctcaaggctt atgcaaagcc 3361 cggtgggtgc attgggattt gcaatgacga taagcttgtt ttttccaatg tatttcttcg 3421 catcaagtgt taaatcatcc tcaagtggaa taatctcaga ttcaactccg tgaagcttcg 3481 caaagacctt ataaaaaccg taggtgatgt cggcatatgc tgcgccctct tgcgaaaaag 3541 ccataaacga aatgttcaaa atatcgtccg agccgttggc aacaaaaata ttttgcggct 3601 taacgctgta ttcccttgaa agggcttctt taagctcact cgcgtccggg tcgggataaa 3661 gccgaaggga cttaacctgc gcg // LOCUS sequence097 3679 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence097 VERSION sequence097 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3679 /mol_type="genomic DNA" /organism="" /note="sequence097" CDS complement(1624..3612) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MNKMAASTDLGYLASCVMAARGYDDTESLVDFFNREELSDPFLLR DLDKAVDIINEAIENDELICIYGDYDCDGVTATAILYGYLTGMGARVICYIPEREEGYG LNCSALDSIAAEGVSLVVTVDNGISAIQEAEYAKSLGLKLVITDHHQPLDELTDALAIV DPHRRDCPSPFKALCGAGVALKLCAALDGGSYDLALEMYSDLAALGTIADIVPLKGENR TIVSTGLELMKNTENLGLIELLADSHPDMNTLSATGLAFSVCPRINAAGRFGSPITALD ALISEDESASAYAHELSRLNDNRKRCESEILAEVLAQIDSNPSLLNERVLIAVGHGWHH GVIGIVASKLLERFERPVVVISVDESGEARGSARSMPGFNIFKCFDYCKEIMIKYGGHE CAGGLTLREENLPRLRELISEYAKDNHREMPRLTINADKLLKGRDLSPDEVMQLRRLEP YGCENAEPVFALSGAEIKAVIPLKNGDHTKLELWYDNAHVSALLFGVKTAELPYAVGDK LDLMANLIVNEYKGTNHVSIRALDYRLHGLRQDRFFAAKDAYFAFKRGEPLSREILTKG NPTREELVSVYKYLSSLGRSVTEQALYERLQSESINAFKLSVILDAFCETGLASLNPSS GKIMLLAPSVRVDIESSQTLKALRQSL" /locus_tag="LOCUS_4290" /note="WP_011861665.1 single-stranded-DNA-specific exonuclease RecJ (Clostridioides difficile) [pid:37.9%, q_cov:76.6%, s_cov:62.5%, Eval:4.6e-93, partial hit]" /note="MGA_541" ORIGIN 1 ccgattgcgg catagaaatc atcaatggta tcaaggttat ggcgcttgat gtccattgca 61 agaaattctt gaatttcgct ttcctcaagg cggatatagt tgcgcttgaa ttcgcgctca 121 agttccgctt taccctcagc gatgttttca tcgcggcgtt cttttttgaa ccaagagcga 181 atttttgact ttgcttcgtt ggtgtggcag atattcagcc aagcacggtt ggggccgtgg 241 ccggggtctt tcgaggtgat gatttcaatg atctcgcctg ttttgatctg atattcaagg 301 ggaaccatct tcttatctac cttagcacct gtcattcggt ggccgacttg ggtgtggatg 361 gcatatgcaa agtcgattac ggttgagccc agcggcaggg agatcacatc acccttaggg 421 gtgagagcaa aaacatcatc cggagcgagg tcttctttaa tagctctgac gatatcttca 481 acatcgccag attcctgctg ggtttcaaga atctggcgaa cccagttaag acggttatca 541 agcttatatt tgccccttac gccctcttta tatttccagt gggcggcgat gccgtattcg 601 gcggtgtggt gcatatccca agttctgatc tgcacttcaa atggaatacc ctcgcggcag 661 gtgacggtcg tatggagcga ctgatacata ttgtgcttgg gggtggaaat ataatctttg 721 aagcgattag gaatgggtga gaacatatcg tggatgatgc ccaaaacgaa gtagcattcg 781 gtcatatcat cgacaattac gcgcactgcg tatttatcat atatttcttc aaaggtcttg 841 ccctgttcat aaaccttttt atagattcca taagcactct tgactcgacc ctcaatggtg 901 ggtacagggt caaaatcgtg ggaaagacgc tcggagattc gggatttaat cagcttaatg 961 aaatcctcac gctcagcctt gctcttttca atcatctgtt cgatctcatt ataagcatat 1021 gggtcgaggt acatgaaaga gatatcttca agttcttcct ttaatgccat aattcccaga 1081 cggttggcaa gcgggacata tacattcatt gtttcaaggg aaacagtgcg tctttttgct 1141 tcagagcgaa aaccgagtgt tcgcatattg tgaaggcggt cgcccagctt gatgatgatt 1201 actcttatat cctttgccat cgagaggaaa attttgcgga cgttttcagc ctgctgttcc 1261 tctttggaga agatcgcaat ttgatcgagc ttggtaacac cgtcaacaag agttgcaacg 1321 tcggctccga acatcttttt aatgtcgtcc aaagaggttt cggtgtcctc aacaacgtcg 1381 tgaagcaaag ctccgcaaat tgtgtcggta tccataccaa ggtccacaag aattcccgca 1441 acgcaaagag gatgggtgat atacggctcg ccggattcgc gtaattgtcc accatgcttt 1501 aggtcggcaa attcatcggc gcgcttgatc ttatccacct ggtcgttttt gtcggtggcg 1561 gttatttttt caattaaggc ttcaatggaa ttgatgtttt tagacatata tgattgctcc 1621 tgtttatagg ctttgacgca aagccttgag agtttgagat gattctatat caacgcggac 1681 agagggcgct aatagcataa tctttccgct tgatgggttt aaacttgcaa gccccgtttc 1741 gcagaaggca tccaaaatta cgctgagctt aaaagcgttg atgctttccg attgcaagcg 1801 ttcatataaa gcttgctctg ttacagacct gcccaaagag gaaagatatt tgtatacgct 1861 taccaattcc tcgcgggtgg ggttgccttt ggtgagtatc tcgcgggaaa gtggttctcc 1921 cctcttgaac gcgaaatatg catcctttgc ggcaaaaaat cggtcttggc gcaagccgtg 1981 caagcggtaa tcaagtgcac ggatgctgac atgatttgtt cctttatatt cattgacgat 2041 taagtttgcc ataaggtcga gcttgtcacc aactgcataa ggcaactcgg cagttttaac 2101 gccaaacaaa agcgcggaaa cgtgagcatt atcataccaa agctcaagct tggtatggtc 2161 gccgtttttg agggggatga ccgctttgat ttcggcaccc gaaagagcaa agacaggctc 2221 ggcgttttca cagccgtaag gctccaaacg gcgaagctgc ataacttcat cgggtgaaag 2281 gtcgcgacct ttcaacagct tgtcagcatt tattgtcaag cgaggcattt cgcggtggtt 2341 atccttagca tattcggaga taagttcacg caggcggggc aaattttcct cacgcagggt 2401 caatcctcct gcacattcgt gtccgccgta tttgatcatt atttccttgc aataatcgaa 2461 acatttaaaa atattgaagc ccggcatact gcgggcagaa ccgcgggctt cgcccgattc 2521 atcaactgag atgacaacaa cgggacgttc gaagcgctcg agaagctttg aggcaacgat 2581 gccgattaca ccgtgatgcc aaccgtggcc tacggcaatt aatacgcgct cgtttaaaag 2641 tgaggggttg gaatcaattt gtgcaagaac ttcggcaaga atttccgatt cacaacgctt 2701 gcggttatcg tttaagcggg aaagctcatg tgcgtatgcc gatgcagatt cgtcctctga 2761 aattaaggca tcaagcgcgg tgattggtga gccaaatcgg cctgcggcgt taattcgcgg 2821 acaaacactg aatgcaagac cggttgcact aagggtgttc atatcgggat ggctgtcagc 2881 caaaagttct attagtccga gattttcggt atttttcata agctcaaggc cggttgaaac 2941 aatggtgcgg ttttcgcctt taagagggac aatgtcggca atggtgccca aagctgcaag 3001 gtcggaatac atttcaaggg cgagatcgta tgagccgccg tcaagtgcgg cgcagagttt 3061 taaggcaact cccgctccgc agagagcctt gaagggtgat gggcaatcgc ggcgatgggg 3121 gtcaacgatc gctaaagcat cggtgagttc atcaagaggc tggtggtggt cggtgatgac 3181 caatttcaga ccgagagatt tagcatactc tgcctcctga attgcagaaa tgccgttatc 3241 gacagttaca acaagggaaa cgccttcggc agcgatggaa tcgagagcag agcagttaag 3301 accgtagccc tcttcccttt cgggaatata gcaaatcaca cgggcaccca tgcctgtgag 3361 atatccatac aaaatcgcgg tggcggtaac gccgtcgcaa tcgtagtcgc catagatgca 3421 gatcagttcg tcgttttcaa tggcttcatt gatgatgtca acagccttgt ccagatcgcg 3481 gagcaaaaat gggtcactta attcctcgcg gttgaagaag tccacaaggg attcagtgtc 3541 atcatatccg cgggcagcca taacgcagga agctaagtag ccaaggtcgg ttgatgccgc 3601 cattttattc actttttggg catccgccgc agatactgtc catcttttca taaagtaccc 3661 ctattttata aaatacata // LOCUS sequence098 3662 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence098 VERSION sequence098 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3662 /mol_type="genomic DNA" /organism="" /note="sequence098" CDS complement(150..3602) /product="DNA polymerase III subunit alpha" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003436251.1" /transl_table=11 /codon_start=1 /translation="MSKFVHLHVHSEYSLLDGACRIKRLVSRAKELGMDTVAITDHGNV YGAVEFYNECKRQDIKPIIGCEVYVAPRTRFDKEGRLDSSPYHLILLCKNEQGYRNLCK LVSIASIEGFYGKPRIDISLLEMYHEGLICLSGCLAGEIARRLSENDYDSARKVALRYK NLFGDDYYIEVQNQNFSEQQAILPYQYKLARELGIPLVATNDAHYISRADAPAQKILMC ISTNTTIKDPDAMDLPNDEFYFKSEEEMRAAFIGHNDAIENTCIIADKCNFDFEFGVTK LPFFSLEGVTDNEKFLRDMSYEGLKRLYVNPTQEAIDRLEYELSVIAKMGYVNYYLIVW DFINYAKTHGVPVGPGRGSGAGSLVAYCIGITGIDPLKYNLLFERFLNPERVSMPDFDI DFCIEGRQSVIDYVKDRYGHDHVAQIITFGTMAAKNAIRDTARAMALPYSLADKVAKAI PFGMSITEAKEKNEDFKAMYLGDAQIHELCDMAIQVEGMPRHSSTHAAGVVITEGPVSD YVPLTTNDGQPVTQYTMTVLESLGLLKIDFLGLRNLTVIRDCVREIHKTDPSFDIDKIP LDDKGVFKMLAKGDTCGVFQFESGGMTSTIMRLVPENIEDLIAVISLYRPGPMDSIPTY IKNRHNPKLVKYATPKLKPILDVTYGCIVYQEQVMQIFRELAGYTFGRADIVRRAMAKK KHSVLEAERKAFIWGDEKPDGTGCCGCVANGISEEVASKLFDDMMSFASYAFNKSHAAA YATVSYQTAYLKLHYFKEYMSALLTSVLDSTSKIIEYSEECEAKGVKILIPDVHESYDS FVACDGGIRFGLLAVKSLGRGVINGIIDERQKNGKFVSLYDFISRMYGREMNSRAVEAL IMSGAFDSFPTNRKQMLTNYDLVMNAVSDRERGNIDGQLDLFGFADDTGSTAEIEIPYA EEYPFAELLEMEKETVGIYVSGHPLSEYAGWLTASGGTTARRVIEGVISDPPIYKDGET VTIVALFRTKKMFTTRSNKQMCFAEVEDTSGNIEVLVFPNVYDRVRGLLNAGTKLAITG KISIKDEEDPKILADSIVTVDDFIKELKRKALCVQIDSSDRDAVEALKQVAEKYKGESK LMVYLRDLKKLTAVKGAGELRLCYESLSELKKLFGAENVKFKK" /locus_tag="LOCUS_4300" /EC_number="2.7.7.7" /note="WP_003436251.1 DNA polymerase III subunit alpha (Clostridioides difficile) [pid:47.3%, q_cov:99.7%, s_cov:99.6%, Eval:6.4e-314]" /note="MGA_543" ORIGIN 1 atgcggcgcc gaaggcgccg cagagtccgc cccattgggg cggacggctg ccgcgaagca 61 cgcgaatgtg tggcgatgat caagtggagc ccatccgatg aaatacgttg ccgaatgtca 121 cgtttcggcg ggtgggcggt gagagcagct cactttttga attttacatt ttcagcgcca 181 aagagctttt taagctcgga aagagattca tagcaaagcc tcaactctcc tgcgccttta 241 acggcagtga gttttttaag gtcacgcaga tagaccatca gtttgctttc gcctttatat 301 ttttcggcaa cctgcttgag tgcctcaacc gcatctctgt cggatgagtc gatttgaacg 361 cacagcgcct ttcgctttag ctctttgatg aaatcatcaa ccgtgacaat cgaatctgcc 421 agaattttcg gatcttcttc atctttaatt gaaatcttac ccgtgattgc aagcttggtt 481 cctgcattca aaagtccgcg aacgcggtca tatacattcg ggaaaacgag gacttcgata 541 ttacccgaag tgtcttcaac ctcggcgaag cacatttgct tgttgcttcg ggttgtgaac 601 atcttcttgg tgcggaagag tgcaacgatt gtaacagttt cgccgtcttt atatatcggt 661 ggatcgctga ttacgccttc aatgacacgc cttgcggtgg tgccgcccga ggcggtcagc 721 cagcctgcat attccgacag aggatgaccc gaaacataaa ttccgacagt ttctttctcc 781 atttccaaaa gctctgcaaa tggatattcc tcggcatatg gaatctcaat ttcggcggtg 841 gagcctgtgt catcggcaaa gccgaacaaa tcaagctgtc cgtcgatatt tccgcgctca 901 cggtcggaaa ccgcattcat gacgaggtca tagttagtca gcatttgctt acggttggtg 961 gggaatgaat cgaatgcgcc gctcataatt aacgcttcaa ctgcacggga gttcatctct 1021 cgaccgtaca tacgggagat gaaatcatag agcgaaacaa atttgccgtt cttttggcgt 1081 tcgtcaatta ttccgttgat tactcccctg ccaagactct tgactgcaag caaaccaaat 1141 ctgattccac catcgcaggc aacaaagcta tcatagcttt cgtggacatc ggggatgaga 1201 atttttacac ccttggcttc gcattcttcg gaatactcga ttatcttcga ggtggagtcg 1261 agcacgcttg tcaaaagcgc agacatatac tccttgaaat agtggagctt taaatatgcc 1321 gtttgatatg atacggtggc atatgcggcg gcatgggatt tgttgaatgc ataggatgca 1381 aagctcatca tatcatcaaa gagcttggat gcaacttcct cggaaattcc gttggcgaca 1441 catccgcagc agcccgtacc gtcgggcttt tcatcgcccc agatgaatgc ctttcgttcg 1501 gcttcaagca ccgaatgctt tttctttgcc attgctcggc ggacaatatc cgccctgccg 1561 aaggtatagc ccgcaagctc gcggaagatc tgcattacct gttcctgata aacgatacag 1621 ccgtaggtta catccaaaat cggtttcagc ttgggtgttg catatttgac aagcttggga 1681 ttatgacggt ttttgatata tgtgggaatg gaatccatcg gaccgggacg gtaaagagag 1741 attaccgcga taaggtcttc gatgttttca gggacaagtc gcataatggt cgaggtcatt 1801 ccgcccgatt caaactggaa cacaccgcag gtgtcaccct ttgcgagcat tttgaatacg 1861 cccttatcat cgaggggtat tttgtcgata tcaaagctcg ggtcggtctt atggatctca 1921 cggacacagt cgcggataac ggtcaagttt cgcaagccca aaaagtcgat cttcaaaaga 1981 ccgaggcttt cgagcacagt catcgtatat tgggttacag gctgtccgtc gttggtcgta 2041 agcgggacat agtcggaaac agggccttcg gtgatcacaa cgcctgccgc atgggtcgaa 2101 gaatggcggg gcatgccctc aacctgaata gccatatcgc aaagctcgtg aatttgagca 2161 tcgccgagat acatcgcttt gaaatcttcg tttttctcct tggcttcggt tatgctcata 2221 ccgaaaggaa tcgcttttgc aaccttgtcc gcaaggctat atggcagagc cattgctcgg 2281 gcggtgtcgc gaatggcgtt ttttgccgcc attgtgccga aggtgatgat ttgcgccacg 2341 tggtcgtggc cgtatctatc cttaacatag tcgatgaccg actgtctacc ttcgatacag 2401 aagtcgatat cgaagtcggg cattgacaca cgctcggggt ttaaaaatcg ctcgaagagc 2461 agattatatt taagcgggtc aattcccgta atgccgatgc aatatgcaac aaggcttcct 2521 gcacccgagc ctctgccggg gccgacggga acaccgtggg ttttggcgta atttatgaaa 2581 tcccagacaa tgagataata gttgacatag cccatttttg caataaccga cagttcatat 2641 tcaaggcggt ctattgcttc ctgcgttggg ttgacgtaaa gacgttttaa tccctcatag 2701 ctcatatccc gcaggaattt ttcgttatcc gttacaccct caagagagaa gaacggcagt 2761 tttgtcacgc cgaattcaaa gtcgaagttg catttatcgg cgatgataca ggtgttttcg 2821 atagcatcgt tatggccgat gaaggcggcg cgcatttcct cttccgactt gaaatagaac 2881 tcgtcattgg gcaagtccat cgcatcgggg tctttgatgg tggtgttggt ggagatgcac 2941 attaatatct tctgggcggg ggcatccgca cgggagatat agtgggcatc gttggtggca 3001 acaaggggta tgccgagttc ccgcgccagc ttatattgat aaggcagaat tgcctgttgt 3061 tcgctgaagt tttggttttg aacttcgata tagtaatcat cgccgaagag gtttttataa 3121 cgaagcgcca ctttgcgggc ggaatcgtaa tcattttcgc tgaggcgcct tgcaatctcg 3181 cctgccaagc atcccgaaag gcagattaag ccttcgtgat acatctcaag aagcgagatg 3241 tcgatacggg gtttgccgta aaatccttcg attgatgcga ttgaaacgag cttgcaaaga 3301 tttcggtagc cctgctcgtt tttgcaaagc aaaataaggt gatagggcga ggagtcaagt 3361 ctgccctctt tgtcaaatcg ggtgcgaggt gcaacatata cctcacagcc gattatcggc 3421 ttgatatcct gacgtttgca ttcgttataa aactccacag cgccgtatac atttccgtgg 3481 tcggtgattg caacggtgtc cattcccaat tcctttgcac gcgaaacaag ccgcttgatt 3541 cggcaggcgc cgtcaagcag cgaatattcg ctgtgaacat ggagatggac aaatttggac 3601 atgggtttgg ctcctttgcg ggggatactg ggtgtagggg cggacctatg tgtccgcccg 3661 cg // LOCUS sequence099 3657 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence099 VERSION sequence099 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3657 /mol_type="genomic DNA" /organism="" /note="sequence099" misc_feature <1..1572 /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_000003348.1:oligoendopeptidase F" /note="WP_000003348.1 oligoendopeptidase F (Bacillus cereus) [pid:49.1%, q_cov:94.5%, s_cov:81.4%, Eval:1.2e-146]" /note="frameshifted, insertion/deletion at around 1485" /note="MGA_545" /locus_tag="LOCUS_4310" CDS 1777..2637 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MKRLLVSLLIMSMMLCSCTNASNEIDNGTDNGTGESTPAVTEESL LSDSEPTQTDEIVSAQDESTEVNIETTASESKKSPFPDVNDLRARPDGKEVSIFKDNTF DCDYSGYKEIGYDFGDLHRSVMAPAGWHGFRFYRKDDPSFENMLTGLPIYDGELPVQID QFDDSTMFKNEPLTKSTFFFAESPWIHAEDFINADGLINKYDYETYIDKKGRSMKVYFI DGLPKYAVYDDFFNLCIWFNLDSEEQIPVVVNMINSIEVSLSREAELTLKTAERLGYTI IPPEE" /locus_tag="LOCUS_4320" /note="MGA_546" ORIGIN 1 cttgaattcc tcaagtataa cgaagagctt gaccttgttt tctctcgcct tgctaactat 61 gcaatgagaa agaacgatca ggactccacc aaccccacct atcaggatta cagaaaccgc 121 cttatgatgg cattcaccca ggtaagtgct gcttctgcat ttatgactcc tgagcttatt 181 tcaatggata acgaaaccgt tgaaagcttc ttcaaggcac agcccgatct tgaactttac 241 agactccaga tcgaaagaat cagaaaggat aaggaccata tcctctctga aaaggaagaa 301 gcaatcatgg ctgctgcagg ccagctcaag agaagcccct caaacatcta ttcaatgttt 361 gagagtgccg acattaagtt cccctcaatc aaggatgctc agggcaacga acttcccctt 421 accagcggca cattcattcc ttatatgatg tcacctgaca gagagatccg taagcaggca 481 tttgaaaatc tttatcacac atatgagcag ttcaaaaaca ctcttgcttc ctgctatgat 541 gctgaggtaa agtcgagaat gttctctgca aaggcaagaa actacggctc tactcttgaa 601 gctgctcttt ccaataacga ggttcccact tctgtatatc ataacctcat tgatgccgta 661 cacgagaata tgcactatat gcataagtat atcaagctcc gcaagaagct gatgggcgtt 721 gatgagcttc atatgtatga cctttatact tcaatcattc ccgatgctga tgttaaggtt 781 acatttgaac aggccaaggc tgacaccctt gccgcaactg cagttttggg cgctgattat 841 accgcaatgc tcgaagaagg ctttgcaaac cgttggatcg acgtttgcga gaatgtgggt 901 aagcgctcgg gcgcatattc cgcaggcgca agacctcacc cttatgttct tttgaaccac 961 aaggaagacc tcgaccacga attcactctc gctcacgaaa tgggtcacgc tttgcattct 1021 tatctttcca tgaagaatca gcctatttgc tatagcgact atgtaatctt tgttgccgaa 1081 gttgcatcca cctgcaacga agcactcttg atgcagtatc tcttgggcaa gaccaccgat 1141 aagaaggaaa gagcatatct tatcaatcac ttccttgagc agttcagaac aactctctat 1201 cgccagacaa tgttcgctga gtttgaaatg ctcactaacg caatggctga aagaggagag 1261 tccctcaccg ctgaatctct ttgcgcactt tatcacaagc tcaatgttga gtattacggc 1321 gacggtatca ctgttgaccg tgagatcagc ttcgagtggg aaagaattcc tcacttctat 1381 tacaacttct atgtattcca gtatgcaacc ggcttatccg ccgcaatcgc actttctcag 1441 agaatcttaa aggaaggcga gcctgcagtt aaggattata ttaaggtcct tttccggcgg 1501 ttgctcaacc gatcctatct cccttctcaa gatcgcaggc gtagatatga actctcccga 1561 gcctgttgct aacgctctta aactcttcgg cgaactcatc gacgaaatgg aagagctcat 1621 ggctgaataa ataaaatcaa actccgtcct tcgtgggcgg agtttttcat atttacaaaa 1681 ctacataaat gtggtataat gactttggaa gcgttagagg cgatactata ctcgtcttat 1741 aaccacgtat attagctttg gagggatctg aatattatga aacgtttatt ggtgtctttg 1801 ctcatcatgt cgatgatgct ttgcagctgt accaatgctt ctaacgaaat cgataatggt 1861 acggataacg gaacaggcga aagtacacct gcagttacag aagaatctct gctttccgat 1921 tccgaaccca ctcagacgga tgagatagtt tctgctcaag acgaaagtac cgaagtcaac 1981 attgaaacta ccgcttctga aagtaaaaag tccccgtttc ccgatgtgaa cgacttacgt 2041 gcacgtcccg acggcaagga agtttctatt ttcaaggaca atacctttga ttgcgactac 2101 tcaggctaca aggaaatcgg atatgatttt ggagatttac accgctctgt tatggcgcct 2161 gcgggttggc acggtttccg tttctaccgt aaagatgatc cgagttttga aaatatgctt 2221 acaggcttac cgatttacga tggagaactt cctgttcaaa tagatcagtt tgatgattct 2281 acgatgttta aaaatgaacc gctgacaaaa tctaccttct tctttgcaga gtcaccgtgg 2341 atacatgctg aggattttat caatgcagac gggttaatta ataagtacga ctatgaaacc 2401 tatatcgaca aaaagggcag aagcatgaaa gtttatttca ttgacggctt gcctaaatat 2461 gctgtgtatg atgatttctt caatctttgc atttggttta acttagacag tgaagagcag 2521 atacccgtcg ttgtgaatat gataaacagc attgaagtgt cgttgagccg tgaagcagag 2581 ctcactttga aaactgccga gaggcttggc tatacaatca ttccgcctga ggaataatgt 2641 gatgatgatc caatcaaact ctccgccctt tatgggcgga gttttttatg ccacacactc 2701 tacccaacct gccccaagaa tccattatgc ggattcttgt taaaactttg tgaccaaagg 2761 gagcaacgtt tttacccctt ttgcccgttg acaattttcc ctacgaatga tagaatatat 2821 gaggatttta aacataaaat ctaaatgtat cctgcggctc gtccgtaaaa gaaaggaaac 2881 tcactatgaa gtattatatt ggtatagatt tgggcggcac caacattgtt gcaggtgttg 2941 tcaacgaaaa atatgaaatt atcgcaaagg caaagacacc gacaaaccgt ccccgtcctg 3001 ttgaggatat ttgcgcggat atggcgcgcg ttgcgcttga ggctgtcgct ttggcaggac 3061 ttacaattga tgacatccag tcggtaggcg ttggctctcc cggaactgtc aacagcgaca 3121 ccggagtaat tgaatacgcc aacaatctcg atttcaacga tgctcccgtg gcttcgctca 3181 ttcgcaaggt cattgacaag cccgtttatt gcgaaaacga tgcaaacgct gcggcctacg 3241 gcgaatttgt tgcaggttct gcaaagggcg caaataacgc tgtttgcatc accctcggca 3301 caggtgtcgg cggcggtatc atcattgacg gcaagatcta ttccggtttc aacttcgcag 3361 gtgctgagct tggacatatg gtagtcgagg tggacggtcc caagtgtacc tgtggcagac 3421 acggctgttt tgaggtatat tcttccgcca caggtcttat ccgtatgacc aaggaagcaa 3481 tggatgctaa ccccgattcc aagatgcacg aaatgatggg cgaccatgtt tcaggcagac 3541 tcgccttcaa tgcaatgagg gcaggggacg atgctgccaa gggcgttgtc gataaatata 3601 tcaagtatct tgcggcgggt attgctaaca ctatcaacat cttccagcct gaaattc // LOCUS sequence100 3651 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence100 VERSION sequence100 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3651 /mol_type="genomic DNA" /organism="" /note="sequence100" CDS complement(220..1098) /product="FMN-dependent dehydrogenase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011254509.1" /transl_table=11 /codon_start=1 /translation="MTHDSNQITRDYFDSLLLESRYIDSDQPSLDFELFGEKFKTPIMT AALSHLHKICDNAMVEIAKGACNAGAVHWVGMGEPEEMEEIFAAAKTVRIIKPHADNSD VLWRIEHAIKHGAFAVGMDIDHAFSWDGKYDNVLGLAMKPKSLDEIKMFVKAAGDTPFI VKGVLSVSDAEKCAEAGVAGIVVSHHHGIMNYAIPPLQILPDIKKAVGDKMKIFIDCGF ESGMDTYKALALGADAVCVGRNLMGPLSEGASGVERRINELNRELRATMARTGVKNLSE FDASVIHPRKV" /locus_tag="LOCUS_4330" /EC_number="1.1.3.15" /note="WP_011254509.1 FMN-dependent dehydrogenase (Lactobacillus acidophilus) [pid:45.8%, q_cov:98.6%, s_cov:86.5%, Eval:2.2e-63]" /note="MGA_549" CDS 1232..3241 /product="tetracycline resistance ribosomal protection protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_010964757.1" /transl_table=11 /codon_start=1 /translation="MFKNLGILAHVDAGKTTLTEQLLYVSGVIRDLGSVDDGTAKTDSL SIERKRGISVRSSTASLKWKGADINIIDTPGHVDFAGEVERCLEALDFAILVISAPDGI KAHTENLLNALVTLKMPRLIFINKLDRAGSDYEGIISELNRLGGAKTVYMPLSIAQNEG GDDVSITSRDFARAATEALAEFDEVAADAFLSDQNLSDTGINHMLPQAILDTRITPVLC GCAKKGLGVEELLDFIASYMPDATHKATEDTSGIIFKIEHDKTMGKIAHVRMFGGKIQN RDALAVIMPESATAFSDDDAIPADSEDDSKDKVSQIRKAIGGRFSDAGVVESGDIAALC GLTKAKVGRFVGSVAPSNHYTLAHPLLRVRATPLDDHPEALPKLAHALKELSDEEPYID AKWENGQSEIVISLTGSIQSEIIKSLLEERYSLRANFSDPTVIYRETPTKKGCGIGVYT MPKPCWAIVNFMFEPMPRGYGVSYHGRLPNNQCFYKYQSHIHRSFENCLEQGLHGWEVT DFKCTLIGGEHHTIHTHPLDFFVATPMAFMNALTDCGSTLLEPLMKLRIIAPAELSGKL ITEIMRGDGEYNAPYVRGDTVTLDAIVPFKNFMDFPTRLASMSSGRGVCSTSFYGYREC PEGQGEDCPRRGVSPLDRSKWILWARGALSESQI" /locus_tag="LOCUS_4340" /gene="tet" /note="WP_010964757.1 tetracycline resistance ribosomal protection protein (Clostridium) [pid:35.8%, q_cov:99.1%, s_cov:99.2%, Eval:4.1e-113]" /note="MGA_550" ORIGIN 1 ccgagctgcg caaaccgatg gggtgtgcgt tgctcttcgc gcaacaagaa atcatccatc 61 tggaaaacat tgcagtcata ctgctttgcc aaggcgagcg caagggtggt cttgcctgag 121 gtgcaatatc cgtcaatcgc aattatgacc tgttcttttt ccgccataag gcgatcaatt 181 tgctcaatta tcaaattaag tttttgcttc atattaaggt catacctttc ttgggtgaat 241 aacgctcgca tcaaattccg agagattttt aacgcctgtt cttgccattg tcgcccgaag 301 ctcgcggtta agctcgttaa ttctgcgctc aactccgctt gcaccctcac tgaggggacc 361 catcaggttt ctgccgacgc atacggcatc tgcacccaaa gccagcgctt tatatgtatc 421 cataccgctt tcaaaaccgc agtcgatgaa aattttcatc ttatctccga cggctttttt 481 aatgtcgggc aaaatttgaa gcggagggat agcatagttc ataatcccgt gatgatggga 541 aacaacaatt cccgcaacgc ctgcttcggc gcatttttcg gcatcagata cactcaaaac 601 acccttgacg ataaagggag tatcgcctgc ggctttcaca aacattttaa tttcgtccag 661 cgatttcggc ttcattgcaa gtcccaaaac gttgtcatat tttccgtccc aggagaatgc 721 gtggtcaata tccataccga cggcaaaagc gccgtgttta attgcgtgct caattcgcca 781 aagaacatcg ctgttgtcgg cgtggggctt aatgatgcga acggtttttg ccgcagcaaa 841 aatttcctcc atctcctccg gctcgcccat tccgacccaa tggacagcgc ccgcgttgca 901 agcgcccttt gcaatttcaa ccattgcgtt gtcgcagatc ttatgcagat gggaaagcgc 961 cgcagtcatg atcggtgttt taaacttttc tccgaaaagc tcaaagtcaa ggctcggctg 1021 gtcggagtct atgtatctcg attctaaaag caatgaatca aaataatctc ttgtaatttg 1081 gtttgagtcg tgggtcataa ttatgcctcc cgtcgttttg ttgattctat tgtacaatat 1141 gaaacaaata attgcaaccg tcttgccata atatgtgtcc gtatggtata atttattgaa 1201 ctttgattta taagatatgg agacgccgac agtgtttaaa aatttgggaa tactcgctca 1261 cgttgacgcg ggcaaaacga ccttaactga acagcttttg tatgtttcgg gtgtaattcg 1321 tgaccttggc tcagttgatg atggcaccgc caagaccgac tcactttcaa tcgagcgcaa 1381 aaggggaatc tccgtgcgct cgtcaacagc atcgctgaag tggaagggtg cggatataaa 1441 tataatcgac acccccggtc acgttgattt tgcaggtgag gttgaaagat gtcttgaagc 1501 gttggacttt gcaattttgg tcatctctgc gcccgacggc attaaagccc acaccgaaaa 1561 ccttttaaat gcccttgtga cccttaaaat gccgcgactt atatttatca acaagcttga 1621 ccgcgcaggg tcggactatg agggaataat ttccgagctt aatcgactcg gtggtgccaa 1681 aacggtatat atgcctttaa gcattgccca aaacgaaggc ggggatgatg ttagcatcac 1741 ctcgcgcgac tttgcacgcg ccgcaaccga agctttggcg gaatttgacg aagttgctgc 1801 ggatgcattt ttgagtgacc agaacctttc ggacacaggc atcaatcata tgctccccca 1861 agcgatcttg gatacgcgga tcactcctgt tctttgcggt tgcgcaaaaa agggattggg 1921 agttgaagag ctgcttgatt tcatcgcgtc ttatatgccc gatgccactc acaaggcgac 1981 cgaggacacc tcgggaataa tctttaaaat cgagcacgat aaaacaatgg gcaagatcgc 2041 acacgttaga atgttcggcg gaaaaattca aaaccgcgat gctttggcgg tcattatgcc 2101 cgaaagtgca actgcctttt cggacgacga tgcaattcct gccgattccg aagacgactc 2161 aaaggacaag gtttcccaga taagaaaggc aatcggcggc agattttccg atgcaggcgt 2221 cgttgaatcg ggggatattg cggcactttg cggtttgacc aaggccaagg tcggccgatt 2281 tgtcggctct gttgccccgt caaatcatta taccttggcg catccgcttt tgcgcgtgcg 2341 cgcaacacct ttggacgatc accccgaggc tttgcccaag cttgctcacg cgctcaaaga 2401 gctttccgac gaagaaccgt atatcgacgc caagtgggaa aacggccaat cggaaatcgt 2461 catcagtctg acgggcagta tccagtcgga gataatcaag tcgcttcttg aggaaagata 2521 ttccttgcgt gcaaactttt ccgacccgac ggtcatttat cgcgaaacgc cgaccaaaaa 2581 gggctgcgga ataggtgtat atacaatgcc gaagccctgc tgggcaattg tcaactttat 2641 gtttgagccg atgccccgag gttatggcgt gagctatcac ggacgactgc caaacaacca 2701 atgtttttat aaatatcaga gccatattca tcgctccttt gaaaactgcc ttgagcaggg 2761 acttcacggt tgggaagtca ccgacttcaa atgtaccctc atcggcggtg agcaccacac 2821 gatacatacc catccccttg atttcttcgt tgcaacgccg atggcgttta tgaatgcgct 2881 gaccgattgc ggatcgaccc ttttggaacc gcttatgaag ctcagaatca tcgctcctgc 2941 ggagctttcc ggcaagctga taaccgaaat tatgcgcggt gacggcgaat ataacgcacc 3001 gtatgtcaga ggtgatacgg ttactcttga tgcaattgtg ccctttaaaa actttatgga 3061 cttccccacg cgcttggctt caatgtcatc gggcagggga gtgtgctcaa caagctttta 3121 cggctaccgc gaatgccccg agggtcaggg tgaggattgc cccagacggg gtgtcagccc 3181 cctcgaccgc tcaaagtgga tactttgggc aagaggagct ttaagcgaat cacagatata 3241 gtactttcgg gggcgaccac acagggtcgc ccctatggca ttataagggg caggcctgtg 3301 tgcctgcccg ataaccgaat atattagcgt cggcgtgtag cttcccttgc atggcggttt 3361 ttgcgggcgg acacataggt ccgcccctat tgtacatatt ctgggtaaaa ggagcctttt 3421 ttatccatca tacctctccc aaaaatctct aaaggcttgt tcatatctat ccttgttgat 3481 aaaatagctc agcccatgct ctgcaccggg caccacaaga agatgtttcg gcgcgcggca 3541 tgccttgaag ttttcatatg tcatctcaat tggcacaaag tggtcgtcgg tgccgtgaac 3601 aaacaaaaca ggaacagggc ataccttcat ggcatccaag gttgaatatt c // LOCUS sequence101 3639 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence101 VERSION sequence101 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3639 /mol_type="genomic DNA" /organism="" /note="sequence101" misc_feature <1..1019 /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_013222767.1:glycoside hydrolase family 97 protein" /note="WP_013222767.1 glycoside hydrolase family 97 protein (Amycolatopsis mediterranei) [pid:37.4%, q_cov:76.6%, s_cov:41.1%, Eval:9.6e-40, partial hit]" /note="internal stop codon at [1018:1020](+)" /note="frameshifted, insertion/deletion at around 168" /note="MGA_552" /locus_tag="LOCUS_4350" CDS 1122..1739 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MTVKKRSISVPLNFLDSGEYNAYIYLDDKDGNLILEEKKVSATDT LSFDLIDKGGVAVMITKAKVDTEVEESPFFNLAGYTYYECEDGKLTGSAVVSSSMLCSG GEKVGYVGNATNTCDITVTVPEAGEYELVVYYCTAEQRNLLIKIGDEKYEIKGLIGTSY DSPEMAKTTVKLEKGENTVTLTSALLWAPDLDRIAISDEPMK" /locus_tag="LOCUS_4360" /note="WP_086845818.1 glycoside hydrolase family 127 protein (Amycolatopsis kentuckyensis) [pid:34.7%, q_cov:58.0%, s_cov:16.4%, Eval:8.3e-12, partial hit]" /note="MGA_553" CDS complement(1868..2359) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MERKRDPLSIVGMIILALIIITIGIILIDNSGLVGGRNDLTYVTF VCEHNNGTVDTAIIGYKNDIVCEYTLETKYPTDVWSEDEIDGILEWYRETDKELKSEKC YKVKIKKSDKYVIASEIFTGLDKEENREALIDAGFNLTAEPLPYSVLESELLSNGFVKQ " /locus_tag="LOCUS_4370" /note="MGA_554" tRNA complement(2619..2694) /product="tRNA-Val" /inference="COORDINATES:profile:Aragorn:1.2.38" /locus_tag="LOCUS_t0080" /note="Aragorn_8" CDS 2846..3616 /product="polysaccharide deacetylase family protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_004082686.1" /transl_table=11 /codon_start=1 /translation="MKRLIALLLAFMLLLCGCAGAPANSDDVKQNSDADIDAAVDENAR PDFGPDDKLIALSFDDGPSLGSTNALLDYFEEMDIVGTFFVIGNNINDETAEVMKRAIE LNCEIGNHSQSHQQMGNMTPETLEQEIGYVQDKVFEYTGVTPVLFRPPFLNVSKTMHDT IPLTFIFGRDSLDWTDISAEERAENIMNHADDGVIILMHDGWDNYKTVEAVKIVVPQLI EQGYRFVTISELFEAKGTTPEANSGVIYSTATGK" /locus_tag="LOCUS_4380" /note="WP_004082686.1 polysaccharide deacetylase family protein (Thermotoga) [pid:40.3%, q_cov:78.5%, s_cov:86.2%, Eval:1.1e-39]" /note="MGA_555" ORIGIN 1 taactgcata tacaggcaag acatggatgc tcttctccga gtcggatgct tttgccgacg 61 atattacata tattaagagc gttcttgaaa ccaagaacgg aagcgacacc cttttgtggc 121 aatttggctt tgagcgtgac cccgcaaacg aggttacaga cgagcttgca agccccggac 181 atataagaat cggcgaggtt aaaacacagt gcggttttac aactccttgg agagctacga 241 ttatttccga ggatctgaac gaccttgtat cgagctgtct tattgatgct ctttgcccca 301 aaatggatga gaagctcttt aaggatacaa gctggataaa gccgggtaag gtttcctgga 361 gctggtggtc gggcgaaaat cagcacagct atgacgcaca gatcccatat atcgattttg 421 ccgcagaaaa cggctgggaa tactgctgtt tggatgcagg ctggccaaca tttggcgacc 481 gacttaaaga gatctgcgac tatgcaaaga aaaaaggcgt cggaataatc gtctgggtca 541 actatctcga gctcaagact cccgaggata ttgaagaacg cttctcaaag tggagcaaag 601 cgggtgttgt cggcgttaag accgactact tcgaaagtga cgctattgag gttttggaat 661 caatgcgcaa ttgcgccgag atcggtgcaa aatatgagct gatgatgtat tatcacggct 721 gtattcatcc ctgcggcgaa acaagaacat accccaacgt tatgacgatg gaagctgttt 781 tgggtgagga attcagaaag tggagcgagg tgcccacagt tgaaaactgc ctgatgtatc 841 ccttcacaag aaacatcgtc ggttcaatgg actatacccc cagctgtatc aaaattgata 901 aaacaggtga aagcggcggc ttcagccttg caaaggcgat cgtatatgaa tctgcgcttc 961 agcacttcgg cgcttccgca aagctctatc ccagctatgt cggtttaccc ctgatttaga 1021 gaatccccac cgattggaaa tcctctattc ttcttgacgg ctaccccgga aagtatgcaa 1081 catatgtccg ctcggacggc gaggacttct atatcggctc gatgactgtt aaaaagagaa 1141 gcatttctgt tcccctcaac ttcttggaca gcggcgaata taatgcatat atttatcttg 1201 atgacaagga cggcaacctt attctcgagg agaaaaaggt cagcgcaacc gacactctca 1261 gcttcgattt gattgataag ggcggtgtcg cagtaatgat tacaaaggct aaggttgaca 1321 ccgaggtgga ggaaagcccc ttctttaacc tcgcaggata tacttattac gaatgtgagg 1381 atggaaagct gacgggaagc gcagttgttt cctcgtcgat gctctgctcg ggcggcgaaa 1441 aggttggtta tgtcggaaat gcaaccaaca cttgtgatat aaccgtaact gttcccgaag 1501 cgggcgaata tgagctcgtt gtatattact gtactgccga acagcggaat ctcttaatca 1561 agatcggcga tgagaaatat gagatcaagg ggctcatcgg cacgagctac gattcccccg 1621 aaatggcaaa aaccaccgtt aagcttgaaa agggcgagaa tactgtcacg ctgacttcag 1681 ctctgctttg ggcacccgac cttgacagga tcgcgataag cgatgagcct atgaaataaa 1741 caaaaaagaa actcctccga aattcggggg agttttttgc ggcgcgcaca cccttgggat 1801 ataacaaagg ggaaaacggt cggtaccatc aggacggcct gtcctgtgta aggggatgtg 1861 cagggcttta ctgcttgaca aatccattgg ataagagctc gctttcaagc accgaatatg 1921 gcaaaggctc tgcggttaaa ttgaagcctg catcaataag ggcttcgcgg ttctcttcct 1981 tatccagacc ggtaaatatt tcgcttgcga tcacatattt gtcggatttc tttattttaa 2041 ctttatagca tttttctgac ttgagttcct tgtcggtttc cctataccac tctaatattc 2101 cgtcaatctc gtcttcagac caaacatctg ttgggtattt tgtttcaagc gtatattcac 2161 aaacaatatc attcttatat ccgatgatag ctgtgtcgac cgttccgtta ttatgctcgc 2221 aaacgaaagt tacgtatgtg aggtcgttcc tgccgccaac taagcctgag ttatcaataa 2281 gaattattcc gattgttata attataagtg ccaaaatgat cattccgacg attgagagag 2341 ggtcacgctt tctttccata ttaattctcc ttatgagttg atgcttcaat tatattggct 2401 agcaaattcg tttgcaacaa ttattaacga aacttaatac aaccttaaga aaaattaata 2461 tttacatggc aggggtgccc aatttgcgct ccacattttg tgacagccga aagtgtgaaa 2521 agcgcaaata agcaaatcct tgcggatttg caggctcaag tcgaaagtcc ctgataaatt 2581 aaaaaagctg cacagctaaa gctgtacagt cttttaattg gtgaggataa taggactcga 2641 acctatgacc ccttgcacgt caagcaagtg ctctaccagc tgagctatac cctcattcgc 2701 ataatgaatt ataactgatg ggtgggggtt tgtcaagggg attttgattt tttctgccgc 2761 ttgaaatctc acaggcaatg ttatataata tatgaaacag caaaaatgcg ttgtgttttt 2821 ggcttaatga aaggactgct tgattatgaa aagacttatt gctttgcttt tggcatttat 2881 gttgcttctt tgcggatgtg caggcgcacc tgcaaacagc gacgatgtga aacaaaactc 2941 cgatgccgat atagatgcgg ctgttgatga aaacgctcgt cccgatttcg gtcccgacga 3001 caagcttatc gctctttcgt ttgacgacgg accctctctt ggctcaacca atgcactttt 3061 ggactacttt gaagagatgg acattgtcgg cacattcttt gtgatcggca ataacataaa 3121 cgatgagacc gccgaggtca tgaagcgcgc aattgaactt aactgcgaga taggaaacca 3181 ttctcaatcc caccagcaga tgggcaatat gactcccgaa acactcgaac aggaaattgg 3241 ctatgttcag gacaaggtct ttgaatatac cggtgtaact cctgttttgt tccgtccgcc 3301 cttcttgaat gtcagcaaaa ctatgcacga caccattccg ctgaccttca ttttcggccg 3361 cgattccctc gactggactg atatttccgc agaggagaga gcagaaaaca ttatgaacca 3421 cgcggacgac ggagtgatca ttcttatgca cgacggttgg gacaactata agaccgttga 3481 ggctgttaaa atcgttgtac ctcagctcat tgagcagggt taccggtttg tgaccatcag 3541 cgagcttttt gaagcaaagg gcacgacccc cgaagccaac agcggagtta tatattctac 3601 cgcaacaggc aaataagagg gctaaaaata tgatgaaaa // LOCUS sequence102 3637 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence102 VERSION sequence102 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3637 /mol_type="genomic DNA" /organism="" /note="sequence102" CDS 121..756 /product="polysaccharide deacetylase family protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_012582836.1" /transl_table=11 /codon_start=1 /translation="MESERKLIALTFDDGPNTTTMVEVLDLLEEYNAVATFFLIGNYIN DDTAPVLNRALEMGCELGNHTWSHGYTSKLDAEGIKEEIESVQRKVYEVTGIIPEYFRP PYFDMNQTMYDVIDLPFIGGFSSQDWDSSVSAEERVKLFFEGYGEDKIAVLHCFKGNSN TVEALKTILPRLVDEGYEFVTVSELFEEYGLTPEAHNGVLYASADDVK" /locus_tag="LOCUS_4390" /note="WP_012582836.1 polysaccharide deacetylase family protein (Dictyoglomus turgidum) [pid:43.8%, q_cov:91.0%, s_cov:82.6%, Eval:7.0e-41]" /note="MGA_556" CDS complement(918..1817) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MKRIFTFILIGVMILSLSACAKKVTVVDEIPKEDIEKLDDGGTLE LITYPSKDYFGNMEDIEKKAYVYLPAGYDESKQYNVLYILHGIGGDIWEWGMTDNNSTV KKIMDNLIADGEIEPFIVVAPNGRAAKNHGTDGDFNSFYQFGKELRYNLIPYIDNNYAT YADTENYDVTEAREHRAVAGLSMGGMQTINIGMCECLDMFSYFGAFSACPTTYNAQTIA DHLEDFPDYDIKYFYNLCGTEDGIAISHHTAATEGLCDLTDKLKDGKNFMWQTRSGGHD FNIWHLGFYNFSKIVFTR" /locus_tag="LOCUS_4400" /note="WP_001336377.1 esterase family protein (Enterobacteriaceae) [pid:27.7%, q_cov:85.6%, s_cov:63.8%, Eval:3.2e-12, partial hit]" /note="MGA_557" CDS complement(1934..2632) /product="nicotinamide riboside transporter PnuC" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_002992863.1" /transl_table=11 /codon_start=1 /translation="MKYKFTNPFKTLDRFERWLLGISLILVLASYLLSADKSPLSLIAS LVGATALIFVAKGVPIGQVLVIIFSLLYGAVSLQTRYYGEMITYVGMSLPMAVASLVSW IKNPYEKGKGEVKVASLTAEKVALLSALAILVTVAFYFILGALNTPRLVVSTVSVLTSF VAAGLTFLRSPYYALAYAANDVVLIILWVAASVNDISYLPMVMCFAVFLANDIYGYISW QRMRNRQSGK" /locus_tag="LOCUS_4410" /gene="pnuC" /note="WP_002992863.1 nicotinamide riboside transporter PnuC (Streptococcus pyogenes) [pid:48.1%, q_cov:92.7%, s_cov:93.5%, Eval:5.1e-51]" /note="MGA_558" CDS complement(2771..3166) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MKRRGILRLILLIACGLMCSCGTDAPAEAIYKNITPEEAKEIMDT ETDYVILDARTQAEFDEGHISGAVCISHEEIAQKAEEMLPDKDKLILVYCRSGRRSKIA AETLLELGYTRIYEFGGIIDWPYDVVK" /locus_tag="LOCUS_4420" /note="WP_003356887.1 rhodanese-like domain-containing protein (Clostridium botulinum) [pid:46.9%, q_cov:73.3%, s_cov:93.2%, Eval:9.0e-23, partial hit]" /note="MGA_559" CDS complement(3196..3615) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MTAIAIHNLPEGIAAGVGFGSGNDAEALIIAGGIALQNIPEGMVI IAPLLAAGVSPKKTLFLSLATGLVEIFGTMLGYFAVSIANALLPFALSFAGGTMLYVIS DEMIPETHAHGNQRASTYSLLIGFCLMLVCDVLLG" /locus_tag="LOCUS_4430" /note="WP_011144264.1 ZIP family metal transporter (Gloeobacter violaceus) [pid:47.4%, q_cov:98.6%, s_cov:52.7%, Eval:2.4e-31, partial hit]" /note="MGA_560" ORIGIN 1 atgatgaaaa agtttttgtt tattttcatg gcttgcgcta tgcttttaac cgcctgcgga 61 acaaatgcag atgcgcccat cagccgggaa gatgttttaa atgatactgc ggaggaacaa 121 atggaatctg aaagaaaact gattgccctc acctttgatg acggccccaa caccaccact 181 atggtggaag ttctcgacct tttggaggag tataacgcag ttgcgacatt cttcctcatc 241 ggcaattaca ttaacgacga caccgcgcct gttttgaacc gcgcccttga aatgggctgt 301 gagcttggca accacacatg gagccacggt tacacctcga agctggatgc tgaaggcatc 361 aaggaagaaa ttgaaagcgt tcagcgcaag gtatatgagg tcacaggcat aattcccgaa 421 tatttccgcc cgccatattt tgatatgaac cagacgatgt atgatgtcat cgacctgcct 481 tttatcggcg gcttcagctc tcaggattgg gattcatcag tttccgccga ggagcgagta 541 aagctcttct ttgagggtta cggcgaggat aagatcgcgg ttttgcactg cttcaaggga 601 aacagcaaca ccgttgaagc gctgaaaacg attttgccga gattggttga tgagggatat 661 gaatttgtga ccgtttccga acttttcgag gagtatggct taactcccga agcccacaac 721 ggcgtgcttt atgcaagtgc cgacgatgtg aagtaaacta aaaaaagcac tccgcgagga 781 gtgcttttgt tttgtcaatg tgaagtgata gcaagcggag cgccgtcatc gaaaagcgcg 841 gcagcgccga tggtggcgcg aagcggtagg taatgagcaa aaaaacgggc gactctgtgt 901 ggtcgcccgt tattttttta tcgtgtaaat acgatctttg agaagttata gaagcctaag 961 tgccaaatat tgaaatcgtg tccgcccgag cgggtctgcc acataaagtt cttgccgtcc 1021 ttgagcttgt cggtcaaatc gcaaagacct tcggttgctg cggtgtggtg ggaaattgca 1081 atgccgtcct cggtgccgca aaggttatag aaatacttga tgtcatagtc ggggaagtcc 1141 tcaaggtggt cagcgatggt ctgtgcattg taagtggtgg ggcaggcgga gaatgctccg 1201 aagtatgaga acatatcaag gcattcgcac ataccgatgt taatggtctg cataccgccc 1261 attgaaagac ctgcaacagc gcggtgctct ctggcttcgg taacgtcata gttttcggtg 1321 tctgcatatg tagcatagtt gttgtcgata taaggaataa ggttataacg aagctccttg 1381 ccaaactgat agaaggagtt gaagtcgccg tcggtgccgt gattctttgc ggctctgccg 1441 ttgggcgcaa caacaatgaa aggctcaatt tcgccatctg caatgaggtt gtccattatc 1501 ttcttaacgg tggagttgtt gtctgtcatg ccccattccc agatgtcgcc gccgatgccg 1561 tggagaatgt ataaaacatt atactgcttc gattcgtcat agcctgcggg aagatataca 1621 tatgccttct tttcaatgtc ttccatattt ccgaagtagt ccttcgaggg gtaggtgata 1681 agctcaaggg taccgccgtc atcaagcttt tcaatgtctt ccttggggat ctcatccaca 1741 acggtgactt ttttcgcaca tgccgacaaa ctcaaaatca tcactccgat caaaataaat 1801 gtaaaaattc ttttcatgtt ccaagttctc ccttcaatag atatacttat attttagagc 1861 tattgaacat aaagagcaat gaccaaaaca tagcacttca ttgatatttt cggcgcacag 1921 ccttgactca ttctcatttt cccgactggc ggtttctcat tctctgccag cttatatagc 1981 cgtaaatgtc gttggcaagg aaaactgcaa agcacatcac catcggcaga tacgatatat 2041 cgttcaccga tgccgctacc caaagaatga ttaaaacaac atcgtttgcg gcatacgcca 2101 aagcataata tgggcttcgc aggaaggtaa gccccgccgc cacaaagctg gtcagaacgc 2161 ttacggtgct gacaacaagc cggggagtgt tgagtgcgcc gagaatgaaa taaaacgcaa 2221 ctgtcaccaa tatcgcaaga gcgctcaaaa gagccacttt ttccgctgtc aggcttgcaa 2281 ccttgacctc gcccttgccc ttttcatagg ggttttttat ccacgacaca agcgaagcca 2341 ccgccatcgg taagctcata ccaacatatg ttatcatctc gccgtagtag cgcgtctgca 2401 gggacactgc gccatacaaa agcgagaaga tgatgacaag cacctgacct atcggcacac 2461 cctttgcaac aaatatcaaa gctgttgcac ccaccagcga agcaatcagc gacagcgggc 2521 ttttatccgc cgagagaagg tatgatgcaa gcaccaatat aagggaaatg cccaaaagcc 2581 aacgctcaaa tcggtcgaga gttttaaagg ggtttgtaaa tttatatttc atattgcacc 2641 tcattaaaaa tgcaccccga cacatcttca aagacctaac gacgtgtcag gatgcaaaag 2701 catccgttgc ccggtggcaa cataatattc cgataagatt atagccaaaa cgggtgatga 2761 tgtcaagcgg ctattttacc acatcatacg gccaatcaat tattccgccg aattcatata 2821 tcctggtgta gccaagctca agcaacgttt ctgcggcgat tttgcttctg cgtccgcttc 2881 ggcaatatac aaggatcagc ttgtccttat cggggagcat ttcctcggcc ttttgggcaa 2941 tttcctcgtg agaaatgcaa actgcgcccg aaatatgtcc ctcgtcaaat tccgcctgcg 3001 tgcgggcatc gaggattaca tagtcggttt cggtatccat tatctctttg gcttcttcgg 3061 gggttatgtt tttatatatc gcctctgcgg gggcatctgt gccgcaggaa cacatcagcc 3121 cgcaggcgat aagcaaaata agtctgagaa tccctcttcg tttcatttgt tttcaacttc 3181 ctttcggttt atatattatc ccagcaaaac gtcgcacacc agcatcaggc aaaagccgat 3241 gagcaaagaa tatgttgatg cccgctgatt tccgtgggca tgggtctcgg gaatcatctc 3301 gtcgctgatg acatatagca tcgtgccgcc cgcaaaggaa agcgcaaagg gcaaaagggc 3361 gtttgcaatg ctgactgcaa aatagccgag catggtgccg aaaatttcaa ccaaccctgt 3421 ggcaagcgat aggaaaagag tctttttcgg gctgactccc gcagccaaaa gcggcgcgat 3481 tataaccatt ccctcgggaa tgttctgcag tgctattcca ccggctatta tgagcgcctc 3541 ggcatcgttc cccgagccga agcccacacc tgctgctatt ccctcgggca gattgtgtat 3601 ggcaatagcc gtcacgaaca gaagaacctt gctgagc // LOCUS sequence103 3625 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence103 VERSION sequence103 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3625 /mol_type="genomic DNA" /organism="" /note="sequence103" CDS 1528..1956 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MNCCDLHTHSTFSDGTLTPTQLISEAERIGLDAIALCDHNTIAGL PEFISAAEGRGVEAVAGVEFSTEYLDTELHILGLFIRPEHYSSVNEKLMEYTRRKDASN RELIEKLRCKGYHLDYDSIKAASPNGNINRAHIAAELT" /locus_tag="LOCUS_4440" /note="WP_010937958.1 PHP domain-containing protein (Desulfovibrio vulgaris) [pid:36.5%, q_cov:96.5%, s_cov:47.2%, Eval:3.1e-21, partial hit]" /note="internal stop codon at [1954:1956](+)" /note="MGA_562" CDS 2128..2367 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MRVFLEKAKPCGLDGMETLYSLYSDETTLLAKQIAREFSLLESGG SDFHGDNKPDISLGVGKGNLIISTEYLKKLRQAL" /locus_tag="LOCUS_4450" /note="WP_010942094.1 PHP domain-containing protein (Geobacter sulfurreducens) [pid:36.4%, q_cov:97.5%, s_cov:26.4%, Eval:4.8e-08, partial hit]" /note="internal stop codon at [1954:1956](+)" /note="MGA_563" CDS 2621..3382 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MIFDLQKASMLKRISAFMFDIIMLGILAVGLGFIISSLTGYDKYS TALNDTYDKYEAEYSIEFEIAEDTYRSFTDEERANYDAAYNALINDTDAMYAYNMVINL TLLIITLAILLSYVVLEFVIPLMFDNGQTLGKKIFGIALMRTDGVKISAPLLFIRTILG KFTIETMVPVLIIIMIYFNSIGVVGILVLFLILVLEISLLISTKTNSMVHDVLAKTVAV DLASQMIFDTEADMIAYKNKVHSEKAARDTY" /locus_tag="LOCUS_4460" /note="MGA_564" ORIGIN 1 ccgccgctga taacagacac ggatttataa acattctcgc ccgtcaacaa aaccattccc 61 aaaaggctcc tgacctcgtg gtcggtcatt cgtggataac gcttgtgaat ttcttcgata 121 actgaattca tcgggtcaag ctgttcgttt ttctggtcga aatatgcgat tttaacattc 181 atcgcccagt cgatcttgcc cttcttgtgg ggattgagat tctgcacagt tttgagaatt 241 gtcgatttac cgatgccgtt tgcgccgata attgcaacct tttcgccacg ccttatgtgc 301 agatcaaagc tctcaataag ctttttttcg cccgccgtaa tgtcaacatc cttaacaacc 361 aaaacatcct ttggcggctc aatgtcatat tcaagtctta tcttcggcgg tttggtgtaa 421 gtcctcggtt tctcaacagc gttttcaacg attcgatcaa gcatatgctg cttcgatttt 481 gcctgcttcg cactggtcgc gctgactctg tttttgtcaa tgaaaaactg cagctcgccg 541 atcttctttt gctgttgctc ataaagcttt tcctgacgtt caatatccgc cttcttagtt 601 tcaaggaact tcgtatagtt gcccgtatat gaccttagtt tgccgtcctc gatctcgcag 661 atacgtgtgc agatcttgtc caaaaagtat ctgttatggg atactgtcaa aatcgcgccc 721 ttatattcct gcaaatagct ttcaagccac atcattgttt caaggtcgag gtggttggtg 781 ggctcgtcca aaatcaaaag atcaggctct tcaagcaaaa gctttgccag agcaaggcgc 841 gttctttcgc cgcccgaaag ggaatttatc tcgcgtgtgc ggtcaattcc cgcaaatccc 901 ataccgttaa gaatcgtgtt gatcttaacg tcgatcaaat atccgtcgtt agtctcaaaa 961 tatgccacca atcttgaata ttcgttctgt gctttatcaa gctccgcacc cgaaagggaa 1021 ctcatctgct cctcaagctc ggtgattcgt tcatatacct catcaagctt cgcaaaaggc 1081 aggcgcatct cgtgtgcaat agatgcatct ccttcaagcc ctgtgtgctg ttccagataa 1141 ccgattcgcg tcgaatttgt aactgcaacg cttccttttc cgtcgggagt cttatcaaag 1201 tccattctcc ccgtgagaat cgacaaaagg gtggtctttc cgcatccgtt gatgcccaca 1261 agtccgattc tgtcggtgtt ttcaattgta aggttaatgt ccttcaaaag ctcttcgcca 1321 ttaaagacct tataaacatt ttccatgctt gcaagcattc ggcagatctc ctttcgccta 1381 aaatcatcat acctattcat tttatcacat cttagtcagt ttggcaagaa atgatttaca 1441 gaatatgtac tattgactcc tgttgcaaaa ttttgttcta tgcgttaaaa tatatgcagt 1501 taatacttac aaaggagagc ggttaaaatg aattgttgcg atcttcacac tcattcaacc 1561 ttttccgacg gcaccctcac acccacgcaa ctgatatccg aagctgagcg aatcggcctt 1621 gatgctattg ctttgtgcga ccataatacc atcgcaggtc tgcctgagtt tatctctgct 1681 gccgagggca ggggagttga agcagttgcc ggagttgaat tttccaccga atatctcgat 1741 accgaactgc acatccttgg ccttttcatt cgtcccgagc attattcatc agtaaacgaa 1801 aagcttatgg aatatacacg tcgcaaagat gccagcaata gggaactgat tgaaaaactg 1861 cgctgtaaag gctatcacct tgactatgat tcaattaaag ccgcttcgcc aaacggcaac 1921 attaaccgcg cacacatcgc cgccgagcta acctaacttg gctatacatc atcgatcaaa 1981 gaagccttca aaactcttct ttctccctct tgcggatatt acaccccgcc ccaaagactc 2041 gacgcctttg aaaccatccg ctttatcaaa tcaatcggtg ctgtcgctgt catcgctcat 2101 ccctttttga acctatctgt gccgtctttg cgcgttttcc tcgaaaaagc gaagccttgc 2161 ggacttgacg gtatggaaac gctctattcc ttgtattccg atgaaaccac tctgcttgcc 2221 aaacagatcg cccgcgagtt ttcccttctt gaaagcggcg gcagcgattt ccacggcgat 2281 aacaagccgg acatctctct gggtgtcgga aaaggcaatc tcataatatc aaccgaatat 2341 ctaaaaaagc tccgtcaagc tctttagctt tacggcgttt ttgtaatatt ttttgatttt 2401 tggtcgagat taacacaatt gacaaaaaac agcagtaaaa aatgttcaag tttttttgtc 2461 tttcctgtgg aattttgccg caaggtatga tataatgctt ttataatgca attattgtgg 2521 cttggtgttt ctattcggcg gtaatatttt aaatatttaa acttttaaag cgttaaacgt 2581 caattttgca ggattttact gcaaagaagg gagtcagcaa atgatttttg atctgcaaaa 2641 agcaagtatg ctaaaaagaa tatctgcttt tatgttcgat ataattatgc tcggcatcct 2701 tgctgtcggt ttgggattca taatttcttc cttaacgggg tatgacaaat acagcaccgc 2761 ccttaacgat acttatgaca aatacgaagc cgaatattct atcgagtttg agattgctga 2821 ggacacctat agatctttta ctgacgaaga acgcgctaac tatgatgcgg catataacgc 2881 tcttatcaac gatactgatg ctatgtatgc ctacaatatg gtcatcaatc tgaccttatt 2941 aataatcacc ctcgcaattt tgctgtcata tgtggttttg gagtttgtca ttcctttaat 3001 gtttgacaac ggccagacgc tcggcaaaaa gatattcgga attgccctaa tgcgtaccga 3061 cggtgttaaa atttccgcgc cccttttgtt cattcgcaca attttgggca aattcaccat 3121 tgaaacaatg gttcccgtac tcattataat aatgatatac ttcaactcca tcggtgttgt 3181 gggaattttg gttttgttct taattcttgt tttggagatc tctttgctca tctcaaccaa 3241 gaccaactca atggtgcacg atgtccttgc aaagaccgtt gcggttgacc ttgccagcca 3301 gatgattttt gacaccgagg cagatatgat cgcctataaa aataaggtgc attcggaaaa 3361 agccgcccgc gacacatact aaagcgattt taatcttgtc gcaatgacgc tttggcgtca 3421 cgaaatataa acagtattgg aaagggaaaa gtaatgaaag ttgtattgca aaacctgaca 3481 aaaatcttcc cgagccgaaa caaaaaatcc aatgaggagg tcgttgctgt cagcgacttc 3541 acctttgaga ttcccgatgg caagcttatc ggcttgctcg gtccttccgg ctgtgtaaag 3601 agtaccacac tctacatgat cagcg // LOCUS sequence104 3584 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence104 VERSION sequence104 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3584 /mol_type="genomic DNA" /organism="" /note="sequence104" CDS 440..730 /product="30S ribosomal protein S6" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_012048444.1" /transl_table=11 /codon_start=1 /translation="MAKITANYESMVVFSVKAGEEAVNALVAKFKDMIEANATLTNVEE WGKRKLAYEINYETEGYYVIYTFESKPDFPAELNRVLNITEGVLRSIVITK" /locus_tag="LOCUS_4470" /gene="rpsF" /note="WP_012048444.1 30S ribosomal protein S6 (Clostridium botulinum) [pid:44.4%, q_cov:92.7%, s_cov:95.7%, Eval:1.4e-15]" /note="MGA_567" CDS 759..1229 /product="single-stranded DNA-binding protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_000934799.1" /transl_table=11 /codon_start=1 /translation="MLNRVILMGRITQDLDLRTTPTGTSVLTFNIAVDRGYVKQGEERQ ADFITCVAWRQQAEFINRYFAKGRMIAIEGNLRSRTYDDKNGTKHYVTEVFVDNVSFTG ERATQGDNSYSQSFKREAPAQAPAYREPAEKPISVGAFDDFEEILSDDGVPF" /locus_tag="LOCUS_4480" /gene="ssb" /note="WP_000934799.1 single-stranded DNA-binding protein (Bacteria) [pid:38.3%, q_cov:100.0%, s_cov:100.0%, Eval:6.5e-27]" /note="MGA_568" CDS 1268..1513 /product="30S ribosomal protein S18" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_012869404.1" /transl_table=11 /codon_start=1 /translation="MERNMSNGRPAKRSHKKVCMFCVDRAQTIDYKDTAKLKKCMTERS KILPRRVTGTCAYHQRELTKAIKRARFVALLPYSAD" /locus_tag="LOCUS_4490" /gene="rpsR" /note="WP_012869404.1 30S ribosomal protein S18 (Thermanaerovibrio acidaminovorans) [pid:58.0%, q_cov:100.0%, s_cov:100.0%, Eval:1.2e-22]" /note="MGA_569" misc_feature complement(1683..>3584) /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_011949155.1:homocysteine S-methyltransferase family protein" /note="WP_011949155.1 homocysteine S-methyltransferase family protein (Clostridium botulinum) [pid:47.4%, q_cov:99.7%, s_cov:80.3%, Eval:1.3e-161]" /note="MGA_570" /locus_tag="LOCUS_4500" ORIGIN 1 atccccagtg tagctatcac tcttgcacag tatggctata ttactgctcc ttgggcgtta 61 tcggaaggat ttattcttct gaataatgtc tttgcaattc tttcttatgc aataagcttc 121 atctgcggaa tcttcggcaa ctggttctac tataaaaagg caaagaagga tattgaaaag 181 atcaaggcaa aatatgaagg cgttgccgaa agaaacaatg cgctgaatgt ttatggcgga 241 acttcgctgt taaacctcgg tttcggcttg cttgttgaga ttggaatcag cttaattatc 301 agctttgttc ttctcggcgg aattgtttaa ataatttatt aaaatcgctt gacaaattta 361 ggtttatttg ttatactaac tgagttatcc ttgtccatcg aatgaacggt ggatgtaatc 421 cagaaggagg tgcaatatta tggcaaagat taccgcaaac tacgagtcta tggtagtgtt 481 cagcgtaaag gcaggcgagg aagcagttaa tgctctcgtt gctaagttca aggacatgat 541 cgaggctaat gcaactttga caaatgttga agaatggggt aagagaaagc ttgcttacga 601 gatcaattac gaaaccgaag gttactacgt aatttatact ttcgaatcca agcccgattt 661 ccctgcagag ctcaatcgtg tactcaacat cactgaaggc gttcttcgtt cgatcgttat 721 caccaagtaa gtgatgacaa acgtaatgga gggtatttat gcttaacaga gtaattttga 781 tgggtagaat cacacaggat cttgaccttc gcactacgcc cacaggcacc agcgttttga 841 cattcaacat cgctgttgac cgcggatatg ttaaacaggg cgaagaaaga caggctgatt 901 tcatcacctg cgtcgcatgg cgtcagcagg ctgaattcat caacagatat tttgccaaag 961 gaagaatgat tgcaattgaa ggcaacttga gaagccgcac ttatgatgat aagaacggca 1021 ccaagcacta tgtcaccgag gttttcgttg ataacgtttc cttcaccggc gagcgtgcaa 1081 cccagggcga taattcatat tctcagtctt ttaagcgtga agctcctgct caggctcctg 1141 catatagaga gcctgctgaa aagccgatct ctgtcggcgc attcgacgat tttgaagaaa 1201 ttttaagtga tgacggcgtt ccgttctaag atttaacgga gcaaaacctt gaaaggagaa 1261 tactaacatg gaaagaaaca tgtctaacgg cagacctgca aagagatccc acaagaaggt 1321 atgcatgttc tgcgtagata gagctcagac catcgattat aaggacacag ctaagcttaa 1381 gaagtgcatg accgaaagat ccaagatcct tccccgtcgt gtaaccggca cctgtgctta 1441 tcatcagaga gagctcacca aggctatcaa gagagcaaga tttgtagctt tgcttcctta 1501 ctctgctgac taatagccga gccaattgca aaaacaaaaa atcaacaggt actcgatttc 1561 gggtacctgt tattttttat atatagcctt ccccttgagg ggaaagagtc ggcgtatgcc 1621 gacggatgag gtgccaaacg accgccaaac ctttgcttgg tattaccgct ctcgacggct 1681 cgctacgttt tataataccc cttcacaacc ttaaccgctt ccatcgcatc cttgcagtat 1741 gaatccgcgc cgatcatatc ggcatactcc tgattcagca ccgcaccgcc cacgatggtg 1801 aaaactttag ggtcgtttgc ctgtaaaagc tttatggttt cttccattgc gggcactgtt 1861 gtggtcatcc tcgcggaaag gccaacaact ttacagccac tctcattcac agcgtcaaca 1921 attttgctcg gctcaacgtc ttttcctaag tcgataattt taaaaccgta actttcaagc 1981 atcaccttga caatgttttt gccgatgtcg tgaatatctc ccttaactgt cgccaaaatc 2041 accgcattat cgctgtctgc gttcttttta ataaacggtt taacctcatc aatcgccgcg 2101 gttgccgcct cagcggcata taaaagctgt ggcaaaaatg cagtctttct ctcaaaccgg 2161 ttgccgatct cattcagcgc gggaataatg tgcccattta ttatatccag tggctcaata 2221 tcattgagca tatccttagc gcacgtaatg gcacttgcct ttacgcctga aatcaccgca 2281 tcatacagca tcgctgtgct ttcctttggt ttcacatcgg tcagcgcggc tccgtttgcg 2341 tattcaatat aatctgagca agctctgtcc tgcccgtgaa gtgaacgatg ggcataatat 2401 gcgttcatca ttccctcggc aaatgggttc atgatcgagc aatcaagccc gcgctccagc 2461 gcctgtgcaa agaacacagc atttatgata tcccgcctcg gcaatccaaa actgatgttt 2521 gaaactccaa ggcttgtatg gtatcccatt tccttgatga gccgaattgc ttcaagtgtc 2581 acctttgcgc tgtcgggatc agacgataca gtaagtgcca gcggatcaaa gatcaattcg 2641 ttttcatcaa ttccatatcc ctttgcgctc tcggcaatcc tcttagcaat ttccgctctt 2701 tcctgcgcgg acttgggaat tccgttttcg tccattgtca gagcaatgat cgcgccgccg 2761 tatttctttg ccagcgggaa aacccgctcc atcgaggatc tttcgccgtt aacggaattt 2821 atcagcgcct tgccgttata tcttcgcaaa gccttttcca aaacctcagc tcttgtggag 2881 tcgatgcaca aaggcagctc gcttaccgcc tgcacagttt caactgctcg ctccataacc 2941 atagattcat caatttcagg caatcccaca ttgacatcca aaatatgcgc acccatatca 3001 gtctgcttaa ttgcttcgtt ggcaatatag ctgtagtctg cgcttctcaa tgcttccttc 3061 agctttggtt tacctgtcgg attgatgcgc tcgccaatca aaatcggttc gttgccaatc 3121 gtaaccgcct tcgaatatga tgtcacaacc gtctttttcc ctccatttgg caagcggtag 3181 gggatatcct tggtcttctc aacggttttc tttatgtatt caggcgttgt accgcagcac 3241 cctcccaaaa tgcatcctcc ggcctttgcc agtgttgcca tcaaatcgga aaacgtatct 3301 gcatccgttt caaaaacagt cttgccgtca accgttttcg gcaaccctgc attgggattt 3361 acaatgatag gcaaacttgt ggcatcagct aactgctcaa caatcgacaa catcttgtcc 3421 ggccccaaag agcagttgat gccgagtgca tccacgccca gcccttcgag cattgccgcc 3481 ataacttcgg gcgtcgcacc tgtcaaaagc cgtccgtcgg tgccgtaaac attggtgacg 3541 aatataggta gatctgaatt ctccttcgcc gccaataccg ccgc // LOCUS sequence105 3579 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence105 VERSION sequence105 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3579 /mol_type="genomic DNA" /organism="" /note="sequence105" CDS 64..810 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MTDDHFTNEKMLKSITENMYEAIALSHQFYLKLENAELYDEIKIL RHQMSCCFKVLGAVANANEMKKYESGLNEKVFDVTSLIRDIVDNCRSKLRSHCISLEFS DCEPMMVLCDPDRFTACLLNIIVNSLQNIDREEGAVRFSVKQRGEYINVTVTDNGYGVA HGEDISNYRSDSGLAVINRFCESVGTTPIFETGENSGFSVSLRLPMATDGGMDIASCRA GLDLGTFSPVNIYLAKVDYINISDIC" /locus_tag="LOCUS_4510" /note="MGA_571" CDS complement(936..3371) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MSHFSHLPMIYLDMFMHGSDLRLKSLIAAEAYQSSTWSGELNPLL DELKNYIEREYCCIVLTGTEKSVSFVMGDIEKQGFRVQPLTKQTTLSPGMVYVGSGALS SGFEYPANKLAVITQMKANTSRRKTAKKKPKNTEKINSLSDITRGDLVVHALHGIGRFE GIKNITTNNVTKDYITIKYAGTDVLYVPVTQLDTVSKYIGPKDDESVKLNKLGGNEWQR TRARVKKACRDMADELIAIYAKRQLAKGYAFSADNDWQMEFEERFEYQETDDQLQSIDE IKGDMQKATPMDRLLCGDVGFGKTEVALRAAMKCILDSKQCVILVPTTVLAWQHYQTAL RRFGGFPVKIELLSRFRSPKQQKEILRQLERGEIDLVVGTHRLVSKDVKFKDLGLLIID EEQRFGVAHKEHLKSIYPEVDILTLSATPIPRTLNMAMSGIRDMSVIDEPPSDRYPVQT YVIEHQTGVLIQAIQKELRRGGQVYYIHNRIETLDMCAYKLQQSLPDARIGVAHGQMSE TQIEEIWRQLLDHEIDILVCTTIIETGVDVSNCNTLIIEDADRFGLSQLYQLRGRVGRS SRRAYAYFTFRRGKVLSEVASKRLTAIRELTQFGSGFKIAMRDLEIRGVGSILSAKQHG HMEAVGYDMYLQLLTEAIAEQKGEAAPRTAEDCLVDVTIDAFIPETYIEDLKLRIEAYR KIAGIMSKEDSEDVLDELIDRYGDPPKSVVGLVDVALLRNTASKLGIREITQRKENIVF YLREAKMGSIMALTSKYKGRVLVNGTSESYVSVKLAPKQEPVDLMKEVLMTMERAEVE" /locus_tag="LOCUS_4520" /note="WP_005814875.1 transcription-repair coupling factor (Desulfitobacterium hafniense) [pid:48.4%, q_cov:96.2%, s_cov:65.9%, Eval:1.9e-216, partial hit]" /note="MGA_572" ORIGIN 1 ctttacaaca cgcatagtta atgctaaaat ttaaacacag tttgaaaaag gagggatatt 61 tatatgacgg acgatcattt caccaacgaa aaaatgctga aatccataac cgaaaatatg 121 tatgaggcca tcgcgctttc acaccagttt tatttgaaac ttgaaaacgc cgagctatac 181 gatgaaataa aaatcttgcg tcatcaaatg tcctgctgct tcaaggtctt gggtgctgtt 241 gcaaatgcaa acgaaatgaa aaaatatgag tcgggcctga atgaaaaggt gttcgatgtc 301 acatcgctta tccgcgacat tgttgacaac tgccgttcca agctgagatc ccactgcata 361 agccttgagt tttccgattg cgaaccgatg atggttttat gtgatccgga cagattcacc 421 gcttgtctgc ttaacataat cgtcaattct ctgcaaaata tcgaccgcga ggaaggtgcc 481 gtgcgcttct ctgtcaagca aagaggggaa tatattaatg ttaccgttac cgacaacggc 541 tatggcgttg cccacggcga ggatatttca aattaccgct ccgacagcgg tcttgctgta 601 atcaatcgct tctgtgaatc ggtcggcacc acccccatat ttgaaacggg cgaaaacagc 661 ggcttttccg tcagtctgcg cttgccgatg gcaacagacg gcggaatgga tatcgcatcc 721 tgccgtgcag ggctcgacct tggcaccttc tcgcctgtga acatctatct tgccaaggtg 781 gattatatta acatcagcga tatctgctaa tatataaaaa accaaagccg tatggacttc 841 catacggctt ttttgtcggt ttgctatcgc tccgctcgcc accatcggcg ctgccgcgct 901 tttcgatgac ggctcgctcc gcttcccgat gctttttatt caacctctgc tcgctccatc 961 gtcataagaa cctctttcat caaatcaacc ggctcttgct tcggtgcaag ctttacggat 1021 acatacgact cactggtgcc gttaacaagc actctgccct tatattttga ggtgagagcc 1081 ataatgctac ccatcttagc ctcgcgcaaa tagaaaacaa tgttttcctt tcgctgtgta 1141 atttctctta ttcccagctt cgaagcggtg tttctcaaaa gtgcaacatc caccagcccc 1201 acaaccgatt tcggcgggtc gccatatctg tcgataagct cgtctaaaac gtcctccgaa 1261 tcttctttgg acattatccc cgcaatcttg cggtaagctt caattctaag cttcaagtcc 1321 tcaatatatg tttcgggaat gaacgcatca atggtaacat caaccaagca atcctcggca 1381 gttctgggcg ctgcttcgcc cttttgttcg gcaatggctt ctgtcagcag ctgtaaatac 1441 atatcatatc cgaccgcttc catatgccca tgctgttttg ccgacaaaat cgaacccaca 1501 ccgcggattt caaggtcacg catggcgatc ttaaatcccg agccaaactg tgtcagctct 1561 ctgatcgctg tcagtcgttt cgatgctact tcgctcaaaa ctttacctcg tctgaacgta 1621 aaatatgcat acgctcggcg agagcttctg cccacacgtc ctcttagctg ataaagctgt 1681 gaaagtccga atctgtctgc atcttcaata atcagcgtgt tgcagtttga aacatccaca 1741 cccgtttcaa taatggtcgt gcagaccaaa atgtctatct cgtggtccaa aagctgtcgc 1801 catatctctt cgatctgcgt ttcgctcatc tggccgtgcg ccacaccgat tctcgcatcc 1861 ggcaagcttt gttgcaattt atatgcgcac atatccagcg tttcaatgcg gttatgaatg 1921 taatatacct gaccgccacg cctcagttcc ttttgaatcg cctgaatcag cacgcccgtc 1981 tggtgctcaa tgacatatgt ctgcacagga tatctgtcgc tgggcggctc gtcaattacc 2041 gacatatccc taattcccga catcgccata ttcagcgttc tgggaatggg cgttgccgac 2101 agcgtcaaaa tatccacctc aggataaatg ctcttcaggt gctccttgtg tgccacgccg 2161 aagcgttgct cttcgtcaat tattaaaagt cccaagtcct tgaacttaac atccttagat 2221 accagcctat gtgtacccac aaccaagtcg atctcgcccc gctcaagctg tctgagtatt 2281 tccttttgct gtttgggcga gcgaaaacgc gagagcagct cgatcttaac aggaaaaccg 2341 ccgaagcgcc ttaaagctgt ctgataatgc tgccaagcaa gcaccgttgt cggcaccaat 2401 attacgcact gctttgaatc gagaatgcac ttcatcgccg cacgcaaagc aacctctgtt 2461 ttgccaaagc cgacgtctcc gcaaagcagt ctgtccatgg gtgttgcctt ttgcatatcg 2521 cccttaattt cgtctatcga ctgaagctgg tcgtccgttt cctgatattc aaacctctct 2581 tcaaactcca tctgccagtc gttgtcagct gaaaaggcat atccctttgc aagctggcgc 2641 ttggcatata tcgcaataag ctcgtctgcc atatctcggc aggctttttt aacccttgcc 2701 cttgtccttt gccattcgtt tccgccaagc ttattcagct taacgctctc gtcgtcctta 2761 gggccgatat attttgaaac tgtgtcaagc tgtgtaacag gtacatacaa aacatccgta 2821 cctgcatatt tgatggtgat atagtccttg gtcacgttgt ttgtggtgat atttttgatt 2881 ccctcaaacc gaccgattcc gtgcaaagcg tgaacaacca agtcgccccg cgtaatgtcc 2941 gaaagcgaat tgatcttctc ggtattcttc ggcttctttt tcgctgtctt ccgtcttgat 3001 gtattggctt tcatctgcgt gatgaccgca agcttatttg cgggatattc aaaaccgctc 3061 gataaagcac ctgaacccac atataccata ccggggctga gcgttgtctg cttggtcagc 3121 ggctgaaccc taaagccttg cttttcaata tcgcccataa caaagctgac acttttctct 3181 gtacccgtca aaacaataca gcaatactcc cgctcgatat aattcttcag ctcatcaagc 3241 aggggattaa gctctccgct ccaggtcgat gactgataag cttcagcggc aataagcgac 3301 ttcagcctta aatccgaccc gtgcataaac atatccagat atatcatcgg aaggtgggaa 3361 aaatgcgaca ttacctcggg aaattatgcg aaaaacccgc tcatttcttt gaaaagcagt 3421 ccgtcctcat aaaggatctt caaatcctcg gtcagctgaa ccgtaaaggc ctttgccttt 3481 tcaacacagt ttgtatattc gctgacaacg cagaccccgt cctcaaaata atcgctcaaa 3541 aaagtggggt cgccgtaaat ctgcgagtaa tatttatca // LOCUS sequence106 3552 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence106 VERSION sequence106 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3552 /mol_type="genomic DNA" /organism="" /note="sequence106" CDS 465..2144 /product="UDP-N-acetylmuramoyl-tripeptide--D-alanyl-D-alani ne ligase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011405061.1" /transl_table=11 /codon_start=1 /translation="MINLFLAVLVLLYITAMVFSARHFIHMFQLNSYKPKVQAKWICNS DRKYFLQSMIYLALGTVVPLILSLSYYGKDVECVMSLLHFAVIFPLVSLIYFTVTAISK HPKKTYKTPLVYTARIKRLITTLTFIFVIFIVIDACIAFATFPKDGVLDNAIGVREVVF FVTVPAIPCVFISLMPFVILLANLINRPLELMINRHYINDAKRILESCRSHLRVIGITG SFGKTSVKYFLETLLSVKYNVLKTPGNFNTPLGVVKTIRGSLRATHDIFLCEMGAKNVG DIKEICDIVHPDMGIITSVGPMHLESFKSIENVIKTKFELADAVSQKGGEVYANFDNEY IVGECKKREVIPYGIDDVSGYTVSNLHISELGSEFTVTSPEGESCEYRTRLIGKHNVLN IVGAIAVAHRLGIDLDELRPAVRKLESVPHRLQLIDKGEYTIIDDAYNSNPSGTKAALE TLSMTDGMKILVTPGMVELGGMEYALNKEFGVDAAKVCDFVALVGKKQTQPIYDGLKSV DYPEEKIYVAESLNDAMAKVYGLTSGGKRKIILLENDLPDNY" /locus_tag="LOCUS_4530" /note="WP_011405061.1 UDP-N-acetylmuramoyl-tripeptide--D-alanyl-D-alanine ligase (Salinibacter ruber) [pid:32.5%, q_cov:98.9%, s_cov:99.3%, Eval:1.2e-70]" /note="MGA_575" CDS 2268..3458 /product="D-alanine--D-alanine ligase family protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011404923.1" /transl_table=11 /codon_start=1 /translation="MKIKLALIFGGKSVEHEISIISALQAAQSLDREKYDVIPLYIAKS GEMYYGEKTGDIEAYKDIKKLIASSRQVTLARNGERVEIIKYPVKMFEKPFVDYIDVAF PVVHGTNVEDGTVAGYLNMLGVPYVGCDILSSALGMDKYAMKAIFKDNDIPVLDCVVLS SDEFDKDEDECARRVELEIGYPVIVKPVNLGSSVGISKADNHKKLISSLTDAFLYSKRV LVEKAITNLTEINCSVLGNDRKAEASVCERPINSDEILSYEDKYLGGSKSSKGMASTQR VIPADISNEHTLLIQELAVKAFKVLGCCGVSRIDFMIDNDANKVYLNEINTIPGSLSFY LWEPKGVKYSELLDRMIALALEAHRERAKITYAFDTNVLAGIKLGGGTKGAKGSKM" /locus_tag="LOCUS_4540" /note="WP_011404923.1 D-alanine--D-alanine ligase family protein (Salinibacter ruber) [pid:40.4%, q_cov:97.0%, s_cov:93.5%, Eval:2.4e-80]" /note="MGA_576" ORIGIN 1 ctttgaagtt aaaaaaataa ttttgattga tgcggcggga attaagccga agaagacgct 61 caaacaaaaa atcagtcttt tggcatataa aacaggcaga aaaataatgg aaacaaagcc 121 tttaaaggca atgttccccg atgctgttga gaatatgcgc aaaaagcggg gctccgccga 181 ttataactcg gcaacaccga tcatgcgcca aacgcttgtc aaggtcgtta acgaggacct 241 gaccgagctt ttgccgaaca tcaaggcatc gagcctgctt gtttggggca ccaatgacac 301 cgccactccc ctttcggacg gcgagaagat ggagaagctg attcccgatg cagggcttgt 361 caaggtgcag ggtgcagggc attactcctt ccttgaagca tccgagcttg tgtcaagggt 421 cgttaagtcg tttttgaaaa ttaattgaac ggagagattt tgagttgata aatctgtttt 481 tggcagtttt agttctgcta tatatcaccg caatggtatt ttcagcaagg cattttattc 541 atatgttcca gctaaattca tataagccga aagtgcaagc taaatggatc tgtaacagtg 601 acaggaaata tttcctgcaa tcaatgattt atttggcctt gggcaccgtt gttccgctga 661 tactgagttt atcttactac ggtaaagatg tggaatgcgt tatgtcgctt cttcacttcg 721 ccgtcatttt cccgctcgtt tcgctgattt actttaccgt cactgcaatt tcaaagcacc 781 ccaaaaagac ctacaaaacg cctttggtat atacagcaag aattaaaaga ctcatcacaa 841 cgttgacttt catctttgtg attttcatcg tcattgacgc ttgtatcgct tttgcgacct 901 tccccaaaga cggagtgctt gacaacgcca taggtgtgcg cgaggtcgtc ttcttcgtaa 961 ccgtacctgc catcccctgc gtatttattt cgctgatgcc gtttgtgatt ttgcttgcaa 1021 acctaatcaa ccgcccgctt gaactcatga tcaaccgcca ttacatcaac gatgcgaaga 1081 ggattttgga gagctgccgc tcgcatcttc gagtcatcgg cattacggga agcttcggca 1141 agaccagtgt gaagtatttc cttgaaacgc tgttgagcgt caaatataat gttcttaaaa 1201 cccccggaaa cttcaacacc cctttgggcg ttgtcaagac tattcgcggt tcgcttcgcg 1261 cgacccacga cattttcctc tgcgagatgg gtgcaaaaaa tgtcggggac atcaaggaga 1321 tttgcgacat tgttcaccct gatatgggta tcatcacctc ggtgggaccg atgcatcttg 1381 aaagctttaa gagtattgaa aacgtaatta aaacgaagtt tgagcttgcc gatgctgtca 1441 gccaaaaggg cggcgaggtt tacgcaaact ttgacaatga atacatcgtc ggtgaatgca 1501 aaaagcgcga agttatccca tatggcattg acgatgtttc gggatatacc gtttcaaatc 1561 tgcacatttc cgagcttggt tcggaattca ccgtgacctc tcccgagggc gaaagctgtg 1621 aataccgcac ccgccttatc ggaaagcaca acgttttgaa cattgtcggt gcgatagctg 1681 ttgcacacag acttggcatt gatttggatg aactaagacc tgctgtgcga aagcttgaaa 1741 gcgtccctca cagactccag ctcattgaca agggtgaata taccattatt gacgatgctt 1801 ataactccaa tccgtccggc acaaaggcgg ctttggagac cctttcgatg accgatggaa 1861 tgaagatctt agtcacaccc ggaatggtcg agctgggcgg aatggaatat gcccttaaca 1921 aggaattcgg cgttgatgcc gcaaaggtct gcgactttgt tgcgcttgtt ggcaaaaaac 1981 agacccagcc gatatatgac ggattgaagt cggttgatta tcccgaggag aagatttacg 2041 ttgcagaaag ccttaacgac gccatggcga aggtttatgg cttgacaagc gggggcaaaa 2101 ggaagataat acttcttgaa aacgatttgc cggataatta ttgagggaag tgagccgacg 2161 acgtcgcacg atgcgccccg caggggctgt gcgtgcggtg gaggaggcgg taaagcagcg 2221 cgacctcaca aaatccaaac accaatccga aaggaactga tatacacatg aaaatcaaac 2281 ttgcacttat ctttggcggc aagagcgttg agcatgagat ctcaattatc tcggcactcc 2341 aggcagctca gagtcttgac cgcgaaaaat atgatgtcat cccattgtac atagccaaaa 2401 gcggcgagat gtattacggt gaaaagaccg gcgatattga agcatataag gacattaaga 2461 agctcatcgc ttcaagccgt caggtaaccc ttgccagaaa cggcgagagg gttgagatca 2521 tcaaatatcc tgtgaagatg tttgaaaagc cttttgtcga ttatattgac gttgcattcc 2581 ctgttgttca cggcacaaat gttgaggacg gcactgttgc gggatacctc aatatgctcg 2641 gcgtgcctta tgtgggatgc gatattctct cctccgcttt gggcatggat aaatacgcga 2701 tgaaggcaat tttcaaggat aacgacattc ctgttttgga ctgtgtcgtt cttagttctg 2761 acgaatttga caaggatgag gatgaatgtg caagacgggt tgagcttgag atcgggtatc 2821 ccgtgatcgt taagcctgtt aacctgggtt caagcgttgg aatctcaaag gcggataatc 2881 acaaaaagct catcagctcc ctcaccgatg ctttccttta ctccaagcgg gttttggttg 2941 aaaaggcaat aacaaacctc accgaaatta actgctcggt tttgggcaac gaccgcaagg 3001 cggaagcctc cgtttgcgag cgtcccatca attcggacga gatcttgtcc tatgaggata 3061 agtatttggg cggttcaaaa tcctcaaaag gtatggcgag cacacagcgc gttatccctg 3121 cggacatttc aaacgagcac accctgctga ttcaggagct tgcagttaag gcatttaagg 3181 ttttgggttg ctgcggtgta tcacgtatcg actttatgat cgacaacgat gcgaacaagg 3241 tttatctcaa cgagatcaac accattcccg gttccctttc attctatctt tgggagccta 3301 agggagttaa gtattcggag cttttggaca gaatgattgc gctggcgctt gaagcgcaca 3361 gagagcgcgc aaagatcacc tatgcatttg acaccaacgt tttggcaggc attaagcttg 3421 gcggcggaac caaaggagcc aagggctcga agatgtaacc attcaaacgc aaaaaatccc 3481 gacacgtatg tgtcgggatt ttattttaat ttgtgcgact aagccgataa gccgagtttt 3541 gtcgtgtacg gc // LOCUS sequence107 3551 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence107 VERSION sequence107 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3551 /mol_type="genomic DNA" /organism="" /note="sequence107" CDS complement(115..597) /product="peptidylprolyl isomerase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_010966054.1" /transl_table=11 /codon_start=1 /translation="MITIEMENGKKIKLELYPEHAPITVANFTKLVNEHFYDGIIFHRV IKGFMIQGGDPTGTGTGGSKEHIKGEFLSNGVNNTLKHTRGVISMARTSDPDSASSQFF IMHQDAPHLDGQYAAFGKVVEGMDVVDEIASCKTVNNFFYRDRPADEQRIKTITID" /locus_tag="LOCUS_4550" /note="WP_010966054.1 peptidylprolyl isomerase (Clostridium) [pid:63.8%, q_cov:100.0%, s_cov:89.7%, Eval:9.7e-53]" /note="MGA_577" CDS complement(638..1420) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MIRRLTALMLAVLMAVCLCACKNNENLPEQTLGTSDSMAQEVVSS VTDTSEAPATDAPALSEDAKTSDSQEEEPEESVTLGEDEEEIFEDYGYRAFEIVSLLNS DKVHAKFSEAVSYDGEYISATENEIYVDGGNRVFVVDNTKIIMSDGIAHAVDFDEMAYY TYEYDPEEYERVFGYALEEYVPISHTEENGKITEVYVIEQYGSTITSTWVFETDGTFTV SEINEQAGSFYVYTFEVVTVDVSGMDMTIPEDFEEFEE" /locus_tag="LOCUS_4560" /note="MGA_578" CDS complement(1486..1881) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MTETVIKYVNEKYGVQPEFLWENDFDDGALRHSDTKKWFGIIMMN TKRSVLGLSGDGRVDVMNVKADPFLIERLIDGKGYLPAYHMNKRHWITLLLDGSVDEKA LFALIDKSYELTRKKSIVKAPQRGNKT" /locus_tag="LOCUS_4570" /note="WP_011016732.1 MmcQ/YjbR family DNA-binding protein (Fusobacterium nucleatum) [pid:40.5%, q_cov:88.5%, s_cov:51.8%, Eval:4.5e-22, partial hit]" /note="MGA_579" CDS 2024..3046 /product="stage V sporulation protein AD" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003403641.1" /transl_table=11 /codon_start=1 /translation="MARREGKSTILMESDISVSAFSSAVGKKEGESLLKDCFDHIDSDD RFGQDNFELGETAMQGLALEILFQKRGLKDKDFDIIIGGDLTNQCIATGYAVREFQRPY LGIYSACSTVSESMLISALAVESGGAERVAALASSHFCTAERQYRFPLEYGAVRTPTSQ RTATACGAFAIEKGENAPFIRAVTVGKIEDKGILDANNMGAAMAYAAYSTISGFLDDTG KSPDYFDHIITGDLGEVGTNILYELFDRDGRSIRRNHLDCGKMMYENMNDVYSGGSGAG CSSAVMAGHILPQIRDGKLRNVLFAATGALLSVTSVQQNRSIPCISHLVWLSNKGGASG " /locus_tag="LOCUS_4580" /gene="spoVAD" /note="WP_003403641.1 stage V sporulation protein AD (Clostridium) [pid:42.3%, q_cov:97.1%, s_cov:98.8%, Eval:3.6e-71]" /note="MGA_580" CDS 3043..3396 /product="stage V sporulation protein AE" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003403640.1" /transl_table=11 /codon_start=1 /translation="MIYLKAFVVGGLICMVGQVLIDKTKLTPARILTAYVCAGVLLGAL GLYEPLIEFAGAGASVPLTGFGNLLAKGVREAVAEDGFIGIFTGGLKSAAGGITVALVA GLAMAVFFRPRTK" /locus_tag="LOCUS_4590" /gene="spoVAE" /note="WP_003403640.1 stage V sporulation protein AE (Clostridium) [pid:53.8%, q_cov:100.0%, s_cov:99.2%, Eval:5.2e-31]" /note="MGA_581" ORIGIN 1 ccgacccatt tcagggcttc gccctgaaat gggacccccg cgccgcaggc gcggggtgcc 61 cgcaaagcct tgcgggcagg aggcggcgtc gccaaggcac atacgtttgg tttctcagtc 121 aatggttata gtcttaattc tctgctcgtc ggcggggcgg tcacggtaga agaagttatt 181 caccgtcttg caggatgcga tctcgtcaac aacgtccata ccctcaacca ccttgccgaa 241 tgcggcatac tgtccgtcca aatggggtgc atcctgatgc ataataaaga actggctgga 301 tgctgagtcg gggtcgcttg ttctcgccat cgagataacg cctctggtgt gcttaagtgt 361 gttgttaacg ccgtttgaaa ggaattcgcc cttaatgtgc tccttcgagc cgcctgttcc 421 ggtgcctgtg gggtcaccgc cctgaatcat aaagccttta atcacgcggt ggaagatgat 481 tccgtcgtaa aaatgctcgt tgacgagctt ggtgaagttc gcaacggtaa tgggtgcgtg 541 ctcgggataa agctcaagct taattttctt tccgttttcc atttcaattg taatcataat 601 tatattttcc tttctttgct ttaaaaaggc atctgcctta ttcttcaaat tcctcaaaat 661 cctcgggtat ggtcatatcc attcccgaaa catcaacagt tacaacctca aaggtataaa 721 cataaaacga gccggcctgt tcgttgatct ccgaaacggt gaacgttccg tccgtttcaa 781 atacccaggt gctggtaatg gtgctgccat actgctcgat aacataaacc tctgttatct 841 tgccgttctc ttcggtatgg ctgataggga catattcctc gagggcatat ccgaacaccc 901 gttcatattc ctcggggtca tattcatagg tgtagtatgc catttcgtca aaatcaaccg 961 cgtgtgcaat gccgtcggac ataataatct ttgtgttatc aacaacgaag accctgtttc 1021 cgccgtcaac atatatttca ttctccgttg cggatatgta ttcgccgtca tatgacaccg 1081 cttcgctgaa ctttgcgtgg accttgtccg agttgagaag cgaaacgatt tcaaatgctc 1141 tatatccgta atcttcaaaa atctcctctt catcttcgcc gagggtgacc gattcttcag 1201 gctcctcttc ctgcgaatcg cttgtcttgg catcttcgct caaggcaggc gcgtcggttg 1261 caggtgcttc gcttgtgtcg gtaacagatg aaacaacctc ttgtgccatg ctgtccgatg 1321 tgcccaaagt ctgttcgggc agattttcat tatttttgca ggcgcaaagg caaaccgcca 1381 ttaaaaccgc cagcatcagc gccgttaatc ttctaatcac taaacatcac cttcaatgta 1441 aaagtaaaac tgttcaaaat attatactac atttgacacc gattttcaag ttttattgcc 1501 cctttgaggt gccttgacga tactcttttt gcgcgtcaat tcatagcttt tgtcgatcag 1561 cgcaaatagg gctttttcgt caacgcttcc gtcaagcaaa agggttatcc aatgccgctt 1621 gttcatatga tatgcaggaa gatatccttt tccgtcaatc agtcgttcga tcaaaaacgg 1681 gtcggcttta acgttcataa catctacccg tccgtcgccc gaaagcccca aaacgctccg 1741 cttggtgttc atcattataa ttccgaacca ctttttggtg tcactatggc gcaaagcccc 1801 gtcgtcaaaa tcgttttccc aaagaaattc gggctgaacg ccgtattttt cattgacata 1861 tttaattacg gtttcggtca ttgtgagtca cctcgatatt ggttttatct tattatacat 1921 caaacccaac acgaaaacaa gaagccgtgt gcgcctcgcg gaataaattg caaaatgcgg 1981 caaacaatat gcaaagtaaa acaaaaacgg aggcacttaa aaaatggcaa gacgagaggg 2041 caaatcaacc atacttatgg agtcggatat atcggtcagt gcgttttcct cggcggtggg 2101 caaaaaagag ggcgaaagcc ttttgaaaga ttgctttgac cacatcgact cggatgaccg 2161 tttcgggcag gataattttg agttgggcga aaccgcaatg caaggcttgg cgcttgaaat 2221 acttttccag aaaagaggcc ttaaagacaa ggattttgac attataatcg gtggggatct 2281 gacaaatcaa tgcatcgcaa cgggatatgc cgtcagggag tttcagcggc cttatttggg 2341 catttacagc gcctgctcga cagtcagcga aagtatgtta ataagcgcat tggcagttga 2401 atcgggcgga gccgaaagag tcgctgcttt ggcatcatcc cacttttgca ccgccgagag 2461 gcaatatcgc tttccgcttg aatacggcgc ggtgagaacg cccacatccc aaagaacagc 2521 caccgcctgc ggagcctttg cgattgaaaa gggcgaaaac gcgccgttca tcagagcggt 2581 aacggtgggt aagattgagg acaagggtat acttgatgcc aacaatatgg gtgcggcgat 2641 ggcatatgcg gcatattcaa ccataagcgg atttttggat gacacaggca agagccccga 2701 ttattttgac catataatca caggcgactt gggcgaggtg ggaacaaata tactgtatga 2761 gctgtttgac cgcgacggca gaagcatacg gcgaaatcac ctcgattgcg gcaaaatgat 2821 gtatgaaaat atgaacgacg tttattcggg cggctcgggt gctgggtgtt caagtgcggt 2881 aatggcgggg catattttac cacagataag agatggtaaa ctcagaaatg tgctttttgc 2941 ggcgacgggt gcgcttttaa gcgtcacaag tgttcagcaa aaccgaagca tcccctgcat 3001 ctcccatctg gtgtggctgt caaacaaagg aggggcaagc ggatgatata tttaaaagcg 3061 tttgttgtag gcgggctgat atgtatggtc gggcaggtgc tgattgataa aacaaagctg 3121 actcccgcga gaattttaac ggcatatgtc tgtgcaggtg tgcttttggg cgcattggga 3181 ctatatgagc cgctcattga atttgcgggg gcgggggcaa gtgtgccctt gacgggcttt 3241 gggaacctgc tcgccaaggg cgtgcgtgag gcggttgccg aggacggatt catcgggatt 3301 ttcacaggcg ggctgaaatc ggcggcagga ggaatcaccg ttgcacttgt ggcaggcctg 3361 gcgatggctg tattcttcag accgaggacg aagtagtggc acgggtgtgc caatgaagct 3421 tgttatgttg gcggggcgga ggccggcgta acccgaaggg ttgtgccgga ggggacccgc 3481 atatgcacgc ttcggtttta ccgctcgcca ccatcggcgc tgccgcgctt ttcgatgacg 3541 gctcgctccg c // LOCUS sequence108 3546 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence108 VERSION sequence108 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3546 /mol_type="genomic DNA" /organism="" /note="sequence108" CDS 510..1061 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MKSKIYYKLMVRIAMVVVLIVAMTVVTYSYAMSVLRVDDNAFTTG LIDIDLNGGLPVVADLKDIEPGATYVREFYIRNNSTDEGGVYYKLYFEDISGIMANILD ITIADRDSGEVLLSGKMNDLTEDRVLAFDDILETGETRWFTVSFHYPIDGDNRGMGTEL LFSLSADAVQTKNNPDKLFE" /locus_tag="LOCUS_4600" /note="MGA_584" CDS 1061..1771 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MEKIKKILKIAGDVITLLLVVLAVFMIIFTVISTAVLDESERNFL GYRGFVVLSDSMSATDFDAGDIVFIRSIDPAKLKEGDIISYLSPETGDFITHKIRRLTE TPSGEPGFITYGTTTDTDDKITVTYSMVAGKYQFSLPGIGKILSFVRTGPGYLLTIFTP LTIIVVLQTINTIKLYRQYKAAQLEENREVADVKQETALAESENARIREELEALRAQLR EFVHSETAQEEENQ" /locus_tag="LOCUS_4610" /note="MGA_585" CDS 1768..3546 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MNRTEKSIKLNILALAIPALVCVLICSLILSGMTFSWFTDTHASS ANLIKTASFVTSKTVTDSLGVAITPDANGKYSLPAGEYLVTVDASAANTNGYTTMYLGD VPFLQTALLNDSVLNTQVTYTLNVTLTTTPSATITFADSWDYPQAGLTTVSNGLTYNIT ETSVASAAALANMPQTYSFGGVSMIIDPVYGYIYDLNGGIYYDPFNFENYYTLDPVSGN FIHAETGELFNPETGRNIDSETGYEIDPETDYLIDPVSNFLIHPITNRLVYTQTETVTE GDVITEETLLIDVLTAFETDAETGYLIEPLTGRFIHAETMYYVIEESDYLIIPATSYLY NPTLGTYHDPLTYEEVTEEVALGIPADEDLLGGEETEDDEEIDDPEVVEDGNEPIIDEP MIEDPVIDDSEITDDTVVTYSPIDGFVNVPDTLEYQVVPYLVDDMVYGACRMLYNTTDG TYINLTADALLYTDPTTGFFMIPGSAYQLIPVTGYLYDTVYENYLDPTTMLLTTYDVAL GLVVDEVPADDATEGITPVEPEAEVTTTVTEETTTDETSVSESDTTVSETEPAVTSAEV SDTTAETTAEIEAEVA" /locus_tag="LOCUS_4620" /note="MGA_586" ORIGIN 1 tgatcccata tatgacaagc ttgccgaggt attgatgctc aaagtcagtg tcaacggacg 61 ggaaatatac gacggcttga tgaaagactt tggcggccat aacacaggtc tgccctcgtt 121 ctatgaagat ggcattgttc aaagtcttga ataccacatt gaggtatacc ttgacacaag 181 cgtcggcaac gaatatatgc aaaagcccct caagtgtgac tatagctgga ctatctatga 241 gaatatgccc gatcccgttc ctccgggtgg aggcggctcc ggcaacgccg gcgacgatgg 301 cgacaccact gacaaggata atccggttga tgatgacgac aacaaggacg atgtcgaggt 361 tgtaattccc gacgaaagcc atgagaactt tgaaaccttc gtctatatcc ccgagccttg 421 ccgcttcggc atcgcttgtg taatttcctg tgcggcattt ttggtccttc tcgcttcgct 481 catccttatc cgcagaaagg agaatggcct tgaaaagtaa gatctattac aagctgatgg 541 taagaattgc aatggtcgtt gtccttattg ttgccatgac cgttgtgact tacagctacg 601 ctatgagcgt tcttcgggtt gatgataacg ccttcaccac aggtttaatt gatatcgatc 661 tcaacggcgg cttgcccgtt gttgcagatt tgaaggatat cgagccgggc gcgacctatg 721 tcagagagtt ctatatccgc aacaactcca ccgacgaggg cggcgtatac tataagctat 781 attttgaaga tatttcgggc attatggcaa atatcctcga catcacaatt gccgaccgcg 841 acagcggcga ggtgctcctt tcgggcaaga tgaacgacct gaccgaagac cgagttttgg 901 catttgacga tattcttgaa acgggcgaga cccgctggtt taccgtcagc ttccattatc 961 ccattgacgg cgacaaccgc ggaatgggaa ccgagctttt gttcagcctt tctgccgatg 1021 ccgttcagac caagaacaac cccgacaagc tttttgaata gtggaaaaga ttaagaaaat 1081 tttaaaaata gcgggcgatg ttatcaccct gcttcttgtg gtgcttgccg tgtttatgat 1141 tatatttacg gtaatatcca ccgccgtgtt ggacgaatcg gagcgcaact ttttgggata 1201 ccgcggcttt gtggtacttt ccgactcgat gtccgccacc gattttgatg caggcgatat 1261 cgtgttcatc cgctcgatcg accctgcaaa gctgaaagaa ggggacatca tctcatatct 1321 ttcacccgaa acaggcgatt tcatcaccca taaaataaga cggcttaccg aaaccccaag 1381 cggcgagccg ggctttatca cctacggcac cactaccgac accgacgaca agatcacagt 1441 cacctattcg atggttgccg gaaaatatca attcagtctg cccggcatcg gaaagattct 1501 ttcctttgta cggaccggcc cgggatatct acttacgata ttcacgccgc tcacaattat 1561 tgttgtgctg cagacgatca acacaataaa gctctaccgc caatataaag cggcacagct 1621 tgaagaaaac cgtgaggttg cagatgttaa gcaggaaact gcgcttgccg agtcggaaaa 1681 cgcacgtatc cgcgaagaac ttgaagcctt gcgcgcccaa ctaagggaat ttgtgcattc 1741 agaaaccgcc caagaggagg aaaatcagtg aatcgaactg aaaaaagcat aaaactgaat 1801 attttagcgc ttgcgattcc tgctcttgta tgcgtgctta tctgttcgct gatcctttcg 1861 ggaatgacat tcagctggtt taccgatacc cacgcttcgt cggcaaacct catcaagaca 1921 gcatcgtttg tcacctcgaa aacggtaaca gacagccttg gcgttgcgat aacgcccgat 1981 gcaaacggca aatattccct tcctgcaggc gagtaccttg tcaccgttga tgcatcagcc 2041 gccaacacca atggctatac gacgatgtat ctcggcgatg tcccgttctt gcagactgct 2101 cttttgaatg attccgtttt gaacactcaa gtgacatata ccctaaatgt caccttgacg 2161 accaccccct cggcaacgat cacctttgcc gatagttggg attaccccca agcaggttta 2221 acaaccgttt cgaacggttt gacctataat atcaccgaaa cttccgttgc atctgcagcg 2281 gctctggcaa atatgcccca gacctacagc ttcggcggtg tatcaatgat aatcgacccc 2341 gtttacggct atatctatga ccttaacggc ggaatttatt acgacccctt caacttcgaa 2401 aactactata ctcttgaccc tgtcagcggt aattttattc acgctgaaac aggcgagtta 2461 ttcaatcccg aaacaggtag aaatatcgat tcggaaaccg gatatgagat cgaccccgaa 2521 acagattacc tgatcgaccc tgtatcgaac ttcctcatcc accccatcac taaccgactg 2581 gtatataccc aaactgaaac tgtcaccgag ggcgatgtca taaccgagga aacgcttctt 2641 attgacgttc tcaccgcctt tgaaaccgat gccgaaacag gatatttgat tgagccttta 2701 actggcagat ttatccacgc cgaaacgatg tattatgtca tcgaggaaag cgattatctg 2761 atcattcccg caacctcata tctttataac ccgactttgg gaacatacca cgatccgctg 2821 acatatgaag aagtgaccga ggaagttgcg cttggaattc ccgccgatga agatcttttg 2881 ggcggcgagg aaaccgagga cgacgaggaa attgatgacc ccgaagttgt tgaagacggc 2941 aacgaaccca taattgatga acctatgatt gaagatcccg tgattgacga ttctgaaatt 3001 accgacgaca ctgttgtgac ttattctccc attgatggct tcgtcaatgt gcccgacaca 3061 ttggaatatc aggttgtgcc ttatttggtt gatgatatgg tatacggcgc ctgccgaatg 3121 ctttataaca ccaccgacgg cacatatatc aatctcaccg cggatgctct gctctatacc 3181 gatccgacca caggattctt tatgataccc ggctctgcat atcagctcat ccctgtaacg 3241 ggttaccttt acgacacggt atatgaaaac tacctcgacc cgacaacaat gcttttaacg 3301 acatatgacg ttgcgcttgg attggtggtt gacgaagttc ctgcagatga tgcaaccgaa 3361 ggcatcacac ctgttgaacc cgaagctgaa gtgaccacaa ctgtcaccga agaaaccacc 3421 acagatgaaa cttcagtttc cgaatcggac acaaccgttt ccgaaaccga acctgcggta 3481 acatcggctg aagttagcga cacaactgct gaaaccaccg ccgaaatcga agccgaagta 3541 gcataa // LOCUS sequence109 3514 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence109 VERSION sequence109 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3514 /mol_type="genomic DNA" /organism="" /note="sequence109" CDS complement(784..1692) /product="RluA family pseudouridine synthase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011861614.1" /transl_table=11 /codon_start=1 /translation="MNRFEFIADRQDEGERIDKWLTLQDEVDLTRSAVAKLIEGENVLI NGKIAQKSAKLSIGDRVIIEIPDPVDLKVEAQDIPIEIVYEDDDVVIVNKPQGMVVHPA AGNPDGTLVNALLYKCQGKLSSINGVIRPGIVHRIDKNTSGLLIVCKNDKAHLHVSEQI KAHTFTREYEAICVGRFKEKSGTVNAPIGRDKVDRKKMCVTPTNSKEAITHYEVLEELG NYSYMRFKLETGRTHQIRVHCAYLGHPILGDDVYGKPYKGCKGQTLHARKIGFIHPSTG EYLEFTSDLPDYFTKLLNSLR" /locus_tag="LOCUS_4630" /note="WP_011861614.1 RluA family pseudouridine synthase (Clostridioides difficile) [pid:53.7%, q_cov:98.7%, s_cov:98.3%, Eval:3.2e-84]" /note="MGA_588" CDS complement(1679..2263) /product="signal peptidase II" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011475977.1" /transl_table=11 /codon_start=1 /translation="MLILCLCLIVALILEDQLIKLYIVNNIRECTGFIDRYYTFRIGNF DIFSITHIRNDGAGFSILEGKTAFLLVFTFIVMAGITAYICWKRKSLHRIEMLCLSMIV AGGIGNFIDRVRMVIEPNFNGVIDYIKLEFISFPIFNFADICVCVGAFGYCIYVIVAEI KQQKLKNAQKVSETEKSSETADNTESENEQI" /locus_tag="LOCUS_4640" /gene="lspA" /EC_number="3.4.23.36" /note="WP_011475977.1 signal peptidase II (Ligilactobacillus salivarius) [pid:37.5%, q_cov:82.5%, s_cov:94.6%, Eval:2.0e-20]" /note="MGA_589" misc_feature complement(2338..>3514) /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_012546193.1:isoleucine--tRNA ligase" /note="WP_012546193.1 isoleucine--tRNA ligase (Thermodesulfovibrio yellowstonii) [pid:49.7%, q_cov:100.0%, s_cov:41.1%, Eval:2.6e-103, partial hit]" /note="MGA_590" /locus_tag="LOCUS_4650" ORIGIN 1 cttcttttat cgcatcctga tcgcaggtgg cctttaaaat gacatcggct gtattaagga 61 cacattcctg tgaaacggaa ggacaaaagc ttatatcaga tgctttaagc atctcaatat 121 cgttatcata gtctcctgct gtaaaaacca tgcaggattt aagaccgtaa aggtctttaa 181 gcacctcaac ggcactgcct tttgaaacat cagcaggcaa aacctccaaa aatttggaga 241 ggcttcttac aaatctcaga cctaagctgt taaacttctt aacatattcg caaagttcgt 301 caattacagc atcttcgtca gcaaacaaaa gcttgcagat cggctcattt atatcatcaa 361 cactctcgca tttgataaat tcaaaaccca aaagcgattg atgccagcgc tcggtgtcgt 421 tcatacggag ataatgctga ccgctgacag tgtatacctc cggagcaact gtcgggaaac 481 ggtcataaat ctcgcggaca atatctttag cggtagcagg cagatatttt gcccaaataa 541 tctttctttc atatgggtca taaatcattg cgccgttgca aataatcatc ggaagatcgt 601 aatgcacctg gtcaatataa gtaccgacag tttgaatagg tctgcccgtt gcaacgcaga 661 attttccgcc caaatgctga tattcattga ttgcatcaat atttccctga gttaggcgtt 721 tgtcggttgt caatagagta ccgtcaaagt ctgaaacaaa aattgtgttg gtaagatcca 781 tttttacctc agtgaattta atagttttgt gaaataatcg ggcaaatcac tggtaaattc 841 cagatattcc cccgttgacg ggtggatgaa accgatttta cgtgcgtgaa gggtttgacc 901 tttacatcct ttgtaaggct tgccgtaaac atcatcaccc aaaatcgggt ggcctaaata 961 tgcacagtgg acacgaatct ggtgagtcct gcccgtttca agcttaaaac gcatataaga 1021 gtagttacca agctcttcaa gcacctcata gtgagtaata gcttcctttg aattggtggg 1081 tgtgacacac attttcttgc gatcaacctt atctcgtcct atcggtgcat tgacagttcc 1141 tgatttttcc ttgaatctgc cgacgcatat cgcttcatat tcacgtgtaa aggtgtgcgc 1201 ctttatttgc tcggaaacgt gaagatgggc tttgtcattc ttgcaaacga tcaaaagacc 1261 gcttgtgttc ttatcaattc ggtggacaat accgggacgg ataactccgt tgatgcttga 1321 aagcttgcct tggcacttat atagcaaagc gttaaccaat gtgccgtcgg gatttcctgc 1381 cgcgggatgg acgaccatac cttgcggctt gttgacgatt acaacatcgt catcctcata 1441 aacaatctca atcggaatat cctgtgcctc gactttcaaa tcaacagggt cgggtatctc 1501 aattatgaca cgatccccta ttgataactt ggcgctcttc tgagcgattt tgccgttaat 1561 aaggacgttt tcaccttcaa tcaactttgc aactgccgag cgtgtcagat caacctcatc 1621 ctgcaaagtc aaccatttgt caatacgttc gccctcatcc tgcctatcgg cgatgaactc 1681 aaatctgttc attttcggac tccgtattgt cagctgtttc agaagatttt tcagtttctg 1741 agactttctg tgcattcttc aacttttgct gcttaatttc tgctacgata acataaatgc 1801 aatagccgaa agcaccgaca catacgcaga tatcagcaaa gttgaaaatc gggaagctga 1861 tgaattcaag cttaatatag tcgataacgc cgttaaaatt aggctcaata accattctta 1921 cgcggtcgat aaagtttccg atcccgcccg caacgatcat tgaaagacag agcatttcaa 1981 ttctgtgcaa gctcttgcgt ttccagcaga tgtatgctgt gatacctgcc atcacaataa 2041 atgtgaagac aagcaagaat gcagtcttac cttcaagaat actaaaacct gctccgtcgt 2101 tgcgaatgtg ggtgatgctg aaaatatcaa aatttccgat tcggaaggtg taatatctgt 2161 cgataaaacc tgtgcattct cttatattgt taacaatata cagcttgatc agctgatctt 2221 caagaattaa agccactatc aagcataagc agagtatcag catttattaa cctccgaact 2281 tgaaaacaag ccgattgccg cagttaagcg gcaatcaagc aatgagtatt tataatttta 2341 cttaacggtg tgtgcgcatc ttgagcaaag tgtaggatgc tcatcatccg taccgactgt 2401 atcggaatag atccagcagc gttcgcactt ctcgccgctt gcctttgcaa catcaaagcc 2461 aaggccggtt gtttcacctg taaactcggc ttcgccgcca tttacaacct caacgcgtga 2521 tacgatgaat actgcaggca agatatcctt aacagcgcaa agtctgtcat agtcagcgcc 2581 acttgcgtgg atgaccatat cagcttcgag agaagaaccg attaccttgt cagcacgctt 2641 aagctcaagt gccttctttg catcaactct aagattatag ataaattccc acttggaaac 2701 gaactctgta tcgaaatcgt gtccagaaac cttaggcata tcgttaagga agatgcttct 2761 ggggtcatcc ttcttggaat gaggaatata tgaccaaatt tcatcagcgg taaacgacaa 2821 aataggggca acgagtcttg caattgcaga gagaatggta tacataacag tctgcgcact 2881 gcgtctgagc tcgctgtcag gtgcttcaca gtaaagtctg tccttaataa tgtcaaggta 2941 gaagttggac atatcaatta cgcagaagtt gtgaatagcg tggaatacaa tgtggaaatc 3001 aaagttgtta taagcttcgt tgaccttgtt gataaggtta tcgagcttca tgattgccca 3061 cttgtcaagc tcgggcatat tttcaaatgc aacagcatcg gtgtcaatat taaagccgcc 3121 ctggttgcag atgttaccca agatatatct tgcggtgttt ctgatctttt tatatgcttc 3181 agaaagctga gcgatgattg ccttggaaac acggatgtcg gagtgataat cgctggatgc 3241 tacccaaagt ctcaaaatgt cagcaccgtt cttatcatag atctcctttg gctcaatacc 3301 gttgcccaag gacttgtgca tggtcttgcc ttcgccgtca acgacccaac cgtgagtgca 3361 tacagcctta tagggggcct tgccgctgac aacaacgctt gtcaaaagtg aagactggaa 3421 ccagcctctg tactggtcgg caccttcaag ataaagatca gcaggtgagc aaacaccgtc 3481 acgctggtcc aaaacagctg tatgggtaac gccc // LOCUS sequence110 3504 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence110 VERSION sequence110 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3504 /mol_type="genomic DNA" /organism="" /note="sequence110" misc_feature <1..729 /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_011459675.1:ABC transporter ATP-binding protein" /note="WP_011459675.1 ABC transporter ATP-binding protein (Desulfitobacterium hafniense) [pid:65.4%, q_cov:99.2%, s_cov:41.0%, Eval:2.2e-84, partial hit]" /note="MGA_591" /locus_tag="LOCUS_4660" CDS complement(1035..2015) /product="diaminopimelate dehydrogenase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_005808153.1" /transl_table=11 /codon_start=1 /translation="MKIGIYGYGNLGRGVENAISKNSDAKLMAVFTRRDPATLKIQTEG VPVVSVNDIEKWSDKIDVMIICGGSATDLPEMTPALAKHFNVIDSYDNHSSIPTHFANV DKSAKESGKLALISCGWDPGMFSIMRLYGNAVLPNGNDYTFWGRGVSQGHSDAIRRIEG VIDARQYTVPVEEVVNAVRAGSRDEYTTRQKHTRECYVVAEEGADLERIRNEIVTMPAY FEPYDTTVHFITLEELKRDHMGLPHGGSVIRTGATGVNNEHKQVVEYKLTLDSNPEFTG SVLVAFARAIDKMARRGEIGCKTVFDIAPANLLAISHEEIVAHLL" /locus_tag="LOCUS_4670" /EC_number="1.4.1.16" /note="WP_005808153.1 diaminopimelate dehydrogenase (Desulfitobacterium) [pid:57.1%, q_cov:100.0%, s_cov:99.1%, Eval:7.9e-108]" /note="MGA_592" CDS 2237..2530 /product="YerC/YecD family TrpR-related protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_010965963.1" /transl_table=11 /codon_start=1 /translation="MSENNDMALVKLAKAFSCIHSEEESIKFLTDILSIKEIKEISQRL EVAKMLKSGMVYTEISTKTGASTATISRVNRALNYGEGGYEIILSRLSEDKA" /locus_tag="LOCUS_4680" /note="WP_010965963.1 YerC/YecD family TrpR-related protein (Clostridium) [pid:55.4%, q_cov:85.6%, s_cov:84.7%, Eval:7.9e-19]" /note="MGA_593" CDS 2527..3258 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MNYILKNGEQEMLLLRELYEAWGYSHFKMSKFEEYDLYAKNKDFL LSGNILTFTDPNGKLMALKPDVTISIIKNSSDESENLEKVYYNENVYRAESGSFKEIMQ TGLECIGKIDLFSICEVITLAAKSLERFSENYVLDISHMGILGEILDDIDADEETRQEI IGCIEKKSLHELDAVCKDMGEDAKKKLSNLILLDSDPEKGLDELKAICENSKAIKELER IIKVLENENTKLKEDNQYGFM" /locus_tag="LOCUS_4690" /note="MGA_594" ORIGIN 1 gatattgaat ttgaaaacgt cagcttccac tatggcaacg aagaggagaa ggaagtttta 61 acaaacctct cgatgaagat cgagcaaggc aagaccgttg cacttgtcgg cccatcgggc 121 ggcggaaaga ccaccatttg caatctcatc ccccgattct atgaaattga cgagggaaaa 181 atctccatcg acggagtgga catccgcgat gttaaaagac tcagtttgcg ccgacatatc 241 ggtattgttt cgcaggatgt attcctgttt aacggcacaa ttcgcgaaaa cattgcctac 301 ggcaagagag atgcaaccga cgaggaaatt gccgaagccg caaagaaggc aaacatttat 361 gactatgtga tgacccttga aaagggcttt gacacacagg tcggcgagcg cggtgttacc 421 ctttcgggag gacagaagca gcgaatctcc attgcacgag tattccttaa aaacccgtcc 481 attctcattt tggacgaagc gaccagtgcc ctcgacaatg caaccgaagt tcagattcag 541 gcggctcttg aggagctttc aaagggcaga actgttttgg ttgttgctca cagactttca 601 accgttaaga acgccgatga gatcatcgta attacacaaa acggaattga agaacgcggc 661 acccatgacc agcttttggc gatggacgag ggcatttata aggaattgta tcagtatcag 721 ctcagatgat ggagcgagcc gtggctgaca cgccgatgcg atgaaattgc atcggaagtg 781 gcctgccgtg acgagcggta caatgcccac tcagtcagct tcgctgacag ctctcccgta 841 ggaagatcct tcgaaaattg cacatttaaa aaaggaacag acaaagagtc tgttccttgt 901 gtttttatgg gcggggcgga ggccgacgtt cgccgcaggc ggaagacgga ggggacccgc 961 gattagcgag cgacgtctgg cggattgcgt tgccgtcaag caacagtatc cggcaggtga 1021 agcgagcggt aggatcacag caaatgtgcc acgatctcct catgggaaat tgccaacaga 1081 ttggcagggg cgatgtcaaa tacggttttg cagccgattt cgccgcgacg cgccatcttg 1141 tcgatggctc ttgcgaatgc aacaagcacc gagcctgtga attcggggtt tgaatcaaga 1201 gtcagtttat attcaacaac ctgtttatgt tcgttgttga cgcctgttgc gcctgtgcga 1261 atgacacttc cgccgtgagg aagtcccata tggtcacgtt tgagttcttc aagtgtgata 1321 aaatgaacgg tggtatcgta aggctcgaaa tatgcaggca ttgtaacgat ctcgttacgg 1381 atacgctcaa ggtcggcacc ttcttcagcg acgacgtagc actctcttgt atgcttctgg 1441 cgggtggtat attcatcgcg ggagcctgca cggacagcgt ttacaacttc ctcgacaggg 1501 acagtatact gtcttgcatc gataacacct tcaattcggc gaatagcgtc cgagtggcct 1561 tggcttactc ccctgcccca gaaggtatag tcgttgccat tgggaagaac tgcattgcca 1621 tatagacgca taatcgagaa cattccggga tcccatccgc aagagataag ggcaagcttg 1681 cccgattctt tggcggattt atccacattg gcaaagtgtg tgggaatgct tgagtggtta 1741 tcatatgagt cgataacgtt gaagtgcttg gcaagtgcag gggtcatctc gggcaggtcg 1801 gttgcagagc cgccgcaaat tatcataaca tctattttat cggaccattt ttcaatatcg 1861 ttaacagata caacgggcac tccctcagtt tgaattttga gggttgcggg atcacgtctt 1921 gtgaataccg ccataagttt agcatcagaa ttctttgaga tcgcgttttc aacgcctctg 1981 ccaaggtttc cgtagccgta aataccaatt ttcatataca gtacctcctt gtggatctat 2041 agcatatatt atcacacttt tttgaaaatt tcaatttaca ttttagttac atttatgctt 2101 ttattcatta ttacaataag tcacttagat taacagtggg atttatacag tattacttct 2161 tgactttagc acgataacgt gctaatatgt tattgtgata aagatttaca ttgtcaaacc 2221 actcggaggt gcaaaaatgt ctgaaaacaa cgatatggca ttagttaagc ttgccaaggc 2281 attctcgtgt attcattcgg aagaagagag cataaaattt ttaactgata tactttctat 2341 taaagagatt aaagaaattt cccagcgtct tgaggttgca aagatgctta aatcgggaat 2401 ggtatataca gaaatatcta ccaaaacggg agcttcaact gcaaccataa gccgagttaa 2461 ccgtgcctta aactatggcg agggcggata tgagataatt ctttcaagac tttcggagga 2521 taaggcgtga attatatttt aaaaaacggc gagcaggaaa tgcttttgct ccgcgagctt 2581 tatgaggctt ggggatattc tcattttaag atgagcaaat ttgaagagta tgacctgtat 2641 gccaaaaaca aagacttcct tttaagcgga aatattttga cctttaccga cccaaacggc 2701 aaactgatgg ctttgaagcc tgacgtcact atatctatta tcaagaattc gtcggatgaa 2761 tcggagaatc ttgaaaaggt ctattataat gaaaatgttt acagagctga atcgggcagc 2821 tttaaggaga ttatgcagac aggacttgag tgcatcggca aaattgacct tttcagcatt 2881 tgcgaggtta taacccttgc ggcgaagagc cttgagcgat tcagcgagaa ttatgttctt 2941 gatatatccc atatgggaat tttgggcgag atacttgatg atattgatgc agacgaggaa 3001 acccgtcagg agataatcgg atgcattgag aaaaagagcc tgcacgagct ggatgctgtc 3061 tgcaaggata tgggcgaaga tgcaaagaaa aagctctcta atctcatctt gcttgacagc 3121 gacccggaaa aagggcttga tgaactcaag gcgatctgcg aaaacagcaa ggcaattaag 3181 gagcttgaga gaataatcaa ggtgcttgaa aatgagaata caaagctaaa agaggataat 3241 caatacggat ttatgtagta attattgcct ggagatgtat gatcttttcc acatgctgat 3301 atgtcgcggt atttgtgacg cttgccgcaa aacaagccgt agcaacggct gccgctatac 3361 agtaacaaca ttttgctacc actccgccaa tatttggggt ggtagaggcc gcaagttcaa 3421 gtcttgtcac tcagaccaaa atcggaggtt caaccgaacc tccgattttc ttttattttc 3481 tcgctaaatc tcttgaaatc ttgc // LOCUS sequence111 3491 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence111 VERSION sequence111 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3491 /mol_type="genomic DNA" /organism="" /note="sequence111" CDS 108..965 /product="energy-coupling factor transporter ATPase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003435660.1" /transl_table=11 /codon_start=1 /translation="MEKFIELKNVSFSYTNEYDEKPIKTEVIKNLSMTVNKGEFVAVLG HNGSGKSTLAKLMNAINLPESGEVLINGMDTRKEENLYNIRRTVGMVFQNPDNQIVATV VEEDVAFALENIGVEPEKIRESVDDALKTVGMYNYREHAPHKLSGGQKQRVAIAGVIAM QPDCIVLDEPTAMLDPIGRREIMKTIKKLNDMGVTIVLITHYMDEAAQAKRVVVMDYGK IILDDEPKKVFSQVEKLKSVGLDVPQVTELTHMLIDSGLSLPRDIITEEECVDELYKLL RKAD" /locus_tag="LOCUS_4700" /note="WP_003435660.1 energy-coupling factor transporter ATPase (Clostridioides difficile) [pid:57.3%, q_cov:98.2%, s_cov:100.0%, Eval:2.1e-90]" /note="MGA_596" CDS 968..1822 /product="energy-coupling factor transporter ATPase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_010966382.1" /transl_table=11 /codon_start=1 /translation="MAIIKTENLSYVYGEGTPFRKVAIDNINLEIEEGELVGIIGHTGS GKSTLIQHFNGLLKPTSGKVYIDGEELFADKSHLRDIRFKVGLVFQYPEYQLFEETVYK DIAFGPKNMGLDEAEIDRRVRETAALVGLKPEVLDKSPFDLSGGQKRRVAIAGVMAMEP KVLILDEPTAGLDPHGRDRILGLIKEYHREKGNTVMLVSHSMEDVAKTVSKILVMNDSS VFMYDTPERVFAHSEELRKMGLTVPQITRVFDRLKEMGIDVSDEVYSVKYAKELILKML GKK" /locus_tag="LOCUS_4710" /EC_number="3.6.3.-" /note="WP_010966382.1 energy-coupling factor transporter ATPase (Clostridium) [pid:57.7%, q_cov:97.9%, s_cov:97.6%, Eval:1.1e-83]" /note="MGA_597" CDS 1833..2666 /product="energy-coupling factor transporter transmembrane protein EcfT" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003357319.1" /transl_table=11 /codon_start=1 /translation="MIKDITIGQYFPGKSVIHRLDPRIKILLTALYIVMLFLPNGFLGL GLGAIYLIIAFLLSGIPVKMMLKSIKPILPIIIFTGLLNLFFLDGGTVLLSLGFIKVTS EGIHTMLFMAIRIIFLICGTSLLTYTTSPITLTDAIERILSPLQKIKIPAHEIAMMMTI ALRFIPTLIEETDKIMSAQKARGADLESGSFLQRAKALVPILIPLFVSAFRRAEELALA MECRCYHGGEGRTRMRQLKTTRLDYISIAFTALFIASIIALNIANLSLFNGLIRL" /locus_tag="LOCUS_4720" /note="WP_003357319.1 energy-coupling factor transporter transmembrane protein EcfT (Clostridium botulinum) [pid:56.1%, q_cov:92.1%, s_cov:95.5%, Eval:1.2e-79]" /note="MGA_598" CDS 2663..3397 /product="tRNA pseudouridine(38-40) synthase TruA" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003435654.1" /transl_table=11 /codon_start=1 /translation="MTNYKVTIAYRGTAYHGFQIQEDVQTVQGVVEDAIYKLIGERVTI NGCSRTDAGVHANEFVFNVSLDSTINERGIIYGLNGVLPPDIAVLSCEIANDGFHARYD CRGKEYVYIIHNSEIKSPFYADTAYRSWYPIDAEKLNTACKDFIGTHDFKSFCATACDK EITVRTIYDFKVEREGDLVKFTVSGDGFLYNMVRIMVGTLLFINDGKLAADSIPEIISS LDRTRAGKTVPPQGLYLNKVYY" /locus_tag="LOCUS_4730" /gene="truA" /EC_number="5.4.99.12" /note="WP_003435654.1 tRNA pseudouridine(38-40) synthase TruA (Clostridioides difficile) [pid:42.9%, q_cov:100.0%, s_cov:100.0%, Eval:3.5e-53]" /note="MGA_599" ORIGIN 1 tcaaaataaa ttcggcggaa ctgtcagtgc cgatgaaatc ggtttacctg tggaggaaag 61 taaaatgcct ttacccgcag gcagcaccgc tatgtggatt ggataaaatg gaaaaattca 121 ttgaacttaa aaatgtcagc ttttcatata ccaacgagta tgacgaaaag ccaatcaaaa 181 ccgaggtcat caaaaacctc tcaatgaccg taaataaagg cgaattcgtt gctgttttgg 241 gtcacaacgg ctcaggcaaa tcaacccttg caaaactgat gaatgcaatc aatctgcccg 301 aatcgggcga agtgctgata aacggtatgg atacccgtaa agaagaaaac ctttacaaca 361 tccgccgcac tgtcggtatg gttttccaga atcccgacaa ccagatcgtt gccaccgttg 421 tcgaagagga tgttgcattt gctcttgaaa acatcggtgt tgagcctgaa aagattcgag 481 aatctgttga tgatgccctc aaaactgtcg gaatgtataa ctatcgcgag cacgcaccgc 541 ataagctctc gggcggacag aaacagcgtg tcgctatcgc cggcgtaatt gcaatgcaac 601 ccgattgtat tgttctggac gagcccactg cgatgcttga ccctatcggc aggcgtgaga 661 taatgaaaac cattaaaaag ctcaacgata tgggtgtcac aattgtttta atcactcact 721 atatggatga ggcggcgcag gctaagcgtg ttgttgtaat ggattatggc aagataatcc 781 ttgatgacga accgaaaaag gtattctctc aagttgaaaa gctcaaatcg gtggggcttg 841 acgttccgca ggtcaccgag cttacccata tgcttattga ttctgggctt tcgctccctc 901 gtgacatcat tacagaggaa gaatgtgtcg atgagctata taagctttta agaaaggctg 961 actgactttg gcaataatta aaacggaaaa tttaagctat gtttacggag agggcacgcc 1021 tttccgcaaa gtagcaattg ataatatcaa ccttgaaatc gaagaagggg agcttgttgg 1081 cattatcggt catacaggct cgggaaaatc cacccttatt cagcatttta acggtttgct 1141 caagcccaca tcgggcaagg tatatatcga cggcgaggag ctttttgccg ataaatccca 1201 cttgcgcgat atccgcttca aggtgggtct tgtgttccaa tatcccgaat atcagctatt 1261 cgaggaaact gtatataaag acatcgcctt cggccctaaa aacatgggac ttgacgaagc 1321 cgagatcgac cgccgcgtgc gtgaaaccgc cgcacttgtc ggcttaaagc cggaagtgct 1381 cgataaatct cccttcgatt tgtccggcgg acagaaacgc cgtgttgcaa ttgcgggtgt 1441 aatggcaatg gagcctaagg ttctcatatt ggacgagccc accgctgggc ttgaccccca 1501 cggcagagat cgaattttgg gacttataaa ggaatatcac cgcgaaaagg gcaacaccgt 1561 aatgctcgtt tcccattcga tggaagatgt cgccaagacc gtttcaaaga ttctcgttat 1621 gaacgactca agcgtgttta tgtatgacac ccctgagcgg gtctttgccc attcggaaga 1681 gcttcgcaag atgggcttaa ctgtccctca aatcacccgt gtctttgacc gtctcaagga 1741 aatgggaatt gatgtaagcg atgaggttta ttctgttaag tatgcaaaag agcttatttt 1801 aaagatgcta ggcaaaaagt gaggttaaaa tcttgattaa agatatcacc atcggtcagt 1861 atttcccggg aaaatcggtt attcaccgcc ttgacccccg cataaaaata cttctgaccg 1921 ctttatatat agtaatgctc ttccttccca acggcttttt gggcttgggt ctgggagcaa 1981 tatatcttat catcgcgttt ttgctttcgg gcatccctgt taaaatgatg ctcaaaagca 2041 ttaagccgat tctgcccatc ataatcttta cgggactatt aaatctgttt ttcctcgatg 2101 gaggaacagt gctcctgagc ctcggtttta tcaaagtgac ctctgaaggt atacacacga 2161 tgctgtttat ggcaataaga atcatttttc tcatctgtgg aacatccttg ttgacctata 2221 ccacctcgcc gattaccctt accgatgcca tcgagcgaat tctttctcct ttgcaaaaga 2281 ttaagattcc cgctcatgaa attgcaatga tgatgaccat tgctctgcga tttattccca 2341 cccttattga ggaaacggat aaaataatgt ctgcccaaaa ggctcgcggt gccgaccttg 2401 aatcgggttc tttcttacaa cgcgcaaagg cactcgtccc aattttgatt cctttgtttg 2461 tttctgcatt tcgacgcgcc gaggagcttg ctcttgcaat ggaatgtcgc tgttatcatg 2521 gcggagaggg cagaacacgt atgcgccagc ttaaaaccac aagacttgat tacatttcta 2581 ttgcttttac cgctttgttc attgcgtcga tcattgcttt gaacattgca aacttatcac 2641 tatttaacgg actgatcaga ttatgaccaa ctataaagtg actattgcct atcgcggaac 2701 tgcatatcac ggcttccaga tacaggagga tgtccaaact gtacaaggcg ttgttgagga 2761 tgcgatatat aaacttatcg gtgaacgtgt gacaattaac ggctgttcac gcaccgatgc 2821 gggcgttcac gcaaatgagt ttgtgttcaa tgtttcactt gattccacca tcaacgagcg 2881 cggaataatt tatggcttaa acggtgtttt gccgcctgat atcgcggttt tatcatgtga 2941 gatcgcaaat gacggctttc acgcccgata tgattgtcgc ggcaaggaat atgtctatat 3001 tatccacaac agcgaaatta aatctccttt ctatgctgat accgcataca gaagctggta 3061 tccgattgat gccgaaaagc tgaataccgc ctgcaaggat ttcatcggta ctcacgactt 3121 caaatccttc tgcgctaccg cctgcgataa agagataacc gtccgcacca tatacgactt 3181 caaggtcgaa agggaagggg accttgttaa atttactgtt tcgggcgacg gcttcttgta 3241 taatatggta cgcataatgg ttggaaccct tttgttcatc aacgacggca aattggctgc 3301 cgattcaatt cccgaaatca tttcgagcct tgatcgcacc cgtgcaggta aaaccgtgcc 3361 accacaggga ctctatttaa ataaagttta ctactgatta taattggagg tgtaatatgt 3421 cctctgttaa ttcctttgaa acggatatgc gaaagcttcg ccgcagaaga aaaaacaaac 3481 gcatacttaa a // LOCUS sequence112 3490 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence112 VERSION sequence112 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3490 /mol_type="genomic DNA" /organism="" /note="sequence112" misc_feature <1..541 /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_002681109.1:SLC13 family permease" /note="WP_002681109.1 SLC13 family permease (Treponema denticola) [pid:53.3%, q_cov:100.0%, s_cov:39.7%, Eval:2.5e-45, partial hit]" /note="MGA_601" /locus_tag="LOCUS_4740" CDS 694..1605 /product="aldo/keto reductase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_041466227.1" /transl_table=11 /codon_start=1 /translation="METRKLGNTDLHLSRVGFGCASAWGKTFYKEEDAINLFFDAYDAG INYYDTGHSYGHAEVRLGKCLAMLGSEKRKDLVISTKCGTRVDDNGHYYKDWSVDWLKR SLETSLDRLNTDYIDMLNLHSPDLPEISDEVWCLLEDFKKQKLVSAVGVSCLDDKGNEL AVNNTALDFIMVSYNLFEQHKEDVIKSLYESGKGVIAGTPLAKTLFSNDVFKVKDIKDI WYLLRALANNRGYIKKGLKCRYINHAENMSGNQIALKYVLDNPYITSAVFGTTSREHLL ENVGALDITIPDDILAKIKSMK" /locus_tag="LOCUS_4750" /note="WP_041466227.1 aldo/keto reductase (Chlorobaculum parvum) [pid:25.7%, q_cov:99.3%, s_cov:97.8%, Eval:2.0e-22]" /note="MGA_602" CDS 1809..3170 /product="Trk system potassium transporter TrkA" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011948929.1" /transl_table=11 /codon_start=1 /translation="MHIVIIGGGTVGSAICSQLAREGHDITVVDRDFAVLRELSNTNDV FGVVGGGADVATLKKAEVDKADLVIAVTSSDEINILCCSASKKLGAKHTVARVRNPEYT DLMQLLRNDMNLSLTINPELAAAKEVYRMLKFPAAAKIDTFFRGRVELAQFVVSKDSPL CGVTLNDLRNKLNIRFLVCGVLRNGEAHIPTGFFKIEAGDTVCVTAPDEEITRFFKAIG AYKNPVKNVLIVGGGRMTYYLQYFLEKSKINSTVIEKDPVLCQELAQAYDCTVINDSGT KQDLLLEENLEDTDAFLALSNVDEENAIVSMFAKSKNSRKVVTLISSISYLELFKGVGL DSIVSPKSSTASFILKFVRSLTNARGSEIESLHRVMDDKVEAIEFSIKENISGITDIPL KDLGPKLKQGVLIACILHNNKVIIPTGNDIISNGDTVIVVTAESQIKGIKEILK" /locus_tag="LOCUS_4760" /gene="trkA" /note="WP_011948929.1 Trk system potassium transporter TrkA (Clostridium botulinum) [pid:39.4%, q_cov:100.0%, s_cov:98.9%, Eval:5.0e-101]" /note="MGA_603" ORIGIN 1 cattgtttat aatttcatca agaacaagaa tcttgaagct gttgtcggtc ccctcaaggc 61 tatcgacttt gaaaccctcg gccttttgac cggtctgttc ttaatgatcg gcggcatctc 121 aaacatgggt gttatcgacg cggctgcagg tcttttggca aaggcaggcg gcggaaacat 181 cttcctgctc tataccgtaa tcgtttgggc gtcggtactt atctccgcgt tcattgataa 241 cattccttac gttgcaacaa tgatccccgt aatcggcggc cttgcggcac agctggctcc 301 cggtatgggt gttgatccca cgttgatcgc aattccccta tacttcggct tgctttccgg 361 cgcaaccctt ggcggtaact gcacacctat cggtgccagc gcaaacatta caggtatcgg 421 aatccttcgc cgcgagggat atgaggttaa gaacagcgac ttcttcaaga tcggtattcc 481 cttcaccttt gccgcgatca ttcccgcata tatctatatt tggcttatct acggagtttg 541 atatttcaaa aacctgccca ctctcggcaa ttgtcggggg tgggattttt tgcggaattt 601 ttcagccttg ccgttgtgat cttcggataa tcttgacatt acagtgacga tatgtcaaaa 661 tatagatata atctttaagg cggtaaatga catatggaaa cacgtaagct tggaaatacc 721 gatctgcatt tatcaagagt cggcttcgga tgcgcaagtg cctggggtaa gactttttat 781 aaagaggagg atgcaattaa tctcttcttc gatgcatacg atgcaggcat caactattat 841 gacaccggcc actcatacgg acacgcagaa gtgcgtttgg gcaagtgttt agcaatgctc 901 ggaagcgaaa agcgcaagga cttggtcatt tcgacaaagt gcggaacccg agttgacgac 961 aacggccatt attataaaga ctggagcgtt gactggctga agcgaagcct tgaaacaagc 1021 cttgatcgcc ttaataccga ttatattgat atgctcaacc tgcacagccc cgatcttccc 1081 gaaatttccg acgaagtttg gtgcttgctt gaagacttca aaaagcaaaa gctggtatcg 1141 gcagtcggcg taagctgtct ggacgacaaa ggaaacgagc ttgcagtcaa caataccgcc 1201 ctcgatttca taatggtttc atacaacctg tttgagcagc ataaagagga tgttattaaa 1261 tcgctttacg aaagcggcaa gggcgtaatt gcgggcacgc ccctggcaaa gacccttttc 1321 tcgaacgacg tgtttaaggt taaagatatc aaagacatct ggtatctttt aagagctctt 1381 gcaaacaacc gcggatacat taaaaagggc ttgaagtgca gatatatcaa tcatgcagag 1441 aatatgagcg gcaaccagat cgccctcaaa tatgttctgg ataacccata tatcacatct 1501 gctgttttcg gcaccaccag ccgcgagcat cttttggaaa atgtcggtgc gctggatatt 1561 acgattcccg atgacatact tgcaaagatt aaaagtatga aataaagaca caaagcaaac 1621 actcccgacg gatagtcagg ggtgttttta ttgttataag ttttactttt aactgcaagc 1681 ctgtatcgaa aactgcttaa tgccgcagaa aatctcctac ttgcaaagaa cgcggataag 1741 tgatatgatt taaatagata tacacttttg ttattaagct tttatttatc tcaaaggaga 1801 tgttatttat gcatatagtc atcattggcg gaggcaccgt cggctcggca atctgttcgc 1861 agcttgcaag agagggacat gacattaccg ttgttgaccg cgactttgcc gttttgaggg 1921 agctttcaaa caccaacgat gttttcggcg ttgtgggagg cggagcggat gttgcgacct 1981 tgaaaaaagc ggaagttgac aaggcagacc ttgtcatcgc tgtaacatca tcggacgaaa 2041 taaatattct ttgctgttca gcatccaaaa agcttggcgc aaagcacacc gttgcgcgtg 2101 ttcgaaaccc tgaatatacc gaccttatgc agcttttgag aaacgatatg aacctgtcgc 2161 tgacaataaa ccccgagctt gccgctgcaa aagaggttta cagaatgctc aaatttcccg 2221 ctgctgcgaa aattgacacc ttcttcagag gaagagttga gctggcgcag tttgttgtat 2281 cgaaggattc gcccctctgc ggagttaccc ttaacgatct gagaaacaag ctgaatatcc 2341 gcttccttgt atgcggagtt ttgagaaacg gcgaggctca cattcccacc ggcttcttca 2401 aaattgaagc aggtgatacc gtttgcgtca ccgcgcccga cgaggaaatt acccgtttct 2461 tcaaggcaat tggagcatat aaaaacccgg tcaagaatgt gctgattgtc ggtggcggaa 2521 gaatgacata ttatctgcaa tacttccttg aaaagagcaa gataaattca accgtaattg 2581 aaaaggaccc cgtactttgt caagaactgg cgcaagcata tgactgcacc gttattaacg 2641 acagcggcac caagcaagac ctgcttttgg aggaaaacct cgaagatact gacgcctttt 2701 tggcactttc caacgtagac gaagaaaacg ccattgtctc aatgtttgca aaatccaaaa 2761 attcccgcaa ggttgtcact cttataagct caatctcata tcttgagctt ttcaagggtg 2821 tgggacttga cagcatcgtt tctccaaagt cgtcaaccgc ttccttcatt ttgaagtttg 2881 tccgctcgct gacaaatgct cgcggctcgg aaatcgaatc gcttcacagg gttatggacg 2941 acaaggttga agcaattgaa ttttcaatta aggagaacat ctcgggaatc accgacatcc 3001 cccttaaaga ccttggcccc aagctgaagc agggtgtttt gatcgcttgc atacttcaca 3061 acaacaaggt aatcattccc acaggtaacg acatcatcag caatggcgac accgtaatcg 3121 tcgtcaccgc tgagagtcag attaaaggaa ttaaagagat tttgaaataa tgaattacag 3181 aatgcttgga taccttttga gtatcgtttt gcttattgaa gcggcgcttt tgttgcttcc 3241 catgggcatt gcgctcatat atggcgatag cccgttgcct ttcatattta caattgctcc 3301 gcttattgct gctgcattgc ccagcgtgat catgaaaccg aaaaacacca gaattttcgc 3361 aaaagaaggc ttcgtctgcg ttgcaatggc ttggatctta ctctccgcct tcggagcgct 3421 tccctttgtc ttttcgggca caattacaaa ctatttcgac gctttctttg agaccgtttc 3481 gggatttacc // LOCUS sequence113 3474 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence113 VERSION sequence113 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3474 /mol_type="genomic DNA" /organism="" /note="sequence113" CDS 171..914 /product="ABC transporter ATP-binding protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_007051244.1" /transl_table=11 /codon_start=1 /translation="MAIIEVKDLKKTYRLGNEKVYALKKINLSVEKGEICCVLGTSGSG KSTLLNMLAGLEKPTRGSVKICGTEITSLSEKKLAKFRQENLGFIFQSYNLLNQLTALE NVSMPLMFKGVAKKRRENTAAKMLKNVGLADRMKHKPNQMSGGQQQRVGIARAFVTKPK VIFADEPTGNLDSHTTDDVMRLMVEMCRKHGLTLVLVTHDLGISAYADKIVHIIDGEIT SVESNISKYDPQKNNAERTDDNNEK" /locus_tag="LOCUS_4770" /note="WP_007051244.1 ABC transporter ATP-binding protein (Bifidobacterium longum) [pid:58.4%, q_cov:97.2%, s_cov:96.8%, Eval:3.3e-75]" /note="MGA_605" CDS 904..2679 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MKNRILALAVALMLALSCLSLNIFATESEGTIPDPYAWLNKNGVA ITNYSVDRDYIMAGDHFTLSFVISNTTGAYLGDVKATLPGLDSSKFLIDGGFTYKTVSI SNGAYAVVGFDLIACEGISAIRETVTVAAEYVLPDGSEGLISSDVILNCEPLSVETIPT TSLDLTVTDYKVSSDRIRPDRVFTLTIYVENSGDEDIDKARINVMNLDGHKFAVNKGLT YQDFSISAGETKKISFELVGCDGISSTREVLPIELIYGDFSDTIYCTLSCKPTEQTQAD EEQVFAPNIIITGYDFGGEFVTAGSKFPLTITFENASNDATIENLKITINGASSSIDGG IAFSAANSANSFFFEKLDTKASNSVTLEMNAKSDATPNSYPIDISFSYEYTANGKRYQA STVRETINVPLQQEDRLVVNEPYYPNWVVYVGESCYVSTSLVNMGKSGVYNVTASIVGE GFTMNETSYYIGNIESGREEYYDTEIYPSQAGEINCEIVITYEDANGNAKEKRLPFTVS AQEMYFEDVYYEEPIIDEPIYEEEPSSSSWLNLPQWAWYAIGGSALVVLIIIIITVSVK KKKARFEVDEDDEDI" /locus_tag="LOCUS_4780" /note="WP_005810017.1 hypothetical protein (Desulfitobacterium hafniense) [pid:24.9%, q_cov:69.9%, s_cov:46.9%, Eval:1.1e-26, partial hit]" /note="MGA_606" ORIGIN 1 ctgcctgcct tttttctcgg cgggcagttg tttttaacaa aaaatgtgct ataatttaga 61 caagtataca aagttttaaa tatcaacaaa attttacaaa taaatgcaat attttacaca 121 tagaaaatgt ataattgatt aaggaaacta actgccggga ggtgataggc ttggcgataa 181 ttgaagttaa ggacttaaag aaaacgtaca ggctgggaaa cgaaaaggtg tacgccctta 241 aaaagataaa tttgagcgtt gaaaagggcg agatatgctg tgtgctggga acatccggct 301 cgggcaaatc gacacttttg aatatgcttg cggggcttga aaaacccacc cgcgggtctg 361 ttaaaatatg cggtaccgag ataacctcgc tttccgagaa gaagctcgca aaattccgac 421 aggaaaacct gggattcatc ttccagtcat ataacctttt gaatcagctt acggcgctgg 481 aaaatgtgtc aatgccgctg atgtttaagg gcgttgcgaa aaaacgccgt gagaataccg 541 ccgcgaagat gcttaaaaac gtgggccttg ctgaccgaat gaagcacaag ccaaatcaga 601 tgtcgggcgg acagcaacag cgcgtgggta ttgccagagc gtttgtcacc aaacccaagg 661 tgatttttgc cgatgagccg acgggcaacc tcgactccca cacaactgac gatgttatgc 721 gtttgatggt tgaaatgtgc cgcaaacatg ggcttaccct tgttttggtc acccacgacc 781 tcggcatcag cgcttatgct gacaaaattg tacatataat cgacggtgag atcaccagcg 841 tcgaatcaaa tatctcaaaa tatgaccccc agaagaataa cgcagagagg accgatgata 901 acaatgaaaa ataggatttt ggctttggcc gttgcactta tgcttgcttt aagctgtttg 961 agcttgaata ttttcgcaac agaatcggaa ggcacaattc ccgaccctta cgcctggctt 1021 aacaaaaacg gcgttgcaat taccaactat agcgttgacc gcgactatat catggcgggc 1081 gaccacttca cgctgagttt tgttatttcc aacaccaccg gcgcatacct cggtgacgtt 1141 aaggcgactt tgcccggcct tgattcatcg aagtttttga ttgacggcgg atttacatat 1201 aagaccgtca gcatttcaaa cggcgcatat gccgttgtcg gcttcgacct tatcgcctgc 1261 gaaggaatca gcgcgattcg cgaaacggtt accgttgccg ctgaatatgt tcttcccgac 1321 ggaagcgagg gacttatttc aagcgatgtc attttgaact gtgagccttt aagcgttgaa 1381 acaattccca ccacctcgct ggatttgacc gttaccgact ataaggtcag ctcggacaga 1441 atccgtcccg acagagtttt caccctgact atttatgttg aaaactcggg cgatgaggac 1501 attgacaagg cgcgaatcaa cgttatgaac cttgacggac acaagtttgc ggtcaacaag 1561 ggacttacat atcaggattt cagcattagc gcaggcgaaa caaagaagat ctcctttgag 1621 cttgtcggat gcgacggaat ttcttccacc cgcgaggttc tgccgattga gcttatttac 1681 ggcgacttca gcgatacgat ctattgcact ctttcctgca agcccaccga gcagacacag 1741 gccgacgaag agcaggtatt tgcccccaac attatcatta cgggatatga cttcggcggc 1801 gaatttgtca ccgcaggttc gaaatttccc cttaccatca cctttgagaa cgcttcaaac 1861 gatgcaacca tcgaaaacct caagatcact ataaacggtg catcttcatc aattgacgga 1921 ggcattgcat tctctgctgc aaactcggca aacagcttct tctttgaaaa gctggataca 1981 aaggcatcca acagcgtgac ccttgaaatg aacgccaagt cggatgctac ccccaacagc 2041 tatcccattg atatttcctt ctcatatgaa tacaccgcaa acggcaagcg ttatcaggca 2101 agcaccgtaa gggaaaccat taacgtacct cttcagcagg aggacagact cgttgtgaac 2161 gagccttatt atcccaactg ggtcgtatat gtcggtgaga gctgctatgt ttccaccagc 2221 cttgtaaata tgggcaagag cggagtatat aatgtcacag catccattgt cggcgaaggt 2281 ttcacaatga acgaaacctc atattacatc ggcaatatcg agtcgggcag ggaagagtat 2341 tacgatactg aaatttaccc ctctcaggcg ggcgagatca actgcgagat cgtcatcaca 2401 tatgaagatg ccaacggaaa cgcaaaggaa aagcgtttgc ccttcaccgt tagtgcgcag 2461 gaaatgtatt ttgaagatgt ttactatgaa gaacccatca tcgacgagcc gatatatgaa 2521 gaagagcctt cttcctcaag ctggctgaat cttcctcagt gggcttggta tgcaatcggc 2581 ggctcggctt tggttgttct cataatcatc attatcaccg ttagcgtcaa gaagaaaaag 2641 gcgcgttttg aggtcgacga agacgatgaa gatatttgat atcattaaaa tggcctttag 2701 aaatctgtgg cgaagaaagg gcagaacaat gctcaccgtt atcggtgttg taatcggttc 2761 ctgcgccgta atcgtcatga tttccttggg tctgggtatg aatcttgcca tggacaatat 2821 gcttgcttca tggggagatc tgaccgcaat tacaatatat aattacagct atggcggaaa 2881 taccgacaca gttcctttgg acgacacggc agttgaatca attaagacga ttgagaatgt 2941 gtcgtatgtc atcccgcgac taagggtcga atcaaatatg gtgaccatat gtgcgggcaa 3001 aaacgaccgt taccgaatgg actggtgcga gatttacggt gttgattttg ccttgctgga 3061 taaaatgggc tattctcccg aaacgggcga attcccgagc gaggatgaat attcccgcac 3121 ggtaattttc ggcaacgaaa cggcatataa cttccgcgac acccgcaagc gcggcgacaa 3181 ggcatacacc tggaagcaat atttgagcga cggcacctat actctgccgt tcatcgatcc 3241 gcaggacgaa aagataaccc ttggaatcaa caacaccaag cagactgacg acgaaggtta 3301 ttatcagttt ggcggcaggg gatatgaata tgagctgacc tgttcgaccg tattgcagca 3361 ggaccccaac tgggaaacgg tatatagcgt tttggtggat attgatgtcg ccaaggagat 3421 tattgaggat tataaccgcc gtaacggcgt taaggatgca agcgaccctc agta // LOCUS sequence114 3450 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence114 VERSION sequence114 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3450 /mol_type="genomic DNA" /organism="" /note="sequence114" CDS 444..2201 /product="arginine--tRNA ligase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003020254.1" /transl_table=11 /codon_start=1 /translation="MKKITTTLSGIVSEAFEKCGYDPKLGSVSVSDRMDLCQFQCNGAF AGAKLYRKAPFMIANDVKAVLESNEIFSKVEVANPGFLNLTLTDAYLVDYLNGIISDEH CGIPQAEVEETIVLDYGGPNVAKPLHIGHLRSAIIGEAIKRIARATGRKVVGDVHLGDW GTPMGLVISEYMVRYPDWACFKPDFDPEKDEIMLLDVTELNEIYPFASAKSKEDEDFKA KAHEVTALLQKKHPGYYALWKEIVKVSVADAKKSYDKLGVSFDLWYGESDADDYIDELV EILTDKGLLYESDGAMVVDVEEETDKITIPPVIIKKADGSNIYATTDLATIIQRKKDFD PDRIWYLTDKRQALHFTQVFRCAKKADIVGDDVEFKHLGFGTMNGSDGKPFKTRDGGVM RLSDLIQTATDGAYDKLADSEYVTGDKREYAQKIGVAAIKFGDLSNHPTKDYVFDLDKF LSFDGKTGTYLLYTVTRINSILKKAGLGYEDKANVGGVYTDIERELILALILSGDSYER AFEEMNPAALCDSAYNLATIFSRFYHDNHILNEADEAKKQSWLALSLLTRRMLTGLLDT LAIEYVENM" /locus_tag="LOCUS_4790" /gene="argS" /EC_number="6.1.1.19" /note="WP_003020254.1 arginine--tRNA ligase (Francisella tularensis) [pid:42.9%, q_cov:99.5%, s_cov:99.7%, Eval:9.8e-132]" /note="MGA_609" CDS complement(2297..3004) /product="SDR family oxidoreductase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_012583993.1" /transl_table=11 /codon_start=1 /translation="MNKTVLVTGTSQGLGLAFCKELISRGYKVIALDLKRSNELLALEG DMLQFVECDISDLESVKRAGKSADAETLDYIINNAGVWLEKRKPLDDADFEQEYDAMRK MFEVNSLGVLRIVREFMPRLLKGKSKKVLNVSSEAGSIGSCWRKSEYGYCMSKAAQNMA TKIMSNAYKADGVKFYAVHPGWLISPMGFASATDVDVPGDKPEYSARVFVDLLEGENKE GIYYDFHGNEMPW" /locus_tag="LOCUS_4800" /note="WP_012583993.1 SDR family oxidoreductase (Dictyoglomus turgidum) [pid:37.8%, q_cov:99.6%, s_cov:99.1%, Eval:1.2e-34]" /note="MGA_610" ORIGIN 1 cgacattgcg cggtagttgg aaatctcata accttcgatc tcgggcaagg tcatttcaaa 61 gccgactgca ctaaatgctt catcggcgtt ggtgtaatcc ttccaagggt taccaattgt 121 cattgcgccc tccgaaatct cctcatccga cggctcaagc atctcttcgg gcacgctgtc 181 aaagttgttg tccacagatg ggtcagctgt gttgtcggca caggcacaga gcattgctac 241 gctaagaagt ccgcaaagaa tgaataagat gatttttctc attttatgtc actttccttt 301 cattatataa tacaaccaag tcgataattt aattgcatta tacagctaaa tcccgaaaaa 361 tgcaaatggc tattgcgaaa aggaaatttt tatgatatga tacataattg attacaacac 421 tactaaaaat aaagagggat ataatgaaaa aaattaccac caccctttcg ggcatcgttt 481 ccgaagcctt tgaaaaatgc ggatatgacc ccaagttggg ttcagtttcc gtatccgacc 541 gaatggacct ttgccaattc cagtgcaacg gtgcgttcgc aggcgcaaag ctatatagga 601 aagctccttt catgattgca aacgacgtta aggctgtttt ggaatctaat gagatttttt 661 caaaggttga ggttgcgaac cccggatttt taaacctgac tttaacagat gcttaccttg 721 ttgattacct caacggcatt atttcggacg agcactgcgg tattccccag gcagaggtag 781 aggagaccat tgtcctcgac tacggcggac ccaatgttgc aaagcctttg catatcggac 841 atctgcgttc ggcaatcatc ggcgaagcaa ttaagcgaat tgcaagagca acaggccgca 901 aggtcgtagg cgacgttcac ctcggtgact ggggcacacc tatgggtctg gtcatcagtg 961 aatatatggt tcgctacccc gattgggctt gcttcaagcc cgatttcgac cccgaaaagg 1021 acgaaatcat gcttttggat gtaaccgagc ttaacgaaat ttaccccttt gcaagcgcaa 1081 agagcaagga agatgaggac ttcaaggcca aggcccacga ggtcaccgca cttttgcaga 1141 agaagcaccc cggatactat gcactctgga aggagatcgt gaaggtttcc gtggcagatg 1201 caaagaagag ctatgacaaa ttgggcgttt cctttgacct ttggtatggc gagagcgatg 1261 cagacgacta cattgatgag ttggttgaaa ttttgaccga caagggtctt ttgtatgaat 1321 cggacggcgc tatggttgtc gacgttgaag aagaaaccga caagatcacc attccccctg 1381 tcattatcaa aaaggctgac ggctcgaata tttacgctac caccgacctt gctaccatta 1441 ttcagcgcaa aaaggacttt gaccccgaca gaatctggta tttgaccgac aagcgccagg 1501 cgcttcactt cactcaggtg ttccgctgcg cgaagaaggc tgatatcgta ggcgatgatg 1561 ttgaatttaa gcacctcggc ttcggcacca tgaacggctc ggacggcaaa cccttcaaga 1621 cccgtgacgg cggagttatg cgactgagcg accttattca gaccgctacc gacggcgctt 1681 acgataagct ggccgattca gaatatgtca caggcgataa gcgcgaatat gcgcagaaga 1741 tcggcgttgc cgcaatcaag ttcggcgacc tttcaaacca ccccaccaag gactatgtat 1801 ttgaccttga caagttcctc tcattcgacg gcaaaaccgg cacatatttg ctttacaccg 1861 tcacccgaat caactcgatc cttaaaaagg cgggcttggg atatgaggac aaggcaaacg 1921 tcggcggagt atataccgac attgagcgtg agctgatttt ggcgttaatc ctctcgggcg 1981 actcttatga gcgcgcattt gaggagatga atcccgcggc gctctgcgac tcggcatata 2041 accttgcaac catcttctcg aggttctatc acgacaacca cattctcaat gaggctgacg 2101 aagccaaaaa gcagagctgg ctggcacttt ctttgctgac cagaagaatg ctcacagggc 2161 ttttggacac cttggcaatt gaatatgttg aaaatatgta aaaaacaggc ggccttacgg 2221 tcgcctgttt tatattcaag aggcttgctt atcatcactt cagccgtcaa agcaagctgc 2281 aaaatcggtt tttccttcac cacggcattt cgttgccgtg aaaatcgtaa taaataccct 2341 ctttgttctc accttcgagc aggtcaacaa aaacccttgc cgaatactcg ggcttgtcac 2401 cgggtacatc aacatctgtt gcacttgcaa agcccattgg cgaaataagc catccgggat 2461 gaaccgcata gaatttcaca ccgtcagctt tataagcatt gctcatgatc tttgttgcca 2521 tattctgagc ggccttggac atacagtagc catactcgct cttgcgccag caagagccga 2581 tcgagcctgc ttcggaagaa acattgagca cctttttgct cttgcctttc aaaagtctgg 2641 gcataaactc tctgacaata cgcagaacac cgagggaatt tacctcgaac attttgcgca 2701 ttgcatcata ttcctgttcg aaatcggcat catccaaagg cttgcgcttt tcaagccaaa 2761 cgccggcatt gttgatgata tagtcaagag tttcggcatc ggcagatttt cctgctcgct 2821 taactgactc caaatcggaa atatcgcact caacaaactg aagcatatcg ccttcaagcg 2881 ccaaaagctc attgcttcgc ttcaagtcaa gtgcaatgac tttgtatccc cttgaaataa 2941 gctccttgca aaaggcaagt cccaagccct gcgatgtacc tgttaccaaa accgttttat 3001 tcattgttac tccttaaaaa tcattcaaaa tacttcctgt cgaggcttct gtatctcacg 3061 gcctgggtga tatgctggcg gtcgatgaca cgggcgccgt ccatatcagc aattgttctt 3121 gcgaccttta aaatcttgtc gtatgctctg gcggaaagac ccaggcgttc aaaaacatct 3181 ttaagcttca aatttgccgc gtcggtcaga gggcagacat cacgcaagat atccgaggtg 3241 attcttgcat tgcaggaaat cttcgtgccc ttaaaacgtt ggttttgaat ctcacgggca 3301 cgcattacac gttcgcgcac ctgagcactc gattcctctt tttgagagga cgacaggctt 3361 tcatattcaa cgggagcgac ctcgatatgc agatcaaatc ggtcgagaag cggtccggaa 3421 attcgagaaa gatactgcgc aacctgcttc // LOCUS sequence115 3428 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence115 VERSION sequence115 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3428 /mol_type="genomic DNA" /organism="" /note="sequence115" CDS complement(1229..1807) /product="electron transport complex subunit RsxA" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003419046.1" /transl_table=11 /codon_start=1 /translation="MTVFLEVLLAAFASITLENVIFNSAVGTSTLIECAKKPRQMFSFG LFLSVFSILASIITFFVEPLMSNDRILQRFIPSLYILSLGVVYVITLLFIWKVVNKKFK YLSRFVHLTAFNCASLGCLFMNDLSSGTLSDRVIFALSIGLGFMLATYLLSINYKRLVS SEVPIAFRGFPVTVLYIGIISMLIYACNM" /locus_tag="LOCUS_4810" /gene="rsxA" /note="WP_003419046.1 electron transport complex subunit RsxA (Clostridioides) [pid:29.3%, q_cov:92.7%, s_cov:93.2%, Eval:1.7e-13]" /note="MGA_613" CDS complement(1804..2424) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MDDLRKTNLSNSVKEGFLTGNALLSSGVIIAPAVVAATDLMSAVC LAIVFTVVTYVTVALCSFVPKKVVYTARIIIYTFLASLVYVPVAILLETIMPETMTAVG IYAPLLITNSFITSKSELKFYRHERKNMLVLLAFYVLGYDTALILFGAMRGLLISGSVL GIKLLNFPLPSLSSVYGGFIFLAVSSALYRGIMRYVIRKGNAQ" /locus_tag="LOCUS_4820" /note="MGA_614" CDS complement(2417..3427) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MTIDLMAFYYYGLRAVIVTLVAVVSAVLTDYICCAIMKRKFDWYD PSPAMSEILLALLMPASVPYPIMAFSCIFMVAVAKYAFGGNRNLIFSPVAVTYAFSSIT WSQYIMRYPIPEPFGNVPLDNIVTDNLVHSFTYMLDNSTAGTFSLLDIVWGKLAGPMGT SAVLIILISGVALYLFGDIEPTVFFTGIAANVLLNVLFPGNIIGWEAFLYSLVTGSYMF TLVFMAGDRRFVPKHELAQFLYALTVAVAAFLFRRFTIIENGAVFGLMFAGLMRDEFDR WSLSIHNLGLKLNAKIIDKHNASKSARDARRNSIDAAKAEMSSPESSEKEEKANG" /locus_tag="LOCUS_4830" /note="MGA_615" ORIGIN 1 ttacattgtc aacatcgtat ccgattgatt cgagcgccga gaagatttcg ggaaccgtta 61 aatcggatct gacagccgct actgttttta gccctgaatt tgcaagagca gtattcacca 121 gacgatagac ctgggcgatt ttatagtcct cagtcaagcc ctcaaaggat acaacgctac 181 cgtcagcttt ttcaactcgg ccgccgatac ttgcgccatc gtatttgaca tagagagtct 241 ttgcgttgag taaggctgtg tcacttaaaa gctcacattc acccgagatg atatcctcgg 301 catcgacctc aatggcataa agctttgcag agccgagagt atctccaaga tagtttgaga 361 agccgataag cgcttcatat cttttgggat ttttgtcgat ctcgccgata tatccaaggt 421 ccttgtttct gaaaggcggg aaatcaaact cgcctgcgat tattcccaca aagcctgcat 481 cggaaatctc tgtaacaaag gatgaaatat attccttcgc gctgtcgctg aatggggata 541 tccaaggctt tccgccgttg gcaagggagt tatcaagcca tttgcttgag ccatcttcaa 601 aaagatagca gagtgaacgg tcaaaccaag aggcgatatg gtcgctcaag gctgaaatgc 661 gggcatatgg caaaagctca gaatctgtta tcagcgaaac gcaggtcaaa aggtcgatgg 721 gtgtttttga caccgcctcc gacttgattg cggttctgtt ttgggtatta tacattacct 781 tgccgccctc ggcaacaagg tcaaggcaga tgcctttaca gttttgagca gtagcttttt 841 caatcgctct ttcaagctga gcgacataat cctcgccgtc agcgaaggat acatataata 901 taccattctt aattattatc ggctcggtgg tgacaggcgg ctgtgtggca atctcatcag 961 gtgtggtggt cgtttgcgta tcgctgacat cagcagatac atcgggatca tcatcctcat 1021 tgggcaaggg gtcattcacc gcgggaacac ttccctctcg gttatcaaaa aactccatta 1081 tcggcttgcc gatgctatat cccaaaaaga tgagcacagc cacaattatc aaggtcaaaa 1141 tgacattaag ggcagattga gccggtgtgc gctttttctt gaaaagcggt ttttgttttc 1201 ttctattaaa ggacaaacct gtgcctcctt acatattgca agcatagata agcattgaga 1261 ttattccgat atagagaacg gttacaggga atcctctgaa tgcgattggg acctcgcttg 1321 aaaccagacg cttatagtta attgaaagca ggtatgttgc aagcataaaa ccgaggccga 1381 ttgacaaagc aaatatcact ctgtccgaaa gtgttcccga gctgagatca ttcatgaaca 1441 aacagcccaa ggatgcacag ttgaacgcag ttaagtggac aaagcggctt agatatttga 1501 atttcttatt tacaactttc caaatgaaca aaagggtgat aacgtataca acgcccaagg 1561 aaagaatata caaagacggg ataaatcttt gcagaattct gtcgttcgac atcaagggtt 1621 caacaaaaaa tgtgataatg ctggccaaaa ttgagaatac ggacagaaac agaccgaatg 1681 aaaacatctg tctgggcttt ttcgcgcact caatcaaggt ggatgttccg acagcagaat 1741 tgaaaattac attttcaagg gttatcgagg cgaacgccgc caataaaact tcaagaaaaa 1801 ctgtcactgt gcattcccct ttctgattac atagcgcatg attcctctat acaacgcaga 1861 agaaaccgca aggaaaatga agccaccgta tacacttgag agcgagggca gagggaaatt 1921 aagcaacttg attcccaaga cgcttccgct gatcaataag ccacgcattg caccgaatag 1981 gataagggcg gtatcgtagc caagaacata aaatgccaga aggacaagca tatttttgcg 2041 ctcgtggcga tagaacttaa gctccgattt tgaggtgata aaggagtttg ttatgagcaa 2101 aggagcatag attcccacag cggtcatagt ttcgggcata attgtttcca aaagaatcgc 2161 cacgggtaca tacactaaag aagccaaaaa ggtatatatt ataatacggg cggtgtatac 2221 aacttttttg ggtacaaacg agcagagcgc aacagtcaca tatgttacaa ccgtgaaaac 2281 gattgcaagg caaactgcgg acataagatc tgttgcggca acgaccgcag gcgcaattat 2341 tacgcccgag gacaaaagcg catttcctgt taagaagccc tctttgacgg aattggataa 2401 gttggttttt cttaaatcat ccattggctt tttcctcctt ttcggaagat tcgggcgagg 2461 acatctcagc ctttgcggca tcaatgctgt ttcttcttgc atcgcgggcg gattttgacg 2521 cattatgttt atcaattatc tttgcattga gcttgagtcc gagattatga atcgacaatg 2581 accaacggtc aaattcatca cgcataagac ctgcaaacat caagccgaaa acagcaccgt 2641 tttcaattat ggtaaatctg cggaacaaga aggctgcaac cgcaaccgtc aaggcataga 2701 ggaactgtgc cagctcatgc ttgggcacaa agcggcgatc tcctgccatg aaaacaaggg 2761 tgaacatata tgaaccggtc acgagggagt ataaaaatgc ttcccaaccg atgatatttc 2821 ccgggaaaag aacgtttaaa aggacattcg cggcgatgcc tgtgaagaaa actgtaggct 2881 caatgtcgcc gaaaagatag agcgcaacac cgctgatgag aataattaaa acagcagagg 2941 tgcccatagg ccctgcaagc ttgccccaga cgatgtcaag gagcgagaag gtgccggcag 3001 tactgttatc cagcatatat gtaaaggaat gaaccaaatt atcggtcacg atattatcga 3061 gcgggacatt tccgaatggc tcgggaatgg gatagcgcat gatatattgg ctccatgtga 3121 tggagctgaa agcataagta accgcaacgg ggctgaagat aaggttgcgg ttgcctccga 3181 aagcatattt cgccacagcg accatgaata tacagctgaa agccatgatg ggataaggca 3241 ccgacgcagg cattaagaga gccagcaaaa tttcagacat ggcaggagat gggtcatacc 3301 agtcgaactt gcgcttcatt attgcacagc agatataatc ggttaaaact gcagaaacaa 3361 ctgcaaccag cgttacgatc acggcgcgca agccgtaata atagaatgcc atcaggtcga 3421 tggtcaaa // LOCUS sequence116 3423 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence116 VERSION sequence116 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3423 /mol_type="genomic DNA" /organism="" /note="sequence116" CDS complement(189..1043) /product="AraC family transcriptional regulator" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_010965896.1" /transl_table=11 /codon_start=1 /translation="MMFLNNMYEFVPLSAEVICHYKKTYGYQTYKYHRHNGYEVYLFLD GNIRFYRESNCYNLSAGDMLIIPPGTAHRIDSLDNGYYERIVLNVKRSAFERISSEKSD LLSCFDISSQNTNPIHLNTEDCQKIILLSQNLSNAISSEEFGSDILADSYLTQLLLCVN QYSLGNRVSKPNIMPKVVKEVMKYIDANLAGDLSLTRLSEVFYLNSTYISQLLKKHTGF TAREYILDQRIECAKKLLMGGNNVSEACYKSGFADYSNFIRTFTKAVGMSPGKFARESR DNR" /locus_tag="LOCUS_4840" /note="WP_010965896.1 AraC family transcriptional regulator (Clostridium) [pid:28.9%, q_cov:88.0%, s_cov:88.0%, Eval:6.7e-33]" /note="MGA_616" CDS 1171..1377 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MKKFLSLIIALLMVFALVGCGSNKREIVKLTLSTEDSEAILAAAG ITLPDAEETLVLHQRYKLVYRYC" /locus_tag="LOCUS_4850" /note="MGA_617" CDS 1334..1867 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MFFIRGTSWFTDTVENVSAIYGDIAAGELMFVPLPRDAMGDGKYY IEAVTSGYALINGAENPEGVALLASCERFKAVDPTVVSIDRRQLEETYLWTDEMLEMYD HCVDLANSMGADTIVDYSYGMGDALYSAVNSLKSQTRKATPVTWAQGKEKYSETINYYL EELNASIDEYIESH" /locus_tag="LOCUS_4860" /note="MGA_618" ORIGIN 1 aagcacccac agttacctaa tgaccttcaa gatgctcgct actgtgagct ttgcttaggt 61 gatagctctc taagggaaat atcctttcca tatgtaatct acataaaaat gaaaacagca 121 tccgtaaggg tgctgttttt gtttttgtga ggattttcgt taattggaca gtttttgttt 181 gtttttgttc acctattatc tctgctctcc cttgcaaact tcccgggaga cattccgaca 241 gcctttgtaa atgttctgat aaagttggag taatcggcaa agcccgattt atagcacgcc 301 tctgaaacat tatttccgcc cataagcagt ttctttgcac attctatcct ctgatcgaga 361 atatattctc ttgctgtaaa gcccgtatgc ttcttgagaa gctggctgat atatgtggag 421 ttgagataaa aaacctccga cagtctggtc aagctaagat cgcctgcaag gttggcgtca 481 atatatttca taacctcctt gacgaccttc ggcatgatat tgggcttgct gacacggttg 541 ccaaggctat attgatttac acacagcaag agctgagtca aatagctgtc agcaagaatg 601 tccgaaccga attcttccga tgatatagca ttgctcaagt tttgagaaag caatatgatt 661 ttctgacaat cctccgtatt caaatgtatg gggttggtgt tttgggaact gatatcaaag 721 caggaaagga gatccgactt ttcgctggat attctctcaa aagcagagcg cttcacattt 781 aatactattc tttcatagta tccgttatcc aagctgtcga ttctatgggc ggtgcccggc 841 ggaatgataa gcatatcccc tgcgctcaaa ttatagcagt ttgactcccg atagaaacgg 901 atatttccgt caagaaacag atacacctca tagccgttgt gacggtgata cttatatgtc 961 tgatagccat atgtcttctt atagtggcaa atgacctcag cacttagcgg aacaaattca 1021 tacatattat tcaaaaacat caccccaaaa catctttgat tacattataa tcaaaatatg 1081 cgattttgca atactttcag gccaaaacgc aaattttgtt gcacattctc gtgatataat 1141 attataaaat ctacaacgga gggcgaaaaa atgaaaaagt ttttatcact cataatcgct 1201 ttgctgatgg ttttcgcttt ggttggttgc ggttccaaca aaagagagat cgttaagctc 1261 actctttcca ccgaagactc tgaagcaatc cttgcagcag caggtattac cctgcccgat 1321 gcagaagaaa ctcttgttct tcatcagagg tacaagctgg tttaccgata ctgttgaaaa 1381 cgtttctgct atttacggcg acattgcagc aggcgagctt atgtttgtcc ccttgcccag 1441 agatgcaatg ggcgacggca aatattacat tgaagctgtc acatcgggtt atgcacttat 1501 caacggtgca gaaaaccccg agggcgttgc tctgcttgct tcctgcgaac gcttcaaggc 1561 agttgacccg acagtagtat ccatcgaccg ccgtcagctt gaagaaacat atctttggac 1621 agacgaaatg cttgaaatgt atgaccattg tgttgatctt gcaaacagca tgggggccga 1681 caccatcgtt gactatagct acggaatggg cgacgcgctt tattcggcag taaattctct 1741 gaagtctcag acaagaaaag cgactcccgt gacttgggca cagggcaagg aaaagtattc 1801 cgaaacaatc aattattatc ttgaagagct taatgcaagc atcgacgagt acatagagtc 1861 acactaaaat aagtttccct tggtgttaaa ccgccaaggg aaatttgcta tttgcaagaa 1921 atatatattt aaatgcaatt ttaataaggt aattttgtgc tataatgtaa tcatatacta 1981 aacactcaga ggtaatgtta tgaaacggtt aatttgtgct ttatttgcat tgataatggc 2041 aatgtccgcc tgcgttaccg tgtatgctgc tgacacagtg aagatcgata tggatacaac 2101 atatcagact attgacggtt tcggcgctgc gtatacgtgg tattccgaaa gacttttgaa 2161 tcataacaac aaagaggctc tgttggatga gatattcatt aactgcaact ttaacattat 2221 gcgctttatt cacctgcagg agaataagac aagacctacc acgatggaat cctacaagga 2281 gtattacgat gctgcagttg agcgcggaat cgatcctttg atattgatta cacattgcgg 2341 agcatacgtc acgggatatg aattcagcga atttgtcagg gacatatatt ccggcacaac 2401 attctatgct ctgaaaaagg atgaaaacgg cgaatatatg tatgacgttt ttgccgagca 2461 ttgtgttaat gctgtaaaag aatttttgga tgtgggcatt cctgttcatt atttcacctt 2521 tgcaaacgag gttgaacacc aagaaaagaa atatcagccc ggcgaagatc cgttggaata 2581 ttcaagcttc ttctggggca ccgaagagga cgaatatcac cctgcatatt ggaaagctca 2641 cgccgcgata tatgaagcat ttgagcgaga attcggagaa gatgcgcccg aaattttagg 2701 cgcagaagca atgaacggca gtgttaatat tttggcgccg tatttggatc ccctgattca 2761 aaaccatccc gatatgctta aaaccgttgc attccacctt tatggtacca acagaacaga 2821 agcaaccttt gccgctgtgg atgagcattt tgaagaatat ggcctttggc agacagaatg 2881 gtgctcggac gattattttg acaacgccga aactattatt gacgagctta atcacaacct 2941 caacgcatat ctctattgga acggcgtttg ggcacccgat ttgggtatgt gccttattga 3001 atttccttca aacagtgctg ataccgaagt tgcttttaac ggaagccact atatgatgat 3061 gcacttctcg aagttcatcg accgtggcta tcagcgggtt gagctgaccg aagagcttgg 3121 ctcgaagatg gttgcattta aggctcccga cgattccaga cttgtaattg ttgcattgaa 3181 taacacagat aatggcgaaa acttcacagt tgatttggac ggcagggaaa ttatcagctc 3241 gcagatctat cagtctaccg aagcagataa ccgattcaga aatgagtatt ggaccgattt 3301 gggcatatat acagagtcgc tcggtgtaga catccccgca ggaaccctta cgaccatcgt 3361 actggatttt gtggagcctg tgatgaaacc gacaaattca aatgcattac tttggatcgt 3421 tgc // LOCUS sequence117 3418 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence117 VERSION sequence117 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3418 /mol_type="genomic DNA" /organism="" /note="sequence117" CDS complement(202..672) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MFHLKRFEKFTQGIASCYKYILKLKSHEMSSFGLKASHVMCLFFL GQNRDTGLKSGELVELCREDKAAISKALSALKKLGYVYTKDGAIIKYRKKYFISDSGME IYNKICDIVESTVEKCSVGLSEDEIAVFYSSLDKITSNLGDLCSNLEDVDEE" /locus_tag="LOCUS_4870" /note="MGA_621" CDS 1126..1353 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MSRLKELRKEKGYTQIKMQHLTGIDQSDYSKLESGKRYFTFEQLK KLALALDTSMDYLSGLTDERKPYPRSDIKD" /locus_tag="LOCUS_4880" /note="WP_000737133.1 helix-turn-helix transcriptional regulator (Streptococcus) [pid:47.5%, q_cov:81.3%, s_cov:61.6%, Eval:1.8e-07, partial hit]" /note="MGA_622" CDS complement(1609..2298) /product="DUF975 family protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_000622462.1" /transl_table=11 /codon_start=1 /translation="MTRKELKLKAKASLSGNWGTAIGAGMLIFLVIFAAILVEALILAV LVALAGEGASSEVTYESSIASALLSGAVSVGWAWFYINIIRGNQVRVSDAFYGFKKFWR NFWANFLIGLFTFLWMLLFIIPGIIKSYSYAMTFYILADNPDMKAREAISKSREIMDGH KMELFVLSLSFLGWIILGVFTLGVLYFWLIPYMDATTAAFYESIKGESQPNVVEGEEEP AIAMLEE" /locus_tag="LOCUS_4890" /note="WP_000622462.1 DUF975 family protein (Bacillus) [pid:41.5%, q_cov:89.1%, s_cov:94.9%, Eval:2.4e-40]" /note="MGA_623" ORIGIN 1 gcaagcccat tgaaaagaga acaggacttt gccttgagac ccagttctat cccaactcgc 61 tcaagcacaa gaacttcgct cagccgataa tcgacaaggg cgaaatttac caccacgtta 121 caacatatag attcggcgtt gaaaagtaat caaacaaaac ataaaaccct atcggttctc 181 cgatagggtt tgtttttata attattcttc atcaacatcc tcaagattcg agcaaaggtc 241 gcccaaattt gaggttatct tgtccagaga ggaatagaaa actgcgattt catcttccga 301 taagccgaca gagcattttt cgacagtgct ctcaacaata tcgcaaattt tgttatagat 361 ctccattccc gagtcggaaa tgaaatactt cttgcgatat tttattatcg caccgtcctt 421 ggtgtaaaca taccccaact ttttgagcgc cgacagcgct tttgatatag ccgccttatc 481 ctcacggcaa agctcgacca actcgcccga tttcagacct gtgtcgcggt tttgtcccaa 541 aaagaaaagg cacataacat ggcttgcctt caagccaaag gagctcatct cgtgggattt 601 gagctttagt atgtatttat agcaggatgc gatgccttga gtgaactttt caaagcgctt 661 taagtggaac ataaacgcac tctccgaacg gttgatgtaa taccataatt ttacataaaa 721 tttgatgagt tgtcaacaat agacagagct attgatacgg ttttttgaaa ggatgttttg 781 caggacgact taccctttca gctttctaaa aatgaatata atcagcttga acggcaacgc 841 caaaacccag aataaaaatt caattatgta catatgccac atccaatgcg ggtatctatc 901 tctataaggt ttcaggacga cccttttgat ttttccgcat ccctcgcaca gggaatatcc 961 gtcatccatt gtcacatcaa acacggtata atcggttttg tgtagcttat tccagcactc 1021 caaacagaat tcagccatat catcaccccc cttcgcttat attttaggtc aatttcacca 1081 tattttcaat agggaaatct gccataatat ttttgggtga tgattatgtc aaggctgaaa 1141 gagcttcgca aagaaaaagg ctacactcaa attaaaatgc agcatctcac aggaattgac 1201 caaagcgatt attcaaagct tgaaagcgga aagagatatt tcacatttga acagctcaaa 1261 aagctggctc tggcgcttga tacaagtatg gattaccttt caggtctgac cgatgaacgc 1321 aagccttatc caagaagcga cattaaagat taactccttt ccgatttggg tcgaaaagga 1381 gttttctttt gctcaaaaac atttccctcg caagatgggc gttgcaaatc aatcgggcga 1441 ccacacaggg tcgcctttat aagcctaaac tataggggca ggtctgtgtg cctgcccgcc 1501 taccattatc gcgataatct ctccctacgt ctttttgctt gcaaaaagac acctccctcg 1561 tcagagggag gcataaaaaa tcccctctta cgaggggatt ttactgtatt attcttcaag 1621 cattgcaatt gcgggctctt cttcgccttc aacaacgttg ggctggcttt cgcccttgat 1681 cgattcatag aatgcggcgg tggtggcatc catataagga atgagccaga agtagaggac 1741 accgagagtg aacacaccaa ggataatcca tccaaggaag ctaagactca aaacaaagag 1801 ctccatcttg tggccgtcca tgatttcgcg gctcttggaa attgcttctc ttgccttcat 1861 atcggggtta tccgcaagaa tatagaatgt cattgcatag gaatatgact tgatgattcc 1921 ggggatgatg aacaaaagca tccagaggaa tgtgaacaag ccaataagga aattagccca 1981 gaagtttctc cagaatttct taaatccgta aaatgcatca gaaacacgaa cctggtttcc 2041 gcggatgatg ttgatataga accacgccca gcccacagac accgcaccgc tcaaaagagc 2101 tgaagctatc gacgattcat aggtcacttc gctgcttgcg ccttcgccgg ccaaggcgac 2161 taatacggcc aatattaagg cttcaaccaa aattgccgca aatatcacca aaaatatcag 2221 catacctgcg ccgattgctg tgccccagtt gcccgaaagg ctcgcctttg ctttaagctt 2281 tagttctttt cttgtcatta tgaaatcatc tcctttttgt gataaaaaac gacatattgt 2341 cataaaacat tctaatatat atggaacatc ttgtcaataa tcggctcata aatttgcctg 2401 ccgctgtcag cgatgttgta agtttgcacg aaatttcttc tcgcctattg tatatcctgc 2461 cgcgtgggta tataattatc tcaacgcact taaaagaggg ttaaaaatat gaattttcag 2521 gtaacatttg tcaccgtggc gataatgctt atgtatgctc tgcccggctg gatattggtt 2581 ggaaccaaga cgataaagcc agagtccatt tcggcgtttg caaaggtctt gctctttgcc 2641 tgtcagccct gccagacggt atattccttt atgtctgtcg atttttcgtg gcagcttttg 2701 ggcgacatcg ggctgttctt cgcgatcgtt ttggtgatgc agcttatcat tttgttcgca 2761 atatatgcaa tcatcggcaa aaaacgcacc gacaagctcc gcgttctcaa tcttgcctgc 2821 tgcttcggca atgtttcgtt tttgggcatt ccccttgtgg aagctgtttt gccccaatat 2881 ccccatgcgc ctgtattttg catcagcttc tcccttgcaa tgaacattct cggctggaca 2941 gcgggagcgt ttatcctcac gggtgataaa cagtatatct ccctcaaaaa aatcattctc 3001 aaacccggtt ttttatccgc cgctgttgca attcccctct tcattatgca gttgagattc 3061 cccgagcgtt tgcttgacgg catcaccctt ttcggccgaa tgaccacacc gatgggtatg 3121 ctgattttgg gaatgagact cgcaactgtg cccttaaaaa atgtattcgg cagcggaatt 3181 caatatgcag gcgttttgct caagcaggtc tgcctgccgt tggtcgcctt ggctttgaca 3241 tttattttgc cccttgaccc tgcatttgaa gcaacccttt atctgctctg ctgttgcccg 3301 atggccagct ttgttttgaa catctccgag atcttcggaa agggtcaaca aaccgccgca 3361 aacatggtcc ttttgggaac gcttttaagc attctcaccc tgccgataat gagtatgc // LOCUS sequence118 3402 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence118 VERSION sequence118 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3402 /mol_type="genomic DNA" /organism="" /note="sequence118" ORIGIN 1 cgttgtgctc atgtccgacg gcgcacccac ctatggcacc gcaagcttca caaatgttac 61 caccggcaac agaggcggca acggttcctc aagtgatgaa gacctcgcat ttgtaaacca 121 gcttacaggc gcatacacca agtatcgcat cgagcagaac tataacaagg atgccctcat 181 ttatactctc ggcgtaggca tttcctctga cagtattgca accagcgttt tgaaccccca 241 gaactctgtc agcgatgttt tggacctttg ggaaacatac gacaacttgt caagctacgg 301 ctcaatgtcc atcagcttcc cctggagcag tgagcagaca ctcagcaaga acgcaaacgt 361 cacaagcgct gaccgcgttt atgttgaccg ctactttgca gctaactcca catctgatat 421 ttccaacgca ttccagcaga tcgttgacca gatcatcatc cagtccaagt actatcccac 481 atatgtaacc agcggtgacc accacctcga cggcgacatc accttcgatg acgacatcgg 541 aagatatatg gaagtcaagg cgatcaaggg catcgttttg ggcgacaccc tcttctcggg 601 cgaggctctg gcacactcca tcgacatcgg acaccttgga acaccttcaa atcccacagt 661 tttgggcaac gagcttgtca gatcggttca ggaacgtatt aacgttgacc ttgcaaccgc 721 ccgcgagctg attgaccttg cttatgccac cggccagctg ttctatgaca gccccacagg 781 cgaatattcc aactacatcg gctggttttc cgatgcagac ggcaactatc tcggcttctg 841 gaacggcgat gataacgcga cagctcccgc aggcgctgtt ttcaagaaca cgtcttatgg 901 ctttatcggc gcatctggca caggtaccag cgcttcaaat atgatgtatg ttgctgttca 961 ggttcacacc agaatctcaa ccggaacatc ccaggtgatc ttccgaatcc ctgcagcttt 1021 aattcctctc atcacctacg aggtaagcct tgaaggaaca tcttatgaag atgcaaaaaa 1081 tattgaagtt accaagacaa tggcagatcc tctccgtctt gtatatgagg taggtcttaa 1141 gtcggaagtc aacgagctga ccgtcaagga cgttgttgca tccacttatg agcacgtcaa 1201 cagcgaaggc atctacagct tctataccaa ccgctgggat cacgaccagc acatccacaa 1261 ggatcaccac cccgaggagc acatcaatac cgttgcgttc tacactcctt ctgagcagaa 1321 cgagcgttac tactataccg aagacaccct catctactcc gcacagaaca ccgacagcgt 1381 atatacaggc gcgtctgctc cttccggcgg aacatattac agagcatact acgtattctc 1441 caacaccgcc gccaaggacg gcattaaagc aacattcgtt gagattcacg ccgacgcttt 1501 ggcacaggcc aagcagaata ccgacggaag ctggtatatt cccaagggcg ttattcttgc 1561 aaaccgcggc aacttctttg ttgataagac agcgaacccc accggtacat atcctttcgt 1621 taaggaacct gttgtaggcg gattcgacgg cgtgttctat gcaacctcct tcttgggcaa 1681 taacggcttg ctgacccttg atcccgcaca gggcatcaag atcaccaaga ctattgaaac 1741 cgttgaaccc aacaccaaca ccgagtttac cttcaccgtt aagaacttga ccgacacggg 1801 cgataacggc gaatatcgac ttattaagca ggctgccgac ggcactctct ccgcagagca 1861 gagcattttc ttcacaaacg gcaaggcaac ccttaccctt aacaacggcg aaagcgcata 1921 tatcgttgat ctggttgaag gccacacatt ctccgttgaa gaagctaagc acgatgatta 1981 cagagttaag tctgtaattg ttgacggcac agcaatcagc gatatctttg ctgaaatcac 2041 cgttgcaaag gacaccattg ctaaggcaca gttcatcaac acctacatcg gcaagggact 2101 ccttgtaatc accaaggatg ttatccacaa tttgggcgct gattacgaaa ttcccgcaga 2161 catcaagttc gacgtagctg tttctttggg aatcgacaac gcaggcgagg aatttgacac 2221 cgtaaccgaa actgcagacg gcaccgttac caacggcaag attttggcag atgcaaacgg 2281 cgcattcacc cttgtaattg aggacggaat gtcaattgcg agcgacggta ttgcagacgg 2341 taccgcattc accgttatag aggcagacta ctccgcaagt ggcttcatca ccaccgcaaa 2401 cggagtcgca ggaaattccg caaacggcac aatcgtggca gatgacaact cccacgttgt 2461 attcgtcaac acctatgacc ccgaagcagc agatgcaacc gttttgatcc acaacggcac 2521 caagaccatc tcgggcagag agtggcttga caccgacagc ttcgaatttg ttgttgaaag 2581 atttgacggc aacaactatg ttgaagttgc aagagttgca accacatatg cagatgcaac 2641 caacggcaca gcacccttca gctttaacaa ttacttcacc accgcggtat tcgacaccgt 2701 cggcactcat tccttccgca tcagcgaagt tttgggcacc atcggcggcg taacatacag 2761 caccgctttg tatgatgtaa ccgtcacagt taccgacacc gatatggatg gcaagctgga 2821 gatcgcagat gtaacttcag ctaccgcaac gatcaaccac agccgcaaca acggcacatg 2881 ggaaattgtc actccctttg aaaatactta ccgggcatcg ggcggcgcaa ctgttgagat 2941 cagcattgca aagactattg atgacctgac ccggcaggca cagaacctct cccttcaggg 3001 ttatcagttc ggcttatata acgcatacgg cacacttttg gaaaccctta ccaccgatgc 3061 aaacggtttg gcagtaattg caagaacata taccgccaca gatatcggca aggtattcaa 3121 ctataccatc cgcgagatcg acacaggcgt aacaggcatc aagtactcca acgcagttca 3181 cactgtttcc atcgagatcg ttgacaacct ggacggtacc atcggtgcaa ccgtgacagg 3241 cgcaaccaac gaatccactc aagaagcgac ctttgccgta agctatgaaa acgtttacga 3301 gcctgcaaag acctccatca ctcttagcgg ctccaagacc ctcacaggta tcagagatat 3361 ggttgcagga gagttcacct tctctgtaac cgagaacggc ac // LOCUS sequence119 3388 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence119 VERSION sequence119 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3388 /mol_type="genomic DNA" /organism="" /note="sequence119" CDS complement(1006..1770) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="METKDIILELRTKHGLSQEELAEKVFVTRQAVSRWENGETVPNTE ALKLLSKLFDVSINTLLGSPRKLICQCCGMPLEDSSISHEKDGIFNEDYCKWCYADGEY MYHDMDDLIEVCVANMASEAFPSEQARAYLKEMLPKLDYWKKYKNLDDGGKFEEFKRKL IDEINALGVEGMPKVEKLNALVGGYVNLEYRLPNGKTVKFLDDNATYLGNQLECEFGGD RCFGVVANMDFILICTYEANGENPELLIYKKR" /locus_tag="LOCUS_4900" /note="WP_003828945.1 zinc ribbon domain-containing protein (Bifidobacterium breve) [pid:35.5%, q_cov:59.4%, s_cov:96.3%, Eval:7.6e-22, partial hit]" /note="MGA_627" CDS 1929..3314 /product="MATE family efflux transporter" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003437109.1" /transl_table=11 /codon_start=1 /translation="MSDNKEMLGTAPIGKLLFKLAVPTVVAQLINMLYNIVDRIYIGHM PGDGSLALTGVGVCMPIIMIISAFAALIASGGAPKASISMGKGDNDSAEKIMGGCFSLQ LVISAVLTVILLIWNKELLLTFGASENTIGYANDYMNIYAIGTVFVQLTLGMGAFITAQ GYTKISMITVLIGAVSNIILDPIFIFGFNMGVKGAALATILSQAGSCVWVLLFLCGKKT YLKLKKQNLRIDGKLVFPCIALGTATFIMQSSESVISVCFNSSLLKYGGDIAVGAMTIL TSVMQFAMLPMQGIAQGAQPILSYNFGAKNAERVKKTFKLLLISCLTYSFAIWGAIMLL PQMFAGIFTPDTALIEFTATALRIYCAVMCIFGIQIACQMTFVSVGNAPCSIIVAVVRK FVLLLPLIYIMPQLISDKTMGVYTAEPVADVIAVTFTAILFAVQFKKALKSLTIETSKE AAQ" /locus_tag="LOCUS_4910" /note="WP_003437109.1 MATE family efflux transporter (Clostridioides difficile) [pid:52.8%, q_cov:96.5%, s_cov:97.6%, Eval:2.0e-134]" /note="MGA_628" ORIGIN 1 ggccctgcaa gaggaataaa ggcaggcttc tttgtgataa aatcctccac ctccaccgca 61 tcgcctacgg cgtaaatatt gggaatattg gtctgcattt tgttgtttac aacaatgctt 121 ccacgttggt tgagttctat tccgcattcc ttggcaatag cggtttcggg acggacgccc 181 accgacataa tgatcatatc ggcggtaatt tcgccgtttt gcaatatgac ggtatttccg 241 tttatagcct ttacaccgtt attaaggtgc agataaattc ctttggattt gatataacgg 301 tgaacatctg ccgccatatc aaagtcgagg ggcgctatca gatggtcggc aagttcgacg 361 atggcgacct tcagccctgc ttcgactaaa ttttccgcca tctcaacacc gatatatccg 421 ccgccgatca ccacagccga gcgcggcttt gcggtatcga tatagttctt gatctttaag 481 gtatcgggaa tgttgcgaag ggtgaaaacg ttgccgccgt ccgccccctc gatattcggc 541 cgtatcggct cggcacccat agacaacatg aggttatcgt aggtttcttc ataggtttcg 601 cccgtgcgaa gatctttgac ggtgacggtt ttggtatcgg gtcttatctt aaccgcctca 661 ttgagcactc tgacgtcgat atgaaaacgc gccttgaagc tttggggcgt ctgcaaggtc 721 aagtccccac ggtcggtgat gacaccgccg atataatacg gcagaccgca gttggcaaag 781 gacacgtatt cgccgcgttc caaaataatg atctcggctt tttcatccag tctgcgaagt 841 cgcgccgccg ccgtggcacc gcctgcaaca ccgcctataa taatgatttt catccttttc 901 acctctatgc aatattttta tatgaacatt atatcatctt ttgcggcttt tctcaatcct 961 tttttctggt ttcggtccca tcaagtcacg acgccatccg tcacatcagc gtttcttgta 1021 aataagaagt tcgggatttt cgccgtttgc ttcataggtg cagataagaa tgaagtccat 1081 attggcgacg acgccgaagc atcggtcgcc gccgaattcg cattcaagct gattgccaag 1141 ataagtggcg ttatcgtcaa ggaatttgac ggtcttgccg tttgggaggc gatattccag 1201 attgacgtaa ccgcccacaa gcgcattgag tttttcaacc ttcggcattc cttctacacc 1261 aagggcattg atctcgtcga tcagcttacg cttaaactcc tcaaactttc cgccgtcgtc 1321 aagattttta tatttcttcc aatagtcgag tttggggagc atttccttca gatatgctcg 1381 agcctgctcc gaggggaagg cctcgcttgc catattcgcc acgcagacct cgatcagatc 1441 gtccatatcg tgatacatat actcgccgtc agcataacac cacttgcagt agtcttcgtt 1501 gaagattccg tctttctcat ggctgatgct gctatcttcc aggggcattc cacaacattg 1561 acatatcagt tttctcggag agccgagaag cgtattgatg gacacatcaa aaagttttga 1621 caggagcttg agtgcttcgg tgttgggtac cgtttcacca ttttcccaac ggctgaccgc 1681 ctgacgggtg acaaatactt tttcagcaag ctcctcctgg gagagcccat gttttgttct 1741 gagttccaat ataatatctt tcgtttccat attccttacc gcctttgatt actgcgatta 1801 cattataaca gattgccgtg cgcatcacaa gcaacgcgct gttgcacaaa agctatttga 1861 tgacttgaat tataaatgca agtgttatat aatatacatt gccatttttg attttacggg 1921 gcgtaattat gagcgataac aaggaaatgc tcggcacagc gccgatcggc aaattgctgt 1981 tcaaattggc agttccgacg gtggtggccc agcttatcaa tatgctatac aacatcgttg 2041 accgcatcta tatcggtcat atgccgggcg acggaagcct ggcgctgacg ggtgtcggcg 2101 tatgtatgcc gattattatg atcatctcgg catttgcggc gctgatcgcc tcgggcggtg 2161 cgcccaaggc atccatctcg atgggcaagg gagacaatga ttctgccgaa aaaattatgg 2221 gcggatgttt ttctctgcag cttgttattt ctgccgttct gaccgtcatt ttactgattt 2281 ggaataaaga gctgcttttg acgttcggtg caagtgaaaa caccatcggt tacgccaacg 2341 attatatgaa catctacgcc attggcaccg tctttgttca actaacgctt ggtatgggcg 2401 cgtttatcac cgcgcagggt tacaccaaaa tcagtatgat cacggtgctg attggcgctg 2461 tcagcaatat catccttgac ccgattttta ttttcggctt taatatgggg gttaagggcg 2521 cagcgcttgc caccattcta tcgcaagccg gctcttgtgt gtgggtgctt ctgttccttt 2581 gcggaaagaa gacctatcta aaactcaaga agcaaaatct ccgcattgac ggaaagctcg 2641 ttttcccttg tattgcactg ggaacggcaa cctttattat gcaaagcagt gaaagcgtca 2701 tttcggtttg ctttaattct tctctactta aatacggtgg agatattgcc gttggcgcta 2761 tgacgatcct tacaagcgtg atgcagtttg caatgctccc gatgcagggc attgcacagg 2821 gcgcacaacc gatactcagc tataatttcg gtgccaaaaa cgccgagcgt gtcaagaaaa 2881 cctttaagct gttgcttatt tcttgcctta cgtattcttt tgccatttgg ggagccatta 2941 tgctgttacc gcaaatgttc gcaggaatat tcacacccga tacagcactc attgaattca 3001 ccgcaacggc acttaggatc tactgtgcag taatgtgcat attcggtatt cagattgctt 3061 gccagatgac ctttgtttcc gttggcaacg caccgtgttc tatcattgtt gccgttgttc 3121 gcaagtttgt tttactctta ccgctgattt acattatgcc gcaactcata tcagacaaaa 3181 caatgggcgt ttacacggca gagcctgttg ccgacgtgat agccgtaacc tttaccgcta 3241 tccttttcgc cgtgcaattt aagaaggcac taaagtcttt aacgatagaa acttcaaagg 3301 aggcagcaca atgaaaattg cagtaactta ccaaaacgga gagatctttc agcacttcgg 3361 acataccgag cagtttaaga tctatacc // LOCUS sequence120 3361 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence120 VERSION sequence120 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3361 /mol_type="genomic DNA" /organism="" /note="sequence120" ORIGIN 1 aaatcaagcc gaaaataagg atgaatccga gtaccagtcc aaggtaaggc aatgagctga 61 cagcatcaac gaagaagtcc ttgaagtcct cgccgatgtc ataaagattg tcggaaaggt 121 tggatgaaat tctctgccaa acggtcttct tttcggtggt cttggtaatg cggacgacct 181 ctcttatgtc aatagtcaag gtcgaatagg agatcttgct cttatatgaa ttgagctttg 241 cggtgtatga ctccagctcg taggtcacat cagtaagata gttctgaatg gtgagaatct 301 cctcgatagt ttccgccttg tccatcagct tgaggtatgc ttcctgctgt gccttgaggg 361 cggcaatacg agcttctgtg tcaacataat ccgctgtaac gtcggcaatg tattcggtag 421 aatagctgat gttgcccata tttcccacat cggtgacaaa ctgctcaaat ctctctgcag 481 ggattctcac aacgtagttt gcgcttctgg tggaatatgt gtcatatgcc gagccatact 541 gcgaagagtt ctgaacatat ccgccgtatg cgccgactgc ctgttcaaat tccttgatga 601 atgcgtcaaa ctcggtggtc tcaagctcaa ccgtgcgata cttgattatc tttctctcgc 661 tttcggcata gctgtcggtg tcgggatttt tagaagctga gttggacatt ccgtaagaag 721 gggattccat atccgcttct tcctccatct caacggagtc ctcaacgatc cagccgtatt 781 cataatcgcc tgcggattcg gttgtgggca tcatagaatc atacatcgcg cccttgccgt 841 tataggatct tccgcaaccg gtaaacataa ccaaaacggt cataagtgct ataacaatgg 901 ataacgttct tttcatcatt ttatgtcaat cctttcaatc agccaaagcc ttggctgtct 961 ttcacttata atacaatttt tgggcattga ttattgcgtt gtcaagaaga aaatgcctca 1021 taaagaaaaa ttcggaaaaa tttccaaaaa tgcttgacat cagttgtcca ttgtgctaca 1081 ttgtaatatg tatcataatg gcgtagtgaa cgcctatttc cgaaaagtga taatttttgt 1141 gagaactttt tcaacaattt ctttatgaaa ttagcgatat tgcacaaaat catcttttcg 1201 tgaacgagag tgagggcgtt ttaaaacgcc aatacttaac gtcagttatg ttaaaacgca 1261 attttatata aggagtgata agccaatggt caatgtcaaa gacgtcaagc tcggtaagaa 1321 cagccgtaaa agcttcgcaa agatcaacga agttttggaa atgcccaacc ttatcgagat 1381 ccagaagaaa tcctataagt ggtttctcga ggaaggcttg agagaggtat ttaaagatgt 1441 agcatccatt aaggactaca acgaaaccct cgaactcagc tttattgact accgtctgga 1501 cgatcagccc aagtacacca tcgcagaatg taaggaaaga gacaccacat atgctgcacc 1561 cttgcgtgta actgcgcgac tcgtcaacct cgaaaccggc gaaatcaagg acagcgaagt 1621 attcatgggt gatttccccc tcatgactcc ttcgggaaca ttcgtcatca acggtgcgga 1681 gcgtgtaatc gtatcccagc tcgttcgttc tcccggcgta tattatgctg ttgagaagga 1741 caagaccggt aaggacctgt tcaagtccac cgttatcccc aacagaggtg catggctcga 1801 atacgaaatg gactctaacg atgtagtcta tgtccgtatc gacaagaaca gaaagatccc 1861 cctgaccaca tttatccgcg ctctcggcat cggcaccacc tatgagatcg acgagatgtt 1921 caacaacgac ctccgcctca aggcaaccag catgcagaag gatgcttgca ccaccaccga 1981 ggaaggtctt atcgaagtat ataaaaagct tcgtcccggc gaacctccga cggttgacag 2041 cgctgtaacc catttgaaca acctcttctt cgatgcaaga agatatgacc tttgcagatt 2101 cggcagatat aagtataaca agaagcttgc aatcgattcc cgacttgcag gccgcacccg 2161 ttcccgccct gtgatcaacc ccttgacagg tgagatcgtt gcagaagcag gggagaccct 2221 ttctttggca agagctaacg agatcgaggc tttgggtgta agcgaagcat acatcaccgt 2281 tgagagaaga gagaccctca catctcccac cggcgaagtt atccacaagg ttgaaaacgt 2341 tgaagttaag gttatcggca acggtatggt cgacatcaac gactttatcg actttgacgc 2401 taagccttac ggcatcaacg aaaaggtatc cttcaaggtg ctcaaggaaa ttcttgaatc 2461 tgccgctaac tccgacgaga tcgcagagca ggtcaaggca agagcagacg agctcattcc 2521 caagcacatc atcaaggaag atatcattgc aacaatctct tacttcctca acctctgcga 2581 gggtgtaggt accgttgacg atatcgacca cctcggaaac agacgtatcc gctgtgtcgg 2641 tgagcttttg cagaaccagt tcagaatcgg cttcagccgt atggaaagag ttatccgcga 2701 aagaatgaac attcagtcgc aggatatcga ggttgtaacc cccaccgcgc tcatcaatat 2761 cagacccatt accgctgcta tcaaggaatt cttcggttca tctcctttgt ctcagtttat 2821 ggaccaggtc aaccccttgg cagagcttac ccataagaga agactttccg cactcggtcc 2881 cggcggtctt tcccgtgacc gcgcaggctt cgaagttcgt gacgtacact attctcacta 2941 cggcagaatg tgtcctatcg aaactcctga aggacctaac atcggtttga tctcttatct 3001 tgcatccttt gcaagaatca acgaatacgg cttcattgaa gctccttacc gcagagttga 3061 caaggcaaca ggcgttgtaa ccgacgaagt tgtatatatg actgcggacg ttgaagataa 3121 ctataccgtc gcacaggcta acaccccctt gaccgaggac aacaagtttg ccaaggcaaa 3181 ggtaaacggc cgttaccgcg accagatcat ggagatcgac gctgaaaaca tcgacttcat 3241 ggacgtatct cctaagatgg tagtatctgt tgctaccgca atgattccct tccttgaaaa 3301 cgacgacgca aaccgtgccc tcatgggtgc gaacatgcag cgtcaggcag ttccgcttct 3361 c // LOCUS sequence121 3338 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence121 VERSION sequence121 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3338 /mol_type="genomic DNA" /organism="" /note="sequence121" CDS 441..1817 /product="altronate dehydratase family protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_002286002.1" /transl_table=11 /codon_start=1 /translation="MRTLKIHPRDNVAVDLNTGHKVALCDIKCGENIIKYGFPIGHATA DISEGDSVHTHNLKTNLNELLDYEYIPNLTEIKAEEPRTIMAYVRPDGNIGIRNDIWII NTVGCVNKTAERLAHATGALTFSHPFGCSQLGGDHLTTQLILRGLVNHPNAGGVLVLGL GCENNNIPEFKKILGEVDENRVKFLIVQEVEDELTEGIRLINELKTYADTFTRQPVPIS KLKVGLKCGGSDGLSGITANPLVGQFSDKLIAQGGSSVLTEVPEMFGAETILMNRCLTR ELFDKTVDLINDFKRYFIRHGQEIYENPSPGNKAGGISTLEEKSLGCTQKGGTSCVVDV LGYGDTVTKSGLNLLNGPGNDIVAVTNLTAAGCHLILFTTGRGTPLGAPVPTVKISTNT KLYENKPHWIDFNAGEMINGRDLCNGLFDYVIGVCNGELTNNEKHGYREISIFKDGVTL " /locus_tag="LOCUS_4920" /note="WP_002286002.1 altronate dehydratase family protein (Enterococcus) [pid:58.3%, q_cov:96.9%, s_cov:91.8%, Eval:4.8e-152]" /note="MGA_633" CDS 1814..2701 /product="amidohydrolase family protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_008767091.1" /transl_table=11 /codon_start=1 /translation="MIIDAHLHLWDKQNGIVNGKPVYDIGGGRSDFGGEIRQMMPPYLY DGKNSVEALISNMNFACVSGCVVTQEYIDGNQDKYLLEAKSKYGDRIKICALYEENGVF DEEYFLSNPFDGLKICAGRLADQVLTKLLPIFKMVERSGRFISIDLSDGEAQVPAMKEL IKACPNLRIAIGHFGMVTRDGWLEQIRLACNPNVYIESGGITWLFNDEFYPYPSAVDAI KEAASICGIEKLMWGSDYPRTMTIITYLMSLDFVIKSDKMTDEEKSLFLGENARKFYGF SDLPIPEKIHHMAE" /locus_tag="LOCUS_4930" /note="WP_008767091.1 amidohydrolase family protein (Bacteroides thetaiotaomicron) [pid:52.1%, q_cov:99.7%, s_cov:98.7%, Eval:8.1e-85]" /note="MGA_634" ORIGIN 1 gaaacagtaa gtgctttttt aaatcaatgc atttttaacg agattattcc taccctcggc 61 tcgaccgatg aggatattgc cttcggtaag gctgttttgg aaagattttc caatcccttc 121 atcaagcata agcttttggc gattgctctt aactctgtca gcaagtttaa tgtaagagtt 181 ctgccttcgc ttttggctta ccgtgaaatg aacggcgtta accccaaggc attaaccttc 241 tcacttgcgg cacttatcgc attctataag acaaacgaat ccaacgatct ccctgaggtt 301 atggaatata tgaggaatgc aagcgttgat gaaattctcg ctaaggttga atattgggat 361 accgacctta gcttcctcgc cgatgatgta aatgagtatt acaataccat tcagactaag 421 ggaatgaaag aggcatttaa atgcgtactt taaaaattca tccccgcgac aatgttgcgg 481 ttgatcttaa taccggtcac aaggttgctc tttgcgatat caaatgcggt gagaacataa 541 ttaaatacgg tttcccgata ggtcacgcaa ccgctgatat ttccgaaggg gatagcgtac 601 atactcataa tttaaaaacc aacctcaacg agctcttgga ttatgaatat attcctaatc 661 tgacggaaat caaagcggaa gaacctcgta ccataatggc atacgtccgc cctgatggca 721 atatcggcat tcgcaatgat atatggataa tcaatacggt tggctgtgtc aacaaaacgg 781 cagaacgctt ggctcatgct acaggtgctc tcacattctc gcatcctttc ggttgctctc 841 agcttggcgg agatcacctt acgactcaac tgatcctccg aggacttgtc aatcatccga 901 acgcaggcgg tgtcctcgtt ttgggcttag gatgcgaaaa taacaacatt cctgaattca 961 agaagattct cggcgaggtt gatgaaaatc gcgtcaagtt tctcattgtt caagaggttg 1021 aggatgaact gactgaaggt attcgcctca ttaacgagct taaaacatat gccgatactt 1081 tcacccgtca accggtcccg atttcaaaac tcaaggtcgg acttaaatgc ggcggttctg 1141 acggactttc cggcattacc gctaaccccc ttgtcggtca gttttccgat aagcttatcg 1201 ctcaaggcgg ttcaagcgta ctcacagaag tccccgaaat gttcggagca gaaactattt 1261 taatgaatcg ttgcttaact cgagagctgt ttgacaagac tgttgacctc atcaacgact 1321 ttaaacgata tttcattcgc cacggtcagg agatatatga aaatccctct cccggtaaca 1381 aagcgggcgg aatttcaact cttgaggaaa agtcccttgg atgcactcaa aagggcggaa 1441 cttcctgcgt tgtcgatgtt ttgggatatg gcgacactgt cacaaaatcg ggtcttaacc 1501 ttttgaacgg ccccggtaac gacattgttg ctgtaacaaa ccttaccgcc gcaggatgtc 1561 atctgatttt gttcacaaca ggcagaggaa cacctctcgg agctcctgtt ccaaccgtaa 1621 agatttctac aaatacaaag ctttatgaaa acaaacctca ttggatagac ttcaatgcag 1681 gcgaaatgat taatggacgt gatctctgca acggcttgtt tgattatgta atcggcgttt 1741 gcaatggtga attaaccaat aacgaaaaac acggctaccg ggaaatttca atattcaagg 1801 acggtgtaac attatgatta tagatgctca ccttcacctg tgggataagc aaaacggcat 1861 tgtcaacggc aagccggtat atgatatcgg cggcggaaga agcgatttcg gtggtgagat 1921 ccgtcagatg atgcccccat atctttatga cggcaaaaac tcagttgaag ccttaatttc 1981 aaatatgaac tttgcttgcg tttcgggctg tgtcgtaacg caagagtata tcgacggcaa 2041 tcaggataag tatttgctcg aggcaaagag taaatacggc gacagaatta aaatctgcgc 2101 tttatatgaa gaaaacggcg tttttgatga ggagtatttc ctctcaaatc cctttgacgg 2161 tttgaaaatc tgcgcaggac gtcttgccga tcaggtttta accaagcttc tgccaatttt 2221 caagatggtt gagcgctcgg gtagattcat atctatcgac ctttcagacg gagaagcaca 2281 agtccccgca atgaaggaac tgatcaaggc ttgtcccaat ttgcgtatcg caatcgggca 2341 tttcggaatg gtcactcgcg atggctggct tgagcagatt cgtttggcct gcaacccaaa 2401 tgtatatatc gaaagcggag gaattacctg gctcttcaat gatgagtttt acccttatcc 2461 ctctgcagtt gatgccatca aagaagcggc ttcgatctgc ggtattgaaa agctaatgtg 2521 gggtagcgac tatcccagaa caatgacgat aatcacatat ctgatgagtc ttgattttgt 2581 gataaaatcc gataaaatga ctgatgaaga aaagtcactt ttcttgggcg aaaatgcaag 2641 gaagttttat ggcttttcgg atttgccgat tcccgaaaaa attcaccata tggctgaata 2701 attgtacata aggcgtagac aaaatgtctg cgcctttgtt gactaatata catcccattg 2761 ttataatgaa ttcatcaacc gaaaggagca ggattatgta cattgcaaac agtcaaagat 2821 attcaaagat gatatacaac cgttgcggca actcggggct caagcttcct gcagtatccc 2881 tcggtttctg gaaaaacttc ggaaacggtg acggaaactt tgccaatatg gaaaagatgg 2941 ttcacacagc ttttgacctc ggcatcactc attttgacct tgccaacaac tatggtaatc 3001 cccataacgg aagcgctgaa gaaaactttg gtaaaatttt aaagggtatg agcacatacc 3061 gcgatgagat gatcatctcc accaaggctg gctacgaaat gtggcccggt ccttacggcg 3121 acagaaacgg ttcaagaaag tatctaacgg cttcactcga ccaaagcttg aagcgtatgg 3181 gacttgatta tgttgatatt ttctatcatc acgtatatga tcccaatact ccgcttgaag 3241 aaactgcact tgctttggat aacgctgtac gtcaaggtaa agccctttac gtcggtatct 3301 ctaactacgg catgtatcac acaggcgaga tgattaaa // LOCUS sequence122 3336 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence122 VERSION sequence122 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3336 /mol_type="genomic DNA" /organism="" /note="sequence122" ORIGIN 1 ccaaatcagc caaaaggagg aaaacaacga tgcctaactg gacaaatgaa cagcttcgcg 61 ccataaactc ctttggcaac ccgacaattg tttctgccgc cgcaggaagc ggcaagaccg 121 cagttcttgt cgagcgcacc atccgacttc tttccgaccc tgaaaagaac atccccgccg 181 acagcgtttt ggctgtaaca ttcacaaacg actccgcatc tcaaatgcgc gagaagcttt 241 caaacgcctt tgaatcgctg gcaatatccg acccgtcaaa cgcttgggta cagcaccagc 301 aggcgctttt gcacctggcg caaatcacaa ccataaattc cttctgcttc ggacttgtaa 361 aagacaatct cgctctgacc gatttccaga cgggcctgcg aatccttgaa caaaacgaag 421 cggatatgct taccgaccgc gcacttactg atgttttaga gtgcagatat gcacacgacg 481 gcaagggcat ggaaaagctc atctcgcttt tctgcaaaga aaacgactat gagcttcgct 541 ctgtaatcaa aaagctctat gcctttttgc gtactttgcc ttatcaggag ctttggatca 601 gcgatgtcat taaatccctt cgcgacggat caaagctcgc ccaaataatg accgaattcc 661 gcgcatctgc aaaaagtgcc gccgcaaccg tcaaaagtct ttcctcaaag cttgccgacc 721 tctgtcagag ccttgaatac cactctgccg acaaagccgc atttattaag aattgcgacc 781 tcgctgacag cctttgcgat gctgttgaaa acagcgaatg ggatggtctg gttggcacct 841 ttgcaaaaat tccctgggca cgccgtacag gcaaaaccac agccgccgaa aaggctgctt 901 gctcatatgc cgaagaagca tactatcgct ctgcggtctt ggctttagat gaactcaaat 961 cctccgccga gcagataggg gactatttca aatatcctgt cagcgtgatg caaagcgatt 1021 ctttgctctg cgccgatatt ttcgaaaacc tttgtgaaat ctgccgcgag cttgaagatg 1081 ctgtacacaa agtcaaggtt gaaaagaacg ccgtcgactt tgccgacacc gagcttatga 1141 ccgtgcgcct tttgaccaac atcgaccaaa acggaaaaat cacccgcaca cccctctgcg 1201 aggagatcgt ttcctcaaag cgctataagc tgataatcat cgacgagttc caggatgtta 1261 acaatcttca ggatgtcatc ttcaaagcca tttccgatac agacgactta aatcttatcg 1321 gtaataatgt ctttgttgta ggcgatgcaa agcaggcgat ctatcgcttc cgtcgtgcca 1381 acccgatgat ttttgtcaat acccgccttg ccgctgcgga tgataataat cccgtcagtg 1441 aagtgattct ttcaagaaac ttccgctcaa gaaacgcggt gcttggcttt gcaaactata 1501 ttttttcatc gctcatgtct cgcgaggtgg gcgagatcga ctataccttt gaagaggagc 1561 ttcgtctcgg cgcgaattat gagggcaagg atcccgccgc cgagctgatt ttggtcaact 1621 ccgatgctgt ttccgacgat gacgaaggca tcgtccccga tgaattctct gccgttgcat 1681 ccaaaatcaa agaaatgctt gatgatggcg tattggttcg cgacggcgac acttatcgcc 1741 cctgcatacc atccgacttc tgtgtcctga cccgcaacaa catcaccgat gaatcgctcg 1801 tttcaagctt cgagcgtctg ggcttaaagg tgctttcaaa cgaccgttcc ggatatcttg 1861 cttcccgcga aatatctgtg cttctcaatc ttctttcctg tatcgcttcg cctatgcgtg 1921 atgtgccgat ggcaagcgta atgctatcgc ccataatggg atttaccgac gacgaacttg 1981 cacttgttaa aatggcgggc aaaaagcaca gattatataa aaatatgctc cgtataattg 2041 cgggcgaacg cgaagctggc gacattttaa aagctaagtg tgaaagtgcc gttacacttc 2101 tgaaaaagct ccgcatatat gccactgaaa tgcccttgac gaggttaatt caaaaggcat 2161 atgacttaac ggacatcttc tcgatcgcct cggcatatga agacggctct caaaagcgtg 2221 ccaacctgca cctgcttttg gaatatgccg cgagctatga agaagcatca agcgacggaa 2281 ttgcaggctt cctgcgctat atcgactata tctccaaatc gggcggcgat tttgaatcgg 2341 catatgccgt aacggaatcg gctgacgccg tatccgtcaa gacgatacat aaatccaagg 2401 gccttgaata tccccttgtt ttcatctgcc agaccaaaaa gagattcaac cgccgcgatc 2461 ttcaatgtgc gttgaactta aatgccgatg caggtgtggg aatcaacttc ctggataaat 2521 cgcagcttgt caagcataaa accgtttttg ccgaccatat ccgcctcaaa aacgaatcgg 2581 agatgctttc cgaggaatta agacttctat atgtcgcgct gacccgtgca aaggagcgag 2641 tctttgtcgt tctcaacaga agcgaaaaat ccctcgagcg tgccgcaaag tttgcatatt 2701 ccatcgacac ttataaagtg ccttccgaca tcgcccaaaa ggctgacagc tttgaagatt 2761 ggctctatat ggcgcttttg cgccaccctg cacttgagca tataagaaaa gaccttcttc 2821 ccgaggactt ggcatattgc gacggcgatt tcatctcttt ccccgatgtt gtggcgtccc 2881 atgcccgtct aatgtccgat gccgtcggcg agaaatcggc tttatccgaa tctgctcctg 2941 ccgacaggga aatggttatg agccttatgc gcagcttctc tcttgaatat gaccgcagac 3001 tcattgaaaa cgaagcaaag gtcaccgttt ccgaacttgt caaggatgat gccctcgact 3061 tcttcgtcac ccttcccgag ttgggcgaat cgctgggcga gctgaccccg gcacaaaagg 3121 gaaccgtcac ccaccgcttt atgcagttct gcaattttaa taacgcctca cgcgaccttg 3181 aaacggagat ctcccgactt gaatcgggcg gactgtttac aaagcgtgaa gctgatgcaa 3241 ttgaccgcag agcggtaggg gagttcttta aaggcgaaat atattcccgt atgcttcaaa 3301 gccgtgaggt tatgcgcgag cgcagtttca tcgtcc // LOCUS sequence123 3312 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence123 VERSION sequence123 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3312 /mol_type="genomic DNA" /organism="" /note="sequence123" CDS 1599..2705 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MKRFISLLLVALMLMSLSGCSGNKVICAYEEETPSLYEQFEQWFG VGAAINSWNLDGSSEQYKTITKHFNVFVYENESKPDATHPSEDRYNFANVDKFVEFGEQ TGATLRGHTLLWHSQCPDWFFFDSNGNYVAPEVLIERIDDHVTTIVSRYAGKIDTWDVV NEVISDGAGLRDSHWYNVVGDYDGDGDKYDYIEQAFRSARAADPDARLIINDYNMEWSE SKTISMYLAVKQMLSEGVPIDGVGLQMHIGPDLDVAKLRSNIEILLKLRDINPDFVIEV TEMDMNMTGSTKEDFEKQAAKYAELFQLFIDLAEEGVLDTVVFWGFYDGASWLNKSDAD NYPMLFDREFMTKPAFWSVLEVAENNKK" /locus_tag="LOCUS_4940" /note="WP_012584062.1 endo-1,4-beta-xylanase (Dictyoglomus turgidum) [pid:38.4%, q_cov:89.9%, s_cov:31.4%, Eval:9.1e-63, partial hit]" /note="MGA_639" ORIGIN 1 cgttgaactc ggcaaccttg tcttcaattg tgggccaata gctcttataa tccgatttat 61 ccaaaattac atcaatgtta tatgccagat tatcttccaa agcataagcc atgggaatgg 121 ttgcatatct tccgcttgat ttatagaagc tgtggttatc tcttaagttt ccgtcaccct 181 cagctctgta aagtccctcg gtcaatgtgt cgggaatgga atacatggca tcaatattgc 241 ccgagtcaat atcattgatg atgattacct ttgtgcgttc aacaacctct tcctttgtgg 301 gaatgtcaat agtgccgtca attaccttgt aaatgaggtc ctgtgcaaca ttcttaaata 361 cagtcaacga ttcccactgt ctggctgtcc aaccgtcctc gtctgtggtt gcgccgatct 421 ccttgaagtc gtcttcaaat accagctcgg ggccgtcaat aacggtcgca ccgttcaaaa 481 gcattctttc aaattcaaca gccaagccgg tagacattgt gtagtcgctg ctggatccgc 541 tgccgggtgt ccagcctgtt tcatcatatc ttacgcccca ctgtccgcag tagccggaaa 601 gatatgctcc caaaacaaca ctttccatat ctgcaagata gcttgtctgg gtatatttct 661 cacaaagaat gtagttttct gcataaagac ggctagcttc ttcccattcg ggaacctgct 721 tgagcattgc aagagggtta attgaagggc tccactggtt tccacaccag cttacaaaca 781 aatatccgcc gtattcatgt gtgatctcca aaaggtttgc aaaatgcaaa tatctgtcat 841 gacaggaagg ggaaatgcct tccatatcgt atccccagaa ctgctcggaa tagttaaatc 901 cgaggaagtt ggggtaatct tcaaagaatt ctctgtaaag tgtgttatca tactcggaca 961 tttccttata gtcggggaaa tggcagggtc cgccgctggc gggctgaacg gttgcccaaa 1021 caccgttctc ggcacaggtt ctcagccacg atttacaggt ttcatacgca tattcaacaa 1081 caccaaagcc ctcttccgaa tcatgtccgc ttacggacat ggaaaggttg aatatgacat 1141 aaggacggat ttcctcggga atcaattcaa ttatcctttg agggtccgga gatgtccatg 1201 tgtcaatatg tacgatccaa gcaggagctt cattattaat cactcttcgc aactcgacct 1261 tctctgcggc gtttgcttta actgaaaatg gttcaaagct aaacgcaccg accaaaatca 1321 agcatacagc aataagtgca aacagtcttt taaaattcat attaaaacct tcctttcacc 1381 ggcacttcta aaatgcttat tttaattata caacgcgttc atttaaaaat atatagcaaa 1441 aaaatacttt ttgagttcaa gagcagaaaa gtttgcaaaa tctgcactat cgccaaatga 1501 cgaccttcaa atattgcata attgacgatt gaaaaatcag cattcgctat gataaaatta 1561 ttatacttgg aactatatcg ttttgaagga gaaatgttat gaaaagattt atttcattac 1621 ttttggttgc cctgatgtta atgtcccttt cgggctgctc gggaaataaa gtaatctgtg 1681 cttatgagga agaaaccccc tcgctttatg agcagtttga gcagtggttc ggtgtcggtg 1741 ccgcaatcaa ctcttggaac ctggacggct caagcgagca gtataagaca atcaccaagc 1801 acttcaacgt tttcgtatat gaaaacgaat cgaagccgga tgccacccat cccagcgagg 1861 acagatacaa cttcgcaaat gtggataagt ttgttgaatt cggtgaacag accggtgcaa 1921 ccttgcgagg acatactttg ctttggcata gccagtgtcc cgattggttc ttctttgact 1981 caaacggaaa ctatgtcgcc cccgaagttt tgattgagag aattgacgat cacgtcacca 2041 caattgtttc ccgttatgca ggaaaaattg acacttggga tgttgtaaac gaagttatca 2101 gcgacggcgc aggccttcgc gattcccatt ggtataatgt tgtcggcgac tatgacggcg 2161 atggcgataa gtatgactac atcgagcagg cgttccgctc tgcccgtgct gctgaccccg 2221 atgcccgcct catcatcaac gattacaata tggagtggag cgagtcaaag actatttcaa 2281 tgtacctcgc agttaagcag atgctttccg aaggcgtccc gatcgacggc gtcggtctgc 2341 agatgcatat cggcccggat cttgacgttg caaagcttcg ttcaaatatc gaaattcttc 2401 tcaagctccg tgatatcaat cctgatttcg taattgaagt taccgaaatg gatatgaata 2461 tgaccggcag tacaaaggaa gactttgaaa aacaggcagc caaatatgcc gagctgttcc 2521 agttgttcat cgacctcgca gaagagggag tgcttgatac agttgttttc tggggattct 2581 atgacggtgc ttcttggctc aacaagagcg atgctgacaa ttatcccatg ctctttgaca 2641 gagaatttat gaccaagccc gccttctggt cggtgcttga agttgccgaa aacaacaaga 2701 aataatgtac aaaatcatcg gtcgcccaac ggcggccgat ttttttcgct ccgctcgcca 2761 ccatcggcgc tgccgcgctt ttcgatgacg gctcgctccg ctcctgtcgg gcgccaccta 2821 ttgtaagcct ctcctgttgg gagaggtgtc agcgtatgct gacggagagg gcaaaacggg 2881 cgaccacgca gggtcgcccc tataatagag aaaatttctc tctgttctgc cgcaccgatt 2941 ccataccgcc tgacggcgga tgccatgcac gcctgcggcg tgatttgcgc gcgggtcccc 3001 gccaccgtga accttcggtg cccgatggcc tccgccccgc gtgctctcca ttctccccaa 3061 aaccgtgccc aaaatcccgc tgaaattcta cgtgaaatct tgatgaaaat ttaacaaact 3121 acttgactat ttgacacaaa agaaataaaa tagtatttga ggaagattgg ggtttcgatg 3181 aatattgaaa cgcaaaaaac cattctttcc gaatgatcgt cttataaaaa ttagaataaa 3241 tagtaaggag attaacatgg caacattaac caagaaccct aatgtcaaca agtgggttga 3301 cgaaatgatc gc // LOCUS sequence124 3310 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence124 VERSION sequence124 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3310 /mol_type="genomic DNA" /organism="" /note="sequence124" CDS 369..1502 /product="cysteine desulfurase family protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_009895806.1" /transl_table=11 /codon_start=1 /translation="MIYLDNAATSKVCAEAVSASSFAMTEVFGNPSSLHKLGIEAEKLI TFSKEQIASALGCAGDEIVFTSGATESNNMAILGLCENYGKRKKRIVTTAIEHPSAYEP FEKLKKMGYEVCVINPDEDGNITEDMLIDAVDDNTCLISAMLVNNENGYILPIAKAFKE IKAMYPECMTHCDCVQGFEKIKIKAKLLYCDTMSISGHKIYAPKGIGALYIKKGVRVAP LLIGGGQQKNLRSGTESVPMIYSFGKTVEALTPTIDERYEYVKGLNEYARKLISGIDTA VINSPENASPYILNISLVGLKSEIVLHFLEQSEIYVSSGSACSRGKKSSVLSAFGLNDK RVDSAIRISFSKDSTRDEIDRLCEELERAVKTLARAR" /locus_tag="LOCUS_4950" /note="WP_009895806.1 cysteine desulfurase family protein (Clostridioides difficile) [pid:42.0%, q_cov:97.9%, s_cov:96.9%, Eval:1.1e-76]" /note="MGA_640" CDS 1636..2823 /product="tRNA 4-thiouridine(8) synthase ThiI" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011860948.1" /transl_table=11 /codon_start=1 /translation="MKELILCKYGEIVLKGLNRSSFESEMLKNIRRRLKPMGNFKFVSA QSTLYIEALDEDIDIDEVLEKLSKVFGIVKLCKAVEVEKDMDVIFETAKSYLGRALKKA STFKVESKRSDKRFPLKSPEIAAELGGRILEAFPHLKVDVHNPEVTVICEIRDNGAYIH GMPIEGAGGIPVGTGGRALLLLSGGIDSPVAGYMIAKRGVQISAIHFEAPPYTSERALM KVERLAQKMTDYCGKISFYCVPFTKIQEVIKDNCPEELFTIIMRRLMMEIAQRIAESHD YAALVTGESIGQVASQTMSAMVCTDAVCRIPVFRPCIGLDKKEIIDISYKIGTFDISIE PYEDCCTVFTPKHPKTRPVLADVEAAQAAYDFEPLIREAYEGITVKTFKIGGQVE" /locus_tag="LOCUS_4960" /gene="thiI" /EC_number="2.8.1.4" /note="WP_011860948.1 tRNA 4-thiouridine(8) synthase ThiI (Clostridioides difficile) [pid:46.5%, q_cov:97.0%, s_cov:98.0%, Eval:1.2e-95]" /note="MGA_641" ORIGIN 1 caaaacggta tgtggatata tatgcctaca gacacacgct cacctccttc aggttgatgg 61 ggatattgta tcataaaaca ggttgaagcg caagcgggag cggcagcccg cgcgagatgc 121 gagcgcaaag cgctcgcatc tcgcgaaccg cggctaagcc gcgggaaaaa cgccccgtaa 181 ggtagggcgt tttggctgcc gcgttgtttg gctgtgtgca aaagtttcag gtgacagggc 241 ggtaaaaaaa tgtcgataaa ctgcatattt cagttgcaat tatgcaatat ttctgctata 301 ctgattgtat ataattatag tacaatgcgg tactatgtgc tcatctgatt ttaagaggtg 361 aaacattaat gatatatctt gacaacgccg caacttcaaa ggtgtgcgcc gaagcggttt 421 cggcttcttc atttgcgatg acggaagtgt ttggaaatcc gtcgagtttg cataaacttg 481 gaattgaagc agagaagctg attactttct caaaagaaca gattgcaagt gcgcttggtt 541 gtgcaggtga cgaaattgtt tttacatccg gtgcaactga gtcgaacaat atggcaattt 601 tggggctgtg cgaaaactat ggcaagcgta agaagcgaat tgttacaacg gcgattgaac 661 atccttcggc atatgaacct tttgaaaagc tcaagaagat gggatatgaa gtttgtgtca 721 taaatcccga tgaagatgga aacatcaccg aggatatgct tattgatgcg gtggatgata 781 acacctgtct tatcagcgcg atgcttgtca ataatgaaaa cggatatatc ctgccgattg 841 cgaaagcctt caaggaaatt aaagcgatgt atcccgaatg catgacccat tgtgattgcg 901 ttcaggggtt tgaaaagatt aagattaagg caaaattgct ttattgcgac acgatgtcaa 961 tcagcgggca caagatttat gcgcccaagg gtatcggtgc gttatacatc aaaaaaggtg 1021 taagggttgc tcccctgctt atcggtggcg gacagcagaa aaatcttcgc tcgggaacag 1081 aatctgttcc gatgatatat tcgttcggta agaccgttga agctttgaca cctaccattg 1141 acgagcgata tgaatatgtc aagggactca atgaatatgc aagaaagctg atttcgggta 1201 ttgataccgc agttatcaat tcacctgaaa acgcaagccc atatattttg aacatttcgt 1261 tggttggatt aaaaagcgaa atagtgcttc attttttgga gcaatcggag atctatgttt 1321 caagcggttc ggcttgttcg agaggtaaga aatcaagtgt tttgtcggca tttggtttga 1381 acgacaaacg agttgactcg gcaatacgca taagcttttc aaaggattcg accagagacg 1441 agatcgacag gttatgtgag gagcttgagc gcgcggttaa gacgcttgcg agggcgagat 1501 aagacgttgc aggcggggcg gaggccgtcg tgccggattt aaagttgagc ctgtctaaac 1561 tttaaatgag gcgtgacgga ggggaccagc tattcgggca caacaagaat caagtaacaa 1621 gaaggaatta tcaatatgaa agaactcatt ctttgcaaat acggcgaaat tgtactgaaa 1681 ggacttaaca gatcgagctt tgaatcggaa atgctcaaaa acattcgcag acgtttaaag 1741 cccatgggca atttcaagtt tgtttctgca caatcgactc tttacatcga agcgctggat 1801 gaagatattg acatcgacga ggttttggaa aagctttcaa aggtattcgg aattgtgaag 1861 ctttgcaaag ctgttgaagt tgaaaaggat atggatgtta tctttgaaac tgcgaagtca 1921 taccttggca gagctttgaa aaaggcttca acattcaagg ttgagtctaa gcgttcagac 1981 aagcgttttc ctttgaagtc tcctgagatt gccgctgaat tgggtggaag aattttggaa 2041 gcattccctc atctcaaggt tgatgttcac aatcccgagg taaccgttat ttgtgagatt 2101 cgtgacaatg gcgcatatat tcacggaatg cccattgaag gcgcaggcgg aattcctgtc 2161 ggcacaggcg gaagagcgct gttgcttctt tcgggcggta tcgactcccc tgttgcgggt 2221 tatatgattg caaagcgcgg tgttcaaatt tcagctattc actttgaggc tccgccttac 2281 acttctgagc gcgcactgat gaaggttgaa cgcttggcgc agaagatgac cgactattgc 2341 ggaaagataa gcttctattg tgtgccgttc acaaaaattc aggaagttat taaggacaac 2401 tgccccgagg agcttttcac cattatcatg cgcagactta tgatggagat tgcccagaga 2461 attgcagaaa gccacgatta cgccgcactc gttacaggcg aaagcatcgg acaggttgca 2521 tcgcagacga tgtcagcaat ggtatgcacc gatgcggttt gccgaattcc tgttttccgc 2581 ccctgtatag gattggataa aaaggaaata attgatatat catacaaaat cggaacattt 2641 gacatttcaa ttgagcctta tgaggattgc tgtactgtat ttacccccaa gcatcccaaa 2701 acaagacctg ttttggcaga tgttgaagcg gcgcaggcgg cttatgattt tgagcctttg 2761 attcgcgagg cttatgaggg cattaccgtt aaaacattta agatcggcgg acaggtcgag 2821 taagttttgg ttagtaggat ctgcctgcgc agcagcgagc cgtagcagac acggcgatgc 2881 gacggagtgg catcggcagt ggcgtgctgt ggcgagcggt atgatgcgaa gtcatttttg 2941 gccagacatc gttttcagga gaaacatatg agcataattg attgtaaaaa ttttgaatat 3001 agttccgagt ctctgacaac ttattgcaat gagcttgccg aaaaggttgt cagctcattg 3061 aaggcaaatg gcaaaagcgt tgcttgcgcg gaaagttgca caggcggtat gcttgcacag 3121 tttattacag cagtttcagg tgcttcagag gtttttcagt ttggtgcggt gacttattcc 3181 gaaagaatga aatcgcaggt tttgggaatt cccccgcagc tgatcgagga atgcggagtt 3241 gtgagtccgc aggtagctct ttcaatggca tatggctcga agctttatac tggcgctgat 3301 atcggtgtgg // LOCUS sequence125 3305 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence125 VERSION sequence125 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3305 /mol_type="genomic DNA" /organism="" /note="sequence125" CDS 103..1005 /product="thymidylate synthase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003244896.1" /transl_table=11 /codon_start=1 /translation="MSVWDKKYCELCKTILEKGTEVENRTGINTVKIPSWHFHLDLSEE YPILTTKQVFIRQAILEMLWIYQAQSNDVRWLQERNVHIWDEWEIDENGFWHAKQMLPD ENGKPVLREIHKEFGKKWAHTIGTAYGYIVKKFGLTQELINKLKNNPGDRRMLMSLWQN DYLPTAVLPSCVWSSEWDVTDGKLNAWVHQRSCDVPLGLPFNVTQYATLLYMLAQVTGL KPGTLDWSIKDAHIYVNQIDGIKEQLSRFETFGDLSAPKLWLNPEVKDFFDFDSSAECK DVKLIDYKHMGKIVFPIAQ" /locus_tag="LOCUS_4970" /EC_number="2.1.1.45" /note="WP_003244896.1 thymidylate synthase (Bacillus) [pid:38.2%, q_cov:99.7%, s_cov:99.6%, Eval:1.4e-47]" /note="MGA_643" CDS 1023..1502 /product="dihydrofolate reductase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_000637198.1" /transl_table=11 /codon_start=1 /translation="MVKMIAAVGKNLELGKDNNLMWSISEDMKFFRTTTAGHTVVMGRL TYESIGRPLPKRRNIVISRNPDYKPEGVETAMSLETALEMCEHNCFIIGGAAIYKLGLE YADEIILTEIDNAYPEADVYFPEFNKDVWNREVIGESEENGLRFSFVKYSKKENA" /locus_tag="LOCUS_4980" /gene="dfrA" /EC_number="1.5.1.3" /note="WP_000637198.1 dihydrofolate reductase (Bacillus) [pid:41.7%, q_cov:98.7%, s_cov:99.4%, Eval:1.0e-30]" /note="MGA_644" CDS 1503..1901 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_080510936.1" /transl_table=11 /codon_start=1 /translation="MKKRLIYALLPLVAIALELSPLGAVLSFANPEGKDFRETYSYFSL MPFGYANFGPFLTAILSSVLLVLMLIYAFTAKETLKTVGAVVCFVACGTSLMPLLFGVK FFSLVGLLISLALFAQLVLALFGDRVKK" /locus_tag="LOCUS_4990" /note="WP_080510936.1 hypothetical protein (Desulfitobacterium hafniense) [pid:33.6%, q_cov:94.7%, s_cov:93.7%, Eval:2.8e-08]" /note="MGA_645" CDS 1929..2315 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MRRFIALVLASLLTLSMLCGCSDKVEPFNLSDFEDEIEEYAYSEN LGEIPDAETAKEKAEELWISLYGEWRDIEGEKPFKVFFDEENEVWYVKGALKQPLIPIF GTVKGGTGGLIVTTDGEVLAVWHF" /locus_tag="LOCUS_5000" /note="MGA_646" ORIGIN 1 ccttttttag aaatagtcgc attatatgcg attttcagta gacggaccgc gaaaaatctg 61 ttataatata ttggatatga caatgaaagg ttgggtaaat ctatgtcagt atgggataaa 121 aaatattgcg agctttgcaa aacgattctt gaaaagggca ccgaggttga aaaccgcaca 181 ggtatcaata cggttaaaat tccttcttgg cattttcatc ttgacctttc ggaggaatac 241 ccaattttaa ccactaagca ggtgttcatc cgccaggcga ttttggaaat gctctggata 301 tatcaagcac agtccaacga tgttcgctgg ctgcaggaaa gaaatgtcca catctgggac 361 gaatgggaga tcgatgaaaa cggcttctgg cacgccaagc aaatgcttcc cgacgaaaac 421 ggtaagcccg ttttgcgcga aattcataag gaattcggca agaagtgggc acacaccatc 481 ggcaccgctt acggatatat cgttaagaaa ttcgggctga ctcaagagct gataaataag 541 ctcaaaaaca accccggcga cagaagaatg cttatgtccc tgtggcagaa tgactatttg 601 ccaaccgctg ttttgccctc ctgcgtatgg agtagcgaat gggatgtcac cgacggcaag 661 ctcaacgctt gggttcacca gcgctcctgc gatgttccct tgggactgcc tttcaacgtg 721 acccagtatg caactcttct gtatatgctt gcacaggtca caggtcttaa gccgggcact 781 ctcgattgga gcattaagga cgcacatatt tatgtcaacc agatcgacgg aataaaggaa 841 cagctttccc gctttgaaac ctttggagac ctttctgcgc ccaaactctg gctcaacccc 901 gaggtcaagg atttcttcga ctttgactcg tcagccgagt gtaaggacgt taaactgata 961 gattataagc atatgggcaa aattgttttc ccgattgcac agtaatagtg ggggatataa 1021 aaatggttaa aatgattgcc gctgtcggca aaaatttaga gcttggcaag gacaacaacc 1081 taatgtggag catctcggag gatatgaaat tcttccgcac taccaccgcc ggccacaccg 1141 ttgttatggg cagactcaca tatgaatcaa tcggaaggcc tttgccaaag cgcagaaata 1201 ttgtaatttc ccgcaacccc gattataagc ccgagggcgt tgaaactgcc atgagtcttg 1261 aaacggcact cgaaatgtgt gagcataact gcttcatcat cggcggtgcc gccatatata 1321 agctgggcct tgagtatgcg gatgagataa ttctcaccga gatcgataac gcatatcccg 1381 aggcggatgt atatttccct gagttcaata aagacgtgtg gaatcgcgaa gtaatcggcg 1441 aaagcgagga aaacgggctt aggttcagct ttgtcaaata ctccaaaaag gagaatgcat 1501 aaatgaaaaa acgcttgata tatgcccttt tgccgctggt tgcaatcgct ttggagctgt 1561 cgcctttggg cgcagtgctc agctttgcaa accccgaggg taaggacttt cgcgaaacat 1621 attcatattt cagtctgatg cctttcggct atgccaactt cggcccattt ttaacggcga 1681 ttttaagcag cgtattattg gtgctgatgc tgatatatgc ctttacggca aaagaaacgc 1741 tcaaaaccgt cggagcggtt gtttgctttg tcgcctgcgg aacatcgctg atgccgcttt 1801 tgttcggcgt gaagttcttt tcgcttgtgg gtctgctcat atcccttgca cttttcgccc 1861 agcttgtgct ggcgctgttt ggggataggg tgaagaagta aatagcaaag agaggaagga 1921 acatttctat gagaagattt attgcattag ttttggcgtc gcttcttacg ctttcaatgc 1981 tttgcggatg ctccgacaag gtcgagcctt ttaacctttc tgatttcgag gacgagatcg 2041 aagagtacgc ttacagcgaa aatctcgggg aaattcccga tgccgaaacc gcaaaggaaa 2101 aagccgaaga actttggata tccctctacg gcgaatggag agatattgag ggtgagaagc 2161 cttttaaggt tttctttgat gaagaaaacg aagtctggta tgttaaaggt gcgttgaagc 2221 aacctttaat tcctatattc ggaactgtta aaggcggaac gggcggattg attgtcacta 2281 ccgacggcga agttttggca gtatggcact tttgaaaaag gataagaccg ctctgttctt 2341 aactaatgaa caacagggcg gggaaaatga tgcccctgct tttcggcgtg aagttctttt 2401 cgcttgtggg cttgctcata tctcttgcgc tcttcgctca gttgatgctg gcgctgtttg 2461 gggataggac gaaagaataa acagcattaa gagagaacgg tatgttctct cttttttgtt 2521 tgtattcatc aatcagcata ttacaaatat gcattgaaaa aacgccttgc atcaactata 2581 atataatcag cacatcatta tttatcattt acaaggatgg agcgttatta tgagaagatt 2641 tattgcattg gttttgacgg cagttcttat gttgtcgatg ctttgcgcct gtgccgataa 2701 ttcggcgaat tcggataagc cgagcagctc gatcaacaat gagcctaaaa acgagatcac 2761 cgttgcaagg cagacatcaa gctctgcaaa gattggcgat atcaagcttt atgcccttaa 2821 agagctgacc accacatccc ccgacgggaa tatcaaggca ctcttctggc aggatgaaaa 2881 cggtgcggta tattatagcg ttgaattcgg caaggaagaa gtcatttctc cctcaaagct 2941 tggatttgtt ttgtcaaact gcgatctttc ttcgggcatt gaaactatcc gtgcgtatga 3001 ccgccccgac gagatcgacg atgaatttga aaccgcggag acaatttctc ttaaggatgt 3061 taccttgcgc gaccattgct atgagcgaga aatattcctt gaaaagggcg aagcgggtct 3121 aaccttgcgc gtaagggtat atgacgacgg ctttgcatat agatatgaaa acgtcaccaa 3181 cggcagggaa ggcacggtat atgtcaccaa cgaggcgtcg cagatcaatc ttgctgacga 3241 taccaccgtt tttgcgggtg gatacagcgc cacctatgag gttacatacc acgaatatga 3301 tcaca // LOCUS sequence126 3285 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence126 VERSION sequence126 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3285 /mol_type="genomic DNA" /organism="" /note="sequence126" CDS complement(250..675) /product="GNAT family N-acetyltransferase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_004082236.1" /transl_table=11 /codon_start=1 /translation="MTIRVYENALPEDALYIRTVVFVEEQGFRDEFDEIDKTCLHLIAY DDDKPIAVCRCFNEHDATSWHIGRMSVLKEYRKKGIGSLVMTKAEEEIVKRGGLEAVLS SQYPVKGFYESLGYTAEGDIYLDEDYPHILMRKRLEK" /locus_tag="LOCUS_5010" /EC_number="2.3.1.-" /note="WP_004082236.1 GNAT family N-acetyltransferase (Thermotoga maritima) [pid:37.9%, q_cov:100.0%, s_cov:100.0%, Eval:5.4e-18]" /note="MGA_649" CDS complement(677..1915) /product="aminopeptidase YwaD" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003242515.1" /transl_table=11 /codon_start=1 /translation="MTIEQINNIFNDTAYVRMGGSDDELKCAEYIKKLCKEMNLGDAYI EPFEVDMATIKSATLTVDGIEIPCKGYFNCGSGEVSAPIYYLNNADDKYQLSQCKGKIV IFDGYLRHWLYQDLLENGALGFISYDGNANYVDEDIDQRELRAHVSNGNKILGVNINAK KAIEIINRKAEFAKIAIEQDEYKGESRNVILDIPGICDEYIVFTAHYDSTSLSQGAYDN MSGSVGLLGIAEHFMKTRHKYGLRFIWCGSEERGLLGAKAYCAAHEEELKKVVLNINLD MIGCIMGKFISCCTTEEKLVHYIDYLSLETGFGVSSHQGVYSSDSTPFADKGVPALSFA RIAPPNTATIHNSYDTKSLMSAEQMQEDIWFINQFTERMANAVFCPVAREIPDNMKDEL DVYLARKRKGAKK" /locus_tag="LOCUS_5020" /gene="ywaD" /EC_number="3.4.11.10; 3.4.11.6" /note="WP_003242515.1 aminopeptidase YwaD (Bacillus) [pid:26.3%, q_cov:85.2%, s_cov:78.2%, Eval:6.5e-12]" /note="MGA_650" CDS complement(2070..2774) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MNLDEKLIQYRREREISQEALAEQLGVSRQAISKWETGESMPELS NLLAICKIFDTNPNELFGYEAVPTLTAESAKRKSPVWLTVLLVVSLVLNLLLSSAIGLY IYHAYDEHVNAVIQPQGIPEDFGFREISYRIIEVNEHQNTLEIVFRPTATKESYVYGVA VTGSLVSDLFYGELGEDGLVRTEIAIERYALAGDISLFTSSEGVNISYASYSYRFPKDG STYSVIMTETFE" /locus_tag="LOCUS_5030" /note="WP_011836492.1 helix-turn-helix transcriptional regulator (Streptococcus sanguinis) [pid:47.1%, q_cov:28.6%, s_cov:33.2%, Eval:4.5e-10, partial hit]" /note="MGA_651" ORIGIN 1 ctttaaaaac gtcctcaagg tcggcatcca aggcatatgc cgtttccgcc agataccatg 61 cgatgtcgcc aagctcttct aagaggtgct ctcggtcaag ctcgtggcct tgggcaatgt 121 gctttttaac aaggtcgata gcttcgcccg attctccgca aagtcccatc acgccgacaa 181 taagaacatc cttcttgtca agctccttgt tttgggtcac cattgcaagc ttttgatatt 241 ccgaaactgt catttttcca gcctctttct cattaaaatg tgagggtagt cctcgtctaa 301 atatatatca ccctcggcgg tgtagcctaa gctctcataa aaccccttga cgggatattg 361 gcttgagagc accgcttcta atccgccccg ctttacaatt tcctcttctg cttttgtcat 421 tacaagcgaa ccgataccct tttttcggta ttcttttaaa accgacattc tgccgatatg 481 ccacgaagtc gcatcatgct cattaaaaca tctgcaaacg gcaatgggct tgtcgtcgtc 541 ataagcgatg agatgcagac aggtcttgtc gatctcgtcg aattcatcgc ggaagccctg 601 ctcctcgaca aagacaacag tgcggatata cagcgcatcc tcggggagcg cattttcata 661 aacccgaatt gtcattttac ttctttgcgc ccttgcgttt tcttgcaagg tatacatcca 721 actcatcctt catattgtcg ggaatttctc ttgcaacagg gcagaatacg gcatttgcca 781 tcctttcggt aaactgattg ataaaccaga tgtcttcctg catctgttcg gcgctcataa 841 gtgacttggt gtcatatgaa ttgtggatag ttgcggtgtt cggaggcgca attctcgcaa 901 atgagagcgc aggcacgccc ttgtcggcga agggagtcga gtcgcttgaa tatacgccct 961 ggtgggagct cacaccgaag cctgtttcaa ggcttaagta gtcgatataa tgaacaagct 1021 tttcctctgt tgtgcagcag gagataaact tacccataat gcagccgatc atatcgaggt 1081 tgatgtttaa aacaaccttc ttgagttctt cctcgtgggc agcgcaatat gcctttgcgc 1141 ccaaaagtcc gcgttcttcc gaaccgcacc agataaagcg cagaccgtac ttgtggcggg 1201 tcttcataaa gtgttctgca attcccaaaa gaccaacaga gccggacata ttgtcatatg 1261 cgccctggga aagggaagtg gagtcatagt gtgcagtgaa aacaatatat tcatcgcaga 1321 tgccgggaat atcaagaatt acgtttctcg actcgccctt atattcatcc tgttcgattg 1381 caatttttgc aaattctgcc ttgcggttga taatttcaat tgcctttttc gcgttgatgt 1441 taacgcccaa gatcttattg ccgtttgaaa catgcgctct aagctcgcgc tggtcaatat 1501 cctcgtcaac atagtttgcg ttgccgtcat aggaaataaa tcccaaagcg ccgttttcca 1561 aaaggtcctg atataaccag tgacgcagat atccgtcaaa gatcacgatc ttgcccttgc 1621 actgtgaaag ctgatatttg tcgtcagcgt tgttgaggta ataaataggt gcgctgactt 1681 ctcccgagcc gcagttgaaa tatcccttgc aggggatttc gataccgtca acagtcaagg 1741 ttgccgactt gatggttgcc atatcaacct cgaaaggctc gatgtaagca tcaccgaggt 1801 tcatttcctt gcagagcttt ttaatgtatt cggcgcactt gagctcgtca tccgagccac 1861 ccatacgcac ataagcagtg tcgttaaaaa tgttatttat ctgttcaatt gtcatttttg 1921 tgtccctccg tttgaaagtg gttaatataa ttatatcacg gattcggaga atgtaaagag 1981 gggaagcctt cctctgacga gggaggtgcc gagcttgtcg aggcggaggg agagataaca 2041 aaagcccaca caaaggtggg cttgattgtt tattcaaatg tttcagtcat tatcacgctg 2101 taggtcgagc cgtctttggg gaagcggtat gaatatgacg cataactgat atttacgcct 2161 tctgagctgg taaacagcga tatgtcacct gcgagtgcgt atctttcaat tgcgatttct 2221 gttcgtacca gtccgtcctc gcccaattct ccgtaaaaga gatctgatac cagacttcct 2281 gtcactgcaa ctccgtaaac ataactctcc ttcgtggcag ttgggcggaa aacaatctca 2341 agtgtgtttt ggtgctcatt gacctcaatg attcgatagc ttatttctct gaatccgaag 2401 tcttcgggga tgccctgtgg ttggataacg gcatttacat gctcgtcata tgcgtggtag 2461 atatacaaac cgatggcgga gctgagcaat aaattcaaaa caaggctcac aaccagcaga 2521 acggtcagcc aaacggggct ctttcgcttg gctgattctg ctgtgagggt cggtaccgcc 2581 tcatatccaa aaagttcatt ggggttagta tcaaaaattt tgcatatcgc caaaaggttg 2641 gaaagctcgg gcattgattc tcccgtttcc cattttgata ttgcctgcct tgaaacgcca 2701 agctgttcgg caagtgcctc ctgggaaatc tcgcgttcac ggcggtattg tattaacttc 2761 tcgtccaaat tcatatttgt cgactccttt cggctgattt ctgtctttat tatacacgta 2821 actttggttg caatcaacca aaagagcctt gaagtgtatg caacttcaag ttgcaatcgc 2881 cgttttcggt ggttttaggc gtgttttaag gtgttggcag cgctccgcag gaacaagcct 2941 tccccttgag gggaaggtgt cggcgtatgc cgacggatga ggtggatacg gctgagcgcc 3001 ctctccaaaa acaaaagccc acacaaagat gggctttgta agcataaatt attctcaata 3061 gccttcaacg ctgaggcact caaggcttcc cttgccgacc agcttgatat agctgacatc 3121 gtcaagcggg aagctgttgc ctgtttgggt cgcatagctt ccgtcggtat aatacaacct 3181 cacggtcgca ttgctcgaaa gattcagcac aagctcgctt gaatcaatgt tcttatatgc 3241 aagatatgat cttaccgttt caatgttgag gtataggtct tcata // LOCUS sequence127 3236 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence127 VERSION sequence127 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3236 /mol_type="genomic DNA" /organism="" /note="sequence127" tRNA complement(1..73) /product="tRNA-Thr" /inference="COORDINATES:profile:Aragorn:1.2.38" /locus_tag="LOCUS_t0090" /note="Aragorn_9" CDS complement(206..2344) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MAKNIYGEMFEQLSIPARLEPDNIAKMLDEHMAANTKRASITVSS SDNNIKRSAPKKTHSAAYRVIMSAAACAALVLGLMRYTGATDPKIVVTPPAPGNYASDY SDIHSAFQQYYVDDSDKQTLDSAIAEIEHAYNEAQANEGTDETVTEPEVTTTQPDVTEP PVTTTEAPVTEPAPEEEENVTVTDIEEPEESGVALPDMSGFDRDHGIIIENGRIFVRDG DDIRILSSVDGTLNYDGTVEMLSGVNETKELVEFYVIGNRLAAVYTVETAEVIDSAVPA QEEEFESVLDEIIGDTYAEVAHDVIRHSAEVCIYEFTDGAFYQVYNYTQCGSLVEIKET DGSIYVVTDYNDYRLSPIVGVDDLDSYVPTYSINGVKLFLEPSEILLPSRVTTTDYTVI SGINVAASSINASVQALLGYEGRTVVTDSAVYIFAYESADTSSTSVEKFKLMDGAVMHD GFEVIDGVALSGDGITHNGDTILISTLSNTELGYVTSVKAYDEALEIISKVDLPALLTK AQLDGSKLYLNGSDCAYAIDFLDPAAPALIEITGEKDVLESLVEFEDGYVILTRAEDGS IKLSKIIEDVNGDLSVCYEATVYEAADATSKALINNDVLYVGDGLVGVPYGYFDGYDYC YTYALYRSAGNAFELVGKFESHETDAAFEMGKAIESDGTLYVFSEGRVYAMNATTEALS LIGRADIIYSAYSGHNAW" /locus_tag="LOCUS_5040" /note="MGA_653" CDS complement(2370..2921) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MASGFSELVKKAKKGDSKAFAELYSAIYKELYYYALCNLNNQDDA ADAVSDAVLDAFSGIKNLRDEDAFKGWMLRILTAKIKRKQAEYVRDREYLTSTIMTDDD GEDVIMDIPTRESKYEGIELLDHIESLSQNEKMCFSLNAIYGYTSDEISKLTGINAATV RTYLARGKTKLRKLIDDDMY" /locus_tag="LOCUS_5050" /note="MGA_654" ORIGIN 1 agctggtgga cggactcgaa cccccgacct gctgattaca aatcagctgc tctaccaact 61 gagctacacc agcaagcgct gcaacgaaag ttattctaac atataagttg gctcttgtca 121 agtgcttttt gaaaatattt tttcaaaaat gaaaaccgcg gcgaagattt tttcaacgcc 181 gcgaagtcgt tccgtttttt tgaatttacc aagcgttatg tccgctgtat gccgaataga 241 ttatatctgc acggccgata agcgaaaggg cttcggttgt tgcattcatt gcatacactc 301 tgccttcgga gaagacataa agtgtgccgt ccgattcgat cgccttgccc atttcaaagg 361 cggcatctgt ttcgtgggat tcaaacttgc ccacaagctc aaacgcgttg cccgcagagc 421 gatagagcgc ataagtatag caatagtcgt atccgtcaaa gtagccgtaa ggtacgccta 481 caagtccgtc gccgacatac aaaacgtcgt tattgataag cgccttagag gttgcatcag 541 cagcttcata tacagtcgct tcatagcaaa cgctcaaatc gccgttgacg tcttcaatta 601 tctttgaaag tttgatgctt ccgtcctctg cacgggtcaa aataacgtag ccgtcttcaa 661 attcaacgag ggactccaaa acatccttct cgccggtgat ttcgataagc gcaggagcgg 721 cagggtccaa aaaatcaatc gcatacgcgc agtcgctgcc attgagatat agcttagagc 781 catccaactg tgcctttgtc aaaagcgcag ggagatcaac ctttgagatt atctccaatg 841 cttcgtcata tgccttaacg gatgtgacat agccaagctc ggtgttggaa agagttgata 901 tcagaatggt atcgccgttg tgggtgatgc cgtcgccgct gagcgcaacg ccgtcaataa 961 cttcaaagcc gtcgtgcatt accgcgccgt ccataagctt gaacttttca acagatgtac 1021 tgctggtatc agcagactca taagcgaaga tatatacagc actgtctgtg acaacagttc 1081 tgccttcata tccgagcaaa gcctgaacag aagcgttaat tgatgaagca gccacattaa 1141 taccggaaat tacggtatag tcggtggtgg taactcttga ggggagcaaa atttcggaag 1201 gttccaagaa cagcttaacg ccgttaatgc tgtaggtggg aacatagctg tccaaatcat 1261 caactcccac gatgggagaa agtctgtaat cgttataatc ggttacaaca tagatgcttc 1321 cgtctgtctc cttaatttca acaagacttc cgcactgggt atagttgtat acctgataga 1381 atgctccgtc ggtaaattca taaatgcaga cttcggcgga atgtctgata acatcgtgag 1441 caacctcggc ataagtgtct ccgattatct catccaaaac agattcaaat tcttcttcct 1501 gtgcaggaac agcagagtcg ataacttcgg cagtttcaac ggtatataca gccgccaagc 1561 ggttgccgat aacatagaac tcaaccagct ccttggtttc gttaacgccg gagagcatct 1621 caactgtgcc gtcatagtta agtgtgccgt caacagatga aagaattctg atgtcgtcgc 1681 cgtcgcggac aaagatgcga ccgttttcaa tgatgatgcc gtggtcgcgg tcaaatccgc 1741 tcatatcggg aagcgcaaca ccgctctcct cgggttcttc aatgtcggtg acggtgacat 1801 tttcttcctc ttcgggagca ggctcggtga caggagcttc ggtggtggta acgggaggct 1861 cggtcacatc aggctgagtt gtggtaactt cgggttcggt gacggtctcg tcagttccct 1921 cgtttgcctg tgcttcatta tatgcgtgct cgatctctgc gatggcagag tcaagtgtct 1981 gcttatccga atcgtcaaca taatactgct ggaaggcgct gtgaatatcg ctgtaatcgg 2041 aagcgtagtt gccgggtgcg ggaggtgtga ctacgatctt gggatctgta gcgccggtgt 2101 aacgcataag tcccaatacc aaagcagcac acgcagcagc cgacatgatc actctgtatg 2161 cagcagagtg ggtcttcttg ggtgccgatc tctttatatt gttatcggag gaagaaacgg 2221 ttattgatgc gcgcttggtg tttgcagcca tatgctcgtc gagcatcttg gcaatgttgt 2281 ccggctcaag gcgtgcggga atgcttaact gttcaaacat ttcgccgtaa atattttttg 2341 ccatttatct tcctcctttc tgatgatttt taatacatat cgtcgtcgat tagtttacgc 2401 agcttggttt tacctcttgc aaggtaagtt cttacagtcg ccgcgttgat tcctgtaagt 2461 tttgatatct cgtcgctggt gtagccataa atagcgttca gcgagaagca cattttttcg 2521 ttttgcgaca ggctttcaat atggtccaaa agctcgattc cctcatactt cgactcgcgg 2581 gtgggaatgt ccataattac atcctcgccg tcatcatcgg tcataatggt tgaggttaag 2641 tattcgcggt ctcttacgta ttccgcttgc ttgcgcttga tcttcgccgt gagaattctt 2701 agcatccagc ccttgaaggc gtcctcatcg cggagattct tgatgcctga gaatgcgtcc 2761 aaaacagcat cgctcacagc atcggcggcg tcatcctggt tattcaggtt gcacagcgca 2821 taataataga gctctttata tatagccgaa tagagttcgg caaaagcttt actgtcgcct 2881 ttctttgctt tcttaacaag ctcggaaaag ccggaagcca ttctctcacc tcgaatcata 2941 gacacataga catacagacc cgtggcttgg gcttctgtat attaagtgtc aaatttttgc 3001 gattttgttg catcgattga taaaaaattt tcaaaaatct tcttgtgcaa aatctgccat 3061 tacagtatat cggaaactga gccgacatac acattcatta tacaccaaac gatgtcgaat 3121 tacaagtgat attgtataaa aagcgttttt tgcccgcgcc accgccgccg cacagccgct 3181 catcgcggcg cagcggctcc gacggcgctc accgactgcg aacgccgcac catagg // LOCUS sequence128 3223 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence128 VERSION sequence128 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3223 /mol_type="genomic DNA" /organism="" /note="sequence128" CDS complement(207..809) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MMPEDEYDLAGFAVGIVDKKKILDNTKMAEGDVVIALASSGVHSN GFSLCRKVFDIDNNNPALYVPREELGGKTVAETLLTPTKIYVKSVLALLEQVDVKGISH ITGGGFYENIPRSIPKGLTAKIDKSAVKILPIFELIAKEGNIPERDMFNTYNMGVGMSI TVPADEVDTALEILRACGEDAYVIGHIVKGDEGVIIC" /locus_tag="LOCUS_5060" /note="WP_002209777.1 phosphoribosylformylglycinamidine cyclo-ligase (Yersinia pseudotuberculosis complex) [pid:48.4%, q_cov:96.0%, s_cov:54.2%, Eval:6.6e-51, partial hit]" /note="internal stop codon at [957:959](-),[960:962](-)" /note="MGA_656" CDS complement(960..1256) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MHNQSKSDSYAAAGVDITAGYKAVELMKKHIARTKNEGCLDDVGG FGGCFGLNLMGMEEPVLVSGTDGCGTKVKMAILMDKHDTIGIDAVAMCVNDII" /locus_tag="LOCUS_5070" /note="WP_003242485.1 phosphoribosylformylglycinamidine cyclo-ligase (Bacillus) [pid:62.0%, q_cov:93.9%, s_cov:26.6%, Eval:4.9e-29, partial hit]" /note="internal stop codon at [957:959](-),[960:962](-)" /note="MGA_657" CDS complement(1293..2717) /product="amidophosphoribosyltransferase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_005795565.1" /transl_table=11 /codon_start=1 /translation="MGGFFGAVCKRDVIEDVFFGTDYHSHLGTRRGGMAAFDRKIGLQR DIHNIENSPFRTKFEHIFEEMKGFSAIGCISDSDPQPLLIRTKLGAYAIATVGKINNAD ELIEKYLFSSNGHFSAMTGGKINSTELVAALIGVKETLAEGIAFAQDVIEGTANILILK NGGDIVAARDKLGRLPVIIGKSEDGYCVSFESFAFQKLGFETVKELGPGEIVELTADKF VQLKAPGEEMRVCAFLWTYYGYPTSKYEGINVENSRYRNGEIIARDDALGGNIPHIDYV GGVPDSGTPHAIGYSAQSKIPFARPFIKYTPTWARSFTPAKQSERNKVAKMKQMPVVEL IKDKDLLFVDDSIVRGTQLRETVEFLYSNGAKSVHMRSACPPIMYGCKYLNFSRATSEM ELITRQTILELEGEEGFKYLEEYSDSKTERGKKMRQAICDKLHFASLEFQSLEGAIESI GLEPCKLCTYCWNGKE" /locus_tag="LOCUS_5080" /note="WP_005795565.1 amidophosphoribosyltransferase (Bacteroides) [pid:47.7%, q_cov:99.6%, s_cov:99.1%, Eval:4.0e-125]" /note="MGA_658" ORIGIN 1 atttcgcttg gtatgttcgc ttgttccgct cttgtgattg caaacgcgtc gggattgttc 61 gatataacga gagatatctc tccgtgtttg ataatgccgg acttttgcgc atcaataaga 121 gcttggaggt ttgttcctcc gccagatacg agaacggcaa cttttacttt tttagtatta 181 ttcatttaga tacctccgac gtgttattaa cagataataa cgccctcgtc gcccttgacg 241 atatgtccga taacatatgc atcctcgcca caagctctga gaatttcaag cgctgtatca 301 acctcatcag cgggaacggt tatactcata ccaacaccca tattgtaggt gttaaacata 361 tctctttcgg gaatgttgcc ttcctttgcg ataagctcga aaatggggag aattttaacc 421 gccgacttgt caatttttgc ggtcaagccc ttggggatgg atctcgggat gttttcatag 481 aatccgccgc ctgtaatgtg gctgatgccc ttgacatcta cctgctccag aagcgccaaa 541 acgctcttaa catatatctt tgtgggggtt aaaagggtct cggcaacggt cttgccgcca 601 agctcttcac gagggacata aagcgcgggg ttattgttat caatatcaaa cacctttctg 661 caaagcgaga agccgtttga atgtacgccg ctggaagcaa gtgcaattac aacatcgccc 721 tctgccattt tggtgttatc caaaatcttt ttcttgtcaa caatgcccac agcaaatcct 781 gcaaggtcat attcatcttc gggcatcatc ttggggtgct ctgcagtttc accgccgatg 841 agcgccgcgc ctgactgaac acagccttca gcaacaccgc tgacgattga atcaatcttt 901 tcgggaatat tattgaagca agcgatatag tcgaggaaga agattggctt cgcacctcat 961 cagataatat cgttaacaca cattgcaacg gcgtcaatgc cgatggtatc gtgcttatcc 1021 attaaaattg ccattttgac cttggtgccg cagccgtcgg tgcccgaaac caaaacgggt 1081 tcttccatac ccataaggtt cagaccgaag caaccgccga agccgccgac atcgtcaaga 1141 cagccttcgt ttttggttct tgcaatgtgc tttttcatta attcaactgc tttgtagcct 1201 gcggtaatgt caacacctgc ggctgcatag ctgtcggatt tggattgatt atgcatagtt 1261 tttctcctcc gaatttattg taaatgttta tattattcct tgccgttcca gcagtatgtg 1321 caaagcttgc agggctcaag tccgattgat tcgatcgcgc cctccagcga ctggaattcg 1381 agcgatgcaa agtgaagctt gtcgcaaatt gcctgacgca ttttcttgcc gcgctcggtc 1441 ttgctgtcgc tgtattcttc gagatattta aagccttcct caccctcaag ctccaaaatt 1501 gtctgacggg tgataagctc catttcgctt gttgcacggg agaagtttaa atatttgcat 1561 ccgtacatta tcggcgggca ggcagagcgc atatgcacac tcttggcacc gttggaatac 1621 aaaaattcaa cagtctcgcg aagctgagtt cctctgacga tcgagtcgtc aacaaagagc 1681 aagtccttgt ccttaatcag ttcaacaacg ggcatctgct tcatttttgc aaccttgttt 1741 ctttccgatt gcttcgcagg agtaaagctt ctcgcccagg tgggggtata tttgatgaaa 1801 ggtcttgcaa aggggatctt tgactgcgcc gaatagccga ttgcgtgggg tgtgcccgaa 1861 tcgggaacgc cgcccacata gtcaatgtgg ggaatatttc cgccgagcgc atcatctctt 1921 gcaataattt cgccgttgcg atagcgggag ttttcaacat ttattccttc atatttggaa 1981 gtggggtagc cgtagtaggt ccaaagaaat gcacacaccc tcatttcctc gccgggtgct 2041 ttaagctgaa caaatttgtc agcagtaagc tcaacgatct cgcccgggcc aagctcttta 2101 accgtttcaa agcccagctt ctggaaggca aaggactcaa aggaaacgca gtagccgtcc 2161 tcgctcttgc cgatgatcac gggaagtcgg ccgagcttgt cgcgtgccgc aacaatgtcg 2221 ccgccgtttt taagaattaa aatgtttgcg gtgccttcaa taacatcctg cgcgaaagcg 2281 atgccctcgg caagagtttc tttaacaccg atgagtgccg caaccaattc ggttgaattg 2341 atcttgccgc ctgtcatcgc gctgaagtgg ccgttgctgc taaaaagata tttctcgatc 2401 agctcgtcgg cgttgttaat tttgccgacg gtggcaatgg cgtatgctcc cagcttggtg 2461 cgaattaaaa gcggctgggg gtcactgtcc gagatacagc cgatggcgga aaagcccttc 2521 atctcttcaa aaatatgctc aaattttgtt ctgaaagggg agttttcaat gttgtgaata 2581 tccctttgca ggccgatttt tctgtcaaat gccgccatac ctccgcgtct tgtgccgagg 2641 tgagagtgat agtcggtgcc gaagaaaaca tcttcaatga catcacgctt gcagacagct 2701 ccgaaaaagc ctcccataga tatttgcctc ctatgcaaaa aagtgattat gcgttaagcg 2761 atgctgtaag tgctgcgtcc ttggctaaaa ctgcctcggc atcggctttt cttttggcgt 2821 caagcttgct tgcaagctcg gcgtcctcaa tagccagcat ctgaatacaa agcaaggcgg 2881 cattaacggc accgtttatc gcaacagttg caacaggtat gcctgaaggc atctgtactg 2941 tggacaaaag ggcgtcaata ccgtccaaat tagttgattt acaggggatt cccacaacgg 3001 gaagggtggt gtttgcggca attgctcccg caaggtgcgc agccatgcct gcggcggcaa 3061 taattgcgcc gaagccgttt gctcttgcat tgagggcgaa atctcttgcc tcaacagggg 3121 ttctgtgagc ggagtaaatg tgtacttcat agggcacgcc gaagctttca agggtatcca 3181 tcgccttttt aacgatgggc atatcgctgt cgctacccat tac // LOCUS sequence129 3222 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence129 VERSION sequence129 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3222 /mol_type="genomic DNA" /organism="" /note="sequence129" CDS 602..2269 /product="DNA mismatch repair protein MutS" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_138361510.1" /transl_table=11 /codon_start=1 /translation="MRITDKVNLFYPDATKQKYAYDRRMALSQYPCSYIDDLEASRVAL MLLPQNPDRVLSLMLELNDDIDTLNYRLDCLEDFLRQPRLSDSFRKIIRRLSDNNKQLE SGETAPNSFMELKMRMDELEVYLNCIDEINFFYDKNRHTIKSQAMTNLFGFFESLPKTT EFTAVKTNLSELREIFSKTIKSVKIGINFTHDMTPDVCGILEVSSKKIYPKGNVLDRLI FKTYQGFEQFEGEEHINSATRHQPSDMDTVLFKELDKYTKDFTRRISTAIKSYRELFFS DIYELEHQLDFYDGVVNFIGFVRSRGLEMTRPKLMPKSERKLSLTNAFDLCFFRQAVSS DYKKMGDELIVRNDLDMQDEQFYLITGANNGGKTTFARGVGLCQLLAQIGVYVPAESAE ISPVDYIFTHFPKEEEIGIDSSRFTTEIKQLRTICDLITPDSMVIMNESIQSTTPDECL EIAYRHLEILSAVGVRGMYVTHLNGLYDKALEINKKDYPSKIGSLVSAVDEATGKRLYK MEKKPPVLGSMAYTVYDNFGAKLDDVMRRLGKFERCPQ" /locus_tag="LOCUS_5090" /note="WP_138361510.1 DNA mismatch repair protein MutS (Klebsiella indica) [pid:25.2%, q_cov:89.5%, s_cov:93.8%, Eval:1.8e-26]" /note="MGA_661" CDS 2266..2472 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MKKLVTILMALFCAIILFFTFFGEMLFYEAKPQVTTHSVYSMYTA DGNIAPIIPKECLIDGKYIYVVT" /locus_tag="LOCUS_5100" /note="MGA_662" CDS 2521..2646 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MTQEYDEGYYLVIEGNLRNGEKVIVTADRPFENGDKVTVVE" /locus_tag="LOCUS_5110" /note="MGA_663" ORIGIN 1 cccgaacgag cttattgatt gcacagcctt ggaaacaaca tccgttttca aaactttccg 61 ttatgctgtt atcccacaaa ttaaacctgc aattgtatcg ctggcaatcc tcatcttctg 121 tgagagctgg aatatggttg atcaagcact catcttctcg atggaaaacg acgagataat 181 gccactttcg gttatgctct cggagattcc ggcagatgtt tcctacgccg gcggagcagt 241 atatatgttc ccgataatca tgctgtttgt aatgttccgt gaaaccttgg aagaatccat 301 ggagagttat aagttttagc cttccccttg agggaaggtg tcggcggatg ccgacggatg 361 aggtgaaacg tttggtaagt ctcaaactct tcgcccaccg ctcggcgcca cctgcttcga 421 ctcgccttct gctcacctcg cagacggcgc cacgctcctt cgtcatccct accaattcgc 481 ccttgaaatt ttgtacgaaa cgcagatttt cacctcccat ttgccaactc ccgcaacctt 541 tgccctcaaa aagttgttat attatatgac aagccacgta ccgtccgcaa aggagaatgt 601 tatgagaatt accgacaaag ttaacctttt ctatcccgat gctacaaagc aaaagtatgc 661 ctacgaccgc cgtatggcac tttcgcagta cccttgttcg tacatcgacg acctcgaagc 721 gagccgagtt gcgcttatgc tcctgccgca aaatcctgat agggtgctga gcttaatgct 781 cgagctaaac gacgacatcg acacgcttaa ctaccgcctt gattgcttgg aggatttttt 841 gcgccagccg aggctgtcgg actcctttcg caagataatc cgccgacttt cggataacaa 901 caaacagctc gaatcgggcg aaactgcgcc caactcgttt atggagctga aaatgcggat 961 ggatgagctt gaggtctacc ttaactgcat tgacgaaatc aactttttct atgacaaaaa 1021 ccgccacaca atcaaatcgc aggcaatgac aaacctcttt ggcttttttg aatcattacc 1081 caaaacgaca gagttcaccg ctgtaaaaac caatctttcg gagcttcgcg agattttctc 1141 taagactata aagagcgtca aaatcggcat caacttcacc cacgatatga cccccgacgt 1201 atgcggaatt ttagaggtct catcaaagaa gatctacccc aagggcaacg tcctcgatag 1261 gctgattttc aagacctacc aaggcttcga gcagtttgag ggcgaggagc atatcaactc 1321 cgcaacaagg catcagccgt cggatatgga caccgtactt ttcaaggagc tcgacaaata 1381 caccaaggat tttacccgcc gtatttcaac cgcaatcaaa agctaccgtg agctgttttt 1441 cagcgatatt tatgaacttg aacaccaact cgacttctac gacggagtgg ttaatttcat 1501 cggctttgtc cgctcccgcg ggcttgaaat gacaagaccg aagcttatgc caaaaagcga 1561 gcgcaagctc agtcttacaa acgcctttga cctctgcttc ttcaggcagg cggtatcttc 1621 ggactataaa aagatgggcg atgagctaat cgtgcgcaac gatcttgata tgcaagatga 1681 gcagttttat cttatcacgg gtgccaacaa cggcgggaag accacctttg caagaggtgt 1741 gggtctttgt caactccttg ctcaaattgg tgtttatgtc cctgctgaaa gtgccgagat 1801 ctcacccgtt gattacatat tcactcactt tcccaaggaa gaagagatcg gcatcgacag 1861 cagtcgattc accactgaaa ttaaacagct ccgaaccatc tgtgacctca tcacccctga 1921 cagcatggtg ataatgaacg aatctatcca atcgaccacg cccgatgagt gcctcgaaat 1981 cgcataccgc caccttgaaa ttttgtcggc ggtgggagta agaggaatgt acgtcaccca 2041 cctcaatggg ctctacgaca aagccctcga gataaacaaa aaggactacc catcaaagat 2101 aggcagtctt gtttctgcag tagatgaagc gacgggcaag cgcctttata aaatggagaa 2161 aaaaccgcct gttttgggaa gtatggctta cacagtatat gataactttg gcgcaaagct 2221 tgatgacgtt atgagaaggc ttggaaaatt cgaaaggtgc ccccaatgaa aaaactagtt 2281 acaattctaa tggcgctctt ttgcgcgatc atactcttct tcaccttttt cggcgaaatg 2341 ctcttctatg aagccaagcc ccaggtgacg actcactctg tatattcaat gtataccgct 2401 gacggcaaca tagctcctat aattccaaaa gagtgtctta ttgatggtaa gtatatctat 2461 gtggtgacct agacccaagg tttctctgct gagatatgct ccgcagaagc gcgtgaagtc 2521 gtgactcaag aatacgacga aggctactat ctcgtcatcg aaggcaacct tcgcaacggc 2581 gagaaggtca tcgtcactgc cgatcgacca tttgagaatg gagataaagt aactgtagta 2641 gaatagaaac aaaatccccg agaggagtac tctcggggat tttgaatgcg attatgtatt 2701 actgtatacg ttacaaaact cctttttgag tctcaacata acttttgaat atatcgccaa 2761 ctactatcgt tcttgtcgtt ttttgaccat ttgtgtaaac ctcgttgaat tacaaattat 2821 acatcattaa agtgatagtg agactgattg acaaattggt tgagcttatt tgtgaagcgg 2881 agcgtgatga caatgcggcg tgatacatat acagccgatg ccgagtcata cagaactccg 2941 atgctcgttt gtgaaatgat tgtgcgtcag gaatattcat ttgcagtatg cccgagatgc 3001 aaggtttcgt tagaaagaga atatcagaac tattgcgaca gatgcggcca ggcactcaaa 3061 tggagccggt ataggtatgc gaaggtgata actttaggta atggatgtta ggggagaggg 3121 gttacttttc gctggttcat ttccggtcag gaagaaaata tatctatgga aacgaacgtt 3181 taaattctat attcgtgcaa tgaaaaaagc ccgataaatc gg // LOCUS sequence130 3216 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence130 VERSION sequence130 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3216 /mol_type="genomic DNA" /organism="" /note="sequence130" CDS 188..1963 /product="aspartate--tRNA ligase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_004454140.1" /transl_table=11 /codon_start=1 /translation="MDTMGNLRRSHYCAEIPLTPCEVVVCGFVQKIRDLGNLIFIDLRD RTGIVQLAFGDDTARDVFEKASTIRNEYVIMARGNVTPRESINKDIKTGTVEIRVTELK ILAKSQTPPFEVANSGKVNDELKLKYRYLDLRSRELTENILMRHKIAKVTREYFYENDF VEIETPMMIRSTPEGARDYLVPSRVHEGKFYDLPQSPQIYKQLLMVSGFDRYIQLARCF RDEDLRADRQPEFTQIDLEMSFVDVEDILQIGEGFMKRLFKEVKGIDIETPLPRLTFAD AMNRYGSDKPDTRFGMEIQDLSETVKDIDFVVFKSAIENGGSVRAIVAKNAAGVYTRKE IDKLTEHAKGIGAKGLAYIRWVDDEPNCSFAKFLKEGELDEIINKLGAKKGDVVLFVAD KNKVVLPVLGALRLIVAKRLDIIPKDKFNLLWIVEMPFFEYNEETGNWDAMHYPFTMPL DECIEYLDTDPGAVRAKCYDLVLNGVELCSGSIRITDYELQQRMFRSLGLTDEEIEAKF GFLVEAYKYGAPPHGGMGLGLDRITMLLCGADSLRDVLAFPKVQNASELMSACPATVDD IQLKDLHIAVVKDEK" /locus_tag="LOCUS_5120" /gene="aspS" /EC_number="6.1.1.12" /note="WP_004454140.1 aspartate--tRNA ligase (Clostridioides difficile) [pid:51.6%, q_cov:100.0%, s_cov:100.0%, Eval:8.3e-179]" /note="MGA_665" CDS 2196..2315 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MCATVLIDDYSASAFSALALLLIHNRTSVAKCKNTLIQV" /locus_tag="LOCUS_5130" /note="MGA_666" CDS complement(2403..3188) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MNITNFGCGSICGGNNDCNKGKGCNCKDHDRFPGCGHGCLACCIG PQGPAGPTGPQGPQGETGPQGPAGATGATGATGPQGPVGATGATGPQGPAGATGATGPQ GPAGPVGPTGPQGPAGVTGYASVYNLATQTVASDEEVLFDSNGANSTIVTHTAGASDIT FNEAGVYLVYVRTVAQTNARFALYLNTDPVTGGIFSSGPVGTTTEGMAIITADEGDVLT LVNLEVDNIVLNGATTGTGSTINTVNGQIVILKLADTTE" /locus_tag="LOCUS_5140" /note="MGA_667" ORIGIN 1 atatctacag ccaaaaagcc gatagaatcg cattcacgtt atgccaaaaa atcaaactga 61 cattggcaat ctcggcatta ttgcttttcg ggcgaccacg cagggtcgcc cctgataatc 121 aactataggg tcgggcctgt gtgcccgacc aataacccca cactacaata taaaggagaa 181 taacactatg gacactatgg gtaaccttcg ccgcagccat tactgcgccg aaattcctct 241 taccccctgc gaagtcgttg tttgcggctt tgtgcagaag atcagagatt tgggaaatct 301 cattttcatc gacctgcgcg accgcacagg cattgttcag ctcgcttttg gcgatgacac 361 cgcacgcgat gtctttgaaa aggcatcgac catccgcaac gaatacgtaa ttatggcacg 421 cggtaatgtc acacccagag aaagcatcaa caaggatatc aaaaccggta ccgttgaaat 481 tcgcgttacc gaactgaaga tccttgcaaa gagccagacc cctcccttcg aggttgcaaa 541 ctccggaaag gtaaacgatg agctcaagct caaatatcgt tatcttgacc ttagaagccg 601 tgagctcacc gagaacattt tgatgcgcca taagatcgca aaggtcacca gagagtattt 661 ctatgaaaac gacttcgttg aaattgaaac acctatgatg atccgttcaa ctcccgaggg 721 cgcacgcgac tatctcgttc cttcccgagt tcacgagggc aagttctatg atcttcccca 781 gtcaccccag atatataagc agcttttgat ggtttcggga tttgaccgct acattcagct 841 tgcccgttgc ttccgcgatg aggacttgcg cgctgaccgt cagcccgaat tcacccagat 901 cgaccttgaa atgtcatttg ttgacgttga ggatattttg cagatcggcg aaggctttat 961 gaagcgcctc tttaaggaag ttaagggcat cgacattgaa actcctttgc ccagactcac 1021 ctttgccgac gctatgaacc gttacggctc cgataagccc gacacccgct tcggaatgga 1081 gattcaggac ttgagcgaaa ccgttaagga tattgacttt gttgtattca agtcggcaat 1141 cgaaaacggc ggctcggtaa gagcaatagt tgcaaagaat gccgcaggcg tatatacaag 1201 aaaagagatc gacaagctga ccgagcacgc aaagggcatc ggcgcaaagg gacttgcata 1261 catccgctgg gttgacgatg aacctaactg ctcatttgct aagttcctca aggaaggtga 1321 gcttgatgaa ataatcaaca agctcggtgc caaaaagggc gacgttgttc tctttgttgc 1381 agacaagaac aaggtagtgc tccccgtttt gggtgcgctc cgtctgatcg ttgcaaagcg 1441 tcttgacatt attcccaagg ataagttcaa cctgctctgg atcgttgaaa tgcccttctt 1501 tgaatataac gaagaaacag gcaactggga tgctatgcat taccccttca caatgccttt 1561 ggacgaatgc atcgaatatc tcgacaccga tccgggcgct gtaagagcca agtgctatga 1621 ccttgttttg aacggcgttg agctttgctc cggctcaatt cgtattaccg actatgagct 1681 tcagcagaga atgttccgct cgctgggact tacagacgag gaaattgaag caaagttcgg 1741 cttcttggtt gaagcttata agtacggtgc accgcctcac ggcggaatgg gcctcggcct 1801 cgacagaatc acaatgcttc tttgcggcgc tgattctctg cgcgacgttc tcgccttccc 1861 gaaggtgcag aatgcaagcg agcttatgtc cgcttgcccc gcaacagttg acgacattca 1921 gcttaaagac ctgcatattg cagttgttaa ggacgaaaag tgatataaaa agtccactcc 1981 caagagtgga cttttttaat taataatgaa tgatgaataa tgaatagaga ataataaata 2041 gtaggggcag gcctgtgtgc ctgcccacct aatcaacgat aagtggcgat taacaagcaa 2101 acggttgcaa gggttatgac agaaaagata atttccatcc atatgcgcaa tttgcggaat 2161 tcttcgttgc ttaaccacgg agtagcgcag ccgcaatgtg cgcaacggtt ctgattgatg 2221 actacagtgc ttccgcattt tctgcacttg cgctcttgct tattcataat cgaacctccg 2281 ttgcaaaatg taagaatact ctaatacaag tatagatagc aagcggccga ttgtcaatgg 2341 acgggattgt ctttttggag ggtctttatg tgggcgggga cacagccccg cccgtttttt 2401 gattattccg tggtgtctgc cagtttcaaa attacgatct ggccgttgac tgtgttgatg 2461 gtggagcctg tgcctgttgt tgcgccgttg aggacaatgt tatcgacctc gaggttgaca 2521 agtgtcaaca cgtcgccttc atctgcggtg atgatcgcca ttccctcggt ggtggtgcca 2581 acggggccgg acgagaagat tccgcctgta acagggtcgg tgttgagata aagagcgaat 2641 cttgcattgg tctgtgcaac cgttctgaca tatacaagat atacgcctgc ttcgttgaag 2701 gtgatgtccg atgcacctgc ggtatgggtc acaatggtgg agtttgcgcc gttggagtca 2761 aacaaaacct cttcgtccga tgcaacggtc tgggttgcaa ggttatagac agaggcatag 2821 cctgttacgc cggcagggcc ctgaggacct gtgggaccta cgggaccggc agggccctgg 2881 ggacctgttg ctcctgttgc acctgcgggg ccctgggggc ccgttgctcc cgttgcgcct 2941 acaggaccct gaggaccggt cgcaccggtg gcacctgttg cacctgcagg accctgggga 3001 cctgtttcac cctgaggtcc ctgaggaccg gtggggcctg cgggaccctg aggaccgata 3061 caacaagcca gacagccgtg tccgcagccg gggaatctat cgtgatcttt acaattacag 3121 cccttgccct tattgcagtc attatttccg ccgcagatac tgccgcagcc aaaattggtg 3181 atattcataa ttgattaaac ctttcctttc gcagtc // LOCUS sequence131 3166 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence131 VERSION sequence131 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3166 /mol_type="genomic DNA" /organism="" /note="sequence131" CDS 357..1052 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MKKALNIVKSILVWAICIFTVMIMIFTVISVTTFDRNDRSIFGYK AFIVLSDSMAATDFNAGDVVLVKEVDPTTLEAGDIICFSSADPDNYGETVTHKIRALTT DKDGNPAFITYGTSTDTDDKTPVTYPFIKGQYFGRIPYAGTFFRFLKTTPGYICCILVP FMLLILSQAVNSIKLFRAYKNEQSEAIEAERAKLAAERAESMEMLKELQALKAQLAAMK GDGESKPEE" /locus_tag="LOCUS_5150" /note="MGA_668" CDS complement(1098..1286) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MIECTCTHCIYQENNRCMLDNIEVSYGGMCHSAILIYIEDEELEA RKKAQRDYLDMVDDELE" /locus_tag="LOCUS_5160" /note="MGA_669" CDS 1398..1577 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MFKVDNELKSANVPRTVRFTEPLFEKLNEVASENGISFNLLVLQC CKYALDNMENNGDK" /locus_tag="LOCUS_5170" /note="MGA_670" CDS 1745..3118 /product="MATE family efflux transporter" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_002682366.1" /transl_table=11 /codon_start=1 /translation="MRTHEIRMTEGSIASNMIRFAIPLFLGNLFQQLYNTADTFIVGKL IGNDALAAVSSTGSLVFLLVGFFGGIAAGGGIVISQRFGAKNYEEMSRAIHTNLALSLT AAVILTLFGTLFTPQILIWMDTPADVLPRSIEYIRVYFAGCTGMVMYNCCMGIMQAVGD SRHPLYYLIISSCFNVVLDIAFIALFKMDVGGAALATIISQFLSVFLCLRRLVKTDAEY KVSFKKIRLYPDMAKLIIRYGLPSGLSNSMIALANVMVQSNINAFGKMAMAGNGAYAKL EGFAFLPVNCFTSAITTFVGQNLGAGEIERAKKGVRFGVACSMAIAEIIGVILFVGSPF LIGLFTEEAESVAYGVMKSNACSLFFFMLAATHCLSAVMRGAGKATVPMATMLICWCAV RVISLSVLVPITQSIHIVNWIFPITWSLSTVVLLIYYLKVDWIGDFAKNKASAKVSEP" /locus_tag="LOCUS_5180" /note="WP_002682366.1 MATE family efflux transporter (Treponema denticola) [pid:34.5%, q_cov:95.4%, s_cov:97.6%, Eval:1.3e-72]" /note="MGA_671" ORIGIN 1 cacgtatttt ttgttctaac aaaactttgg cgcgaaattg ggtcaaaacc aattccaagc 61 atagcgagga atttgttttt agaatcccca aattgtttca tttttaaatc acattgaact 121 ctggcaaaaa attgggtcaa aaccaattcc aagcatagca aggaatttgt ttttagaatc 181 cccgaatatt tgatgcaccc aacagggtgc cttttgggct tattgcaaga ttattcgatt 241 tgagccccga gtttgcaaaa aacgctattt ttttcacacc tctttacaaa ttacactaaa 301 gtgtgttatt ataataaaaa tatacttgga ttaactatgc aaggggatac ataaatatga 361 aaaaagcatt aaatatcgtc aagtcgatac tggtttgggc gatctgcatt tttacggtta 421 tgataatgat attcactgta atttccgtta ccaccttcga ccgcaatgac cgtagcattt 481 tcggctataa ggctttcatc gttttgtccg actcaatggc agccaccgac ttcaacgcgg 541 gcgatgttgt attggtcaag gaagttgacc ccactaccct tgaggcaggg gatatcatct 601 gcttcagctc tgccgacccc gacaactacg gcgaaaccgt aacccataag atcagagctt 661 taactaccga taaagacggc aatcctgctt tcatcaccta cggtacatcc accgataccg 721 acgataaaac tcccgtgaca tatcccttca tcaagggcca gtatttcggc agaatccctt 781 atgcgggaac attcttccgc ttcttaaaga ccactcccgg atacatctgc tgtattcttg 841 tgccgtttat gcttttgatt ctgtcgcagg ctgtcaactc aatcaagctc ttccgcgctt 901 ataagaatga gcagtcggaa gcaattgagg cagagcgtgc aaagcttgct gctgagcgtg 961 cggaatcaat ggagatgctc aaggagcttc aggctctcaa ggctcagctt gccgcgatga 1021 agggcgatgg cgagagcaag cccgaagaat aataaaaaat agcaaaatcc ccgactacgg 1081 tcggggattt ttatgcacta ctcaagctcg tcatcgacca tatccagata gtccctttga 1141 gccttttttc ttgcttcaag ttcttcatct tcaatgtata tcagaattgc gctgtgacac 1201 attccgccgt aacttacttc aatattgtcc agcatacatc gattattttc ttggtatatg 1261 cagtgtgtac aggtacattc aatcattgat atcatcctcc ttataatgta atataacaca 1321 ttgtcccaac taatgcaacc ataaatggtt atattattat aaccgaaatt ggcataatat 1381 attattgggt gatgaaaatg ttcaaagttg ataatgaact caaaagtgcc aatgtgccga 1441 gaaccgtcag atttaccgag cctttgtttg aaaaactgaa tgaagtcgct tctgaaaacg 1501 gcatatcttt caatctgctt gttttgcaat gttgcaaata tgcattggat aatatggaga 1561 ataacggcga taaataaatc aatccccgac tgcggtcggg gattattttt ttgtgtgccc 1621 cgccgctcgg ccacctgccg cacgccttcg gcacctcggc agacggcctc gctttttctt 1681 gcattccccg acacatagtg ctataatatc ccttgtatat ttatagaaag accggtttta 1741 tcctatgcgc acacacgaaa ttagaatgac cgagggctcg atcgcctcaa atatgattcg 1801 ctttgcgatt cctctgttct tgggaaacct cttccaacaa ttatataaca ctgcggatac 1861 cttcattgtc ggcaagctta tcggcaacga cgctttggcg gctgtttcat caacgggaag 1921 ccttgtcttt ttgctggttg gcttctttgg cggtattgcc gcaggtggcg gcattgtaat 1981 ttcccaacgc ttcggagcga agaattacga agaaatgagc cgtgcgattc acaccaatct 2041 ggcgctttct ttaactgccg ccgtaatact cacacttttc ggcaccttgt tcactccaca 2101 gatactcatc tggatggaca ctcccgccga tgttttgccc cgctcgatcg aatatatcag 2161 ggtctacttc gcgggctgta caggtatggt tatgtataac tgctgtatgg gcattatgca 2221 ggctgtcgga gattcccgcc atccgttata ttatcttata atttcctctt gctttaatgt 2281 cgttctggat atcgcattca ttgctctgtt taaaatggat gtcggcggcg cggctttggc 2341 gacaattatt tctcagtttt taagcgtttt cctctgtctg cgcagacttg ttaaaaccga 2401 cgcggaatat aaagtcagct tcaaaaagat tcgcctatat cccgatatgg ctaagcttat 2461 aatcaggtat ggcttgcctt cgggtctttc aaattcaatg attgcccttg caaacgtaat 2521 ggtacagtca aatatcaatg ccttcggcaa aatggcaatg gcgggcaacg gcgcatatgc 2581 caagcttgag ggctttgctt tcctgcctgt aaattgcttc acctctgcaa tcaccacatt 2641 tgtcggtcag aatctcggcg caggggagat cgaacgagcc aaaaagggcg ttcgcttcgg 2701 cgttgcctgc tcaatggcaa ttgccgagat aatcggtgtg attttgttcg tcggctctcc 2761 cttcttaatc ggtttgttca ccgaagaggc tgaatcggtt gcatacggtg ttatgaaatc 2821 caacgcttgc tcgctgttct tctttatgct tgcggcaact cattgccttt ctgcggttat 2881 gcgcggcgca ggcaaagcaa cagttccaat ggcaacaatg ctcatttgct ggtgcgcggt 2941 gcgcgtaatt tctctttccg tgctggtgcc gataacccaa tccatacata tcgtcaactg 3001 gattttcccg ataacatgga gccttagcac ggtagttctc ttaatctatt acctcaaggt 3061 cgattggatc ggcgactttg ccaaaaacaa agcttctgcc aaagtcagcg agccataatc 3121 accgggggat gtatcactcg tacctgcgct gattgactat ggcgcg // LOCUS sequence132 3162 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence132 VERSION sequence132 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3162 /mol_type="genomic DNA" /organism="" /note="sequence132" misc_feature <1..676 /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_012048395.1:radical SAM protein" /note="WP_012048395.1 radical SAM protein (Clostridium botulinum) [pid:48.6%, q_cov:98.2%, s_cov:74.2%, Eval:2.2e-56, partial hit]" /note="MGA_672" /locus_tag="LOCUS_5190" CDS complement(711..1220) /product="AAA family ATPase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_000767065.1" /transl_table=11 /codon_start=1 /translation="MTVGQELMKITDLRLFHNHMTIEPVLEIFNDFNVNAILRMREVIF EEFAKSNNYGMIFTFMWAFDCEEDWKIHDSVLSIFDNYNTEYYYVELTAPLEVRLARNS TENRLANKASKRNIEASNARLISMDQTHRFESYDGELKFDNYIKIDNTDKSPMEVAKLI KETFNL" /locus_tag="LOCUS_5200" /note="WP_000767065.1 AAA family ATPase (Bacillus cereus) [pid:48.6%, q_cov:100.0%, s_cov:92.5%, Eval:7.2e-36]" /note="MGA_673" CDS complement(1265..2122) /product="16S rRNA (adenine(1518)-N(6)/adenine(1519)-N(6))-dimethyltransferase RsmA" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003226751.1" /transl_table=11 /codon_start=1 /translation="MDNLSNIGVIKQILSDHGFTFSKKLGQNFLINPSVCPRIAEMGNA KEGFGVIEIGPGIGVLTNELAKRADRVVAIEIDDRLPPILEKTLEEHKNVKVINDDVLN VDLHKLIEEEFAGLDVAVCANLPYYITSPIIMMLLESRLPIKSITTMVQKEAGQRLCAQ MGTRDTGAVTVAVNFYAEAKILFNVSRGSFMPAPNVDSCVIRFDLREQTPSVSDEKFFF KVVRGMFSQRRKTLLNCVSGSLGIGKETVLEAIEKSGISPTARPEQLSMDEMIRLSENL KEVM" /locus_tag="LOCUS_5210" /gene="rsmA" /EC_number="2.1.1.182" /note="WP_003226751.1 16S rRNA (adenine(1518)-N(6)/adenine(1519)-N(6))-dimethyltransferase RsmA (Bacillus) [pid:47.9%, q_cov:96.5%, s_cov:95.9%, Eval:1.4e-65]" /note="MGA_674" CDS 2237..2413 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MGPITKLYHLQNMSMADISAMMSSSEFKNYIELHHRTKRVMPENI AKTENEDEANDKI" /locus_tag="LOCUS_5220" /note="MGA_675" misc_feature complement(2465..>3162) /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_003384678.1:translation elongation factor Ts" /note="WP_003384678.1 translation elongation factor Ts (Clostridium) [pid:42.6%, q_cov:99.6%, s_cov:75.2%, Eval:1.3e-46]" /note="MGA_676" /locus_tag="LOCUS_5230" ORIGIN 1 aataagccag cttgacaagg gatatgccat tactgttaat gaactggcag atatattcct 61 gcagttgcag gaaaaaggcg cacacaatat aaaccttgtc agtccgaccc catatgtgcc 121 acatatcatc aaagcgcttg atatggttaa aggaaagctg acaattcctg tggtatataa 181 ctgcggcgga tatgagagaa ttgaaaccat taaaacgctc gagagttatg tgcagatata 241 tctgcctgat ttgaaatatt ttgacgatac atatgccaag gaatattcgg gcgcaaacga 301 ctattttgaa actgcaatgg gagcaatcaa agaaatggtc agacaggtcg gtaagccgag 361 atttgatgat aacggaataa tgcagagcgg cgtaattgtt cgccacttgg ctctcccctc 421 cttgcggcag gactcagcaa aggttattga tgcacttggc aaagaatttg cgcgtgatga 481 gataatgctc agccttatga gccaatacat tccgatgcat aaggccatag gacacccaaa 541 gctcggcaga agaatatcaa catttgaata taataaggtt ttggaaacag cgagcaagtt 601 tggttacgag ggcttttcgc aggagcgaag ctcatccagc gaggtttacg ttccgccgtt 661 tacagacaaa aaataatgca gtaccacggt ttcgggtact gcatttatac ttatagatta 721 aatgtttctt tgattaattt tgcgacttcc atcggagatt tgtcagtgtt atcaatttta 781 atatagttat caaacttgag ttcaccatca tagctttcaa atctatgggt ttggtccatt 841 gaaatgagcc gtgcgtttga tgcctcaata tttcgcttag aggccttgtt tgcaagcctg 901 ttttcagttg aattccgtgc aagtctgact tcaagcggag ctgtcaattc aacataataa 961 tattcggtat tatagttatc gaaaattgaa agaacactat catgaatttt ccaatcctct 1021 tcgcaatcaa aggcccacat aaatgtaaaa atcattccgt agttatttga tttggcaaat 1081 tcttcaaata tcacttcacg cattcttaaa atcgcgttca cgttgaaatc gttgaaaatt 1141 tcaaggacag gttcaatagt catatgattg tggaacagcc ttaaatcagt aatcttcata 1201 agctcttgac cgacagtcat tttcccgaca gccccatcgc caaataagaa taccaacttc 1261 aaatttacat cacctctttg agattctcgc ttaagcggat catttcatcc attgaaagct 1321 gttcaggacg agcggtggga gaaatgcccg acttttcaat cgcttcaagt acagtttctt 1381 ttccaattcc caacgaaccg ctgacacagt tgagaagcgt tttacgacgc tgagagaaca 1441 ttcccctcac gactttgaaa aagaactttt catcgctgac cgaaggagtc tgttcacgca 1501 gatcaaatcg gattacacag ctatccacat tcggcgcggg cataaagctt ccgcgggaaa 1561 cattaaacaa aatcttcgcc tcggcataga aattaacagc aactgtcaca gcgcccgtat 1621 ctcgggtgcc catttgtgcg caaaggcgct ggccggcctc tttttgaacc attgtcgtga 1681 ttgatttgat cggcaagcgg gattcaagaa gcatcattat aattggcgat gtgatgtaat 1741 atggcaagtt cgcacagaca gcaacatcaa gacctgcaaa ttcttcttca ataagcttat 1801 gcaggtctac attgagaacg tcatcattta tgaccttaac gtttttatgc tcctcaagtg 1861 tcttttccag aattggcggc aaacggtcat caatttcaat tgcaactacc ctatcggcgc 1921 gcttagcaag ctcgtttgtc aaaactccga tgccggggcc gatctcaatt acgccaaagc 1981 cttcttttgc attgcccatt tcggcaattc tcgggcaaac agaaggattt attaaaaagt 2041 tctgacccag cttttttgaa aaggtaaaac cgtggtcgga aagaatttgt ttaattacac 2101 cgatgtttga aagattatcc ataatttact ccatttgaag aattatatat tgattatagc 2161 aagcattttc atttaagtca ataaagcata tttttgcttc atttgttaat aataaatcaa 2221 aaacaaagga gcaaatatgg gaccgattac aaagctttac catctccaaa atatgtccat 2281 ggcagatata tcggcgatga tgtcgtcaag tgaatttaaa aactatatcg agcttcacca 2341 tcgcacaaaa cgagttatgc ctgaaaatat cgcgaagact gagaatgaag atgaggctaa 2401 cgataagata taaaaaacaa ggcaaccgcg gttttgcgat tgccttgatt cttttgcttt 2461 aaaattactt catcatggaa gctacttcag ctgcaaagtc atcggatctc ttctcgattc 2521 cttcgcctct ttcgtagcga acatattcag caaccttgat ggagccgccg aggtccttag 2581 cgcacttgtc aacgtacttg ccaacagtgt agtcgccatc cttaacgaat tccatatcta 2641 cgaggcagtt ttcagagtag tacttgccaa ccttgccttc aacgatcttg accattacag 2701 cctcaggctt gttagccatc ttgggatctt ccttcatctg agcaagcatg atgttctttt 2761 cgttttcaag aacttctgca ggaacatgat ctctgtcgag atatgcaggg ttcatagcag 2821 cgatctgaag agcaacgtcc ttaccgcaag caagagcctt gtcgcccaaa tcggtatcaa 2881 gcttaaccat aacgccgatt ctgccttcac cgtgaatgta agataccaag gtgccttcca 2941 ttcttgtgaa tcttctgatc tgaatgtttt ctctgatctg gaggaatact tcctgaacct 3001 cttcgtcgat ggttctgtca gagtcaacag acttgcaagc cttcaaagct tcaacgtcag 3061 cagggttgca agcaatcagg ttctgagcga tggtgttaac caagcccttg aactgatcgg 3121 tgttagcaac gaagtcggtt tcggagttaa cctcaacaac aa // LOCUS sequence133 3145 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence133 VERSION sequence133 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3145 /mol_type="genomic DNA" /organism="" /note="sequence133" CDS 68..289 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MTYTLLAVSSITYAMKGKRLLNGMGYYCEIEKTPKGLSSGCGHSL RVRDDPEVICSLLRRNGIDTRDRMTVNR" /locus_tag="LOCUS_5240" /note="MGA_677" CDS 389..1438 /product="aminotransferase class V-fold PLP-dependent enzyme" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_041272645.1" /transl_table=11 /codon_start=1 /translation="MGGNPGRGGHSFSRVSSEIIFNCREEAASLFGASPENVVFTANCT HALNAAIKGVCSRNDHIVISSMEHNSVARPCYRLAKEGARVEVAMVGRSDDETISNFTR LITDDTKCVICTAASNVTGRIMPLREIGEICKRKGVCFIVDAAQAAGSVPISLDHGINF ICCAGHKGLYGPTGTGLLISDGKYLPDTVIEGGTGATSLELDQTPDMPERLESGTLNTV GVCGLLAGIKFIKRIGISRIYDHERLLCNILLDGLKTVDGAKVYRRGESFVPIVSFNIE GFDPTALSTALDGEGFALRGGLQCAPLAHHTIKTLPAGPIRFSPSCHNTQKEVISLVNA LKKFSKQGI" /locus_tag="LOCUS_5250" /note="WP_041272645.1 aminotransferase class V-fold PLP-dependent enzyme (Desulfitobacterium hafniense) [pid:43.0%, q_cov:98.6%, s_cov:91.4%, Eval:2.2e-66]" /note="MGA_678" CDS 1524..2420 /product="diadenylate cyclase CdaA" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003360232.1" /transl_table=11 /codon_start=1 /translation="MDYIANFMSRLVSTISTVGIVDIIDMLILAFIIYKGIKIVRETKA QQLITGVVIIVGIYLVSSAFELKVMSFLLENFLQIGILAIVIVFQPELRRILERVGRAN VKSLKIINDTHSDNAYQHWSNAIDAIGEAVSQLSDTTTGALIVIEREIRLGDQIDTGTI LDCIPSVSTLGTIFFPKTPLHDGAVIIRDARIIAAGCFLPTPQKEETINKLLGSRHRAA IGMSENSDAIVIVVSEETGTVSVAENGELTRGYTKERLISLLRSKLIPEKGQGESKLFE IIKSGKERLNGRKNKKD" /locus_tag="LOCUS_5260" /gene="cdaA" /EC_number="2.7.7.85" /note="WP_003360232.1 diadenylate cyclase CdaA (Clostridium) [pid:44.9%, q_cov:91.9%, s_cov:94.0%, Eval:6.5e-58]" /note="MGA_679" ORIGIN 1 agcctaccag tgtcaagccc tctcatttgc cgtaatatgt aaaaatacta ttacgaggtg 61 atccactttg acatacacac tcttagctgt ttcgtccata acctacgcta tgaagggcaa 121 acggcttctc aacggcatgg gctactactg cgaaatcgaa aagaccccaa agggtctctc 181 aagcggctgc ggacattctc tgcgcgtgcg cgacgacccc gaagttatct gctcgctttt 241 gcgccgcaac ggaatcgaca cccgcgaccg tatgaccgta aacaggtagg gtgagcttat 301 gaagccgaaa atatattttg acaacgccgc cacaaccttt ccgaaacctg cctgcgtttg 361 ttccgctgtc tgccgcggag tcagcgtctt gggtgggaat cccggcaggg gaggtcacag 421 cttttcacgt gtctcatccg aaataatctt caactgccgc gaggaagcag catctctctt 481 cggagcatcc cccgaaaatg tcgtattcac agccaactgt acccacgctc tcaatgctgc 541 gatcaaaggc gtatgctccc gcaatgacca cattgtaata tcttcaatgg agcataactc 601 tgttgcccgt ccatgctatc gccttgcaaa agagggcgca agggtggagg ttgcaatggt 661 tggcagatct gatgacgaaa ccatatccaa cttcactcgc cttataaccg atgacaccaa 721 gtgcgtcatc tgcaccgccg catcaaatgt cacaggcaga attatgcccc tgcgcgaaat 781 aggtgagatc tgcaaaagaa aaggcgtttg tttcattgtc gatgccgcac aggcggcggg 841 aagcgttcca atctcgcttg atcacggcat caatttcatc tgttgtgcgg gccacaaggg 901 gctttatggc ccaacaggca ccggacttct aatatccgac ggcaaatatc ttcccgacac 961 ggtaatcgaa ggcggaacag gcgcaacatc tttagaactt gaccaaactc ccgatatgcc 1021 cgagcgactt gaaagcggca ctctcaatac cgttggcgtc tgcggacttt tggctggcat 1081 caaattcatc aagcgcatcg gcatcagccg aatatatgac cacgagcgcc ttttgtgtaa 1141 cattctcctt gacggtctca aaaccgtcga tggcgcaaag gtatatcgac gcggcgaaag 1201 ctttgttccg atcgtatcat tcaacattga aggcttcgac cccacagccc tctcaaccgc 1261 ccttgacggc gagggctttg ctcttcgcgg cggtcttcaa tgtgcacctt tggcacatca 1321 taccataaaa actctccccg cgggaccaat cagattttcg ccttcctgcc acaacactca 1381 aaaagaggtt atttctttgg taaatgcttt gaaaaaattc tcaaaacagg gcatttgact 1441 attgaatttt cctgtgtaaa ctgctaaaat ataagtatga atgcaaagat gtcccaaatg 1501 gacatacagg aaggagaatg accttggatt atatcgccaa ttttatgtca agacttgtca 1561 gcaccatcag cactgtcggt attgttgata taattgatat gctcattctc gcctttatca 1621 tctataaggg catcaagatc gttcgcgaaa ccaaagccca acagcttatc acgggcgttg 1681 taataattgt tggtatctac cttgtttcct ctgctttcga gctaaaggta atgagcttcc 1741 ttttggagaa cttcctccag atcggaattt tggcgatagt aatcgtattc cagccggagc 1801 tgagaagaat tctcgaacgt gtcggccgag ccaatgtaaa atcccttaaa atcatcaacg 1861 acacccattc ggataacgca tatcagcatt ggtcaaatgc cattgatgcc atcggcgagg 1921 ctgtcagcca gcttagcgat accaccacag gtgccctaat tgttatcgag cgcgagattc 1981 gcctcggtga tcagatcgat accggtacta tccttgactg tatccccagc gtatcgactc 2041 tcggcaccat cttcttcccc aaaacccctc tgcacgacgg tgctgttata atccgtgatg 2101 ctcgaattat cgcggcaggc tgtttcttgc ccactcccca aaaagaggaa acaattaaca 2161 agcttcttgg ctcgcgccac cgtgccgcca tcggtatgtc cgaaaattcc gacgccatcg 2221 taattgtcgt atccgaggaa acgggaacgg tttccgtcgc tgaaaacggc gagctcacca 2281 gaggttacac caaagaacgt ttgatttcat tgcttcgctc caagcttatc cccgaaaagg 2341 gacagggcga gagcaagctc ttcgagatta tcaaatcggg aaaggagcgt ctgaatggca 2401 gaaaaaacaa aaaagactga gcgtaagcct ttaaacaata acctcatcct gatgattgta 2461 tcgggcatag ttgctgtaat aatctggttt tcgctggtgc ttaccgcctt ccccgaaacc 2521 accgtcataa ttaaagacgt tcctatcgac tatgcgctcg acggctccta tgctgacatt 2581 tcgggacttt caatcatcgg cgaggttatc cccaccgtca acgtgcgagt atccggactt 2641 cgctatatca tcggtgacta taagcctgaa gatcttatcg taagcccgaa tctcgattct 2701 gtccgtgcat ccggtcagta tgaacttagc ttggatgtaa gaagtgccca cggtgaccag 2761 atcacggttg atttggttga accgagcacc gttcacgccg agtttgacta tttcgtcacc 2821 aaaactctct ctgttgaaca gggtaccctt gttgccgacc tttcaaacat ctccgcaggc 2881 tcgggctata ttctcgattc ggaggatata accctcaatc cttccgaaat caccatttcg 2941 ggaccgaagg attatgtgga ccaggtcacc tcatgtgtcg tttcctttga ggattcaaga 3001 accttgcgcg aatcagcaaa catcagcgcc accaacatta agctatattc gggcaatgcc 3061 gtatatgacc atccccgtgt tgcgatcgaa accgaatcgg tcaacatctt gattcccgta 3121 tatatgaaga aaacgttgaa cttag // LOCUS sequence134 3133 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence134 VERSION sequence134 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3133 /mol_type="genomic DNA" /organism="" /note="sequence134" CDS complement(1103..1939) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MPKIRYATLSDKSFWYTLDKHLPECEFERKVRDNEAYVMFVGDKP IGILRYNLFWDNTPFCNLIYIDENYRGMSYGKSLMEYWENDMLSLGYDMVLTSTQTDES AQHFYRKLGYRENGCLMLDIKGHEQPMEMFFVKALSSPLTLETERTVLRPWRGTDADYL YELASDPDVGPSAGWRIHDSVEDSLGIIYTVLALPHTMAVVLKENGLAVGSIGLMPGNR ANAPIPEDEAEVGYWIGKPYWGRGLIPEAVRELMRFGFEDLGFKKLWCCHFDGNEK" /locus_tag="LOCUS_5270" /note="WP_003384928.1 GNAT family N-acetyltransferase (Clostridium botulinum) [pid:45.7%, q_cov:49.3%, s_cov:99.3%, Eval:2.6e-29, partial hit]" /note="MGA_682" CDS complement(1951..2994) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MPDIYTLTKNYLALRDAIANHPDLDSLLLLQPSVRELEEYLDADF QRDYEADERGELPNDFPRALISQDGLYNLLCENDRLLRELAMEKHTVPTNAEIIKIAMA QSAIDLNCSPDDFTVSENKVVISAPNPDAHRYLSLPFALNLLSYGSNIVASVSPELEQV ARDYINKYPVEHCFETPNLHALDDALAPYGYKTCFMAEYFLPDVNALVLHPCKYQTKML TQPDFKNLYTPEWSNALCERRRHLDVLGIGAYDGDKLIGLAACSADARDMWQIGIDVLP DYRRQGIASALTSALAYEILNRGKVPFYCAAWSNIKSVRNALKCGFKPAWAELTAKPAT TVNEMNK" /locus_tag="LOCUS_5280" /note="MGA_683" ORIGIN 1 aagattccga cggagaaacc gcagatcgca cagccgataa gacccagcac agggttttga 61 gaaagcacag ccacaagata gcacgcaacg cacaaaaccg cactcgcaag cattgctttc 121 tttaagggaa gcttatcgct gaatttaccg tacaatgcgc gggacgagcc catacagatt 181 gcaaaggcac aagggcctgc aaggtctccg attgtttttg aaacgcccaa gcctgcttca 241 gcgaaagctg atgcccactg gctcattgcc tgttcgcttg cacctgcaca aatcattatt 301 accattaaga gccagaatat tttgtttttg acaagaccat tgattgaatt ttcctcaccg 361 tgggtttcca ttgtatatat cggcacaagg ctgaaatata tgcagttaaa gatcggcact 421 attgcccaca cgaccgcgag gatttcccag ttgtcgatgc cgaagattgt gaagaatgcc 481 gttgaaatga gcacaacgcc aacgtgtccc caacaataga acgaatgaag aaggctcatc 541 gcggcttctt ttttctctgt ggggcaggct tcaacaattg ggctgatgag cacctcgatt 601 atgcctccgc cgacggcata aagcacaacg gatgccataa tgcctgcgta agcattgccc 661 aaaagtgagg gtaaaaacgc aagacccaaa agccccagag ctgagaatac atgggctgaa 721 attattgcgg tgcggtagcc gattttatca ataaacttgg cgcaaaggaa gtcaaccgtg 781 agctgaacgg caaagtttat cgttgtaata aggtttatct caacaagcga gagggagaag 841 cttcgcgaaa aggttaaaaa caaaaggggc gcgaagttgt tgattatcgc ttgggttatg 901 tatcctaagt atgaggcata aatggtatgc tcatagcttt gtctgatttt tgaaaacatg 961 attatgtcct gccttagttg tttttccact cttcgcgggt gatggagtaa taatgttcag 1021 ttttgtactc gcccatcata gcccaatatt tatcatattc ggtgtggctg aatttaaatc 1081 cgaatttttc aattacccgc ttttattttt cattgccatc aaaatgacag caccagagtt 1141 ttttgaagcc taaatcctca aagccaaagc gcataagctc ccgcacagct tcgggaataa 1201 gtcccctgcc ccaatatggc tttcctatcc aatagccgac ctcggcttca tcctcaggaa 1261 tcggtgcgtt tgcgcgatta cccggcataa gcccgatgct tccgacagca aggccgtttt 1321 ccttcagcac gacagccatt gtgtgaggca aggcaaggac ggtgtatatt atgcccaaac 1381 tatcctcaac gctgtcgtgt atgcgccaac ctgcagaggg cccaacgtcg gggtcggatg 1441 caagttcata taggtaatcg gcatcggtgc cacgccaagg gcgcaaaacg gtacgctcgg 1501 tttcaagggt cagcggtgaa gataaagctt tgacaaagaa catttccatc ggctgttcgt 1561 gtcctttaat atcaagcatt aggcaaccgt tttcgcggta gcccagcttg cggtaaaagt 1621 gctgtgcact ctcatccgtt tgagtggatg ttaagaccat atcgtatccg agggatagca 1681 tatcattttc ccaatactcc ataagcgatt tcccatagga cattccacgg tagttctcgt 1741 caatatagat caagttgcaa aagggtgtgt tatcccaaaa taggttataa cgcaggatac 1801 cgatgggctt atcgccaacg aacattacat aagcttcgtt atcacgcacc ttgcgctcga 1861 attcgcactc gggaaggtgc ttatctaaag tataccagaa agacttgtcg cttagcgttg 1921 cgtatctgat tttgggcatt aaatcacttc ctatttgttc atttcgttca ccgttgtggc 1981 aggctttgca gtaagctctg cccaagcggg cttgaaaccg cattttagag cattgcggac 2041 agattttata ttgctccagg ctgcgcaata gaacgggacc ttgccgcgat ttaaaatctc 2101 atatgccaga gcacttgtca gcgcggaagc tatcccctgc ctgcggtagt cgggcaaaac 2161 gtcgatgccg atctgccaca tatcgcgggc atccgcagag caggcggcaa gaccgatgag 2221 tttatcgccg tcatatgcgc cgatacctaa gacatcgaga tggcggcgcc tttcacaaag 2281 ggcgtttgac cactctgggg tgtataaatt tttaaaatcc ggttgggtga gcattttcgt 2341 ttgatatttg cagggatgta gcacaagggc attaacatcc ggtaggaaat actccgccat 2401 aaaacaggtt ttataaccat atggtgcaag agcatcgtca agtgcatgaa ggtttggggt 2461 ttcaaagcaa tgctcgacag gatatttgtt tatatagtcg cgggcaacct gctcaagctc 2521 aggcgaaaca gatgcaacga tattcgagcc ataagataag agattgagcg caaaaggcag 2581 gcttaaatag cggtgagcgt cggggttcgg tgcggagatg acgaccttgt tctcacttac 2641 ggtgaagtca tcgggtgagc agttaaggtc aatggcagat tgcgccattg caattttaat 2701 aatctcggcg ttggtgggca cagtatgctt ctccattgca agctcacgca agaggcggtc 2761 gttttcgcaa agaaggttat atagcccatc ttgagatatt agagcacggg ggaaatcatt 2821 aggcaactct cccctttcat ctgcctcata gtcgcgctga aaatcggcat cgaggtattc 2881 ctcaagctcg cggacagatg gctgaagcaa caagaggctg tcaaggtcgg gatgatttgc 2941 aatcgcatcc cgcagggcga gataattttt ggtgagggtg taaatgtcag gcatatggac 3001 tccttttgga aaattaagcg gagaaagcta atattcattt atatttacag gttcggaatt 3061 tgccttcgat ccaaaatgtg gcttcagttg tgtggaattt cagcagtcgg aatttcgggt 3121 cgtcgattcc ctt // LOCUS sequence135 3123 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence135 VERSION sequence135 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3123 /mol_type="genomic DNA" /organism="" /note="sequence135" CDS complement(877..1326) /product="MarR family transcriptional regulator" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011022043.1" /transl_table=11 /codon_start=1 /translation="MSQQKFTDKQVIGKLICVNRMHRTITENKVGQLGIHRSQHHMLMA IGNREGISQKEIAEKMEISPAAVAVTLKKLEVAGFIERSTSADDSRVNNIHLTEKGREI TKITSELFGGIDAAMLESFTDEERETLCSLLDKLKGNLKAQFECL" /locus_tag="LOCUS_5290" /note="WP_011022043.1 MarR family transcriptional regulator (Methanosarcina acetivorans) [pid:30.2%, q_cov:86.6%, s_cov:84.3%, Eval:2.1e-13]" /note="MGA_686" CDS 1544..2947 /product="MATE family efflux transporter" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_002681807.1" /transl_table=11 /codon_start=1 /translation="MKEFLSKYIGDKKFYTMLLRVCLPIIIQNAISNFVNLLDNIMVGQ TGTDSMTGVSVANQLNFVFNIIIFGAVAGAGIFTAQYHGKNDSDGIRFTLRFKLIICLI MAILGITVFWFFKEPLVSLYMTDGDAAVDPVAVLDYGKRYISVMIFGLLPFAISQAYSG TLRETGETFVPMVSGISAVVVNLCLNYILIFGKFGAPELGVVGAAIATVISRYVEMLIV IIWTHTHKERNPFAVGLFKGFHIPADVTKKIIIKGFPLLVNEALWSFGIAAVNQCYSTR GLDVVSANNISVTISNLFNVVFLSLGSAVAIIVGQALGSGEVEKAVDLDRKLIVTSVLS SLVMGAGLCAISPLFPELYNTEPQIKELAAQLIRVVAFSMPFHAFVNACYFTLRSGGKT FITFMFDSVAIWVLNYTVAFTLTRYAPALSVPAIMLLEQSTNALRCAIGWILVKKRIWV HKLVADNAE" /locus_tag="LOCUS_5300" /note="WP_002681807.1 MATE family efflux transporter (Treponema denticola) [pid:31.5%, q_cov:97.9%, s_cov:97.4%, Eval:2.0e-60]" /note="MGA_687" ORIGIN 1 agcgagaaga ggatctgtga ggtatatgtt acaaacatcg aaaggtcgcc gacctccatg 61 ccgccctcaa gaatgattcc gcttccgaac cagatgacac aaagggtggt cacattcata 121 accagcgtca taacagggtg catcataatg atgatcttca ttgctttcag gtgggtatcc 181 ttcaaatcct tgtttgcaaa agcaaatttg ccctcttcgt gcttttctct aacaaagctc 241 ttaacaactc gcacgtttgt gacattttcc tgaacggtgg agttaagcgc gtcaagcttc 301 ttctgcacaa gagcgaacat cgagaagcca aagattatta ccagcgcgat agctgtaaca 361 agaatcggaa ttgccaccgc ataagtaacg gaaagtctgg gctgaatgga aatggtcata 421 accaatgccg ccaccagcat accgggggag cggatagcca ttcgcaggat catattgatg 481 aagttctgca tctgggtgat gtcgttggta agtcttgtta ccatcgaacc tgtagagaac 541 ttgtcgatgt ttgcaaagga aaacttctga accttgctga aaacatcaag tctaaggtct 601 gcagcaaagt taacagatgc cttcgcaccg aaatatgagc cgccgacacc gcccgccatc 661 atcataacag cgcacaggat cattccgatc atcgtgccga ggcttcctgc aatggtcagg 721 gtgccgctgt tcgctccgtt aattacagtc gccaaaagtc tcggcattac aacttcgccg 781 atgacctcaa cgaccataca caaggggccg agaatgaaat atggccaata gggtttaata 841 tatttaaacc atcttttcaa gtgatatcat cctttcctat aagcattcga actgagcctt 901 taagttgcct ttaagtttat ccaaaagcga gcagagagtt tcgcgctcct cgtcggtaaa 961 gctctcaagc attgccgcgt cgataccgcc gaaaagctcc gatgttattt ttgtgatctc 1021 ccgacccttt tccgttaagt gtatgttgtt aacgcgggag tcgtctgcag atgtcgaacg 1081 ctcaataaat cccgcaacct caagcttttt caaggttact gcaactgcgg caggggatat 1141 ctccattttt tcggcgatct ccttttgaga aatgccttct ctgtttccga tagccatcag 1201 catatggtgc tgagagcggt gaattccaag ctgtccaacc ttgttttcgg ttattgtgcg 1261 gtgcattctg ttgacacaga taagcttgcc gataacctgt ttgtcggtga atttttgttg 1321 actcatgttc gctcctttca ttttggttaa aaaatagtta gtcaattaac gattaacacg 1381 ttaattatat tccctcccca agcaaatgtc aattgtcggt ttggtgaaat attctcacat 1441 attcgcgcca tattcgttga aataatcaat gaccccacag ttgcattttt tcgcagattc 1501 tgttaaaata tagcgttgag ataatattga acggagaaaa ataatgaaag agttcttaag 1561 taagtatatt ggcgacaaaa agttctatac aatgctttta agggtctgcc ttccgataat 1621 cattcaaaat gcaatttcaa actttgtaaa tcttctcgat aacatcatgg tcggacagac 1681 gggcactgat tcaatgaccg gtgtttccgt tgcaaaccag cttaactttg tatttaatat 1741 aattattttc ggcgctgttg ccggtgccgg tatctttacc gcccaatatc acggcaagaa 1801 cgacagtgat ggaattcgtt tcacccttcg cttcaaactg ataatctgtc ttattatggc 1861 aattttgggc atcaccgttt tctggttctt caaagagcct ttggtttcat tatatatgac 1921 cgacggcgat gcagcggtcg atcccgttgc ggttttggat tatggcaagc gatatatttc 1981 cgtaatgata ttcggccttt tgccatttgc aatttcccag gcatattcgg gcacacttcg 2041 cgaaacaggc gagacctttg tgccgatggt ttctggcatt tcggcggttg ttgtcaacct 2101 ctgtctcaac tatattctca tcttcggcaa gttcggtgct cccgagttgg gcgttgtggg 2161 cgcggctatc gcaaccgtaa tctcccgcta tgttgaaatg ctcatcgtca tcatctggac 2221 acatactcac aaagagcgca acccctttgc agtcggtctt ttcaagggct tccatattcc 2281 tgcggatgtt acaaaaaaga tcatcatcaa aggcttcccg cttcttgtta acgaggcttt 2341 gtggagcttc ggtatcgccg cggttaacca gtgctattcc acaagaggcc ttgatgttgt 2401 aagcgcaaat aacatcagcg tcaccatttc aaaccttttc aatgttgtgt tcctctcgct 2461 gggaagcgcc gttgcgatca tcgtcggaca ggctctcggc tcgggcgaag ttgaaaaggc 2521 agttgacctt gacagaaagc ttatcgtcac atcagttttg agcagtcttg taatgggcgc 2581 gggactttgc gcgatttcgc ctcttttccc cgagctttac aataccgagc cccaaattaa 2641 agagcttgcg gctcagctca ttcgcgtcgt tgcattttca atgcccttcc acgcatttgt 2701 caacgcctgc tatttcaccc tgcgctcggg cggaaagaca ttcatcacct tcatgttcga 2761 cagcgtggcg atatgggtgc tcaactatac cgttgcattc accctcacaa gatatgctcc 2821 tgcactcagc gtacctgcga ttatgctttt ggagcagtcg acaaatgcgc tccgctgcgc 2881 aatcggttgg atacttgtta aaaagcgcat ctgggtacat aaacttgttg cggataatgc 2941 ggaataaaac tgttgtattt ttctttaaag tgtgttaaaa tcaaaataat aaatgacaag 3001 gggtggacac ctgatgatta aaagcagact ggaagccaaa aaccttaggg tctggctgac 3061 ctgtatcttt atagttttgt gtattgccgt tggtgctttt gcattcatcg gttttatcgg 3121 cga // LOCUS sequence136 3122 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence136 VERSION sequence136 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3122 /mol_type="genomic DNA" /organism="" /note="sequence136" misc_feature <1..545 /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_012047940.1:phosphoribosylglycinamide formyltransferase" /note="WP_012047940.1 phosphoribosylglycinamide formyltransferase (Clostridium botulinum) [pid:48.8%, q_cov:92.2%, s_cov:80.0%, Eval:2.3e-38]" /note="MGA_689" /locus_tag="LOCUS_5310" CDS 568..1284 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MKVSTIANELNSLAYHGRGIIIGKSADGKKAVTAYFIMGRSENSR NRVFVAEGEAMRTKAYDESKMVDPHLIIYYPVRVLGNKTIVTNGDQTDTIYELMDKQMT FEQALRTREFEDDKPNFTPRISGIIHHENGEMNYAMSILKSAEGDDSSCERFTYAYSNP IAGRAKFIHTYNGDGNPLPSYEGEPKTLELPDTDIDTLTDLIWTNLNEDNKVSLFVRYI DLASGETETRIVNKNV" /locus_tag="LOCUS_5320" /note="MGA_690" CDS 1308..2492 /product="phosphoribosylaminoimidazolecarboxamide formyltransferase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011860970.1" /transl_table=11 /codon_start=1 /translation="MKEFELKYGCNPNQKPSKIFMHDGTDLPIEILNGRPGYINFLDAF NSWQLVKELKEALGLPAVTSFKHVSPTSAAVGIPLSDKLKKACFVDDIEGLDESPLACA YARARGTDRMCSFGDWVALSDVCDVTTALLIKREVSDGVIAPGYEPEALEILKSKRKGS YNIVKIDPNFVPDPVERKQVYGITFEQGRNEFKINRELLSNVVTANKELPESAVRDLII SLITLKYTQSNSVCFAYDGQAIGVGAGQQSRVHCTRLAGGKADTWFLRQCDKVLNLPFK DTLGRPDRDNVIDGYINKNEEDVCAEGNWQKYFTTRPEPLTDEEAKAYLATIDGVALGS DAFFPFSDNIERAKKSGVKYIAEPGGSIRDDLVIECADKYGMAMAFTGMRLFHH" /locus_tag="LOCUS_5330" /EC_number="2.1.2.3" /note="WP_011860970.1 phosphoribosylaminoimidazolecarboxamide formyltransferase (Clostridioides difficile) [pid:71.5%, q_cov:99.7%, s_cov:99.5%, Eval:1.6e-161]" /note="MGA_691" ORIGIN 1 cacaaaactc cggaatcatc aaaagcggcg agatttcact tgtaatttcc aacaaggcgg 61 aggcttacgc tttgacaaga gcgcagaacg caggaattaa gaccgcagtt gtgcttaaaa 121 gcatctgggg cgacagcttt gaatcgagaa ttatggagat tttggacgaa aacgaaatcg 181 acttcattgt tttggcagga tttatgtcga ttctcacgga gaatttcaca aagtcatatc 241 ctaagcgcat cattaatgtt cacccctcgc ttatcccctc tttctgcggc aaaggatttt 301 atggacttaa agttcacgaa gctgccctca gttacggcgt taaggtgacg ggcgcaacgg 361 ttcactttgt caacgaaatt cccgacggcg gcgaaataat catgcagaag gctgtcgaca 421 tcgaccctga ggacaccccc gaaaccttgc agaagcgggt tatggaaaac gcggaatgga 481 taattcttcc aagagctgtc gaaaaggtct gctatgattt tcacttcggt aaaaatgaca 541 actgacaata tataaaggag atttaaaatg aaagtttcaa caatcgcaaa tgagctgaat 601 tctttggcat atcacggcag aggaatcatc atcggcaagt cggctgacgg caaaaaggca 661 gttaccgctt acttcatcat gggcagaagc gaaaacagcc gtaaccgcgt tttcgttgcc 721 gaaggagaag caatgcgcac caaggcatat gacgaatcga agatggttga cccgcacctt 781 atcatctact atcctgtaag agttttgggc aacaagacaa ttgttaccaa cggcgaccag 841 accgacacca tttatgagct tatggacaag cagatgacct ttgaacaggc actcagaacc 901 cgcgaatttg aggacgacaa gcccaacttc acccccagaa tctccggcat tatccatcac 961 gaaaacggtg agatgaacta tgcaatgtca attttgaaga gcgccgaggg tgacgatagc 1021 tcctgcgaga gatttacata tgcttactcc aaccccattg caggtagagc aaagtttatt 1081 cacacctata acggcgacgg caacccgctc ccctcatatg aaggcgagcc caagaccttg 1141 gagcttcccg acaccgatat tgacactttg accgatctca tctggacaaa cctcaacgaa 1201 gataacaagg tttccttgtt tgtaagatat atcgacctcg catcgggcga gaccgaaaca 1261 agaatcgtta acaagaacgt ttgatttatt taaggaggac acacaaaatg aaagaatttg 1321 aactcaagta tggctgtaac cccaaccaga agccctcgaa aatttttatg cacgacggca 1381 ctgaccttcc catcgagatc ctcaacggca gaccgggata tatcaacttc ctggatgctt 1441 tcaactcctg gcagctcgtc aaggagctta aagaggcttt gggacttccc gctgtaacct 1501 cctttaagca cgtttccccc acctccgcag cagtcggaat tcccctttcc gacaagctta 1561 aaaaggcttg ctttgttgac gatattgaag ggctggatga aagccccctc gcttgtgcat 1621 atgcaagagc aagaggcacc gacagaatgt gttcctttgg cgactgggta gctttgtctg 1681 atgtctgcga cgttaccacc gcacttctca ttaagcgcga ggtttccgac ggcgtcatcg 1741 ctcccggata tgaacccgaa gctctcgaaa ttctcaagtc caagagaaag ggctcttaca 1801 acattgttaa gatcgacccc aacttcgttc ccgaccctgt tgaacgcaag caggtatatg 1861 gcatcacctt tgagcagggc agaaacgaat tcaagatcaa ccgtgaattg ctctccaacg 1921 ttgtaaccgc aaacaaggag cttcccgaaa gcgctgtaag agatctcatc atctccctca 1981 tcaccctcaa gtacacccag tccaactctg tttgctttgc atatgacgga caggcgatcg 2041 gtgtcggagc aggacagcag tcaagagtac actgcacacg tcttgcaggc ggcaaggctg 2101 atacatggtt cttgcgccag tgtgacaagg tcttgaacct ccccttcaag gatactttgg 2161 gcagacccga cagagataac gtcattgacg gttacatcaa caagaacgaa gaggacgttt 2221 gcgcagaggg caactggcag aaatacttca ccacccgtcc cgagcccctc accgacgagg 2281 aagccaaggc atatttggca actatcgacg gcgtagccct tggttccgac gctttcttcc 2341 ccttctctga caacattgaa agagccaaga agtcgggcgt taagtatatc gctgaaccgg 2401 gcggatccat cagagatgat cttgtaatcg agtgcgctga taagtacggt atggcaatgg 2461 cattcacagg aatgcgcctg ttccaccact gatttaaagg tgacttaata tgaaaatatt 2521 agttattggc ggcggcggac gcgagcacgc catcatcaag aaaattaaag aaaacagaag 2581 cgttgaaaag atatatgctc ttcccggcaa cggcggaatt gctgccgatg ccgagtgcgt 2641 gagcatttct gcgaccgaca ttgatgcaat cgttgaattt gccgttaaca acgctatcga 2701 ctatgcagtt gttgctcccg atgacccgct tgttcttggc gcagttgatg cgctttccgc 2761 aaagggtatc ccctgctttg gtcccgaggc taaagcggca ataatcgagg gcagtaaggt 2821 cttttcaaaa gagcttatga aaaaatacgg tattcccacc gcggcttttg aggtgtttaa 2881 cgatgccgac aaggcgcttg aatacctcaa gaccgcgccc attccgacag ttattaaggc 2941 agacggcttg gcgctgggca agggcgtaat catcgccacc acccgcgagg aagcatacga 3001 tgccgttaag agcattatgc ttaacaagca gttcggaaaa tcgggagaca atattgtaat 3061 tgaagaattc ttaacaggcc ccgaggtatc ggttttggca ttcaccgacg gcaaggtcgt 3121 ta // LOCUS sequence137 3119 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence137 VERSION sequence137 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3119 /mol_type="genomic DNA" /organism="" /note="sequence137" misc_feature <1..700 /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_010965395.1:Xaa-Pro peptidase family protein" /note="WP_010965395.1 Xaa-Pro peptidase family protein (Clostridium) [pid:49.6%, q_cov:99.1%, s_cov:64.6%, Eval:5.3e-64, partial hit]" /note="MGA_693" /locus_tag="LOCUS_5340" CDS 827..1384 /product="elongation factor P" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003358905.1" /transl_table=11 /codon_start=1 /translation="MITAGDFRNGVTFEEDGNVLQVIEFQHVKPGKGAAFVRTKTKNVI TGSVIEKSYNPTAKFPTAFIERKDMEYSYNDGDIYYFMDTETYEMTPVNASDLGDSFKF VKENMVCKVLSYKGKVFGVEPPTFVVLAITQTDPGFAGNTATNALKPATLETGAEIKVP LFIEEGELVQIDTRTGEYLARA" /locus_tag="LOCUS_5350" /gene="efp" /note="WP_003358905.1 elongation factor P (Clostridium) [pid:59.8%, q_cov:99.5%, s_cov:99.5%, Eval:2.4e-62]" /note="MGA_694" CDS 1469..1972 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MTLTEKAAYVKGLMDGLDIDTTTDEGKILVALYDLVAEMAETVDD IDGDIDDIVEFCNVLDEDLQVVEEYLMDEEELEDDCDCGCHCHCDDDCDCDCDCCCDDD CDCDCCDPDDDTYECVCPTCGDTIELTLPMIEEGSIECPGCGELLEFDIEEECDCEDCA DDEE" /locus_tag="LOCUS_5360" /note="MGA_695" CDS 2217..2876 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MKKTKTAYLTLAALFSALAYLTVFVFRIPFIPAVGWLKFEAKDCV IALESLILGPSYGVMTSLIVSLLEMVTISDTGPIGALMNFLSTCSFVLPVGLMYKYKKS AKTAVIGLCFSVVLTTALMLMWNYFITPLYLNTPRELIVPLLLPGFLPFNLIKYTINAC LTYILYKPLITVLRKSRMLPESSHKTPSTKGAVAVYIICSIVVLASIVGAIVISIK" /locus_tag="LOCUS_5370" /note="WP_012583215.1 ECF transporter S component (Dictyoglomus turgidum) [pid:33.1%, q_cov:74.4%, s_cov:90.4%, Eval:1.7e-21, partial hit]" /note="MGA_696" ORIGIN 1 tacccatctt cgaatcgtca agactcagga tgagatcgac aagattatca aggcccagcg 61 tattgctgaa gctgcatttg aagacgtttt aaacttcatc cgtcccggtg tcaccgagcg 121 tgagatcgga cttcgccttg attactatat gctctctcac ggtgcagaag ctctttcctt 181 tgataccatc gccctcatag gtgcaaacac ctcgcttcct cacggcgtac ccggcgaaac 241 tgttgttgaa aacggtatgt tcgtgcttat ggactacggc gcaatgtatg agggatacca 301 ctcggatatg accagaactg tctgtgtcgg taagcctacc gagaaaatgg agcttgtata 361 taacacggtt ttgaaagcac agctcgatgc tcttgatgcc atcaaggcag gagttatcgg 421 caaggatatc gacaagatcg cccgcgatgt tattacaaac gcaggctatg gcgacaagtt 481 cggccactct ttgggtcacg gtgtaggtgt tgaaattcac gaagccccaa atgccgctcc 541 ttcaagtgaa cacatcttca aggaaaatat gatcgtaacc gttgagccgg gtatctatct 601 gcccgatgaa ttcggcgtta gaatcgaaga tttcgttgta attaaggaaa atggttgcga 661 aaatatgact ttagctaaga aatctctcat ttctttgtaa aaagggcttg cattatttct 721 aaatataggt taaaatagac tgtaactcat tgtaagatac aaagtcttgc ggtgaaactt 781 attaacattg gcgatattcg tctcaaaata aaggaggata cacattatga tcacagctgg 841 tgatttcaga aacggtgtaa catttgaaga agacggtaac gtattgcagg taatcgaatt 901 ccagcacgtt aagcccggca agggtgctgc tttcgtaaga accaagacca agaacgtcat 961 taccggttcc gtaatcgaaa agtcttacaa ccctactgct aagttcccca cagcattcat 1021 cgaaagaaag gatatggaat attcttacaa cgatggcgat atttactact tcatggatac 1081 tgaaacctac gaaatgaccc ccgtaaacgc ttccgacctt ggcgacagct tcaagttcgt 1141 taaggaaaac atggtttgca aggttctttc ctacaagggc aaggtattcg gcgttgagcc 1201 tccgacattt gtcgttttgg ctatcaccca gaccgacccc ggcttcgctg gcaacaccgc 1261 taccaacgct ctcaagcctg caactttgga aaccggcgct gagatcaagg ttcccttgtt 1321 catcgaagag ggtgagcttg tccagatcga caccagaacc ggtgaatatt tggcaagagc 1381 ttaattgact caatttttca aacacaatat cgctgccaat aaaacggcag cgttttgtct 1441 atcaacataa tgtattggag gatttatcat gactttaacc gaaaaggctg catacgttaa 1501 gggacttatg gacggtcttg acattgacac caccaccgac gaaggcaaga ttttagtagc 1561 tctttatgat ctcgttgctg aaatggctga aactgttgat gatatcgacg gcgacatcga 1621 cgatatcgtt gaattctgca acgttttgga cgaagatctt caggtcgttg aggaatacct 1681 tatggacgaa gaagaactcg aggatgactg cgactgcgga tgccactgcc attgcgatga 1741 tgactgcgac tgcgattgtg attgctgctg tgatgacgat tgcgactgcg actgctgcga 1801 tcccgatgat gacacctatg agtgtgtttg ccccacctgc ggcgacacca ttgagcttac 1861 tcttcccatg atcgaagaag gttctattga atgccccggt tgcggcgagc ttttggaatt 1921 tgatatcgaa gaagagtgcg attgcgaaga ttgtgctgac gacgaagaat aattcaaaat 1981 aaaaccaaat aatcaaattg ttgtttcgag gcgaggcgaa attcctcacc ggcggtaaag 2041 tccgcaaaca aggctataaa tatgccttgc cgacagggtg aaactccctg accgacggtt 2101 atagtccgga tgaaagaaac gggcaaaatg ccatcaatgc gtcctcttaa cacatattaa 2161 ggggacgctt tttcatatca tttgaaacag caaacaattt gaaatgagtg atagatatga 2221 aaaaaacaaa aaccgcatac ttgaccttgg cagctctatt ttctgcctta gcatatttaa 2281 ccgtattcgt tttccgaatt ccgttcattc ctgcagtcgg ttggctaaaa ttcgaagcga 2341 aagattgcgt cattgccctt gaatcgctga ttttagggcc atcctacggc gtaatgacct 2401 cgcttatcgt ttcgctcctc gaaatggtca caataagcga tacaggcccg ataggagcgc 2461 tgatgaactt cctttcaacc tgctcctttg tgcttcctgt gggtttaatg tataaataca 2521 aaaagagcgc gaaaaccgct gtgatcggcc tatgcttcag cgttgtttta actactgctt 2581 tgatgctgat gtggaactac ttcatcaccc cgctgtatct taataccccc cgcgagctga 2641 tcgttccgct tttgcttccg ggctttttgc ctttcaatct cattaaatat accatcaatg 2701 cctgcctgac ttacattctt tataagccgc tcataaccgt tctgcgaaaa agccgaatgc 2761 tgcccgaaag ctcgcacaaa actccgagca ccaaaggtgc tgtggcggta tacatcatct 2821 gcagtattgt ggttttggcg tcaatagttg gtgcaatagt aataagtata aagtaaaagg 2881 agaataacca tgctcgatta cagatatgac acacagcttt taattgaagg cgaagatctt 2941 gacgaagatg agatctatga ttacatcaca gacaactttg aaggcgactg ccttttggcg 3001 gtaggggatg aggacttgat caagatccac ttccacacca acgagccttg gaagattttg 3061 gaatattgct ccaccttagg cgagatttat gacatcgtcg ttgaagatat ggacagaca // LOCUS sequence138 3114 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence138 VERSION sequence138 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3114 /mol_type="genomic DNA" /organism="" /note="sequence138" misc_feature complement(1698..>3114) /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_002294013.1:ABC transporter ATP-binding protein" /note="WP_002294013.1 ABC transporter ATP-binding protein (Enterococcus) [pid:44.8%, q_cov:97.7%, s_cov:80.7%, Eval:4.7e-110]" /note="MGA_699" /locus_tag="LOCUS_5380" ORIGIN 1 cgccctttgc catcagctcg gtatgggttc cctgttcaat aatgttgccg tccttcatca 61 ccaaaatgac atcggcgctc ataattgttg aaagtcggtg tgcaacaata aagctggtct 121 tgcccttcat cagcttgtca aaggcgcgct gaacgcgctg ttcggtcttg gtatcgatat 181 tcgaggtcgc ttcgtccaaa atcagcatcg gaggctgaca gagcattact cttgtaatgc 241 aaagaagctg tttttggcct gcggaaagat ttccgccgtc ctcgccgatg ggtgtgtcat 301 atcccaacgg cagacgttta ataaagctgt gagcgtgggt ggcctttgcc gcttcaacaa 361 tttcatcatc tgtggcatcc ggcttgccca tcgttatatt atctctgatc gttcccgatt 421 tcagccaggt ttcctgcaaa accattccgt atcctcggcg gaggctttca cgggtgattt 481 cgcggatatc atttccctcg acacttatcg cacccgagtc gacatcataa aatctcataa 541 gcaggttaat aagcgtagtt ttgccgcaac ctgtcgggcc gacaatttcg accttcgatc 601 cgggcttgac attaaggtta acattttgaa tgagcggtct ttcggggaca tatgagaagc 661 tgacattttc aagggccaca tttccgttta tgccgtcaag ctccttattg ccctcatcgc 721 ttatctgcga gggggtgtcc aaaagctcaa acattcttcc cgcgcaggca aaagcgttct 781 gcaactcggt gataactccg cttatctcgt taaacggctt ggtatattgg tttgcatagt 841 tcaaaataca agtaagtccg ccgacggtaa cgcttcctgc gataacgcca aatgcgccca 901 taagtcccac cgccgcatat acgatcgcgt ttacaaagcg ggtggaggga tttaccaaag 961 aagacaggaa tatggccttg acggaaattt tctgaagatc ggtgttgatc ttatcaaacc 1021 tgtcgtggga tctggtctga tagttatatg ccgcgacggt cttctggttt ccgaccatct 1081 cgtcgataag cgcggtctgt tctccgcgta ttttcgattg ctttccgaaa aggtcatagg 1141 tatttttgga aatatatctt gccacaaaca gcgacattgg ggtcaaaaca accgcaacaa 1201 gggtgatctt ccagcttatt gtgagcataa agcaaagggt tgcaacaatt gtcacaacac 1261 ctgtaaagaa ttgggaaaat cccaaaagca ggccgtcggc aaaggtgtca acatccgata 1321 taactcggct gacaaggtcg ccgtggggat gtgagtcgat atatgatagg ggcaagtctt 1381 caatttttct gaatgccgca tcgcggacat ctcttacagt ctggaaggtg atcttgttgt 1441 tgataacgcc catcacccat tgcattaagg caacggcaat gccgacgatg cccgcacggg 1501 tcaagaacat tataaccgtg tcaaaatcga ccttgcccgc ttcaacgatg ttatcaatcg 1561 cgttgccgaa gagtatgggg acatacaaag aaagcaccga tgagcctgcc gccagcaaga 1621 tcgacaaaac caacagcgga atatattttt tgaggagctt cagcactctg agcgctacag 1681 atgcggaggt tttgttttta gccattgctt acgccctcct ccgatttgat ttgcgattca 1741 taaatctcgc ggtattcggc acaggattcc aaaagctcgc tgtgtgtgcc gatgccgacg 1801 gcatcgccgt catcgagaac taaaatctcg tcggcgtgca taacgcttga aacgcgctga 1861 gatacgatta tgacagcagg attaaaatta agctcccgca gggatatgcg aagacgtgca 1921 tccgttgcat agtcaagggc agaggagctg tcatccagaa tgagaatttc gggctttgtg 1981 accaatgcgc gggcgatgga caaacgctgt tgctgtccgc ccgagaggtt tctgccccgc 2041 tgttcaattt caaagtcaag tccgccgtcc tttgccatga caaagtcata tgcctgagca 2101 gctttgagcg ccgaaacaat ttcgtcgtcc gttgcgtatt ctgcgccgag gcgcatatta 2161 tctctgaccg agcctttgaa aagcgctgtt ttttgcatta caacgccgac cttttcgcga 2221 agcgcttcaa ggtcatattc ttttgcgtct acaccgtcga taagcacttc accctcagtc 2281 gcatcataaa aacggggaat gagatttata agtgtggact ttccgcagcc ggtcggaccg 2341 ataatgccca aggttttgcc cttttcaagg cggaaagcaa tgtttgaaag ggattcctca 2401 gccgcagaac catatttaaa ggacacattt ttgaattcaa ctgccgccga gccgtctttt 2461 ccgctgatta aagcgccgcc ttccattgaa ggcgtgacct ccataactgc ggagattcgc 2521 ttagcgcagg agtatgactt agtaatagtg attatcagat ttgcaagctt aacaagctcg 2581 accaagatct gtgacatgta gttataaaga gcaatcacca tgccctgagt cagaactccc 2641 gtttcaactt tgattgcgcc tatatagatc agcaaaatta cgcccacatt cacaataaca 2701 tatgtaagcg ggttcataac accagatatc cagccgacat gcttttgggt cttggtcaag 2761 tcctcgttgc ggatgatgaa ttcatccgtt tcctcgtcct ccttgcaaaa tgcgcggatg 2821 acacgagcac ccgtcaagtt ttcacgggtg atggaaagaa ctctgtcaag cttcgactgc 2881 acctttgaat ataacgggat gcaccacagc attattccga aaacaaccac cgacaaaacg 2941 ggaatcacgc cgacgaatat caatgccgcc ttgacatcaa tggtgaatgc catcgccatt 3001 gcaccgaaaa cgataaaggg cgagcgcatc aaaaggcgca gggtcagatt tattcccgtc 3061 tgcacctggt tgaggtcgct ggtgagcctt gtgataagcg tggatgagcc gagc // LOCUS sequence139 3107 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence139 VERSION sequence139 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3107 /mol_type="genomic DNA" /organism="" /note="sequence139" CDS complement(1409..1993) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MHCIESNMITVKLKNLTLKFCFGFFFILAVSTIDPDSYAVLSLMF CILHEFGHLAFMLIFKIKVSEINLYGAGIKICANGVDELNRICQTLIYFGGCLMNLLLY LIFINIGLVDYALINLIICVFNLLPIAHFDGGKIFELYMPRLSFLRKVFSVLFSCFLFG IVISVSVIEFEIISTYYIIAFVFIILCEMLE" /locus_tag="LOCUS_5390" /note="MGA_701" CDS complement(2200..3105) /product="ribosome small subunit-dependent GTPase A" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_002287379.1" /transl_table=11 /codon_start=1 /translation="MNMITLNGTIISSLGGTFKVAARGNEYICKARGVFRNRQITPICG DNVTVEIDPVTNEGVITDVSDRKNEIIRPPLANLDQLVFVISTCEPYPNLLLLDKFLAV SVYKNISPAIVFTKTDKAPADEYVEIYSPIFPTFCVDNSTGEGVEQVKELLHDKFSAFT GDSGAGKSTLLNNICPDLNLTTNEISRKLGRGKHTTRRVDIYPLDGGGYVADTPGFSTF NTQMYDTIMKQDLADCFPEFDEYLGNCRFQDCSHTKEQGCAVLEALRSGIIAKSRHNSY CEMYAESALIKPWEVKNAKR" /locus_tag="LOCUS_5400" /gene="rsgA" /note="WP_002287379.1 ribosome small subunit-dependent GTPase A (Enterococcus) [pid:41.8%, q_cov:98.0%, s_cov:98.0%, Eval:1.1e-55]" /note="MGA_702" ORIGIN 1 aacgttgatg ctcaaatact tgcctttgac tcccctattg acttcataga acagatcttg 61 aattttacgg gcaagtgtag caattccgat gatgtcttca tcggtttctg taggatgacc 121 catcatgaaa tatagcttaa catttgagta accacccata aacgcaagct tgcaggtgtc 181 catgatctct tcttcggtga tgttcttgtt aattacatcg cggagtcgct gagtgcctgc 241 ctctgcagca aatgtaagac ccgattttct gatacggctg attttctcga gaatctcttc 301 gctgaagcta tcaacgcgca acgaaggcaa agacaaattt accttttcac cgtcggtata 361 atcaaccaag gttgtaagaa gattttcgat gtcggggtga tcgctggttg aaagagaaga 421 aagagacact tcctcatatc cggtttgttc gcaaagcgct tttgtctgtt tggcgatggt 481 ttctgtcttc ttctcgcgga agggacgata tatataccca gcctggcaga aacggcaacc 541 acgaatgcat ccgcgcagaa cttcgacaac agctctgtcg tgaacaatat cagtgaacgg 601 aacaacgaaa taatcagggt aataaacctt gtcgaaatcg gcaatgatgc gctttttaat 661 aggcatcgga gcatagtttt gaggaacaat tgcattaaca gttccgtcat cgttataaat 721 tacatcatag aataaaggaa catatatacc ctcgattttg caggcttctt tcaaaaactc 781 ggactttgtg catccgcatt ttttcatttc gcagtataga tccatcagtt caaggtttac 841 ctcttcgcct tcgccgagaa tgaacagatc aacaaaatca caaaggggtt cgggattgca 901 aacgcaaggt cctccggcaa ctacgatcgg gtcgttctcc cctctttcgc aagttctaac 961 tttaagccct gcaagatcga gcatatttaa tacgttggta tagctcagtt catattgcaa 1021 tgtgaaacca atgaaatcaa attccttaat agggtcgaga ctttcaagtg catacagcgg 1081 gatattattc tcgcgcatta tcttttcaaa gtccttttca ggcgcaaaaa ctcgttcaca 1141 ccaataattc tcacgcgaat ttttaagtcc gtaaagaatc ttcattccaa gatggctcat 1201 tccgacttca tatgtatcgg ggaaacagaa ggcaaatctt acatccacct ttgatttatc 1261 ctttataaca cttcccactt cgccgccgat atatcttgag ggtttcattg agcgaagggc 1321 aaggcgttca attttatctc ttaaatccat aaacatcctc cgtttagtta tccgatatat 1381 tgtaacacac tttttgaaat aatgcaaatt attcaagcat ttcgcaaagt ataataaaaa 1441 cgaatgcaat aatatagtaa gtggaaataa tttcaaattc gattacggat acggaaatta 1501 cgataccaaa caagaagcaa gaaaataaaa cagaaaagac ttttcgcaga aatgataatc 1561 gcggcatata tagttcaaaa attttcccgc cgtcgaaatg agctattggc aacagattaa 1621 aaacgcatat gataaggtta atgagtgcat agtcgactaa tccgatgttg atgaatatca 1681 aatataaaag caggttcatt aagcatccgc caaagtatat gagggtttgg catatgcggt 1741 ttagctcatc tacaccgttt gcacagattt taattcccgc tccgtaaaga tttatttcgc 1801 tgactttgat tttgaatata agcataaatg caagatggcc aaactcgtga agaatgcaaa 1861 acatcagcga taaaacagcg tatgaatccg gatcaattgt cgaaacggca agtatgaaga 1921 aaaatccaaa acagaatttg agtgttaagt tttttagctt tacagtaatc atattggatt 1981 ctatgcaatg catttataaa tataacaaaa tcccctcggt aaaccgaagg gatcagtttc 2041 aatatgatga ttctttttct tttttgattc cgaaaatcat ccgtaaaatt ccgccaagga 2101 atttgcccgg cttagcaaca acaaccttca taagatatgc ctcccatatg tattttgcaa 2161 cgaatgctaa taacttaata ttcaggcagg ctgaatttgc taacgcttgg cgttcttaac 2221 ttcccaaggc ttgatcagcg ctgattcagc gtacatctcg caatagctat tatgacggga 2281 ttttgcaata ataccgctcc ttaaggcttc caaaacagca catccctgct ctttcgtgtg 2341 ggagcaatcc tggaaacggc agttgcccaa gtattcatca aattcaggga aacagtcggc 2401 aaggtcttgc ttcatgatgg tgtcatacat ctgcgtgttg aaggtggaaa agccgggggt 2461 atctgcaaca tatccacctc catcgagtgg gtagatatct acgcgtcgag tggtatgctt 2521 tcctctaccg agctttctgc taatttcatt tgtcgtcaaa ttcaaatcgg gacaaatgtt 2581 gttcaaaagc gttgattttc ctgctccaga atcacctgta aaggcagaaa acttgtcgtg 2641 aagaagttcc tttacctgct caacgccttc gcctgtactg ttatcaacgc agaaagtcgg 2701 gaaaatcggt gaataaatct caacatattc gtcagcaggt gccttatcag tcttggtgaa 2761 aacaattgca gggctaatgt ttttatatac tgacacagcg aggaatttat ccaacagcaa 2821 aagattcgga tatggctcgc aggtggatat tacaaacaca agctgatcaa ggttggcaag 2881 cggcggacgg ataatctcat ttttgcgatc agaaacatcg gtaattacgc cttcattggt 2941 gacagggtcg atctcaaccg tgacattatc accgcagatc ggggtgatct ggcggtttct 3001 gaatactcct cttgccttgc agatatattc gtttccccgg gcggcaactt taaatgtgcc 3061 gcccagagag cttattattg ttccattcaa tgttatcata ttcatat // LOCUS sequence140 3100 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence140 VERSION sequence140 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3100 /mol_type="genomic DNA" /organism="" /note="sequence140" CDS complement(562..819) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MEEKIFVGYRYGRFTDDKTGEIKDYCQVFVLEDFAGNQSNDYHYD GKAAVKYSCVSPEVFKDIKVNSKVRCFFDSRKKISFMQAI" /locus_tag="LOCUS_5410" /note="MGA_703" CDS 978..2357 /product="MATE family efflux transporter" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011861455.1" /transl_table=11 /codon_start=1 /translation="MTNSHIKDFTKGNITKDLIIFAWPLLLSNILQVVYSMVDMIVVGK VMGKVGTSAVTVGGDVTNLLTFIGMGFASAGQVLIARYVGAKQRDKIGKFVGTMTSFLF IMAIVVSIFGLVSQDLILRLMNTPAEAYDGAAAYSSICISGLVFIYGYNVTSAILRGMG DSKHPLLFIAIAALINIVLDLIFVAGFNMGAGGAALATVVSQAISFILCLIFLIRKKEM FSLNIAKNDFIHWNRDMLSAFVKLGVPMAIKFAAISVSRMFVNSWINGYGVAVSGFAGI ANKLASVVNLFSNAMNTAGSTMVGQNIVAGQFDRVNKILKNLLIITLSIAIAFSIAMVL FPQEIFALFTDSSETEVLELADVYVPIALMMFLSSSLRATMNALINGSGNVKTNFLTAI LDGIVLRIGLSLLFGVALKMEYFGFWLGDAIAGYTPFFIGLVFYLTGSWKKGVKPREQT E" /locus_tag="LOCUS_5420" /note="WP_011861455.1 MATE family efflux transporter (Clostridioides difficile) [pid:28.8%, q_cov:96.7%, s_cov:97.5%, Eval:2.9e-56]" /note="MGA_704" misc_feature complement(2599..>3100) /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_009887791.1:elongation factor G" /note="WP_009887791.1 elongation factor G (Clostridioides difficile) [pid:56.3%, q_cov:95.2%, s_cov:24.5%, Eval:1.5e-46, partial hit]" /note="MGA_705" /locus_tag="LOCUS_5430" ORIGIN 1 aagcgaatga gtgacgaggg agagccaaca aaaacagatg aacctttaca tgatttaatg 61 acttcccaaa agtcagatcg ggaaacaaaa ttgctgtcaa tcgtatcctg gcaaatcttg 121 tctatatcaa gtattccagt gtgatcatca aaagccacat caagacgagt tatttttaag 181 tcattttcat ttatccaagc aaagagttta tcccaaccta ttgaagaaca agtttcaaag 241 gttcggcacc cttgaccaga catttcaacc catactccca tatccgggcg accgttgaag 301 tgaattgaaa tagaagaaaa atagagcctg tcacggtatc ctcttgcacc tttgacaact 361 tcaaagggac aagacatcaa gcctaaagca gatacgattt cttctgggct atgctttttt 421 gtggtaaagc ttagccagtc ataaagaacg atgttttcag tatacaaaac agtaaccccc 481 gtgtgttttg taggtagtac ccccctgtta gcggaggggg gtaaccccga ggagctacct 541 cggggctttt aagcggtagt attagattgc ctgcataaag gaaatcttct tgcggctgtc 601 aaagaaacaa cgcaccttgg aatttacctt gatgtcctta aagacttcgg gagaaacaca 661 cgaatacttc acggcagctt tgccatcgta atggtaatca ttgctctggt tccctgcgaa 721 atcttccagg acaaagacct gacaataatc tttgatttca ccagtcttgt catcagtaaa 781 tctgccatag cgataaccta caaaaatttt ttcttccatt tttcataact cctttgtgag 841 taaaatttta ggactttgtt tgtccaaatt tattataaaa cttaccttcc actttttaca 901 atcaatcttt cccttgataa tcctctcaaa aagtggtata atatataatt gaagtttaaa 961 ttttgaagga acctgaaatg actaattcgc acattaaaga ttttacaaaa ggtaacatta 1021 caaaagacct gattattttt gcctggccgt tgcttctttc caacatcctg caggttgtat 1081 acagtatggt ggatatgata gtcgtcggca aagtcatggg caaggtgggc accagtgctg 1141 taactgtcgg aggtgacgtt acaaacctgt tgaccttcat cggtatgggc tttgccagcg 1201 cgggacaggt tttaattgcc cgatatgtcg gcgcaaaaca gcgggataag atcggcaaat 1261 ttgtcggcac aatgacctca tttttgttta ttatggcgat cgtcgtcagt attttcggac 1321 ttgtctccca ggacctcatt cttagactta tgaacacccc tgccgaagca tatgacggtg 1381 cggcagcata ttcatccata tgcataagcg gacttgtgtt tatctatgga tataacgtca 1441 ccagtgcgat cttgcgcggt atgggtgact cgaagcaccc tcttttgttc attgcgattg 1501 cggcactgat aaacattgtt ctcgacctta ttttcgttgc gggattcaat atgggtgcgg 1561 gcggtgcagc tttggcgact gtcgtcagcc aggcgataag cttcattttg tgcttgattt 1621 tcctcatccg caaaaaggaa atgttctcgc ttaacatcgc caaaaacgac tttattcact 1681 ggaaccgcga tatgctttcg gcatttgtca agctgggtgt gcctatggcg atcaaatttg 1741 cggcaatttc agtttcccgt atgtttgtta actcctggat caatggctat ggcgttgcag 1801 tttccggatt tgcaggaatc gcaaacaagc tggcatctgt tgttaacctg ttctcaaatg 1861 ctatgaacac cgccggctcc accatggttg gacagaatat cgttgcggga cagttcgacc 1921 gagtcaacaa gattttgaaa aatctgctga tcatcacact ttcaatcgcg atcgcattca 1981 gcattgcaat ggttctgttc ccgcaggaga tctttgcgct gttcaccgac agctccgaaa 2041 ctgaggtgct tgagcttgca gatgtatacg ttcccattgc gctgatgatg ttcctttcaa 2101 gctcgctccg tgcaacgatg aatgcgctca tcaacggaag cggaaacgtc aagaccaact 2161 tcttgaccgc aattctggac ggcattgttt tgcgaatcgg attgtcgctt ttattcggcg 2221 tggcgctgaa aatggaatac ttcggcttct ggctgggcga cgcgattgcg ggatatacgc 2281 cattcttcat cggtcttgtg ttctatttga ccggcagttg gaaaaaaggc gtcaaacccc 2341 gagaacaaac agaataattg aaaagcaaat cccctctgcc ttgttgcagg ggggattttg 2401 tgcgcgtatg cctccctctg acgagggagg tgctgagctt gtcgaggcag agggagagaa 2461 gatatatgcc accaacgcat ccacgcattg gtctctccct cagtcgcctg cggcgccagc 2521 tccctcatca gaaggagcct ttttgcacaa aaaatccccc gctctttcga acgggggtga 2581 tttttatttg atattcaatt attcgtcgtc aaccttgaac ttggtgatga catcatcaac 2641 aagcattgcg ggaagctgtt cataacggag ctttgaaagg gtgaattcgc ctctgccgcg 2701 ggtcatctgg cgaacgagca ttgcaaagtc gtgaacttcg ctctcgggaa cttctgcttc 2761 gatggtggtg ttgcccttct tagcagcagg agccataccc aaaacgcgtc ctcttctctt 2821 gttgagttcg cccatcatat cgccggtgtt ttcatccgga acggttacag aaagcatatc 2881 aatgggttcg agcaagatgg ggttagcaag cttcatacct tccttgaagg cgatggatgc 2941 tgccatcttg aaggacattt cgctcgagtc aacatcgtgg tatgaaccgt caacgagggt 3001 tgcctttacg ccgacaacag ggaatcctgc aagaacgccc ttcttcatgc aatcctgcaa 3061 gcccttttca actgcaggga agaagttacg gggaactgcg // LOCUS sequence141 3083 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence141 VERSION sequence141 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3083 /mol_type="genomic DNA" /organism="" /note="sequence141" CDS complement(510..1631) /product="D-alanyl-D-alanine carboxypeptidase family protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003428267.1" /transl_table=11 /codon_start=1 /translation="MKKLLCIFTSIILLTASFSAEEISSPSYSYVLMEGSTAALLYADN GNYVFEPYHFSKLMTLLLTVEAIERGELSFDTVVTVSNHANAMPDPQIWLRVGEEIAVS ELIMSITVGNANDACVCLAEAVSGTEEAFVIQMNKRAEELGMSQTYYADSTGLTDGSYT SACDLAILASELSHYGELTEYFTTWLTYVRGDEAQLVNNNKLVRNYDGITGMKAFSSKS LGNCVVSTAKREDLTMVCVIIGEQEKDEQFSTAKEKMTVGFSAYMLYRPKATDIYCRPV KVSKGVENELETYVGNLDKFVIRKSREDDVEVHAEYFDGIIAPINCGDSVGRIVYTLDG EEVYSAPILAKDSTRKITFFSAFKKLFLNLIKM" /locus_tag="LOCUS_5440" /note="WP_003428267.1 D-alanyl-D-alanine carboxypeptidase family protein (Clostridioides difficile) [pid:29.7%, q_cov:99.5%, s_cov:100.0%, Eval:4.3e-44]" /note="MGA_707" CDS complement(1798..2028) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MNSVMIRLETINDVKKFVNCVSLCDYDVDLVSGRYAIDAKSIMGI FSLDLSKPIELRAHTDDSRDFMEQIADFLVK" /locus_tag="LOCUS_5450" /note="MGA_708" ORIGIN 1 acgttaacgc aaatgtcctt gccttcgcaa atggaaagga tctcgttaag ataagtgggg 61 ctgatgttgt taccaacgaa gtaaatgtcg ggggtatcct ttttgaggtt gttgtagaag 121 gggctcttca aaagctcgat agcggcacgc gcaccgagat atgaaccgcc gattccgata 181 acgattaaga tatcagcctt ctctttaatt ctttctgcgg cggctttaat tcttgcgaat 241 tcttccttgt catagttaac aggaaggtca acccaaccaa gaaaatcatt tcctgcacca 301 gatcttgttt caacaagatt atgagccagg gtgatctgat cgcgacaagc atcatattca 361 tgtgcgccga cgaacttatc ggtatacttt gttaccaatc tgatcgacat ctatgtcatt 421 tcctctctaa tagtttattt gtaagcttat tttagcataa agcacacaat attgcaagaa 481 attttcgaga aaaatatgcg aatcttttat cacattttta tcaagtttag aaacagcttc 541 ttaaaagccg agaaaaaggt gattttcctt gttgagtctt ttgctaaaat cggtgcggaa 601 tatacttctt cgccgtcaag tgtatataca attcttccaa cactgtcgcc acagttgatc 661 ggagcaatga tgccatcgaa atattcagcg tgaacctcaa catcatcttc cctactcttc 721 ctgatcacga atttgtctaa atttcctaca tatgtttcca gttcattttc gacacctttt 781 gaaactttaa caggtctgca atatatatcg gttgcctttg gtctgtagag catatatgca 841 gaaaaaccga ctgtcatctt ttccttggct gttgaaaact gttcatcctt ctcctgttca 901 cctattataa cacacaccat tgtcagatct tctctttttg cggtggaaac aacgcaattc 961 cctaaagatt tactgctaaa ggctttcata cccgtaattc cgtcatagtt ccttacaagc 1021 ttgttgttat ttacaagctg tgcttcatcg ccacggacat atgttagcca cgttgtgaag 1081 tattcggtca gctcgccgta atgggaaagc tcgctcgcta atattgcaag atcgcaggcg 1141 gaggtatacg aaccatcagt caaaccggtt gaatcggcat aataagtttg gctcattcca 1201 agctcttcgg cacgtttatt catctgtatt acaaatgctt cttctgttcc ggaaacggct 1261 tctgccaaac acacacaggc atcgttggcg ttaccgacgg ttatggacat tatcagttcg 1321 cttacagcaa tttcctcacc aacgcgaagc caaatctgag ggtctggcat agcgtttgcg 1381 tgattcgata cggttacaac ggtatcaaac gaaagctctc ccctttcaat cgcttcgaca 1441 gtcaggagca aggtcatcag cttcgagaag tgataaggct cgaaaacgta gtttccgttg 1501 tcggcatata agagtgctgc cgttgaacct tccattagaa cgtatgaata tgacggcgac 1561 gaaatttctt ccgcgctgaa agacgctgta agcaatatta tcgatgtaaa tatacacaaa 1621 agctttttca ttatttcctc cacagccttt tttagtattt tattttatag actgcaaaaa 1681 aatgatagct tgtgtgtggt tgaaaaaact tatgatgtat gataaaatca taaaaaagaa 1741 aagcccctcc gaatttggag aggctgacat attcgagagt tgctcaaatc gcgctgatta 1801 ctttacgagg aaatcagcga tctgttccat gaaatcacga gagtcgtcgg tatgagctct 1861 gagttcaatg ggcttgctga ggtcgaggct gaatatgccc atgatggatt ttgcatcgat 1921 agcgtatctg ccggaaacaa ggtcaacatc ataatcgcaa agagatacac agttgacaaa 1981 tttcttaacg tcgttgatgg tttcaagtct gatcattaca gaattcatta caaataacct 2041 cctaatttaa atttgttttt gctctgcacc ctcaatatag cagttttgcc taaaattgtc 2101 aatagttttt tgtatatcat ttctaataat ttttcacaat ttacgaggaa ataattatgc 2161 atattcatta tcacaccttc ggttgcaagg taaatcagta tgaaaccgaa aatatccgcc 2221 aagcaatgga agctgatggc catacaagtg taaacaatct tgaagaagct gatgtttgca 2281 ttatcaacac ctgcaccgtt acccatgagg ccgaccgcaa gctgattcag cttgtaaaca 2341 gaattaaacg tgttaatccc aaagcgataa ttgttatgtg cggatgctat tctcagataa 2401 atgaaaatgc aaatcagctt gccgatatcg ttgtcggaac atccaacaaa tcgaggatac 2461 cgcagcttgt tgcagaatat aattcgcaga aaacagcaga agttttgccg cactataagg 2521 gcgaacactt tgaaacaatg gcaaatatcg gatcagcgag aaaaacaagg gcggtaatta 2581 aaattcaaga cggctgtgac cgattctgca cctattgcat aatcccctat gccagaggca 2641 gggcacgttc gaagccgata aacgagattg aagcggaagc taaggcattg gttaaagcag 2701 gacacaagga gcttgacctg gttggtataa atctttcctg ttatggtcat gatttgggac 2761 tgaaccttgc cgatgcagtt gaaagagtct gcaaaaccag cggtgccgaa agagtacgac 2821 tcggttcact tgaagctgaa ctgatttccg aggaaataat aaagcgattg tccgaacttg 2881 acaacttctg ccctcatttt catctttcgc ttcatagcgg atgtgacaaa acccttaggg 2941 aaatgggcag aaagtatgac aaggcagaat actttacaat agtcaataac ataagaaaat 3001 atttccccga ctgtgcaatc acaacggata ttatggttgg attcccggga gaaactgatg 3061 atgactttag tgagtcactg gag // LOCUS sequence142 3059 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence142 VERSION sequence142 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3059 /mol_type="genomic DNA" /organism="" /note="sequence142" CDS complement(998..2479) /product="alpha-L-arabinofuranosidase AbfA" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_004398747.1" /transl_table=11 /codon_start=1 /translation="MRAKININAENVIGKIDDRLYGSFIEHLGRAVYGGIYEPTHPTAD DMGFRTDVLELISKLGVPMVRYPGGNFVSGYNWEDGTGDRTKRPKKLDLAWSSVETNEV GIDEFQEWTKRANSQVMMAVNLGTRGAQDAANLVEYCNLETDTYYANKRRENGFDKPFG IKTWCLGNEMDGPWQICAKTPYEYARTACEAAKMMKWVDPSIELVACGSSHIYMPTFGE WERTVLRECYDHVDYISLHNYYGNRNDDTPEYLASAVDMNRFIKTVASICDEIKAEKGS HKTVNLSFDEWNIWFHSNEQDKLIPRWSVAPPLLEDIYNLEDALVLANLMMTLINNCDR VKIACLAQLVNVIAPIMTENGGAAWAQTIYYPFMYTSMNGRGNAIMTTCECPTYDAGNK KNVPLVDSSAVLSEDTNKLSLFVFNRSMDEVCELDIDALGFEDYKLCEHISLEGDDLKA VNTKDEPNKVVPVCKEIGDVITLAPHSWSMLVFEK" /locus_tag="LOCUS_5460" /gene="abfA" /EC_number="3.2.1.55" /note="WP_004398747.1 alpha-L-arabinofuranosidase AbfA (Bacillus) [pid:55.6%, q_cov:99.8%, s_cov:99.2%, Eval:3.8e-166]" /note="MGA_711" ORIGIN 1 tagaataagc aaaggccttc cttaatgcct gcgccttcaa tgtcatttct gagggtccag 61 ccgttttccc aaacaggata gatacagtcg ttcttcttga ggttataaat aaggtcagca 121 gctctttcaa ggccggggtt gccaaggtcg gattcataaa gaccggtctc ggtgttataa 181 acaactgtgg ttgttccgct ggattccata atgttggtgt catagtacca accgtcaaga 241 gcatatctgt cttcgtcagg atcgctgaaa tctacgcaca ttgaatagaa ttcatcccaa 301 gtccattcgt cgttatagta aagctctgcg ggatcgtcaa agccccattc gtcgatgact 361 cttctgttga atatacaaac atcgtcgaac tgagtttcgc agcagataac atatctgttg 421 cctgcaaggc tcaaatatgt atcaacgaaa tccttggtgc cctgccaaag gggatcgtca 481 tagtcaacat agtcgttaac cggctggaac atacccttaa tggtgtaagt ggggaagtag 541 tcaatatcgt ctgcggggaa gaagtcggga gatgtacctg ccaaaatgag gttagcaagt 601 ccgtcatatc tctgatccca tacacattcg atccaattga tctcaccgcc gtatttttcc 661 ttaaaggtaa agaaaccggt gctgacaatt tcctcttcag aatagttgtg gaaaggatcg 721 tgccaggaat accaatcaat aattgtgttt gcgccggcag cttcgctaac gtcaggcaag 781 gtgatacctg ctgctcccaa aatagcttca gcgtcttcgg ttgaaagagt aacttcaacg 841 atttcacgct tgttgccacc gcaaccgaca agagcaaata ccatcaaaag agtaagtgca 901 attgccaaca gtctcttaat tttcataatc gtcctcctaa aaaatttttt atataaatct 961 gcatcaacag aaaatatata ctatttgttg cttaaaatta cttctcaaac accagcatac 1021 tccaagaatg aggagccaat gtgataacgt caccgatctc cttgcaaaca ggtacaacct 1081 tgttcggttc gtccttggtg ttgaccgcct tgaggtcgtc accttcaaga gaaatgtgtt 1141 cacaaagctt atagtcttca aatcccaaag catcaatatc aagctcgcaa acttcatcca 1201 ttgaacggtt gaaaacgaac aggctgagct tgtttgtgtc ctccgaaaga acagcagatg 1261 aatcaaccaa aggaacgttt ttcttgttac ctgcgtcata tgtagggcat tcacaagtag 1321 tcataattgc gttaccgcgg ccgttcattg atgtatacat aaatggatag taaattgtct 1381 gtgcccatgc ggcgccgccg ttttcggtca ttatcggcgc gattacattg acaagctgtg 1441 ccaagcaggc gattttaact ctgtcgcagt tgttaatgag ggtcatcatc aagtttgcca 1501 aaacaagggc atcctctaaa ttgtaaatat cctcgagcag cgggggagca accgaccatc 1561 tgggaatgag cttatcctgc tcgttactgt ggaaccagat gttccattca tcgaaggaaa 1621 ggttaactgt cttgtgtgaa cccttttctg ccttaatttc atcgcaaatg cttgcaactg 1681 tcttaatgaa tctgttcata tcaacagcgc ttgcgagata ttcgggggtg tcgtcatttc 1741 gattgccata gtagttgtgg agcgagatat aatcaacgtg atcataacac tcgcgcaaaa 1801 cggtgcgttc ccattcgccg aaggtgggca tatatatatg tgagctcccg caggcaacca 1861 attcaattga agggtcgacc cacttcatca tctttgcggc ttcacaagca gttcttgcat 1921 attcatacgg tgttttcgca caaatctgcc aaggtccatc catttcattt cccaagcacc 1981 aggttttaat gccgaatggc ttgtcgaatc cgttttcacg gcgcttgttt gcataatatg 2041 tatccgtttc aaggttgcaa tattcaacca aatttgccgc atcctgcgca cctcttgtgc 2101 cgagattaac agccatcata acctgggaat tagctctctt tgtccattcc tggaattcat 2161 caattccaac ttcgtttgtt tcaaccgagc tccaggcaag gtcaagcttt ttcggacgct 2221 ttgtcctgtc gcccgtgccg tcctcccagt tatatcccga aacaaagttt ccaccggggt 2281 atctgaccat gggaactccg agctttgaaa tcagctctaa aacatcagtt ctaaagccca 2341 tatcgtcagc ggtggggtgg gtcggctcat atataccgcc gtaaactgct ctgccgaggt 2401 gttcaataaa tgagccataa agacggtcat caatttttcc gatgacattt tctgcgttaa 2461 tatttatttt agctctcata gtgactcctt gtggtattat taattataat atagcacaca 2521 gcttgcaata aagcaaatga acaattacgc taaaaaacta acttattgtg ttcagacgcg 2581 ttttcttatc cgaaaacagc gatgtatagc aataaactga cattttctgc taattcattg 2641 atattttctg cgactaacgg cttttgactt gatttttcaa aaaacttttg tatataatca 2701 aattaacaaa acttcggagg gaagataatg caaattaaca acatcggata taaccatcac 2761 cacgatgctg atttctgtgt taaccgtcct gtcggctcgg gagaccatct gcttttgctt 2821 ttaaagacac ctgcaatttt tagctttaac ggtgttgaag aaaagactct gtcaaattcc 2881 ttcattctct atgacaaagg tgcgccacag tattatcgag ccctcggctc tcagtttgca 2941 aatgactggt tccatttttt gatcgacgaa gccgacatta gctttttcca ggctcttgat 3001 attcctatga ataaagttgt ccctcttgat gatatcaacg gtctgtcaat gctgattaa // LOCUS sequence143 3046 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence143 VERSION sequence143 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3046 /mol_type="genomic DNA" /organism="" /note="sequence143" CDS complement(244..486) /product="TIGR03905 family TSCPD domain-containing protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_008761253.1" /transl_table=11 /codon_start=1 /translation="MVINYKTQGTCSRQINITVEDGIVMEVEFIGGCNGNLKGISKLVK GMKVEDVIERIEGTTCGFKNTSCPDQLAQALKQAL" /locus_tag="LOCUS_5470" /note="WP_008761253.1 TIGR03905 family TSCPD domain-containing protein (Bacteroides) [pid:63.5%, q_cov:92.5%, s_cov:91.4%, Eval:5.2e-23]" /note="MGA_714" CDS complement(508..1461) /product="RluA family pseudouridine synthase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_010964333.1" /transl_table=11 /codon_start=1 /translation="MKEFIIEKNDAGQRLDKFIKKAVPDLPQNLMYKYIRLKRIKLNGK RCEISSRLNVGDKLEMYINDEFFSSEKVQDFTSAPAQIDIVYEDDNILLVNKKCGLVVH EDDDNTLDTLINRMTHYLYDKGEYDPEREQSFAPALCNRLDRNTEGIVICAKNAESLRL LNDIIKEREITKKYLCITLGTPKPVEATITAYLEKDEFKKQVYISDKKTPANKTIVTKY KVLETRGELSLCEIELITGRTHQIRAHMAYIGHPLLGDGKYGRNDDNRRYGVKYQALCA YHLSFDFKSDKGILNYLNGKSFSVAVPWFAKEFFDK" /locus_tag="LOCUS_5480" /note="WP_010964333.1 RluA family pseudouridine synthase (Clostridium) [pid:42.0%, q_cov:96.5%, s_cov:95.6%, Eval:4.5e-60]" /note="MGA_715" CDS complement(1462..2223) /product="SDR family NAD(P)-dependent oxidoreductase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003436810.1" /transl_table=11 /codon_start=1 /translation="MNIAIITGASSGLGVEFLKEISAVYPSLDEIWLVARREDRLIELA AQYTKPVCVPVALDLTSDSAYEALKAKLEEKQANVSILINNAGMGKMGNVADMDCASQT MMVDLNCRGLTAVTSICLKFMSRGSQIINICSIASFCPNTRLNTYSATKAYVMSFTKGL REELKPLGINCMCACPGPMKTEFLSVAAIETGTSKTFDTLPYSDSNTVAKNTLKASAKG KCVYTHLFLFKLFRVLAKILPHNLVMKWCRV" /locus_tag="LOCUS_5490" /note="WP_003436810.1 SDR family NAD(P)-dependent oxidoreductase (Clostridioides difficile) [pid:37.3%, q_cov:97.6%, s_cov:94.2%, Eval:6.6e-34]" /note="MGA_716" ORIGIN 1 ctgttacgcc aagcaaagtc tgacgctttt tgccttcctt tatgccttta acaagggcag 61 ttatcgcttc gggctggtcg cctgtcggct taaattcact tttgattttg aactgatcca 121 taactcgcac ctcgctttag aacatttgtt cacattatac cacttatatt tttaatagtc 181 aacgatttat gataaagttt gagcaaaaaa gcaggaagtt ttcttcctgc tttatgtcac 241 aaattaaaga gcctgcttga gagcctgtgc caactggtcg ggacaagagg tgttcttgaa 301 gccacaagtg gtgccttcaa ttctttcgat tacatcttca accttcatac cctttacgag 361 cttggaaatg cccttgaggt tgccgttgca accaccgatg aattcaacct ccataactat 421 gccgtcctca actgtgatgt tgatctgtct tgagcaggtg ccctgtgtct tgtaattgat 481 taccatttta ttttctcctt tacgttgtta tttatcaaaa aattctttag cgaaccacgg 541 tacggcaacg ctgaagcttt ttccgttgag atagtttaaa atacccttgt ccgatttgaa 601 atcgaaactg agatggtatg cacagagtgc ttgatatttc acgccgtagc gacggttatc 661 atcatttctg ccatacttgc cgtcgcccaa aagcggatga ccgatatatg ccatatgagc 721 gcgtatctgg tgggttctgc cggttataag ctcaatctcg caaagagaaa gctctcccct 781 tgtttcaaga actttatact ttgtgacgat agttttgttt gcaggcgttt tcttgtcgct 841 gatatatacc tgttttttaa attcgtcctt ttcaagatat gcagtgatgg tcgcctcgac 901 gggcttagga gtgccaaggg tgatgcaaag atacttcttt gtaatttcgc gttctttgat 961 gatatcattg agcaaacgaa gactttcagc gttctttgca caaatcacaa tgccttcggt 1021 gttgcggtca aggcggttac acaaagcagg agcgaaagat tgctcgcgct cgggatcata 1081 ttcgccttta tcatatagat agtgcgtcat tcggttgatg agtgtgtcga gggtgttgtc 1141 atcatcctcg tggacaacca atccgcattt tttattgacc agcagaatgt tatcgtcttc 1201 atacacaata tcaatttgtg caggtgcaga tgtaaagtcc tgcacctttt cagatgagaa 1261 gaactcatcg ttaatataca tttcaagctt gtcgccgaca ttaagccgcg aagaaatttc 1321 gcaccgcttg ccgttgagct taattcgctt tagacggatg tatttataca tcagattctg 1381 cggcagatcg ggaacagcct tcttgataaa tttatcaaga cgttggcctg catcgttctt 1441 ttcaattatg aattctttca tttatactct gcaccatttc atcacaagat tgtgaggcaa 1501 gatttttgca agaactctga agagcttgaa caggaataag tgtgtatata cacacttgcc 1561 ctttgctgat gctttcaaag tattttttgc aactgtgtta gagtcgctgt atgggagcgt 1621 gtcaaatgtc ttggatgtac ccgtttctat tgcagcgaca gaaaggaatt ctgttttcat 1681 aggtcccgga caggcacaca tacagttgat gcccaagggc ttaagctctt cgcgcaagcc 1741 tttggtgaag ctcataacat atgcctttgt tgcggaatat gtattgaggc gggtatttgg 1801 acaaaatgat gcaattgaac agatgttaat tatctgcgag ccgcgggaca taaacttcaa 1861 gcatatgctt gtcacagcag ttaaaccgcg gcagttaaga tcaaccatca tagtctgcga 1921 tgcgcagtcc atatcagcta cattgcccat tttgcccata cctgcattgt taataagtat 1981 tgaaacattt gcttgcttct cttcaagctt tgctttgagt gcttcgtatg ccgaatcaga 2041 tgttaaatcg agcgcgacgg gaacacaaac aggtttggta tattgagctg caagctcgat 2101 aagtctatcc tctcggcggg cgacgagcca gatctcatca agtgatggat acaccgcgga 2161 aatttctttt aaaaattcaa ctcccaggcc gctggaagca cctgtaatta tagcaatgtt 2221 cataagtctg ctccttaaat gaaagttcat ttactattat atctattgag cacagtttgt 2281 caaatgaaat gctgaaaata tttaccgtat tgtaatctat gcgctattga aattaggcac 2341 aagctgtgat aaaatattat tagacaacat aatccggcgt aaagcgagtt tgctttacac 2401 cttctcaaca tataaggagc aaaataatga agaacatttc aaaatctgcg cttattttgc 2461 tgattgcaac ttcaatgttt atgagtgctt gcggtcagca gattgaaaat attaccgacc 2521 cgccggttac tactccgcct acggtcagtg aagaggaatc gaccacaaca aaggaaaaga 2581 atgtcccctc tttcacagtt gcaacaacca ctgaaaccac tcctgcaacc accacacagc 2641 cttcggtttc aagcgaaagc caaacttcgg caacaagtga atcaacctca cagacatcag 2701 ttacacctgt aactgaacac acgacagaag cgacaacccc tgcaagcacc aatgaatcgg 2761 gcgagatcgt tgatgatcct tatgagggac ttgttttcaa cacagaagac cccgatgagc 2821 tttatgagtt gtttgggctt tcaaggagcg aacgtcaggc ttactattcc aaaatctcgc 2881 aagaatgcga actgccaatt attcacattt ccacagaaaa tgagaaaaac gttgtatccc 2941 gcgagaagta cgtcaactgc ttggttgagg tattcaactg cgatgagttt tacgttatgg 3001 acgcaacaag cgcgggcata agagtaagag gtaacgcttc agctta // LOCUS sequence144 3040 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence144 VERSION sequence144 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3040 /mol_type="genomic DNA" /organism="" /note="sequence144" CDS complement(48..1280) /product="DNA polymerase IV" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011461101.1" /transl_table=11 /codon_start=1 /translation="MRDILHCDLNNFYASVECRDNPSLRGKPVAVCGSVEDRAGIVLAK NDLAKAYGIKTAEKIYEAKQKCHDLVIVPPRMEEYSAVSKQVRKIYARFTDMVEPFGMD ECWLDITGSHYLFGSSEKIANDIREAVKKETGLTISVGVSFTKALAKLGSDMKKPDAVT LLPYETFRERISGLDVCELIGIGPATGRRLNKLRIHTLGELANSDPEMLSRALGKAGIW LWRAVNGLDDEVVHEIGYESVSKSIGNSTTLREDLYTNGQVWQVMLSLAEEVCRRMRKE ALCAGGVCISIKTKDLDYHEFQAQLDMPISSALMLAEAGFKLFLERFDWHLPIRAVGIR GINLVSANLARQYSLFADAKRVDKLDALSEVSDKLRDRFGRDVIYPARLKSDLFLTHEK VTCFTDVSFRR" /locus_tag="LOCUS_5500" /note="WP_011461101.1 DNA polymerase IV (Desulfitobacterium hafniense) [pid:37.5%, q_cov:94.1%, s_cov:92.8%, Eval:3.3e-56]" /note="MGA_718" CDS complement(1899..2348) /product="8-oxo-dGTP diphosphatase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011837587.1" /transl_table=11 /codon_start=1 /translation="MKRTENAELTVLCLVYRDDEILLQNRIKKDWQGYTLPGGHVEQGE SITEAVKREMKEETGLDIYEPKLCGVKQFPIDDGRYIVFLYKTDKFSGELISSDEGKME WVKRSEIAKIETVSDFELMLRVFDEDSLSEFQYVIENGEWIAKIY" /locus_tag="LOCUS_5510" /note="WP_011837587.1 8-oxo-dGTP diphosphatase (Streptococcus sanguinis) [pid:50.7%, q_cov:100.0%, s_cov:100.0%, Eval:7.2e-38]" /note="MGA_719" misc_feature complement(2335..>3040) /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_010964226.1:tRNA threonylcarbamoyladenosine dehydratase" /note="WP_010964226.1 tRNA threonylcarbamoyladenosine dehydratase (Clostridium) [pid:49.0%, q_cov:97.4%, s_cov:96.8%, Eval:4.4e-58]" /note="MGA_720" /locus_tag="LOCUS_5520" ORIGIN 1 gtctgcggac gtgttccgca ggaacagtgt cgcaggtgcc gcggtcttta tcttctgaag 61 ctcacatcgg taaaacaagt caccttttcg tgggtcaaaa acaggtcgga tttcaacctt 121 gcgggatata taacatccct cccgaacctg tcgcggagct tatccgaaac ctcgctgagc 181 gcatcgagtt tatccaccct tttcgcatcg gcaaaaagag aatattgccg cgcaagattt 241 gcgctgacta aatttatccc ccgaattccg actgcgcgga tgggcaaatg ccaatcaaat 301 cgctccaaaa acagcttgaa gcccgcttca gcaagcatca acgccgaaga tataggcata 361 tccaactgtg cttggaattc gtgatagtca aggtccttcg tcttgattga tatgcacact 421 ccgcccgcgc aaagcgcctc ttttctcatt cggcggcaga cttcttcggc cagcgacagc 481 atcacctgcc aaacctgccc gttggtgtaa agatcctccc gcagggtggt ggagtttccg 541 atcgacttgc tgaccgactc atatccgatc tcatgcacca cctcatcgtc cagtccgttg 601 accgccctcc aaagccatat tcctgccttg cccagcgccc ttgaaagcat ttcgggatcg 661 gaatttgcca gctcgccaag ggtatgaatg cgaagcttgt taagtcttcg ccccgttgca 721 gggccgatgc cgataagctc gcatacatca agccccgata ttctctcgcg gaaggtttca 781 tatggcaaaa gggtgactgc atcgggcttt ttcatatccg agccaagctt tgccaaagcc 841 tttgtgaagc tgacaccaac ggaaattgtc agccccgttt cttttttgac cgcttcgcgg 901 atatcgtttg caattttctc gctggaaccg aaaagatagt ggctccctgt aatatcgagc 961 caacattcgt ccattccgaa cggctccacc atatcggtga agcgggcata aattttccgc 1021 acttgttttg acacagcaga gtattcttcc attctgggcg gaacaattac caaatcgtgg 1081 cacttctgct tggcttcata tattttctcg gcagtcttaa tgccataggc ttttgcgagg 1141 tcgttttttg caagaacgat tcccgcccga tcctcaacac ttccgcagac agcaacaggc 1201 tttccgcgta atgacgggtt gtcgcggcat tcaacagatg cataaaaatt attcagatcg 1261 caatgtaaaa tatctctcat atgcgcctcc aaaacaagaa catatgttcc gatttgatta 1321 tatattagca catatgttcg catttgtaaa cagggaattt ttgaaatgag ggagattttt 1381 gggacggtgg gggaatagcg aagcgagccg tggcagacac ggcggcgcgc cgaaggtgcg 1441 gcgatttgtg gcttgccgtg gcgagcgaaa cgggaatttc caaatgcgga ggtaaagggc 1501 cccaaccgcg gcacctgcga cactgttcct gcggaacacg tccgcagacg ccgctgcaaa 1561 tgcgcatcgc caaaccttag cggcatatga ttgggaaatc tgcttatgcg atattgtcgc 1621 ataagcagat ttcatagcga ccgtcagcaa cttcatctat attgcaaact ttgtcggtcg 1681 cttggcggca gcccacgtgc gccttcggcg cacgcgcccc gcgcttcgcg cggggactcc 1741 gttgcgcata aagcgcaacg gagtggctgc cgccctctgt aggcgcccga caaatgtagc 1801 tgagggcgtc gggcggtctg ctccgaatgt aatgaggctg tgaccgcgcg gtgccaaaag 1861 cgacaaaaaa cggacgaggt ttccctcatc cgcaaatatc agtatatctt cgctatccat 1921 tcgccgtttt caatgacata ttggaactcg ctcaagctat cctcatcaaa cacccgaagc 1981 atcagctcaa aatcgctgac cgtttcaatt tttgcgatct cgcttcgctt gacccactcc 2041 attttgccct cgtcggagga gatcagctca cccgaaaact tgtctgtctt ataaagaaaa 2101 acaatgtatc gcccatcgtc aattggaaac tgcttgacgc cgcagagctt cggctcatat 2161 atatccagtc ccgtttcctc tttcatttca cgtttgacag cttcggtgat gctctcgccc 2221 tgctcaacgt gcccgccggg cagagtgtag ccctgccaat cttttttgat gcggttttgc 2281 aggagtattt catcatcgcg atagacaagg cagagcaccg tcagctccgc gttttcagtt 2341 ctcttcatct ttgatcaggt cctttataat ctcgcttgcc ataattatcc ccataaccga 2401 cgggcaaaaa gcaaccgatg cgggtatatg cctgccaaac tccttaggca cttccctttt 2461 gggcttggcg ggttcttctt ttgaataaac gcatttaaga tgcttaactc ccctcttgcg 2521 aagctcatat ctgagcgttt ttgccaaggg gcaaacggag gttttaaata tatcgctgac 2581 ttcaaacttc gtcgggtcaa gcttatttcc tgcgcccatc gcgctgatta tcggtgtatc 2641 ggccgcctgt gctcttaaaa taagctcgat tttagcggac atcgtgtcga tgcaatctgc 2701 gatgtagtca tactttgaca gatcaaactc gtctgcgttc tcgggagtgt agaacacctc 2761 gtgtgtcaca acttccgccg cggggttgat gtcaagaatg cgtgccttca tcgcttcgac 2821 cttggggtgc cccgtggtgc tctcaagggc aataatctgg cggtttcggt tggatatgct 2881 caccttgtcc gaatcgaaga gttcaaaatg cataatacct gtgcgtgcca aaatctcaca 2941 gacatatccc ccaacgccgc cgacgccgaa caccgcaact ttcttatttt taagcgatgc 3001 tatcgcctgc tcgcccaaaa gcaactcgct tcttgaaaac // LOCUS sequence145 3038 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence145 VERSION sequence145 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3038 /mol_type="genomic DNA" /organism="" /note="sequence145" CDS complement(141..731) /product="ribonuclease M5" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_000700080.1" /transl_table=11 /codon_start=1 /translation="MLHINGAIVVEGKYDKIHLSPLVDCPIITTEGFGVFKNDETKELI RFYAKNGGIIILTDSDFAGFKIRGYIKGIVTDGVVKNVYIPDILGKEKRKTAPSKEGKL GVEGIDVATLEQAFVTAGVISEREDEPRRKITRLDLYDDGYFGKPDSKAKRILLLDSLN LPTRLSTSGLLDVLNFAVTFEEYKQITEKIREP" /locus_tag="LOCUS_5530" /gene="rnmV" /EC_number="3.1.26.8" /note="WP_000700080.1 ribonuclease M5 (Bacteria) [pid:31.6%, q_cov:96.9%, s_cov:98.9%, Eval:3.1e-13]" /note="MGA_721" CDS complement(944..1993) /product="DNA polymerase III subunit delta" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_010942847.1" /transl_table=11 /codon_start=1 /translation="MPNLTDTELIKSIRSGKIAPIYYFYGKDVATLESITKKLIAKLCP DRDNDMNYHFFSGGSFDMSQFADACEALPMFSDRVLIAVNDLNAEILRADDTKYLFEIL SNIDSETTTVIFYSTGVDLYGGKKTISTKNKKLADHISKVGGAVTEFAFKRPNELVKYI QSRCSDELCVIHPREAEYLASVCLCNVLAINNEIAKLTAYVGKGEITQEIIDELVSGQL DTDAYKLASAVVSGNSREVFKILPELYAKQAEPIPLMSVISASFIDLYRAALAYSTGRT QSDILEDYNYRGRDFVVRNAFRDCRKLSLDKLRACIDIMSQCDIDMKSKRVDSKLLLET AIMQMLALK" /locus_tag="LOCUS_5540" /gene="holA" /EC_number="2.7.7.7" /note="WP_010942847.1 DNA polymerase III subunit delta (Geobacter sulfurreducens) [pid:23.4%, q_cov:97.7%, s_cov:97.3%, Eval:5.6e-14]" /note="MGA_722" ORIGIN 1 cattttccca ctttttggca ggttgtgttt ttatgcacaa aatcacgctt ccaaactgtg 61 taagttgcac aaacgatgta tatgactata ctgcattata cccaaaacag gtgcgaatat 121 accatataaa ataaggaagc tcaaggctcc cttatttttt cggttatttg tttatattct 181 tcaaaggtca cggcgaagtt gaggacatcc aaaagtcccg aggttgaaag ccgtgtcggg 241 agattgagcg aatcgagcaa aagaattcgt ttggcctttg agtcgggctt gccgaaatag 301 ccgtcgtcat ataggtcaag gcgggtgatt ttccttctcg gttcatcttc gcgctcggaa 361 attacccccg cggtgacgaa ggcttgctca agcgtggcaa catctatccc ctcgacgccc 421 agtttgccct ccttggacgg cgcagtcttg cgcttttcct tgccgaggat gtcggggata 481 tagacgtttt taacaacgcc atcggtgact atacctttaa tatagccgcg gatcttaaaa 541 cccgcgaaat cgctgtcggt aagaattata attccgccgt ttttggcata aaaacggata 601 agctctttgg tttcgtcatt tttaaaaacg ccgaagcctt cggtagtgat gattgggcaa 661 tcgaccaagg gagaaaggtg gatcttatca tattttccct cgacgactat agcgccgttg 721 atgtgaagca aggttggatc tccttattta tatagtatgt tggaaagtgg agcgagagcg 781 caagacaatc cagttgggag aggtgtcaaa agcttcgatg aaatcgaagt tttgcagccg 841 tgacggagag ggcatacgcg agcagtaagc attgcaatta tacaaaccgt tccacctcat 901 ccgtcggcat acgccgacac cttgccctca aggggaaggc tatctacttc aaggcaagca 961 tctgcattat tgcggtttca agaagcagtt ttgaatctac cctcttggat ttcatatcaa 1021 tatcgcactg cgacataatg tctatgcagg cgcggagctt atcaagcgaa agcttgcggc 1081 aatcgcggaa agcattgcga acaacaaaat ctctgccgcg atagttataa tcctccaaaa 1141 tatcgctctg ggttctgccg gttgaatatg ccaacgccgc gcgataaagg tcgatgaatg 1201 atgcagaaat aaccgacata agcggaattg gctcggcttg ttttgcatac agctcgggga 1261 gaattttgaa cacctcgcgg gagtttcccg aaacaactgc acttgcgagc ttatatgcat 1321 cggtatctaa ctggccggaa accagctcgt caatgatctc ctgagttatt tcgcctttgc 1381 ccacatatgc cgtaagttta gcaatctcat tgttgattgc caaaacgttg caaaggcaga 1441 cggatgccaa atactccgcc tcgcggggat gaattacgca aagctcatca gagcaacggg 1501 attgaatata tttcaccagc tcattgggac gcttgaaagc aaattccgtt actgcgccgc 1561 cgacttttga aatatggtct gcgagctttt tgtttttggt gctgatcgtc tttttgccgc 1621 cgtaaaggtc aacgcctgtg gaatagaaaa tgacggtggt ggtttccgaa tcaatgtttg 1681 aaagtatctc aaagagatat tttgtgtcat ctgcgcgcaa gatttcggca ttaaggtcat 1741 taacagcgat aagtaccctg tcggaaaaca tcggcaacgc ctcgcaggca tcggcgaatt 1801 ggctcatatc gaaactgccg ccgctgaaaa agtgatagtt catatcgttg tcgcggtcgg 1861 ggcaaagctt tgcaatcagc tttttggtta tgctctcaag ggtggcaacg tccttgccgt 1921 agaaataata tatcggtgcg atcttgcccg agcgaattga ttttatcagc tcggtatctg 1981 ttaaattcgg cactatgcca cctccaataa ttacagttta aattcaatca gcacatcgcc 2041 cgtgtggctt tcgccgttta tgaccagcgt gccgtcgaaa acagagatgt tgatatcccc 2101 acccttggca gcgccgtttt ggacgtatat gctcatatct cccctctcga taaccgtgcc 2161 tgaggcggat atggtcagcg tacagtcggc aaattcaatt tgtgtcactt cgcccaagta 2221 gtcataagga atatctgcgc caaagatata gcttcctgcg ggcagaagaa gcttttcggg 2281 acgtgcagaa attcctgcat agcgagaata tgccgactcg ccgtttttgc tggcagttgc 2341 caaacgaagc cgcgagattc cgtatcgttc gcagagcctt tcaagctcgt aatcgagcga 2401 agctccgccg ttaacatcaa ttataataca ttcttcgttt tttcgcaata gcaatgcaca 2461 atctccgcct gctgatatga cggtgagttt ggtttcatca ttcgatgcaa cagactgtgc 2521 ggaataaatg cagccgaaaa caagtgttgc aacaagaacc agaccgatta ccccacgctt 2581 atttttcata aacacggcaa agcctataac aatcagtgag attatcaccg ccgcaattat 2641 cggcgcggta tggctaagcg gaagatatgt aagatgtaca cttgaaatct tttcgcaggc 2701 aaaaatgaca gcattcatta tcagccccgc aattttcgga atcagcgaca aaagcggcga 2761 gcatccaaaa agaacaaata ccaacgccaa caccagcccc gcagagcaca agggcagaag 2821 caggaagttt gatatgggag cgatgagcga cagctcggtg aaatacagca tcattgcggg 2881 tgcggtggaa atgcttgcac aaatcgcgga cacaaaggtt gtgccaagct tcgatttgat 2941 ttccagagca tcgttgacat agggcgcgaa aacactcacg ccgaacacac cgctgaggga 3001 taggatgaag gacgaatcgg cagcaacata tgggttga // LOCUS sequence146 3028 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence146 VERSION sequence146 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3028 /mol_type="genomic DNA" /organism="" /note="sequence146" CDS complement(205..2448) /product="glycoside hydrolase family 2 TIM barrel-domain containing protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011107432.1" /transl_table=11 /codon_start=1 /translation="MRKIVNFNAKWAFTKQCNAVPESMPNNWNWVNLPHTWNAIDGQDG GNDYYRGTCYYAKTLDKLDLPEADRYYLEIRGANSSADVYLNGKHMAHHDGGYSTWRVD ITEDLTRDNLFVIAVDNAPNDRVYPQVADFTFYGGLYRDVNIICVNEAHFDLDYYGTPG IKITPAINGADADVEVEVFTTNTQMGHTVRYTIYDKEENVVASVTTNDTKVNLTIPEVH LWNGRKDPYLYCCEAELLDGETVLDNVCSRFGCRTYKVDPENGFILNGEEYPLRGVSRH QDRLGIGNALLPEHHEEDIDLIMEVGATTIRLAHYQHDQHFYDLCDEKGLVIWAEIPYI SQHMPNGRENTISQMKELVTQNYNHASIVCWGLSNEITMKGDRDPDLLENHRILNDLVH EMDKTRPTTIAAVSPCPLVSPYIQIPDLVSYNHFFGWYGGDTTMNGPWFDKFHKTHPNI PIGCSEYGCEALNWHTSNPMQGDYTEEYQAFYHEELIKQLFSRKYMWATHVWNMFDFGA DARSEGGENGQNHKGLITMDRKYKKDSFYAYKAWLSDEKFVHLCGKRYIDRVEDTTKVT VYSNMPEVELFANGVSLGKKTAEDHFFYFDVPNVGETHLVAVAGEFKDEGDIRKVEEFN TAYRLVEKNAVLNWFDIEAPEGYFSLNDKMGDILATVRGKLLFAGIMAKMMPKGKASAA GFDIDMAGPMMDMLGGFTVLRLTGMMGSMNINFTKEQLLDLNAQLNKIKKKEK" /locus_tag="LOCUS_5550" /note="WP_011107432.1 glycoside hydrolase family 2 TIM barrel-domain containing protein (Bacteroides thetaiotaomicron) [pid:38.4%, q_cov:80.1%, s_cov:90.2%, Eval:7.9e-121]" /note="MGA_724" CDS complement(2581..3006) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MRNILNLNKDWLFIKDCADISAREGENVCLPHSWNAIDYSEWKFG KREEGTVYSLHSFFRKLAQGVGPSIVIFVLGLLGYVSDLGTTGQSPEVAYRACWLVAGL YLFSAVMQFVGIGLIFNLDKKTLATMNEEIAARKAAE" /locus_tag="LOCUS_5560" /note="WP_002289668.1 MFS transporter (Enterococcus) [pid:34.6%, q_cov:70.9%, s_cov:21.4%, Eval:9.6e-07, partial hit]" /note="MGA_725" ORIGIN 1 gcgcttcata tctgagggtc taacgttgca catatttata tctcctttta tccccgtcag 61 ggttaattta cactcaaaaa tgatataaaa tcacaaaatt attatacgct atcggcatga 121 taaaatcaac tgtcattttt gctaatgatg atattttttt tgacaaaaac tcccgccaaa 181 ttgacgggag ttttctgcgt taaattactt ttcctttttc ttgatcttgt tgagctgtgc 241 gttaagatct aaaagctgtt ccttggtgaa gttgatgttc attgagccca tcatacctgt 301 caaacgcaaa acggtgaagc cgccgagcat atccatcata ggacctgcca tatcaatgtc 361 aaatcctgcg gcacttgcct tgcccttggg catcatcttg gccataatac ctgcaaagag 421 gagcttgcct cttacagtgg cgagaatatc acccatctta tcgttgaggg agaagtatcc 481 ctcgggagct tcaatatcga accagttaag aactgcgttc ttttcaacaa ggcggtaagc 541 ggtgttgaac tcttcaacct tgcggatatc tccttcatcc ttaaactcgc ctgcaacagc 601 aacaaggtga gtttcaccga cgttgggaac atcaaagtag aagaagtgat cctctgcagt 661 cttcttgcca aggcttacgc cgtttgcaaa gagctcaacc tcgggcatat tggaatatac 721 agtgaccttg gttgtgtctt caactctgtc aatatatctc ttgccgcaaa ggtgaacgaa 781 cttttcgtca gagagccatg ccttgtaagc atagaaggag tccttcttat actttctgtc 841 catggtgatg agacccttgt ggttctggcc gttttcgccg ccttcgcttc ttgcgtcagc 901 gccgaagtcg aacatattcc aaacgtgggt agcccacata tattttcttg agaagagctg 961 cttgatgagt tcttcgtggt agaatgcctg atattcttcg gtatagtcgc cctgcatggg 1021 attggaggtg tgccagttga gagcttcaca gccatattca gagcagccga tcggaatatt 1081 ggggtgagtc ttatggaact tatcaaacca agggccgttc attgtggtgt cgccgccgta 1141 ccaaccgaag aagtggttat atgaaaccaa atcggggatc tgaatgtaag gcgagacgag 1201 cgggcatgga gaaacagcag caatggttgt ggggcgggtc ttatccatct cgtgaacgag 1261 atcgttaaga attctgtggt tttccaaaag gtcggggtcg cggtcgccct tcattgtgat 1321 ctcgttggaa agtccccagc aaacgattga agcgtggtta tagttctgag ttacaagttc 1381 cttcatctga gaaattgtgt tttcgcggcc gttgggcata tgctgagaaa tgtaaggaat 1441 ttcagcccag atcacaagac ccttttcgtc acatagatca taaaagtgct gatcgtgctg 1501 atagtgggca agacggatgg ttgttgcgcc cacttccata atgaggtcga tgtcctcttc 1561 gtggtgttcg ggaagcaaag cattaccgat gccgagtctg tcctggtggc gggatacgcc 1621 gcgcaaagga tattcctcgc cgttgaggat aaagccgttt tcggggtcta ccttataggt 1681 gcggcagccg aatctggagc aaacattatc caaaacagtt tcgccgtcca aaagctcagc 1741 ttcacagcag taaagataag gatcctttct gccgttccag agatgaacct cggggatagt 1801 gaggttgacc ttggtgtcat tagttgtaac ggatgctaca acgttttctt ccttgtcata 1861 gatggtgtag cggacagtat gacccatctg ggtgttggtg gtgaatacct caacctcaac 1921 gtcagcatca gcaccgttga tcgcgggagt gatcttgatg ccgggagtgc cgtaataatc 1981 aaggtcgaag tgcgcttcgt ttacacagat gatgttaacg tctctgtaaa gaccgccgta 2041 gaaggtgaag tcagcaacct ggggatatac tctgtcgttg ggggcattgt caacagcgat 2101 gacgaaaaga ttgtcccttg taaggtcttc ggtgatgtca actctccagg tggagtaacc 2161 gccgtcgtgg tgagccatat gcttgccgtt gaggtaaaca tctgcagaag agtttgcgcc 2221 tctgatctca aggtagtatc tgtcagcctc gggaaggtcg agcttgtcca aagtcttggc 2281 ataatagcag gtgccgcggt aataatcgtt gccgccgtcc tggccgtcaa ttgcattcca 2341 ggtgtggggc aggtttaccc agttccagtt gttgggcatt gattcgggaa cagcgttgca 2401 ctgcttggtg aatgcccatt tagcgttaaa attcacaatt tttctcaatg tggtttcctc 2461 ctagtctatg tgataaaatt gtttatagaa ttaaagcggc agacgaaata attccgcctg 2521 ccacccaatt atatcttatt taatttccga ttacaagcgc atcataagat atgatacaaa 2581 ttattctgca gcctttcttg cagcgatctc ttcattcatg gttgcaagag tcttcttgtc 2641 aaggttgaag ataagaccga taccaacgaa ctgcataaca gcactgaaga ggtaaagacc 2701 ggctacgagc cagcaagctc tgtaagcaac ttcgggagac tgaccggtgg ttccgaggtc 2761 ggaaacgtaa ccgagcaagc caagtacgaa gataacgatg gaggggccta cgccctgagc 2821 gagctttctg aagaaggagt ggagagagta aacggtacct tcttcgcgct tgccgaactt 2881 ccattcgctg tagtcgatag cgttccaaga gtgaggcaga catacgttct cgccctcgcg 2941 agcggagata tccgcgcaat ccttgatgaa aagccaatcc ttgttaagat ttaagatatt 3001 tctcattttt ttctcctttg ctaaggta // LOCUS sequence147 3000 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence147 VERSION sequence147 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3000 /mol_type="genomic DNA" /organism="" /note="sequence147" CDS complement(728..2050) /product="SLC45 family MFS transporter" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_010867389.1" /transl_table=11 /codon_start=1 /translation="MKLNTKRTVLIGFAFMSVLAFWQFYDQVVPVILENHFSQSTLLTN MIMSLDNLLAVFMLPLFGTLSDKTRTPLGRRTPYILFGTIVAVVLMFIMAFLTEAHNFI GFIICLMLLLVTMSIYRSPTAAYMPDVTPKPLRSKGNAIINLVGYIGGIFFTIIMMFLV TSEAQPDGSLKYNSFIPIFLTVAVFMLVSVLIMVFTVNENKVVAEANIEEEDEESPVAK GEKLPRDVKISLIFILLSVFMWFTAYNGVTTSFSRYFENKFGVDAGSSSLYLTVATVVA IISFIPLGTISSKLGRKKTIIAGVVLMTLCYGAMIFIGEVSVLMYVVFCLVGIGWAAIN VNSFPMVVEMCSSADVGKYTGYYYAFSMAAQIVTPILSALIISKTQFMGISLGLGLGYG SLFPYAVFFSALAIVTMIFVKHGDSKPVAKKDLLESFDVDD" /locus_tag="LOCUS_5570" /note="WP_010867389.1 SLC45 family MFS transporter (Pyrococcus abyssi) [pid:32.5%, q_cov:99.8%, s_cov:100.0%, Eval:2.3e-63]" /note="MGA_727" CDS complement(2318..2953) /product="HAD family hydrolase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_015943184.1" /transl_table=11 /codon_start=1 /translation="MKKGILFDLDGTMWDSSENVCLSYNLGLEQLGYSLRLTVDDVMGA MGKTMYDIAHIFFDCIDPEKAESIMDYCTAVENEYIKTHGGDIYNGLEQTLERLHSDGW FVACVSNCQCGYIEDFLEYSGLGHLFDDTECWGNTLQLKAYNISLVAKRNSLDKVVYVG DTMGDYTSACEAGAEFIHASYGFGNVPDGTPAVSSLCEVPDLANSLVE" /locus_tag="LOCUS_5580" /note="WP_015943184.1 HAD family hydrolase (Desulfitobacterium hafniense) [pid:42.0%, q_cov:92.4%, s_cov:88.4%, Eval:1.1e-33]" /note="MGA_728" ORIGIN 1 acaagccaac atccgccgcc ggggagccag ttatcgggga gctcgacctg ccagccgtca 61 tcaagcttct ggcagaaaat gccgtattca tacaaaatgg aatagccggt tgcgggatag 121 ccatcagttg caagaccgtc aagatagcat gcagcaagac gacccaagcc accgttgccg 181 agacctgcat cgggttcctg ctcatataca cggctgatac ttacgcccaa atctttaagg 241 gcagcttcag cggcagttac cattcccaag ttataaagac tggtcttcat tgaacgtccc 301 attaagaatt ccattgagat ataataaacc tgctttttgc ctccggaatg caccttggta 361 atatacttgc gacgcttatc tttaaggtcc tcaacaatta cagaggaaag tgcttcataa 421 aattgcttgt cggaagcgtt ttcgggagaa acatcataga tcttctcgag cgctgcaaca 481 atgcgacttt tgagctcttc cttggtatac tttttatttg acaaaatata ttcactcctg 541 ttcggaaaga ttatcgcttt ggtgcggtta acgaaatgta atatccatta accatattat 601 tatacttttt ttgtgatttt atgtcaatga gtagatttga caaagaaaaa agtgcctgct 661 cacaagatgc aggcactttg ccgaaaaaca actatatata ttgttgaaat tgcgaaattt 721 cgaatgctta gtcatcaaca tcgaagctct caagcaagtc cttctttgcg acgggctttg 781 agtcgccgtg cttgacaaaa atcattgtga caattgcaag tgccgagaag aatacggcat 841 aagggaacaa agaaccgtag ccaagaccga gaccaaggga gatgcccata aactgggttt 901 ttgagatgat gagtgcagag agaatgggtg taacgatctg agccgccatt gagaatgcgt 961 aatagtatcc tgtgtattta cccacatcgg cacttgagca catttcaacg accatcggga 1021 aggagttgac atttattgcc gcccaaccga tgcccacaag gcagaaaaca acatacataa 1081 gcacgctgac ttcgccgatg aagatcattg cgccatagca aagggtcatc aatacaacac 1141 ctgcaatgat ggtctttttt ctgccaagct ttgaggagat agtgcccaga gggatgaagg 1201 agattattgc aacaacggtt gcaacagtaa ggtagagcga ggaggagcct gcatctacgc 1261 cgaacttatt ttcaaagtag cgggagaagg aggtggtgac gccgttgtag gcggtgaacc 1321 acataaagac ggagagcaaa atgaagataa gggagatttt aacgtcgcga gggagctttt 1381 caccctttgc gacgggagat tcttcatcct cttcttcgat atttgcctcg gcaaccacct 1441 tgttttcgtt gacagtgaat accattatca ggacggaaac aagcataaag acagcgactg 1501 taaggaatat cgggataaag ctgttatatt taagtgagcc gtcgggctga gcctcggagg 1561 ttacgaggaa catcattatg atggtgaaga agattccacc aatatagcca accaaattga 1621 taattgcgtt gccctttgaa cgcaagggct tgggggtgac gtcgggcata tatgccgctg 1681 taggcgagcg gtagatgctc attgttacga gcaggagcat taagcaaatg atgaagccga 1741 tgaaattgtg agcttcggtc aggaatgcca ttatgaacat taaaacaacg gcaacgatgg 1801 tgccgaagag tatgtacggt gttcttctgc ccaagggggt gcgggtcttg tcactaagcg 1861 tgccgaacag cgggagcata aatacggcaa ggaggttatc cagcgacatg atcatattgg 1921 ttaaaagggt ggactgagag aagtggtttt ccaaaattac gggaactact tggtcataaa 1981 actgccagaa agcgagaacc gacataaatg caaagccgat caggacagtg cgcttggtgt 2041 tgagtttcat agagttacct ccaaatgttt aacattacgc aaacatttta gcatattatg 2101 gcaggtgttg tcaaaccttt agggtttgat gagcggcaac ccgccgagct tgctcggcgc 2161 ttcgcgccgc aggcgcgaaa aaaacgcccc gtatggtagg ggcgttttgg ttgccgcgtg 2221 cgggatgcgc aaaagtttga ggaacagaaa acgagagcga gccgtcgagt gttcgcgcaa 2281 cggagttgca gtgaacaagc ggtggcgagc ggtgacgtta ctcgaccagc gaatttgcca 2341 gatcaggaac ttcacagagc gaagaaaccg caggtgtccc atcagggaca ttgccgaagc 2401 cataagaagc atggataaac tcggctcctg cttcgcaagc ggaggtatag tcccccatcg 2461 tgtcaccgac atatacaact ttatcaagag agtttctttt tgcgacaagg ctgatgttat 2521 atgccttgag ttgtagggtg ttgccccagc attcagtgtc atcaaacaga tgaccgagtc 2581 cggaatattc caaaaaatcc tcgatatatc cgcactggca gtttgatacg caggcaacaa 2641 accaaccgtc actatgcaga cgttcaagcg tctgttcaag gccgttgtat atatcaccgc 2701 catgtgtttt aatatattcg ttttcaactg ccgtgcaata gtccattatg ctttcggctt 2761 tttcggggtc gatgcagtca aagaaaatat gcgcaatatc gtacatcgtt ttgcccattg 2821 cgcccatgac gtcgtcgact gtcaggcgga gcgaatagcc aagttgctcg agccccaagt 2881 tatatgagag gcaaacattt tctgaagagt cccacattgt gccgtcgaga tcgaaaagta 2941 ttcctttttt caaagatatc attcctttgc tgttttctat ctgtgattat agaacaataa // LOCUS sequence148 2998 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence148 VERSION sequence148 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2998 /mol_type="genomic DNA" /organism="" /note="sequence148" misc_feature complement(1619..>2998) /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_011107432.1:glycoside hydrolase family 2 TIM barrel-domain containing protein" /note="WP_011107432.1 glycoside hydrolase family 2 TIM barrel-domain containing protein (Bacteroides thetaiotaomicron) [pid:43.1%, q_cov:62.3%, s_cov:40.5%, Eval:9.0e-58, partial hit]" /note="MGA_730" /locus_tag="LOCUS_5590" ORIGIN 1 atcgtacatt tcaagcatct cgtctgtcca gagatatgta tcctgaagct gacggcggtc 61 gatggaaatt acggtaggat ccaagatctt aaatctttca caagctgcaa acaaagcaac 121 gccatcggga ttctgagttc cggaaacgag gcaatagccg gacggattgg tctgcatata 181 gtatataccg tcgccattgg ggtcgcgagg caagggagca aacataactt cattttgagt 241 aacatcgccc caaagtgcac taatgctttc aactgttcct gtaaaaccaa aggtttcaac 301 aatatagaac aaggttaagc cttccttaac gcctgcaccg attgtgccat ttcttatgtt 361 ccagtttctc caaagaggat agaagcattc gttcttggaa aggttataga tcatatcaga 421 tatacgttca agtctgggat cgtcaaggtt agagacaaat ctgccgcttt ctgtatcaag 481 atgtactatc tgtgctcctg aagagtcgaa aagcgctctg ctggagcccc aaccgtcaac 541 tccgtaacgg tcttcatcgg gatctgtaaa ttccagacac atttcataga atacatccca 601 agtccattca tcgttgtagt aaagctcagc gggatcgtca aagccccatt cttcaagaac 661 tcttctgtta taaggaacta ccataccgaa agagttgtcg gtacagatta cgtagtgctt 721 gtcgccaagc ttgaagtact tgtcagcaaa gcccttcatt cctgcccaaa gcggatcatc 781 atagtcaata tagtcatcaa ccggtacgaa aattcccttc atgcagttgg tggggaaatt 841 ctcactgtat gcgggataga agtcagggga attacccgac aaaacaaggt ttgcaagccc 901 gtcaaagcgt gctccccatt cacattcgac ccattcgata tcgcagccgt atttttcttt 961 gaatgtccag aaaccggtgt taacgatctc tgcttcatca tagttgtgga aactgtcaaa 1021 ccaagcatac cacttgattg ttgttccgga aacgggtgtt gcttcagcgt ccggcagtac 1081 aatacctgct gctgccaaaa tagcttctgc gtcttctgtc gaaagcgtta cttcaacaat 1141 aggtctttta ttgttcgagc atccgaagag agccacagtc attacaacaa ccagtgctat 1201 cgccaatatt cgtttcatgt cgttgcctcc gtttaaaatt tgtgtttgtt ttttgcaaat 1261 tcatgcataa tttgaaacaa tatttgctaa acactgtttc acgctcaata atatcataaa 1321 caaaaacgtg ctgtcaatta taaaaaatgc aaatcgtgtg atttttaata tggatttatg 1381 catccattta tcgttttaca ttaattttcg ctttaaaaaa catacagttt actttcgtct 1441 gcgctgtcgc aagtgtatat cacccaaagg ctcagcggtt aaataaccgt ttgtatattc 1501 gctcgcaatt taatttcttg atttttgtat atacaggcag gagccacata agcggtattt 1561 tcgctcatat ggctcctatc gtttcttatt ttagaggttg atcggtaaaa tctgtcaatt 1621 attctgcttc ttcgggaaca ggctcatatg cttcgatttc ccaaatgcag gggaatccgt 1681 tggcatctcc acagctgaca acctcaatct tcaaatatct gccgcttacg ggattttcaa 1741 tcacatcggt gaagtatccc gaagtgctgg tgttatcgct gcggtcaaca attacggtat 1801 attcaccgtc aagctcattt gagatactta caataaagcc atatgctctg cttccgggct 1861 tgtgtgtaac tgtatagatc ttagaaggag tatgaacttc ttcaaggtcg atgataacag 1921 tagcgggata atcagcagca gatgcagcac accaacgaga tgcgtctgat gcaataccgt 1981 cgttgatctt gccggcaggg ttgcctgctt caacagaaga atagtaagca attggtttgc 2041 caagggctat gttaacaagc tccttctcgg gttcaacata aaagcccttc caagtagcgg 2101 tatcttcaag tgtggtgccg tcagcaaggg ttgctacaac cttaatttca gtgtccttat 2161 caataccgat atccacattc tcccaggtga agacggtgga atagtattca ttaagaacag 2221 cacgtaaaac aacgccctgc gatttgccgt taacaaacag ctcaacgctt tcggcattac 2281 tgtacgcctt aacaatcgga acaatgctct gtctctcggc aaagcgtttt tcggtgaggt 2341 ataccatagg ttcttcgttc caaacagact tatagaagta gtatgaatcc tttgccacac 2401 gttctctggt cattacgccc ttgtcgttct ggcccttggt gtcgccttcc tgtctgccgt 2461 cagatgcaaa gtcaaacata caccagatat acttgcccca gaggtatttt ctctgcgcaa 2521 actgtgccca gatctcttcg tgcattgcgc tctgatagtt ttcatagtga cgggttcccc 2581 aagtatcaat atcttcgccc cagactatgt tatccttgtg ctgagagata gccgcaccgc 2641 cgccatactc ggaaacagca attcctctgt cttccttaga gttgtgatat tggtccagcc 2701 acttgccaaa ggcgccgtca gcgccgtcga tataccaacc gaagtatctg ttatagccta 2761 caacgtcgcc ggggagatcc ataaacctgc cccagaactg agagtcagcg aaggaaataa 2821 gtcttgtttc gtcctctgca tttgcaagct cattaagctc tgtatatata ccgaaaattt 2881 catcattcat ctgatgtagc tcgttggaaa taccccaaac aataatcgag ggatgattat 2941 agtgctgtct gataagctcc atgatctgtt gttttgcatt atcaacaaat ccgtcagc // LOCUS sequence149 2976 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence149 VERSION sequence149 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2976 /mol_type="genomic DNA" /organism="" /note="sequence149" CDS complement(18..515) /product="NAD(+) diphosphatase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_002262000.1" /transl_table=11 /codon_start=1 /translation="MRYKYCPECGEKAVLREIGDEGLIPYCEKCQRPWFDIFPTCVICA AVNEFGEVALIKQGYVTDANYICVAGYMKSGESAEDAAAREVEEEIGLEATSVEYIRSY PYAKKDMLMLGFKVNVKKAELKLSCEVDSARWFSLDEARDFMREGSIAWQLVGEVAKGI KK" /locus_tag="LOCUS_5600" /note="WP_002262000.1 NAD(+) diphosphatase (Streptococcus mutans) [pid:34.0%, q_cov:90.3%, s_cov:91.4%, Eval:1.2e-16]" /note="MGA_731" CDS complement(505..1476) /product="Gfo/Idh/MocA family oxidoreductase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_010964789.1" /transl_table=11 /codon_start=1 /translation="MSQFRYAIIGAADISNKFANAVKLVDGAQVCAIAARDLSRAQAFA DRHGIPAAYGDYEEMLIKEKPDGVYIGVVTSKHFELTMLCLKHRIPVICEKAMFTDLKQ ARECFEYAKEQNTFCMEAMWSRFLPAILKAKSWIDEGKIGNVRYITCNIGWTCEVDMNN RFYSKELGGGAAYDLLVYSYELATFMHPAEIVKKQVVAEFAPTGVDTLSQVSLKFSDGV IASLSASINTVLEEALVICGDKGFIRVPCAHFAWEAYLHDSGRRVVEHFVDSVTKNGFT YEAQELIDCVKAGKLESEVIPHSETLASCEIYDMIFEGNNEI" /locus_tag="LOCUS_5610" /note="WP_010964789.1 Gfo/Idh/MocA family oxidoreductase (Clostridium) [pid:35.1%, q_cov:97.2%, s_cov:98.1%, Eval:2.6e-47]" /note="MGA_732" misc_feature complement(2014..>2976) /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_000105059.1:23S rRNA (uracil(1939)-C(5))-methyltransferase RlmD" /note="WP_000105059.1 23S rRNA (uracil(1939)-C(5))-methyltransferase RlmD (Bacillus) [pid:39.9%, q_cov:96.2%, s_cov:67.2%, Eval:1.8e-69, partial hit]" /note="MGA_733" /locus_tag="LOCUS_5620" ORIGIN 1 agcaaatctt gttcttatca tttctttatc cctttagcaa cctcgccgac aagttgccaa 61 gcgatgcttc cctctcgcat aaaatcgcgc gcttcgtcaa gagaaaacca tcttgccgaa 121 tccacctcgc aggagagttt aagctccgcc tttttaacat tcaccttaaa cccgagcatc 181 agcatatctt ttttggcgta gggatagctt cgaatatatt caacgcttgt tgcttcaagg 241 ccgatttcct cttcaacctc gcgcgcggcg gcatcctctg ccgattcgcc cgacttcata 301 taccctgcaa cacagatata attggcatcg gtgacataac cctgcttgat aagcgcaact 361 tctccaaatt cattcaccgc tgcgcagatg acgcaggtcg ggaaaatatc aaaccaaggc 421 cgctgacatt tttcgcagta tggaatcaga ccttcgtcgc cgatctccct taaaactgcc 481 ttttcgccgc actcgggaca gtatttatat ctcattattt ccctcaaaaa tcatatcgta 541 gatctcgcag gatgcaagcg tttcgctgtg gggaatgacc tcgctttcaa gcttgcctgc 601 cttaacgcag tcaataagct cctgcgcttc atatgtaaag ccgtttttgg ttacgctgtc 661 aacaaagtgt tcaacaaccc gtctgcccga gtcgtgcaaa taagcctccc acgcgaaatg 721 agcgcaaggc acacggatga agcccttgtc accgcagatt accagcgcct cctccaaaac 781 ggtgttgatg cttgcagaaa gcgaagcaat aacgccgtcg ctgaatttaa gcgacacctg 841 cgacagagta tccactcccg taggtgcaaa ttcggcaacg acctgcttct tcacaatttc 901 tgcaggatgc ataaatgtgg caagttcata tgaatataca agcaggtcat atgccgcacc 961 gccgccaagc tcctttgaat agaagcgatt gttcatatct acctcgcagg tccagccgat 1021 attgcaggtg atgtatcgaa cattgccgat ctttccttcg tctatccagc ttttcgcctt 1081 taaaattgca ggcaaaaagc gcgaccacat ggcttccatg caaaatgtat tctgctcctt 1141 ggcatattca aagcactcgc gtgcctgttt taagtcggtg aacatcgcct tctcgcatat 1201 gacaggaatg cggtgcttga ggcaaagcat cgtcagctca aagtgcttgc tggtaacaac 1261 gccgatatat actccgtcgg gcttttcttt tatcagcatc tcctcatagt cgccgtatgc 1321 cgcaggaatt ccgtggcgat cggcaaaagc ctgcgcacgt gacaaatctc ttgcggcaat 1381 tgcgcagacc tgtgcgccgt caaccagctt aactgcattg gcaaatttgt tcgatatatc 1441 tgccgcaccg attattgcgt atctgaattg ggacatggta attcctcctt tggtttggtc 1501 aattattctt tgctgttgtt atggatgcaa tcaactttct ccgtatagtt ccgcacttat 1561 tatgcagttg tttatatgta acttcatcaa tcgcgttgac cctcaacagt atttcgagcc 1621 aatactctgt ttcataacac tctttcaagg ctatctccat tttatttatg aaatcagctt 1681 tactctgtgc atattttgct tcatatgagt ttgcacctat tgatgaacaa gacctaagaa 1741 tctgattcgt aaaaacactt cggcctttaa ttcgatcaca aatagcagtc agttcaactg 1801 ttaactcaac agctaattct tttatagttt tattatccac aattaaagcc tcctttagcg 1861 atatactcgc ttcgctcgtg cgatatattt ttgacaaatg cgatataact tcgcttcgtt 1921 cagttgcgag atgatataaa ttctcgtccc gaagggacat atcgcatcac agatatatcg 1981 cgttgataaa catatcgcaa attccgcagg aatttatatc gcggtgcggc aaagccgcac 2041 tatgcattcg caatggagtg taaacgggaa catatccacc ggctgaactt ttgtcgcctt 2101 atatccgccc ttgatgagtg ccttgatatc cctctcctgg gtttcggggt tacaggaaat 2161 ataaacgatg cgtctgggca tcattttcaa aagtgcgtcc aaggtcgctt tatcgcagcc 2221 tgcgcgcgca gggtcaagca aaaccacatc cgcgccctcg ccttcctcgg caaggcttgt 2281 caaaagcttg cctgtatccg aacaaacaaa gcctgcattt ttaaccttgt tgagggcggc 2341 gtttttcttc gcgtccttaa tcgcctgcgg gttcgattcg acccccagaa cctcgcctgc 2401 tttatcgctt gcaataagcc cgattgttcc gattccgcag tagcagtcca aaactctgtc 2461 ggtcttcttg atatccgcca tttcaatggc aaggctatat agcttttccg tttgagtggg 2521 gttgacctga tagaacgagc gaggagaaat tatgaatttc tttccgcaga gggtgtcggt 2581 gatgtagcca tcccccaaga gcaccttttc gcgctcaccg agcatcattt tatcccgtga 2641 atcgcttatc gactgcacga cagtcttaat ttcggggtac ttcgtctgca gcgctttggc 2701 aagctcattg ccctttggca aaatcggcgt ggcggtgacc aaaaccacca tatattcccc 2761 gcttgtcttg ccgtatctta ccattacgtg cttgaggttt cccttgcccg tatagtcatc 2821 atacggatat agcttaaact cgggcatcag cttacgcaaa tgcttgatta tcgcgcttga 2881 gcgtttgttt tcaagaacac attcatcgtt ggtgacgatt ccgcccgtcg aggactgata 2941 tacccccgag atgattcggt tgttgggctt tgtcag // LOCUS sequence150 2974 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence150 VERSION sequence150 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2974 /mol_type="genomic DNA" /organism="" /note="sequence150" CDS 583..1323 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MNNKANLFSDTEDTKLKRFLKGNNIYIMLGTAIVSFLIFILTLIP ILNINSNIKTAENLVALKDINVHADLHDQYVQGDVYKFVGRLGYIAASEAAATEYYYLM YLDNADGNQYAVLVEVPIAGDADLQNIVTAYLNYAKDPDAGYQGNIIQLGGRFRKMSND EETLFSEGLSKCAVTVPYLTYTLEVGQLPEASQTVAYYFFCVPFGIIMIVAAVLFLYGQ KLEAMREKANESPYPYLNRKNKKK" /locus_tag="LOCUS_5630" /note="MGA_735" CDS complement(1529..2974) /product="alpha-L-arabinofuranosidase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003245027.1" /transl_table=11 /codon_start=1 /translation="MTISQNLIPSKDNGILPGKTLAVSHKPMAEHNPVSSNIYFADPTV VEYNGRLYVYGTNDSQEYDKCDGSRPNSYGGINSLVCYSTADMVNWTYENTIKVTEICT WAGCSWAPSIVSRVEADGLTHFYLYFCNSGNGIGVLTSTSPVGPWSDPNGKALMHNGLL GNDPTCWCFDPGVCIDDNGVGWLAFGGGNPLHEGENALYTGNSRIVKLGADMVSLDREV VVLKSPYHFEANELNFINGTYVLTYCSNWAKRELWEDKFKFDKPHVCSMCYCVSKDPLN PDSWEYMGEYLLNPDQFGYPGSNNHTHMHKFGDKYYIFYQNVSLAENKGEQIRGYRSIG VDEIEVDENAVVIKSGRMTDAGCTQLKNFDPYAVNSANTSAHSAGVKYDAQFKATVTDG SYIALKNVDFLGGAAKFAATLCGNGAIEVRLDDVTSEAVCTLQFDSADFITVVNDMCKS AEGVHDLYLVCGGEFTFDCWQFA" /locus_tag="LOCUS_5640" /gene="xynD" /EC_number="3.2.1.55" /note="WP_003245027.1 alpha-L-arabinofuranosidase (Bacillus) [pid:34.6%, q_cov:94.6%, s_cov:93.0%, Eval:8.7e-67]" /note="MGA_736" ORIGIN 1 cccgagttta tgattttgga cgaggcgact gcgaacatcg acaccgaaac cgaggttttg 61 attcaagatt cactcgaaaa gatgatgaat atcggtactc tcttaatcgt tgcgcacaga 121 ctttcgacca ttcagcacgc agacaacatt atatatcttt ctcacggcag gatcatcgag 181 cagggctcac acgccgagct tcttgaaaag aagggacgct attatgggct ttatatgctg 241 cagtatgata agcagaagtt gaaatagagc taataataaa gacaaataat tcctcttcgg 301 atttcggaga ggaatttttg ttggcggggc tgaggccgtc gtaccgcgaa gcggtgtgac 361 ggaggggacc cgtatgcgag ctttggaaaa tgacttgaca gcgaccgaca taaaagttgc 421 ctccatcgcg agctttgacg gtcgctcgga gcgacgtccg tcggattgtg ttgccgtaag 481 gtaatccgac gggtggagcg attaagcaga ttttatagtt attgactgtc aagaaaattt 541 atgatataat gtcaaaagac tattttttgc gaggtaatgg caatgaacaa caaagcaaat 601 ctcttttccg atactgaaga cactaagctt aaacgctttc ttaaaggcaa caacatatac 661 attatgctgg gcacggcgat agtttctttc ttgattttca ttttgactct catcccgatt 721 ctcaacatta attcaaacat caagactgct gaaaacttag tggcgctcaa agatattaac 781 gtacatgccg acttgcacga tcagtatgtt cagggtgatg tatataagtt cgtcggcaga 841 cttggctata ttgccgcaag cgaagccgcc gcgaccgaat attactactt gatgtatttg 901 gacaacgctg atggcaacca gtatgcagtt ttggttgaag ttcccattgc aggagatgcc 961 gatttgcaaa acattgtaac agcatattta aactatgcaa aggaccccga tgcaggatat 1021 cagggcaaca ttattcagct gggcggacga ttcagaaaga tgtctaatga cgaggaaacc 1081 ctcttctcgg aaggcttgtc taagtgtgct gtaactgttc cttatcttac atatacgctt 1141 gaggtcggtc agcttcccga agcaagccag actgttgcat actacttttt ctgcgttccc 1201 tttggaatca ttatgatcgt tgcggctgtt ttgttcctct atggccagaa gcttgaagca 1261 atgcgcgaaa aggcaaacga aagtccttat ccttatttga atagaaagaa caagaaaaag 1321 taaaatttta aaacaaaaac aaatccctgc cacggtgtgt gacagggatt tttgtttgtg 1381 ccttgagcgg tagcctgcgg gggcaaagcc cccgcacttc gcgcttctgc gcgaagaatc 1441 ccctctgagc gcctataggt cgctcagggg ggatggctgc cgcgaaaaac gcgcgaagcg 1501 cgcaccgacc gcgcggatgc gtatcggatt atgcaaactg ccagcagtcg aaggtgaact 1561 cgccgccgca gacaagatac aggtcgtgaa cgccctctgc gctcttgcac atatcgttta 1621 caactgttat gaagtcggca gagtcaaact gcaaggtgca aacagcttcc gaggtcacat 1681 cgtcaagtct gacttcaatt gcgccattac cgcacagagt tgcggcaaac ttagcagcac 1741 cgcccaagaa atcaacattt ttgagcgcga tatagctgcc gtcggtgacg gttgccttga 1801 actgcgcatc atatttaaca cctgcggagt gcgcacttgt gttagcagaa ttgacagcat 1861 atggatcgaa gtttttaagc tgagtgcaac cggcatcagt cattctgccc gacttaatta 1921 caactgcgtt ttcgtcaacc tcgatttcgt caacgccgat actgcgatag cctctgatct 1981 gctcgccttt gttttctgca agggaaacgt tctgatagaa gatataatac ttgtcgccga 2041 acttgtgcat atgggtgtgg ttgttggagc ccgggtaacc gaactgatcg ggattgagaa 2101 gatactcgcc catatattcc caactgtcgg ggtttaatgg gtctttcgac acgcaatagc 2161 acattgaaca aacgtggggc ttatcgaact tgaatttatc ctcccaaagc tcgcgctttg 2221 cccagttgga gcaatatgta agcacataag ttccgttaat gaagttaagc tcgtttgctt 2281 caaagtggta aggcgacttc aaaacaacta cttctctgtc caaagatacc atatcggcgc 2341 ccagcttaac aattctactg ttgcctgtat agagcgcatt ttcgccctcg tgcaaggggt 2401 tgccgccgcc aaatgcaagc cagccgacgc cgttgtcgtc gatgcataca ccggggtcga 2461 agcaccagca ggtggggtca tttccgagaa ggccgttatg cataagtgcc ttgccgttgg 2521 ggtcggacca ggggccgacg ggagaagtcg aggtcaatac accaattccg ttgcccgagt 2581 tgcagaagta aagatagaaa tgggtaagtc cgtcagcttc aacgcgggag acgattgaag 2641 gtgcccagga gcagcctgcc caggtgcaga tctcggtgac cttgatggtg ttttcatatg 2701 tccagttgac catatccgca gtggaatagc agacaaggga gttgattccg ccgtatgagt 2761 tgggtcttga gccgtcgcac ttatcgtact cttgggagtc attggtgcca tagacgtaaa 2821 gtctgccgtt atattcgaca acggtgggat cggcaaaata gatatttgag gaaacggggt 2881 tgtgctctgc catcggcttg tggctgacag cgagtgtctt gccgggaaga attccgttat 2941 cctttgaggg aatcaagttt tgggaaatgg tcaa // LOCUS sequence151 2958 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence151 VERSION sequence151 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2958 /mol_type="genomic DNA" /organism="" /note="sequence151" CDS 3..1283 /product="L-fucose/L-arabinose isomerase family protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_010965898.1" /transl_table=11 /codon_start=1 /translation="MVVFLGNFGPETPETLIAQKFDGPVMYIAAAEGDGDMINGRGDAY CGVLNCSYNLGMRHLKAYIPEYPVGTADECAEMIKKFVPIARAIIGVKNLKIITFGPRP QDFFACNAPIKGLYELGVEIEEISELDLLLSYKAHANDPRIPEVCADMATELGEKGNIW PELLPRMAQFELTLLDWAEAHKGAREYVAFADKCWPAFPEQFGFEPCYVNSRLASKGIP VACEVDIYGALSEYIGACITGDAVTLLDINNSVPQYIYDEDIKGKYDYTLTDTFMGFHC GNTPECKMCDDRAVKYQLIQHRLLEPVDSEPDFTRGTLEGDIAAGDITFYRLQCDSEGT LRAYIAEGEVLDVPTRSFGGIGIFAINEMGRFYRHVLIQKRYPHHGAVAFAHCGEALFE VLKYFGVCDIAYNQPKGVLYKTENPFA" /locus_tag="LOCUS_5650" /note="WP_010965898.1 L-fucose/L-arabinose isomerase family protein (Clostridium) [pid:66.7%, q_cov:99.8%, s_cov:86.3%, Eval:4.7e-170]" /note="MGA_737" CDS 1509..2153 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MKKLFSVLLAICMVLAMSINVFADEMKEVYFESANRTPNDLGVGA DVPWDGFGIGCIVNDHGLIENVTLADVIEQAKNGGILVMKFSSTGCWGTAPRPEIQFNC WENEETYQVLFDIIDNLDGTYTAYADLSEVLNNFIDAGNTVEDIANCGVQVWAENFGLL EMYVSDTAPVVEVAEDVDVTETDNEPADTGIGLSLIPLAVAASVVVSSKKR" /locus_tag="LOCUS_5660" /note="MGA_738" ORIGIN 1 ctttggtagt attccttggt aacttcggtc ccgaaactcc cgaaacactc attgctcaga 61 agtttgacgg ccctgttatg tatattgctg ctgctgaagg cgacggcgat atgattaacg 121 gcagaggcga cgcttactgt ggcgttctca actgctctta caacctcggt atgcgccacc 181 ttaaggctta cattcccgag taccctgttg gcactgctga cgaatgtgct gaaatgatca 241 agaagtttgt tcctatcgca agagctatca tcggcgttaa gaacctcaag atcatcacct 301 tcggtccccg tcctcaggac ttcttcgctt gcaatgctcc catcaagggc ctttatgagt 361 tgggcgtaga aattgaagaa atctccgagc ttgacttgct cttatcctac aaggcacatg 421 ctaatgaccc cagaattccc gaagtttgcg ctgatatggc aaccgaactc ggcgaaaaag 481 gaaatatttg gcccgagctc ttgcccagaa tggcacagtt cgagcttact cttcttgact 541 gggcagaagc tcacaagggc gctcgtgaat atgttgcatt cgctgacaag tgctggcctg 601 cattccccga acagttcggc ttcgagcctt gctatgttaa ctcaagactt gcttccaagg 661 gtatccccgt tgcttgcgaa gttgacattt acggcgcact ttccgaatac atcggcgctt 721 gcatcaccgg cgacgctgta accttgctcg acattaacaa ctccgttcct cagtatatct 781 acgacgagga catcaagggc aagtatgact atactctcac cgacaccttc atgggcttcc 841 actgcggtaa tactcctgag tgcaagatgt gcgatgacag agctgttaag tatcagctca 901 ttcagcacag acttctcgag cccgttgatt ctgagcctga cttcaccaga ggtactttgg 961 aaggcgacat cgctgcaggt gacatcacct tctacagact ccagtgcgat agcgaaggca 1021 ctcttcgtgc ttacatcgca gaaggcgaag ttttggatgt tcctactcgt tccttcggcg 1081 gtatcggtat cttcgcaatc aacgagatgg gtagattcta ccgtcacgtt ctcatccaga 1141 agagatatcc tcaccacggt gcagttgcat ttgcacactg tggcgaagca ctcttcgaag 1201 ttctcaagta cttcggcgtt tgcgacatcg cttacaacca gcctaagggt gttctttata 1261 agactgagaa tcctttcgca taatttgtac ataataaggc ccctccggaa acggaggggt 1321 tttgtttttt tgtaggggat acacggagcg agcgacgtca gcgaagcgtg cccgaacggg 1381 cgtgcgagca ggtggagcga gcggtaattg atgcgtgaag ttgtctgttg ctaccctctt 1441 gactctaaaa gcaacatatg ttataattta tttgcaatta gccacattac aacaaaggag 1501 tgtcaattat gaaaaagctg ttttctgttc tactcgcaat ctgtatggta ttggcaatga 1561 gcataaatgt ttttgcggat gaaatgaagg aagtatattt tgaatctgca aacagaacac 1621 cgaatgacct gggcgtaggc gccgatgtgc cgtgggatgg cttcggaatc ggatgcatcg 1681 ttaatgacca cgggctgatt gaaaatgtaa cactggcaga tgttattgag caagccaaaa 1741 acggcggaat tctggttatg aagttttctt ctacaggttg ctggggtacc gctccccgcc 1801 ctgaaattca gtttaactgt tgggaaaacg aagaaaccta tcaggtattg tttgatatca 1861 ttgataatct tgacggaaca tataccgcat atgctgacct gtccgaagtg ctgaacaatt 1921 ttatagatgc aggaaacacc gttgaagaca ttgccaactg tggtgtacag gtttgggctg 1981 aaaacttcgg acttctcgaa atgtatgtca gcgataccgc tcctgtcgtt gaagttgccg 2041 aagatgtcga tgtgacagaa actgacaatg agcctgctga tacaggaatc ggtttgtcgc 2101 ttattcccct tgcagttgcc gcgtcagtgg ttgtgagttc aaagaagaga taattttaac 2161 aaagaaaagc tcccacgagg tgggggcttt tttgttttac acctcatgcg tcggctccgc 2221 cgacaccttc ggctaccaca tgccacctct tgcatttttc cacagatgtg ttaaaatata 2281 tgaaacgaca tttttacgga gagcacaata tgatcaaacg atttatcaaa tattataagc 2341 catataaact gctttttgcg gcagatatgc tggcttgcat actcattgcc tgctgcgacc 2401 tgttctatcc gatgataaca aaaaatatca tcaacgacta tgttccaaac aaaaagctgg 2461 agcttctttt gatatggagt ggaattttgc tgggcattta tgccattaaa tgggcgctga 2521 actattttgt cagctactat ggacatatcg taggtcttaa aatgcaggcg gatatgagaa 2581 gagatctgtt taatcatctg cagaagctcc ccttctcata ttttgacggc acaaaaaccg 2641 gttcggttat gtcccgcctt attaacgacc tcaacgaggt cagcgaactc gcccaccacg 2701 gccctgacga tttgttcctc tcggttttaa tgttcatcgg ctcgtttatt atgctttcga 2761 gcattaactt tgcgctcacg ctgattattt tcgcgtttgt tccgtttatc ctgctctttg 2821 cggtgctcat tagaaacagg atgaaaaacg cttcccgccg ttcgcgcgag cagatcgcgg 2881 aagtaaatgc aaacattgaa actgccgttt cgggcgttag ggtttcaagg gcttacacct 2941 cggaagaata tgaaatta // LOCUS sequence152 2956 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence152 VERSION sequence152 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2956 /mol_type="genomic DNA" /organism="" /note="sequence152" misc_feature <1..936 /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_011017097.1:ABC transporter substrate-binding protein" /note="WP_011017097.1 ABC transporter substrate-binding protein (Fusobacterium nucleatum) [pid:33.1%, q_cov:99.0%, s_cov:61.2%, Eval:1.5e-44, partial hit]" /note="MGA_740" /locus_tag="LOCUS_5670" CDS 958..1899 /product="ABC transporter permease" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_010973851.1" /transl_table=11 /codon_start=1 /translation="MKYIIKKSFTLIITLFIVSLLAFLAFAVIPGDPTTRILGTEATEE AVIALREELGLNKPVVQRYIDWLLGFVKGDLGISYSYNMPVEEMISDKLPITALLTVIS FGLTVLISIPLGVALSAVKNKGTELAFTSINQVAMSVPAFFIGMIILYICGNFLKLFVP GGFISPDDSFGGSIYYLLFPAISIAIPRIAMTVKMLRSSVLSELDKPYVITARSRGKSE AGILFGHVLKNALIPVITFLAVSAAEIMTGSIIIEQVFNIPGIGRLLLSSISSRDYPVV QAIVVILAAWIVIVNFVADVLYKLVDPRIRIK" /locus_tag="LOCUS_5680" /note="WP_010973851.1 ABC transporter permease (Agrobacterium tumefaciens complex) [pid:34.7%, q_cov:98.4%, s_cov:97.5%, Eval:7.0e-58]" /note="MGA_741" CDS 1911..2714 /product="ABC transporter permease" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_012583225.1" /transl_table=11 /codon_start=1 /translation="MKTKKSFFTYAGAIISILTVLMILIGYVWTPYDPEAMSAVDKLKA PSFTHIMGTDNFGRDIFSRVLDGAGTSLLIALCVVIIGCVFGIIIGALCGYYGGVADAI LTRVCDSITAFPSFLLALVIVSVIGEGTYNIIIALGILFIPSFARVVRAEFAKQRERKY VANARLMGVKDIRIIICHILPNLKSVLIPTIIIGFNNAILSESSMSFLGIGIQPPQASL GSMLSDSQTYLSSAPWYALGVGGVIALLILGFSLLSEGLSRDRVI" /locus_tag="LOCUS_5690" /note="WP_012583225.1 ABC transporter permease (Dictyoglomus turgidum) [pid:40.4%, q_cov:93.6%, s_cov:87.1%, Eval:3.5e-52]" /note="MGA_742" ORIGIN 1 agaagtgtgc aggaaaatat catcctcgaa aagtttgatg actactacgg cgaaaaggcg 61 catcttgaca aggtgacata taaggtatat gaggatgcga atgcaatgtt caccgctctc 121 aatggcggag cattggacct tgtagcgcat cttactgttg atcagatcaa caacctttca 181 aacggataca acgttttaga gggcacaatg aatctggttc aggcgatata tcttaataat 241 gcagttaaac ctttcgacaa cgaactggta agacaggcgc tgtgctatgc tgtagatgtt 301 gattcgatgc tggctctgac ttcagacggt cacggaacaa aggtcggttc ttcaatgtat 361 cctgcattca aaaagtattt tgatgaatcc cttgcgaatg catatccata tgatcctgaa 421 aaggcaaagg atctgctgaa gcaggcagga tatgcaaacg gaattgaatt tacgattact 481 gttccttcaa actatactcc ccacgttgat tcggcgattg ttttggctga acagttgaag 541 gcatcaggaa ttaaagcaaa cattcggctt gttgattgga acacttggct ttcggatgta 601 tatcagggac gagattttga agcaacactt gtcggattcg attcaagcat gctaacagcc 661 agcggaatgc ttgcaagatg ggtttcgggc aacggcaaga atatgatcaa ttattcaaat 721 tctgagtatg atgaaacata cgccaaggcc caggcaagtg ccgatgatga ggaacagacc 781 cgtctataca agagatgtct tgaaattttg agtgaaactg ccgcgaatgt atatttgcag 841 gaccttgccg atttcgttgc cgtcaatccg aatcttgaag gattcgaatt ctacccgctg 901 tatgtaattg atatggcaaa acttagattt aagtaaattt gaaaaggagg tgcgggcgtg 961 aaatatataa ttaaaaagtc ttttactctc attattacat tgttcattgt ttcattgctc 1021 gctttccttg catttgctgt tattccgggc gatccgacaa cgagaattct cggaacagaa 1081 gcaacagaag aagcggtaat agcattaaga gaagaactcg gacttaataa gcctgttgtg 1141 caaagataca tagactggct tttaggcttc gttaaaggcg atttgggaat cagctattca 1201 tacaatatgc ctgttgagga aatgatttcg gacaagctac cgataaccgc tcttttgact 1261 gttatatcct ttggacttac tgtgcttata tcaattcctc tcggcgttgc tttgagcgcg 1321 gtcaaaaata agggcactga gcttgcgttt acatcgatca accaggttgc tatgagcgtt 1381 cccgcgtttt tcatcggtat gatcatattg tatatctgcg gaaactttct aaagctgttt 1441 gtgcccggcg ggtttatttc gccggatgat agctttggag gatctatcta ttatcttttg 1501 ttccccgcca tttcaatcgc aattccccga attgcaatga cagttaagat gcttagaagt 1561 tccgttttgt ctgagcttga taaaccatat gtcattacag caagaagcag aggcaaaagt 1621 gaagcgggaa ttctgttcgg tcatgttctc aaaaacgcgc tgattcctgt tatcacattt 1681 ttggcggtct ctgccgcaga gattatgaca ggatcgataa tcattgagca ggtattcaac 1741 attcccggta tcggaaggct tttgctttca agcatatctt cacgagatta tcccgttgtt 1801 caggcaattg ttgttattct ggcggcgtgg atagttattg tcaactttgt ggctgacgtt 1861 ttatataagc ttgttgaccc aagaataaga attaagtgag gaggctgatt atgaaaacaa 1921 agaaaagctt cttcacatat gcaggcgcga ttatttcaat tttaacagta ctgatgatac 1981 tcatcggtta cgtctggacc ccttacgatc ctgaggctat gagcgctgtt gacaagctta 2041 aagcaccaag ctttacacac attatgggta cagacaattt tggacgggac attttctcac 2101 gcgttttgga cggcgcagga acttcccttt tgatcgcact ttgtgttgta ataatcggat 2161 gcgttttcgg aattataatc ggagcgctat gcggatatta cggcggagtt gccgatgcga 2221 ttttaacaag agtttgcgac tctattaccg cgttcccaag ttttctgttg gcacttgtta 2281 ttgtcagcgt aatcggagaa ggaacatata acattatcat tgcgcttgga attttgttta 2341 ttcccagctt tgcaagagtt gtaagagcag agtttgcaaa acagcgtgaa cgaaaatatg 2401 tcgcaaacgc acggcttatg ggcgttaagg atattagaat cattatttgc catattctgc 2461 cgaaccttaa atctgtattg ataccgacta tcataatcgg gtttaacaat gcgatcttga 2521 gcgaatcaag catgagcttt ttgggaatcg gaattcagcc gccgcaggcg agtttgggtt 2581 cgatgctcag tgattcgcag acttatttat cctctgcacc ttggtatgcc cttggtgtgg 2641 gcggagttat tgcccttttg attttaggct tcagtctttt aagcgaagga cttagccgcg 2701 accgagttat ttgaggaggg cgagaatgag aaatttgctt agtgttaagg acttgtcgct 2761 ccgtttcatt aacgaggcaa tcgagcgaaa cgccataaat ggcatcagct ttgatatcgg 2821 aagaggcgaa attgtcggtc ttgtgggcga atctggaagt ggaaaatcgg tgaccgcaat 2881 gagtatctgc ggactgactt cgcataagcg cgcagatata ttcggaagca tagtttttga 2941 gggcgaagat gttctc // LOCUS sequence153 2915 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence153 VERSION sequence153 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2915 /mol_type="genomic DNA" /organism="" /note="sequence153" CDS complement(4..804) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MSNRRICAGVSAACGYPETPEVFVKELCRAGVGKIELFVNCEAET RPEYIREIKKILDGEGAKCISLHPYTCAIDTYALFSAYERRTEEYLDYHKRYFEAMNIL GAEYFVFHGSKVNYGDEIVFGRFARLAEIAKSFGVKALQENVDKRVTGELETLKRMKAH FGSDAGFVLDTKQAVRMGWEPMDGARALGNSIKHVHLSDHGAKGDCLLPGVGEMDIMGF IKTLDDVGFDGCLMLELYRRNYGDISDLIKALRDVENMIDEVCG" /locus_tag="LOCUS_5700" /note="MGA_744" CDS complement(884..1828) /product="protein translocase subunit SecF" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_012048082.1" /transl_table=11 /codon_start=1 /translation="MTDMKIYNVVGKRKIFYTVSLIVIAVALVLTFVLGTDVAIEFKGG TIVTYSYTGTIDEDAVASVARDVTGQNANITLGESLADSLTTVALSFPASQGLTADVQS DLTDALTAQFADNSLELYSSQDVNPSTGIGFFGKCMMAVGVSAVAMIIYIAIRFRNIGG LVAGLCAVVALIHDMCFVYASLVIFRFEINSNFMAVLLTILGYSINATIIIYDRIRENR RIHGDRMTLAELVNLSVSQSVGRSIHTTVTTVIAMSAICVVALIAGVESILSFAFPLVI GLLTGVYSSNCIAPSLWVLWQNKIDAVKAKKKD" /locus_tag="LOCUS_5710" /gene="secF" /note="WP_012048082.1 protein translocase subunit SecF (Clostridium botulinum) [pid:31.0%, q_cov:93.6%, s_cov:95.8%, Eval:1.1e-37]" /note="MGA_745" misc_feature complement(1821..>2915) /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_011144152.1:protein translocase subunit SecD" /note="WP_011144152.1 protein translocase subunit SecD (Gloeobacter violaceus) [pid:32.8%, q_cov:95.9%, s_cov:75.1%, Eval:2.8e-40]" /note="MGA_746" /locus_tag="LOCUS_5720" ORIGIN 1 aatttatccg caaacctcat ctatcatatt ctcaacatcc cgcagagcct tgataagatc 61 gcttatgtca ccgtaatttc tgcggtaaag ctcaagcatc aaacagccgt caaacccaac 121 atcgtcaagt gtcttgatga atcccataat gtccatctcg ccaactcccg gtaaaagaca 181 atcgcccttc gcgccgtggt ctgaaaggtg cacatgcttg atgctgttgc ccaaagcgcg 241 agctccatcc atcggctccc aacccatgcg tacagcctgc tttgtgtcga gcacaaatcc 301 tgcatccgag ccaaaatgcg ctttcattcg ctttaaagtt tcaagctcgc ctgtaactct 361 tttgtccaca ttttcctgca aggccttaac gccgaagctt ttcgcgatct cggcaagtcg 421 ggcaaaccgc ccgaagacaa tttcatcgcc gtaatttacc tttgaaccgt gaaaaacgaa 481 atactcagca cccagaatat tcatcgcttc aaaataccgc ttgtgataat ctaaatactc 541 ctcggttctt ctctcatatg ccgaaaacag agcgtaggta tcaattgcac aggtgtaagg 601 gtgcaatgat atacactttg cgccctcgcc gtcaagaatc ttcttgatct cgcggatata 661 ttcgggtctt gtttccgcct cgcagttgac aaacagctca atttttccaa ctcctgcgcg 721 acatagctct ttaacgaaca cctcaggcgt ttcgggatat ccgcaggcag cagacactcc 781 tgcacatatt cttctatttg acattttcag ccactcctta aatataagag ttatgcaaaa 841 gggtgccgtg ttttaaatgc acagcacccc gaagttttaa atatcaatcc tttttctttg 901 ccttaacggc atcaatctta ttctgccaga gcacccaaag tgagggagcg atgcagttgg 961 aggaatatac acctgtcaaa agaccgatta ccaacgggaa agcaaagctc aaaatcgact 1021 caacacctgc aataagcgca acaacgcaaa tggcagacat tgcaattact gttgtaacag 1081 ttgtatgaat gcttcttccg accgactgag aaaccgaaag attaacaagc tcagccaaag 1141 tcattctgtc gccgtgaatt ctgcggtttt ctctgatacg gtcataaata atgatggtcg 1201 cattgatgga ataacccaaa atggtgagca aaactgccat aaagtttgag ttgatctcaa 1261 agcggaagat aacaaggctt gcatatacaa agcacatatc gtgaatgaga gcaacaacag 1321 cacaaaggcc tgcaaccaaa ccgccgatat ttctgaatcg aattgcgata taaatgatca 1381 ttgcaactgc agaaacgccg acagccatca tgcatttgcc gaagaagcca atacctgttg 1441 aggggttgac atcctgggag ctgtaaagct caagagagtt atctgcaaac tgcgcggtaa 1501 gggcatcggt caaatcagac tgcacatcag cagtaaggcc ctgagatgcg gggaaggaaa 1561 gcgcaacggt tgtcaaactg tccgcaaggc tttcaccaag ggtgatattt gcgttttgac 1621 ctgtaacgtc gcgtgcaact gaagcaacag cgtcttcatc aatagttccg gtataagaat 1681 atgtgacaat ggtaccgccc ttaaattcaa ttgcaacatc cgtgcccaaa acaaaggtca 1741 aaacgagcgc aacagcgata acgatcaagg aaacggtata gaaaatcttt cttttgccga 1801 caacattata aatcttcata tcagtcattg ctctcacctc catagaactt gggatctctg 1861 aagcacttga actttgacag agaagtcagc attactcttg tcgagaatac tccgaagaca 1921 aagttaagga ttacgcccac aagcaaggta tagccgaagg agtaaattgt tccttcaatt 1981 gttgcaggga acataaagta gagccagctc atagcacgtg ccaacaagct gtccggaggg 2041 ccaaatgcac ccataaggat tattgcaacg atcaccattg tgatatttcc gtcaacaaca 2101 gctaccaaag ctctcgaata accgcttgtg agagcggcat tgatggtctt gcctgcccta 2161 agctcttcct tgattctttc gaaggttaca acgtttgcgt caacgcccat accaacagcc 2221 agaatgatac cggcaatacc gggaatggta agggtgaagc tggggataac accaaagaag 2281 cctgtgatgc aagcgatggt gccgacaacc tgtcccacca aagcgatgga cgcaacgaca 2341 ccgggaagct tatagatgac gatcatataa atgcagatga ttacaaatgc gattgcgcct 2401 gccaaaacca ttgcgtttct tgcacccgaa cccatggttg cggaaatggt ggagaagttg 2461 gatgtaacca gcttataggg caaagcacct gcagagatct tatcggcaag ctcctttgca 2521 ccgtcatagt caaattccgg gttggtgatc atcgcgctgc cgtctgtgat agcctcatta 2581 acgatgggcg cagaaatgca ggtgtcatcc atccagatcg agattgaacc ctcggtttcg 2641 gcaagagccg cagttgcttc agcaaacttt gccttgccct cttcgttgaa ttcaagggaa 2701 acggcaaact ttgttgcact gtcctcttca taccagatgg cagttgcact tacgacctgg 2761 tcaccggaaa caatgatgtt ttcggcggtc acaccggtgg gcagaccgta ttcatcgacc 2821 tcgtatccct cacggaaggt aagctcagcc atttcgccaa gctccttaac agcagcctca 2881 gggtcgaagt tttcttcgcc tgcctgccag gggaa // LOCUS sequence154 2913 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence154 VERSION sequence154 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2913 /mol_type="genomic DNA" /organism="" /note="sequence154" CDS 937..2406 /product="glycosyl hydrolase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_012582688.1" /transl_table=11 /codon_start=1 /translation="MKRFIAVLLSALLLCGCAPAQKENTVKDDIVRVEVDDILIEAESG ELLGGTTVAKSKNGFSGEGYVTGFKNGEDGVELSVSIPYGCHYDFVFYINSNGQYKENK IWIDGEKAADVSTESNSFEECIVEKLWLDEGDHKIKLTKGWGWVDFDKLIIRQSELLSN EIYDLSTELSNPNATKAAKSLYNYLLSIYGEYTLAGQHSTEGMNSTEFDSIKEKTGKVP ALIEIDIMKISTPFSADYNNIDLYFDRIKEFDKKGGIVALNWHWHAPPPYIYNDSERPW WRGFYAEATSIDIEKIMNGEDPEGLELLNEDIDVVAKLFKKLQDKNIPVLFRPLHEAGG GWFWWGAKGAEPFKALYIHLYDRLTNYHGLNNIIWVWNGDDAEWYPGDEYVDIASTDIY ADSGEYSSQINDFIAVGKASNGTKPVALSENGVQIDPDMMTRDNVYWLYFCTWGGDYCT SDKYTSGEMFHKVFNSEKVITLDELPNWRRY" /locus_tag="LOCUS_5730" /note="WP_012582688.1 glycosyl hydrolase (Dictyoglomus turgidum) [pid:39.8%, q_cov:92.0%, s_cov:94.5%, Eval:2.6e-87]" /note="MGA_748" ORIGIN 1 tgaagaccct gcagaactct attatagcga cgaatggact tgggataagt tctatgatat 61 gtgcgttgaa ttctccgatt tcgatgagga cagatttgct ctcgacggtt ggtcatggga 121 ctctgcattt atggcttcaa gcggtacaca cgtttacgga tataaccctg aaaccagcag 181 atttgaatct cacgctgatg atcccagact tgaacttgca gcagatgtag tatataatct 241 ttgcaagaac gaatgtgtat atcctttgtg gaagcgcggc tggaagctcc gtaacgaagt 301 tgacggcggc ggaatgaagg aaggacagct tttgttctac attgaaggta catatgcatt 361 tacaggaccc gttgacgaga tctcgagcgt ttggggcgac attaccgcca atgaaattat 421 gttctgccct ctccccagat atcaaaacgg cgacggcaca tattatcttg aatccacaca 481 gaccggattt gcaattgttt cgggcgctga aaaccccgag ggcgttgcgc ttttggcaag 541 ctgtgaaaga ttcaaggcga tcgaccccac tgttgttgac attgacagaa agcatcttga 601 agaaacatac ctttggacag aagaaatgct cgaaatgtac gatatctgct atgagcttgt 661 aactgcgggc gatgttgcaa ttttggactt ctatgacggc gtcggcacaa agctcaacga 721 cgttggcaac aagttcaaga agttcgcaag aagcagtaat gtatcgtctt gggcacagat 781 caaggaaaac aacatggaac aacttgatta ttatctcgac gagctcaacc agttgctcga 841 tgaatttgca ggctaaatct ctctcctaaa aaatagatgt gttaaaagcc tgtaccatat 901 ggtgcaggct tttgcataat gaaaggcgga aaccaaatga aacggtttat tgcagtgcta 961 ttatcagctt tgctcctttg cggctgtgcg cctgctcaaa aagaaaacac agtaaaggat 1021 gatatcgtca gagtggaagt agatgacatt ttgatcgagg ctgaaagcgg agagcttttg 1081 ggcgggacaa cggttgccaa gagcaaaaac ggcttcagcg gcgaaggtta cgttaccggc 1141 tttaagaacg gcgaagacgg cgttgagctc agcgtttcaa taccctatgg ctgtcattac 1201 gactttgttt tttatatcaa ctcaaacggg cagtataaag aaaacaagat ctggatagac 1261 ggcgaaaagg cggcagatgt ttcaaccgaa agtaacagct ttgaggaatg tatcgttgaa 1321 aagctttggc ttgatgaggg cgaccacaag atcaagctga caaaaggctg gggctgggtc 1381 gattttgata aactcattat ccgccagtcg gaactgctca gcaacgagat ctatgatctt 1441 tcaacagagc ttagcaatcc caacgcaaca aaggcggcaa agagcctata taactacctt 1501 ttgagcattt acggcgaata tacccttgcg ggacagcact ctaccgaggg aatgaattct 1561 accgagtttg actcgatcaa agaaaaaaca ggcaaggtgc ctgctttgat cgagattgac 1621 ataatgaaga tctcaactcc tttttcagcc gactataaca atatcgactt gtatttcgac 1681 cgcatcaagg agtttgataa aaaaggcgga atcgtagccc tcaactggca ttggcacgcg 1741 cccccgccgt atatctacaa tgattcggaa aggccttggt ggagaggctt ttatgccgaa 1801 gcaacaagca ttgacattga gaagatcatg aacggcgagg accccgaagg gcttgaactt 1861 ttgaatgagg atatcgacgt tgttgcaaag cttttcaaaa agctgcagga taagaacatc 1921 cccgttttgt tccgcccgct tcacgaagca ggcggcggat ggttctggtg gggtgcaaag 1981 ggtgctgagc ccttcaaggc tctttatatt cacctttacg accgcttgac aaactatcac 2041 ggtctgaaca atatcatctg ggtgtggaat ggcgacgatg ccgagtggta tcccggtgat 2101 gaatacgttg acattgcctc aactgatatt tatgccgatt cgggagaata ttcatcacag 2161 ataaacgatt tcatcgcggt aggcaaagcc tcaaacggca caaagcccgt cgctttgtcg 2221 gaaaacggcg ttcaaatcga ccccgatatg atgacaagag ataatgtata ttggctttac 2281 ttctgtactt ggggcggaga ttactgcaca tcggataaat acacctcagg tgaaatgttc 2341 cataaagtgt ttaactccga aaaggtcata acccttgatg agctccccaa ctggcgaaga 2401 tattgataca aaaccacaat agcattttat aacaacttga cctccaaaca agaaacagcc 2461 gtcttggcaa aaggattgtg ccctaaagga cagttttcaa aaactcggca tatctcgaaa 2521 gagatatgcc gagttgtata tttgtgggca caaatgcagt gcttgtcatg aaaattggca 2581 agtcaaaatt tatcggctgt tctttttgta aagtctaaaa acccccactc caagaaaaag 2641 aatgcttatg aataaaaacg atattaaaca tataaagtga acatttccat ttgagcattg 2701 ttgccaatcg ttaaaattca ccagatagga gctgttattt gtacctaaca gtttatccac 2761 aacgtaattc gtgaaataat acacaaccgt gctgaaagca atacaaatgc ccgcttttag 2821 aaaagcgtcc aagcgaagcg cgcaaatgac ggcgcaaatg attgcaggag tgaaagcata 2881 gcacgttatc aatatcgcgg aaacgacttt gaa // LOCUS sequence155 2860 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence155 VERSION sequence155 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2860 /mol_type="genomic DNA" /organism="" /note="sequence155" CDS complement(196..402) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MKDFFKGMAAITLALVLIPAMPLLFQADFVAPSAPVMTETTPIEK EYTLIETVSVYDVVKRGTFTMSI" /locus_tag="LOCUS_5740" /note="MGA_750" CDS complement(510..1295) /product="sporulation transcription factor Spo0A" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011460261.1" /transl_table=11 /codon_start=1 /translation="MAKRLKVRIGDDSKEFGGNCAETLRSMGFFCITRPKDGAVMLDAI KDEVPDVAVVDLSMANFDAIELIKRINKSGVKKPLFIVTSVYDNAFAQKTLMQIGVSYF LLRPFDVKMLGSRINELMGYDILEDYSIGTPTHTGTAPDLEVVVTEMIHQLGVPAQVKG YHYIRSAILHCIADKEMLECVTKMLYPTVAKEFDTTPSRVERAIRHAIELAWDRGDLEI LNSFFGYTVNTGKGKPTNSEFIALVTDKIKLKFKGAAIA" /locus_tag="LOCUS_5750" /gene="spo0A" /note="WP_011460261.1 sporulation transcription factor Spo0A (Desulfitobacterium hafniense) [pid:42.0%, q_cov:96.9%, s_cov:98.5%, Eval:1.3e-53]" /note="MGA_751" tRNA complement(1532..1606) /product="tRNA-Arg" /inference="COORDINATES:profile:Aragorn:1.2.38" /locus_tag="LOCUS_t0100" /note="Aragorn_10" ORIGIN 1 gtggggaagc atcagcgaaa gatatttgga tgaatcggtt gaaatgtctg caccgtaaag 61 ctcgggtgtt ggcgactgtg tttcatcaat tcttctgccg aggatatatg tatacattat 121 caccgtctgt gccttgatca gctcgggatg agcacctttt tcaaggtggg aaaataacga 181 tgcaacaagg taatcttaaa tgctcattgt aaaggttccc cgcttgacaa catcatatac 241 cgatacagtt tcaataagcg tatattcttt ttcgattggt gttgtttctg tcattacagg 301 agcgctcggc gccacgaaat cagcttgaaa aagcaatggc attgcgggaa tcagcacaag 361 cgccagagtt attgccgcca ttcctttgaa aaagtctttc atatatctgc cctccgtttt 421 gttttgggac aagtatagca ctgttaatgc gaagcaaatg tcgaatatgc aaaacacccg 481 ccaaagaaca gctttgacgg gtgagttttt tatgctattg cggcgccttt gaatttaagc 541 tttatcttat ctgtcacaag cgcgatgaat tcggaattgg tgggcttgcc cttgcctgtg 601 ttgacggtgt aaccaaagaa agagttgaga atttcaagat ctcccctatc ccacgccagt 661 tcgattgcat gacgaattgc gcgttcaacg cgagaaggcg ttgtgtcaaa ttcctttgca 721 acggtgggat agagcatttt ggtcacacat tcaagcatct ccttgtcggc gatgcaatgc 781 aagatcgcac tcctgatata gtgataacct ttgacctggg caggtacgcc aagctgatga 841 atcatttcgg tgacgaccac ttcaaggtcg ggtgctgtgc ctgtatgcgt gggcgtgcct 901 atggaatagt cctccaaaat atcgtagccc ataagttcat tgatgcggga gccgagcatt 961 tttacatcga acgggcgcag aagaaaatag gacacgccta tctgcatcaa cgttttttgg 1021 gcaaatgcgt tgtcataaac ggaagtgacg ataaacaaag gctttttgac ccccgatttg 1081 ttgatacgct tgatgagctc gattgcatcg aaatttgcca ttgaaaggtc aaccaccgcc 1141 acgtcgggga cctcgtcctt tattgcatca agcatcaccg cgccgtcctt ggggcgggta 1201 atgcagaaaa agcccattga gcgcagagtt tccgcgcaat ttcctccgaa ttcctttgaa 1261 tcgtcaccta tacgtacttt taatcttttt gccatgattt ttcctcctta ttttgtgttt 1321 gcgcgacttt tgtcgtgctg tatttgcaag tataaggcga gatgacaaaa aagtttgtcg 1381 aatgggggca cgtgaaaaga aaaaatcttg taaaggtggt tagcttgtcg aagagggagc 1441 catacaactg cgttgattcc atacgctttg gcgattccat gcaaatcctt cggatttgat 1501 aacaaacagc aagtcttgcg acttgctgtt ttggcacccg cagcgagaat cgaactcaca 1561 actaaccctt aggaggggtt tattatatcc atttaactat gcgggcatat tcgattacca 1621 agtcattata caccaacagg gcagcgaaat caagtagaga ttggaatttt gggtgcggag 1681 cgagccgtgg ctgacacgac gccgcgccaa aggtgtggcg gttcgtggcg tgccgtggcg 1741 agcggtcaag tggtacgaaa atttggaatt cggcggtttg cttgcaaatt tgcggcgatg 1801 ccgcaaaagc cgaatttaca gcggccgtca agatttttcg ggttccgcaa aagtgattcg 1861 gccgcttggg ccgtggctga cacgacgccg cgccaaaggt gcggcggttc gtggcgtgcc 1921 gtggcgagcg gagcgttggc ggtgcgcttt cgtaatcttt cacaaaacat aacaccactt 1981 attgtcgaag tttacatatt caaagatgcg cggttttgtg ataaaatata tgttaatcta 2041 attttgtttg gaggaacatt atgaaaaaga tcatatcact tatgcttgca cttatcatgg 2101 ctttgagcct tgtttcctgc ggcgaaccca aggtagagga acccgaattt gacgttgcaa 2161 ccttgactaa tcaggagctt acatattctt tggaagaact tgagactctt gcagctcaag 2221 acctattgat gaactcattt gaagcacctg ctttgtataa gtattttgac aacatggatc 2281 tcggtgttgc tttcggtgtc ggacagatca aggactacaa cactgatcct gtaactcaag 2341 gcattttgaa gcatttcaac gtttatgttc tcggcaatga gtgcaagcct gcatacattc 2401 accgtggcga aggtcagttc tattgggatg acgttgacag atttgttgaa tttggcaaga 2461 tcaacgatgt taccttgcgc ggacacaccc ttttgtggca ctctcaggtt cccgattggt 2521 ggttcaaggc agatcctaac gacacaagat ctgtaagaga atgctatgat cagggtgctt 2581 tagcgacccg cgaacagctc accgaaagac ttaccacctt catcaccgaa tatgtcacca 2641 gatataagga tgatattgag gtttgggatc tttgtaatga ggttctcaat gccgattcaa 2701 tcagaacagt cagagacgat tcctattggg ctgagatcat cggcgacgtt gacggtaacg 2761 gcttcaagga tgactatgtt gagattgctg caaatgccgc aagagctgct gatgaggacg 2821 ctgttcttat tatcaacgac ttcaatatgg aatggcagaa // LOCUS sequence156 2830 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence156 VERSION sequence156 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2830 /mol_type="genomic DNA" /organism="" /note="sequence156" CDS 34..1083 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MTSNAESPMTELRKKNGREKPWNVKYIGIGNENWGCGGSMTDEYY SDTYKRFGEYLRGPYQKIACGPSSGDYNWTNVMMDKCAGWGRMKGLSLHHYTIPTNNWG KKGSSTDFDKQEYYHTLSNTWYMETLLRNHKAVMQRYDDVKDPKVGLCVDEWGIWTDVI PGTNPGFLYQQNSMRDAILASINLNLFNLHSDRVKMANIAQVVNVLQAIILTEGDKMVK TPTYHVFDMYQGHMEAELVYSNVENKLIDGVNYLPAVSQSVSVDADGKMHITISNASLD EEFEIEALMPRAEYTSVCAKILTGEYNQCNTFEAPEAVKPECYDGVCLNGEKLTIKLPK CALVSIELA" /locus_tag="LOCUS_5760" /note="WP_004398654.1 alpha-L-arabinofuranosidase AbfB (Bacillus) [pid:46.6%, q_cov:99.7%, s_cov:70.9%, Eval:1.9e-86, partial hit]" /note="MGA_754" CDS 1087..1341 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MSKPFCKRCLLIDIDIDGLYKEVAELISLIPEDRKTDDELYRERL DICRSCESLQNGMCGKCGCFVELRAANKSNYCPSYPKKW" /locus_tag="LOCUS_5770" /note="MGA_755" CDS complement(1382..2095) /product="TraX family protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_010774239.1" /transl_table=11 /codon_start=1 /translation="MSALILKLIASLSMLIDHAGLMLFNDNPTMRMIGRLAFPIFAFFI AEGFKYTRNRGKYFMRVFLLGVICQIVYTIADGSVYIGILLVFSLSIILMYLLDCLKTA VKGQKSDLCAKLFDSKEVSRKLDILMCAVLFAVAVGGCYLLCENVAVDYEFWGIMLPVA MSAFSNKWARLGAFSAVLIVLCITANFHWQPLSLFTLPLLAIYNGKPGKYRMKYFFYVF YPAHLVVLYLIDMLM" /locus_tag="LOCUS_5780" /note="WP_010774239.1 TraX family protein (Enterococcus faecalis) [pid:28.2%, q_cov:97.9%, s_cov:95.8%, Eval:1.0e-14]" /note="MGA_756" CDS complement(2198..2437) /product="PspC domain-containing protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_010957794.1" /transl_table=11 /codon_start=1 /translation="MNGKKLYKSKTDKKICGVCGGLAEFLGIDVTIVRLIWVLVILFAG FGLLAYIVCALILPEKPDGTVTVVNEDDYTGPEV" /locus_tag="LOCUS_5790" /note="WP_010957794.1 PspC domain-containing protein (Coxiella burnetii) [pid:47.4%, q_cov:94.9%, s_cov:92.7%, Eval:9.6e-17]" /note="MGA_757" ORIGIN 1 actgttcagg aagctgttga atgggtcgaa tatatgacat caaacgctga atctcccatg 61 accgaactga gaaagaaaaa cggcagagaa aagccttgga acgttaaata tatcggcatc 121 ggcaacgaaa actggggctg cggcggaagt atgaccgatg aatattattc cgatacatat 181 aagcgcttcg gcgaatattt gaggggtcca taccagaaaa tcgcttgcgg acccagcagc 241 ggcgactata actggacaaa tgttatgatg gataagtgtg ccggttgggg cagaatgaag 301 ggactttcgc ttcaccacta cactattccc acaaacaact ggggcaagaa gggttcatcc 361 accgacttcg acaagcagga atactatcat accctttcca acacttggta tatggaaaca 421 ctcttgcgca accataaggc tgtaatgcag cgctatgacg acgttaagga ccccaaggtc 481 ggtctttgtg ttgatgaatg gggcatctgg acagacgtca ttcccggcac taatcccggc 541 ttcttatatc agcagaactc aatgcgtgat gcaattttgg catctatcaa cctcaacctc 601 ttcaacctcc attcggacag agttaagatg gctaacatcg ctcaggtcgt aaacgttttg 661 caggctatca tcctcaccga gggtgacaag atggtcaaga cccccacata tcacgtattt 721 gatatgtatc agggccatat ggaagctgag ctggtttact ccaatgttga aaacaagctg 781 atcgacggcg ttaactatct ccctgcggtt tcccagtcgg tttctgtcga tgctgacgga 841 aagatgcata tcacaatttc caatgcatcg ctcgacgagg aattcgagat tgaagcactt 901 atgcccagag cagaatatac aagcgtttgt gcaaagatcc tcacaggcga atacaaccag 961 tgcaacacct ttgaggctcc tgaggctgtc aagcccgagt gctatgacgg cgtttgtctt 1021 aatggcgaaa agctcaccat taagcttccc aagtgtgcac ttgtttcaat tgaattggca 1081 taagccatgt ccaaaccctt ttgcaagcgt tgcctgctga ttgatatcga cattgacggg 1141 ctatataagg aagtcgctga gctgatctcc cttatccccg aggataggaa gactgacgac 1201 gagctatatc gcgagcggct tgacatctgc cgcagttgcg aaagccttca aaacggaatg 1261 tgcggaaagt gcggctgttt tgtcgagctt cgcgccgcca acaaatccaa ctactgtccg 1321 tcctatccga aaaaatggta acaaaaatct ccctttcctt taaggaaggg gagatgcttt 1381 tttacatcag catatcaatt aaatataaaa caacgagatg tgcgggatag aaaacataga 1441 agaaatattt cattcgatat ttccccggct tgccgttata aatcgccaaa agcgggagcg 1501 taaacaggga gagaggttgc cagtggaaat ttgccgttat gcaaagcacg attagcaccg 1561 ccgagaatgc gcccagcctt gcccatttgt ttgaaaaggc tgacattgca acgggcaaca 1621 taattcccca aaactcgtag tcgaccgcca cattttcaca aagcaggtaa catccgccaa 1681 ccgcaacagc aaacaaaact gcacacatta aaatgtcaag ctttcgggaa acctctttac 1741 tgtcgaacag cttcgcacag aggtcacttt tttgaccttt aacagcagtt tttaaacaat 1801 caagcaggta catcagtata attgaaagcg aaaataccag taaaattccg atatataccg 1861 agccgtcagc aattgtataa acaatttggc atattacacc cagcaggaaa acgcgcataa 1921 agtattttcc acggtttcgg gtatatttga agccctcggc aatgaaaaag gcaaaaatcg 1981 ggaacgcaag ccttccgatc attcgcattg tcgggttgtc gttaaaaagc ataagccctg 2041 cgtggtcaat gagcatcgac aaggatgcaa taagctttag aattaacgct gacatttaaa 2101 ttactcccta atgttattat ccgaattata gcacttatgc ttttcaaatg caagaaaaaa 2161 cgcccccact ttgagggcgt tttcttctta tcaattatta aacctcggga cctgtgtaat 2221 cgtcttcatt aacaacagta acagttccgt ccggcttctc gggaaggatc aatgcacata 2281 cgatgtatgc caaaagtccg aatcctgcga aaagaattac cagaacccag ataagacgaa 2341 cgattgttac gtcaattcca aggaactctg ccaatccgcc gcaaacgccg cagatcttct 2401 tatcagtctt agatttataa agctttttac cattcatagc taaacgcctg cctttctgac 2461 agtattatat catattctat ctgcttttgc aacacttagt taatcgtagt acttgttctc 2521 gaaatcatac caatctattc ggtttttgtt tgcacataat tcaagtgttc ttccatatac 2581 atccaaatat agattcatat atttggttat atattcgtat gatgataccc atctaccact 2641 aatacccaga ataccgtcaa tatagtactc tggaatgttt acattgttct cattatatgt 2701 tccagtttct tcaattagga acgcagtatg gtgagaatgt tcagaaattg agccgtagtt 2761 gtaatcctgc tcgatattaa ataccatgtc tttaaataca atcgtgtcag gataatcact 2821 gtattctgat // LOCUS sequence157 2806 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence157 VERSION sequence157 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2806 /mol_type="genomic DNA" /organism="" /note="sequence157" CDS 269..1201 /product="methionyl-tRNA formyltransferase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_010940806.1" /transl_table=11 /codon_start=1 /translation="MNIVFMGTPDFAIPTLKALIESEHNVIAVFTQTDKPKGRGMKLTP SPVKELALSYDIPVYQPNSLKKETETYTPILKELNPDCIVVVAYGKILPPVVLEIPRLG CVNVHGSLLPKYRGAAPIQWTVLNGDEYGGVTTMLMAEGMDTGDMLLKSAVKVGENETS YELYDRLSYIGAELLIETLNKLEKGEITPEAQNEAEATLAPMLSKELCPVDFSKTAKEV HSQICGLSDWPCATAMLDGKKLKLYRCEIVNCTASNHHPGEIVNEKDFTVACGEGCIRI TELQAEGSKRMPTNAYLLGRPVKKGAVLN" /locus_tag="LOCUS_5800" /gene="fmt" /EC_number="2.1.2.9" /note="WP_010940806.1 methionyl-tRNA formyltransferase (Geobacter sulfurreducens) [pid:49.5%, q_cov:99.7%, s_cov:96.5%, Eval:3.5e-78]" /note="MGA_760" CDS 1214..1912 /product="zinc metallopeptidase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_012047881.1" /transl_table=11 /codon_start=1 /translation="MPFFYFDPTYIVLLPALIFAAYAQFKVSSTYNRFSRVDNRNGWTA AEVARRILDSNGLHDVQIQRISGNLTDNYNPSTNIISLSDSVYSSKSVAAIGVAAHECG HAVQYALGYAPIRIRSALVSVTNFGSNAGMILLLIGLLFSSYTLAMVGIVMYSTVAVFQ AVTLPVEFNASRRALDTLEADEILCSDEIPYAKKVLSAAAMTYVAALLSSLSTIFRFLL IVGGGRRRRN" /locus_tag="LOCUS_5810" /note="WP_012047881.1 zinc metallopeptidase (Clostridium) [pid:48.6%, q_cov:94.8%, s_cov:96.9%, Eval:1.6e-57]" /note="MGA_761" ORIGIN 1 aagaaacgca gtacggcacc gaaggctgtt tgtcatatcc cggcctttac ggctacgtta 61 caagacctat gacggttaag tttaaggcac aagaccgttt cggtgaatgg tatgagaagg 121 aagtaagcgg tttgtttgca agatgtgttt gccatgaact caatcatctt gacggcatta 181 cacttcctgc aaacatcgaa gctccttatg tgcctgagga tgaggaagaa gattccgaag 241 aataatttga atattaagga gaaatccgat gaatatagta tttatgggaa cacctgactt 301 tgcaattccg acgcttaagg cgctgattga aagcgagcat aatgtcatag cggtgttcac 361 ccagactgat aaacccaagg gcaggggaat gaaactaaca ccatctcctg taaaggaact 421 tgccttgtca tatgatattc ctgtttatca gccaaattct ctcaagaaag agaccgaaac 481 atacaccccc attctcaaag agctgaatcc cgattgcatc gttgttgttg catacggcaa 541 aatcttgcct cccgtggttc ttgaaattcc ccgactcgga tgtgttaatg ttcacggctc 601 gcttctgcct aagtacagag gcgccgcacc cattcaatgg acggttttaa acggcgatga 661 atacggcggt gtaacaacaa tgcttatggc cgagggcatg gatacaggcg atatgctcct 721 caaaagtgca gttaaggtcg gcgaaaacga aacctcttac gagctttatg acagattgtc 781 ttacatcggc gcagaattgt tgattgaaac acttaacaag cttgaaaagg gcgaaatcac 841 ccccgaggcg cagaacgaag ccgaggcaac tcttgctccg atgctctcga aagagctttg 901 tcctgttgat ttttccaaaa ctgcaaagga agttcattcc caaatttgcg gtttgtccga 961 ttggccttgc gcgaccgcaa tgctcgatgg taaaaagctc aagctatatc gttgcgaaat 1021 tgtgaactgc actgcttcca atcatcatcc cggcgaaatt gtaaatgaaa aagactttac 1081 agttgcctgc ggtgaaggtt gcatcagaat taccgagctt caggccgaag gctcaaagag 1141 aatgccaaca aatgcctatc ttctcggcag acccgttaag aaaggcgcag ttttaaactg 1201 ataaaggaga aatatgcctt ttttctattt tgatcccacc tatattgtcc tgcttcctgc 1261 cttgattttt gcggcatatg ctcagttcaa ggtcagctcg acatataaca gattttcccg 1321 tgttgataat cgaaacggtt ggacagccgc tgaggttgca agacgaattc tcgattcaaa 1381 cggacttcat gacgttcaga tccaaaggat ttccggaaat ctgacagata actataatcc 1441 atcaaccaat atcatttcgc tttcggacag cgtatattca agcaaatctg ttgcggcgat 1501 cggcgttgcc gcccacgaat gcggtcacgc tgtgcagtat gctttgggtt atgcacctat 1561 aagaatcaga tctgcgctcg tatctgttac taatttcggg tcaaatgcgg gtatgatact 1621 gcttttgatc ggcttgctgt tctcgagcta tactcttgca atggtgggaa ttgtgatgta 1681 ttcaaccgtt gcggtattcc aggccgtaac tcttcctgtt gaattcaacg ccagcagacg 1741 cgcacttgat acccttgagg cagacgaaat tctctgttct gatgaaattc cctatgctaa 1801 aaaggttctt tctgcagcgg cgatgaccta tgtcgcggca cttttatcga gcctttcaac 1861 aattttcaga tttttgctta ttgtcggcgg cggaaggaga agacgtaact gatgcagaca 1921 ccccgcgaaa tttgcttgaa attgcttgtg tcaaccttca agaatgcaag ctattccaac 1981 atcgctctcg ataagaccct taatcgatat cctgctttga gtgatgttga taagcgcttt 2041 atctccgccc tgtattacgg cgttatcgag cgcgcaataa ccctcgatgc gataattgca 2101 aaatactctt cacgccctgt ggataagctt tccgacgctg tacgcgaaat tctgcgaatg 2161 ggtatctatc agcttttata tatgaactct gtgccagaca gcgcggcggt aaatgaaagc 2221 gtaattctaa caaaatcaaa caaaaaccct gctgtttcgg gatttgtaaa cgctcttttg 2281 cgcagtttca ttcgtgatga caaaaagctt cccttaaacg gaaataagct ccacgatatg 2341 tcaattgagt attcctgccc cgaatggctt gtttcaatgt ggctggatga ttacggcgaa 2401 aagactgcag tttcaatgct ttcttcgtca attggcaaac cgcctgtaac cgcaagactc 2461 aatacttgca atttttcctt cgatgatatt gtttcatcat tagagtccga gaacgtcagc 2521 tggcgcaaag tcgatgcggt tgatgactgt atcgagctgt ttggcgtcgg ctcagttgag 2581 aagcttgatg cttacaaaaa aggaatgttc cacattcaag atgtttcctg ccagatctgc 2641 tgtcacgagc ttggtgcaaa gcccggtgaa accgttttgg atatgtgctc agctcccgga 2701 ggaaaagcat ttaccattgc ccagatgatg aataatgaag gcaaggttct tgcatttgat 2761 ttgcaccaaa aacgagctga ccttatcaaa tcgggtgcag aacgat // LOCUS sequence158 2795 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence158 VERSION sequence158 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2795 /mol_type="genomic DNA" /organism="" /note="sequence158" misc_feature <1..840 /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_010965033.1:23S rRNA (adenine(2503)-C(2))-methyltransferase RlmN" /note="WP_010965033.1 23S rRNA (adenine(2503)-C(2))-methyltransferase RlmN (Clostridium) [pid:51.1%, q_cov:99.3%, s_cov:80.6%, Eval:1.7e-81]" /note="MGA_763" /locus_tag="LOCUS_5820" CDS 861..1589 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MFVLGKTDIGKFRDENQDRFRVSMIDDNTSVAVVCDGMGGAKSGG LAGDIASDIVYERLCLSYRADMEPKSVKSLLVSAFSAANSVVYRRSHEEEVNRGMGTTC VAALVHNDIASIASVGDSRAYLLNESGITQITNDHTVVEYLHSKGVINEDEMRSHRMKN LITRAIGIEESVDVDYFEIDIPHGSVILICTDGLTNYCSDELIYSIVYKRPLEQATNEL IEYSNTRGGKDNITVVLISR" /locus_tag="LOCUS_5830" /note="WP_012257018.1 protein phosphatase 2C domain-containing protein (Chloroflexus aurantiacus) [pid:38.7%, q_cov:96.7%, s_cov:68.8%, Eval:1.6e-37, partial hit]" /note="MGA_764" ORIGIN 1 ggttcgctca aggttgtcag acagcttgaa tcgaaaattg acggcactgt taaaatgctt 61 tatgagcttt cggacggaaa ccacgttgaa accgttttga tgagctatga gcacggagat 121 tccctttgtg tatcaacgca ggtcggatgt aaaatgggct gtcgcttctg tgcatccact 181 attgcaggat ttaaaagaaa tctcgaagct tcggaaatac tattacagct atatgaaaca 241 gagcgcgcca caaagagaaa agtttcaagt attgttttaa tgggaatcgg agagccgctg 301 gataattacg acaatgttgt aaagtttctt aatattcttt caagtgaaaa gggaacaaat 361 atgagcctgc gccacgtgtc gctttcaacc tgcggacttg ttgatcgtat ctatgatctt 421 tctgcactcg atttgggact tacactgtca atatctttac acgcgactaa cgacaaaaag 481 agaagcgaac tgatgcctgt caataacagg tatcatattg aagagctgat gaaggcttgc 541 cgcgactatt tcaaaaagac cggcagaaga atttcatttg aatatgcttt aattgacggc 601 gaaaacgatt caatggacga tgcaaaagca cttagccgac tcatcggcgg aatgccctcg 661 cacgttaata taatccctgt aaataaaatt aaagaaagag agtaccgttc cgatcgctct 721 gctgcccaga gattttgcaa aatgctctgt gatttgggtg ttaatgcaac tgtgagaaga 781 acacttggct ctgatataga cgctgcctgc gggcagttaa gacgtgaata cgaaatttaa 841 atgaaaggcg gtgagagatc ttgttcgttt taggaaagac agatatcgga aaattccgag 901 atgagaacca ggacagattc cgagtttcga tgattgatga taacacctct gtcgctgtag 961 tgtgcgatgg tatgggcggc gcaaaaagcg gcggccttgc gggcgatatc gcatctgaca 1021 tcgtatatga aagactgtgc ctcagctacc gcgcagatat ggaacccaaa agtgttaagt 1081 cgttgcttgt ttctgcattt tctgccgcta acagcgtggt atacagaaga agccacgagg 1141 aggaagtaaa ccgcggaatg ggtacgacct gcgtcgcggc acttgtacat aatgacattg 1201 caagcattgc cagtgtcggt gattcccgtg catacctgct taatgaaagc ggaattaccc 1261 agatcaccaa tgatcacaca gttgttgaat atctccactc taagggcgta attaatgagg 1321 acgagatgag atctcaccgt atgaaaaatc tcatcacccg tgcaatcgga attgaagaat 1381 cggttgatgt tgattatttt gaaattgaca ttcctcatgg ctcggtaatt cttatatgta 1441 cagacggtct gactaactac tgttctgacg agctgattta cagtattgta tataaacgcc 1501 cgcttgagca ggcaaccaac gagcttatcg aatattcaaa tacccgcggc ggcaaggata 1561 acatcactgt agttcttatt tcccgctgaa actgatcaga agatttgcaa aaggaattga 1621 taaaatggat aaatatatcg gtatgaaact tgacggaaga tatgaagtcc ttcaacttat 1681 cggcgtcggc ggtatggctg acgtttataa gggtatcgac ataatggaaa accgtgtcgt 1741 tgccgtcaag atacttaaaa acgaatactg tgagaatgaa gagttcatca aagccttcag 1801 aaacgaaagc aaagccattg ctgtcctttc tcatcctaat atcgttaaga tttacgatgt 1861 tggctatgaa aacaagatgc agtatatcgt aatggaatat atcgacggaa taactctcaa 1921 ggaatttatt gaggagcaag gtcttttaaa atggcgcgac tgtgttcact ttaccatcca 1981 gattttaaga gctcttcagc ttgcacatga taggggaatc gttcaccgcg atatcaagcc 2041 tcagaatgtt atgatcatgt ctgacggcag tatcaaggtg atggactttg gaattgccag 2101 attctcccga tccgactcag gtaattctga tgaaaaaacc atgggatcag ttcactatgt 2161 ttctcctgaa caggcaagcg gatcaagaac tgatgaacgt agtgacattt actctgttgg 2221 cgtaatgatg tatgaaatgc ttactggcag aaaacccttc gacggcgaaa caccagttga 2281 agttgccctg aagcatatga acgatgcgcc gaaaatgccc accgaatatg ttacttcact 2341 ttatgcaggc cttgaagaga tcatattgca cgcaatggaa aaagagcctt caaagagata 2401 tcagtctgca tcaagcatga tcagagatat tgaagctttc aaacaggatc agagcatcgt 2461 tttcggatat aaagaaaccg acattgcaaa atccaagaac tccactgcta tagattctat 2521 caaaaataag cttccaagca ttaacttgcc ttcatttaag cttcctgcaa agaagaaaaa 2581 gaaggaagaa ccaatcgttg aagagcctgt tgatgattac tactatgatg aatatgagga 2641 ttacgatgag gatgattatg atgaacccag attctcattt gttcttccga ttcttgcatc 2701 agttgcatgt acagtcataa ttgttgcaac tttgtttgtc gcaaacgtta ttttgggagc 2761 tttcaaaacc gctccgtcat cttcaaacga ctata // LOCUS sequence159 2788 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence159 VERSION sequence159 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2788 /mol_type="genomic DNA" /organism="" /note="sequence159" misc_feature <1..959 /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_080241138.1:glycoside hydrolase family 2 TIM barrel-domain containing protein" /note="WP_080241138.1 glycoside hydrolase family 2 TIM barrel-domain containing protein (Spirosoma rigui) [pid:44.1%, q_cov:87.4%, s_cov:24.1%, Eval:1.6e-57, partial hit]" /note="frameshifted, insertion/deletion at around 911" /note="MGA_766" /locus_tag="LOCUS_5840" CDS 940..2688 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MWSIGNETSSRTQLYYDLIAELKEMDSTRPVHYESLGESGGVDIS SVMYWDIYGTNLKGNASNNMPFMQCEYVHAMGNSVGNIYEYWEAIRSHDNIVGAFIWDF VDQSIWTEYDEGEFDYYGNGKYLAYGGCWGDANNQGNFCQNGIISADRTIQPEAYEVKY VYQSVWATAENLDLTNKTVEFYNEFNFTDLNAYDISYELLENGKVIDSGKLDINCAPRE TVKVEIPYNAPEKAAADGEYFLNIYVKLPEDTLWAEKGHLVASEQFKVDLDVTEHIGLD VSAMPNVTVLDEENKTTVSSDNFEATFSSKTGLLLSYTYNGEKVINEGPELTYTRATLD NDRDLSWDSAKAKETTSFGVIPDASGKFVTIEAAIAVSNDGGIQYMTYTVYGSGEITVK STLDTVSGSDEMHRYGATMTLPGEYENITFYGAGEWDTYNDRRKGAHIGIYETTVSDSF YPYPQPQDTGTKTGVRYFALTSDEHETGLLFVSDSEMEAQALHFSSLQLRIESRVPKLR DMGRTYVTLSHGSRGTGGASCGPDTLDQYRITANGKDYTYIYTIVPFNKEADDISELWL MFADNE" /locus_tag="LOCUS_5850" /note="WP_011108747.1 glycoside hydrolase family 2 TIM barrel-domain containing protein (Bacteroides thetaiotaomicron) [pid:32.1%, q_cov:97.3%, s_cov:40.0%, Eval:8.3e-75, partial hit]" /note="frameshifted, insertion/deletion at around 893" /note="MGA_767" ORIGIN 1 aggtcggata cagcgaggac tcatatgaca cctcgacctt cgatattacc gcatttttaa 61 atgatgatgg acaggacaac ctgattgccg ttaaggtata ccgttggtgc gacggcagct 121 attttgaaaa tcaggacttt ttgcgccttg caggcatctt ccgagatgtt tatgtgtatt 181 ctgttcctgc tgtcaacatc tgtgattata aggttgaaac cgatctcgat gaggacttca 241 ccgatgcgga gcttttaatt gaagcgcaaa tatataactc taccgttgct gatgttgaat 301 cgggcttcta ttctctggat gtaagacttg ttgatgccga gggcaattcg ctgtttgcaa 361 gcgacccgtt aagagaagat gtaagcgcag ttaaatcggg aaagacaaaa tccgtcagca 421 tttcccgact tgttgaagca cctcaccttt ggagcgacga ggacccgtat ctttacactc 481 taatcatcag tttatatgac aaaaacggcg tatactatgg cagtatctcc caacaactcg 541 gcttcagaga gataaccttt acaaaaactg agggaattga gcccaacaag gataaatatg 601 acataatgct cttaaacggc aagtccctcg tctttaaggg cgtcaaccgc cacgaaacca 661 gccccgacac aggcaaatat gcttcccgcg agctgatcga gcgtgatgtt aagattatga 721 agaaccttaa catcaatgct gtccgcacat ctcactatcc cgatgccaag tatttctacg 781 atatgtgcga taagtatggc ctgttggtgc ttgccgagtg caatatcgaa tcgcactacg 841 gcgttaacga agccgaaacg gaagaatact tcaagggaac tatcaccgac cgcgtcaaat 901 cattcacaga gcttgcaaaa aaaccgcacc tgcgttgtaa tgtggtcaat cggaaatgaa 961 acaagctccc gcacccagct atattacgac ctcatcgccg agcttaaaga gatggactcc 1021 acacgtcctg tccactatga atctttgggc gaatcgggag gtgtggatat ctccagcgtt 1081 atgtattggg atatttacgg aaccaaccta aagggcaacg cttcaaacaa tatgcccttc 1141 atgcagtgtg aatatgttca cgcaatgggc aactcggtcg gaaatatcta tgaatactgg 1201 gaagcaataa gaagccacga caatattgtc ggcgcattta tctgggactt tgttgaccag 1261 tccatctgga cggaatatga cgaaggcgag ttcgattatt acggcaacgg caaatatctg 1321 gcatacggcg gctgctgggg agatgcaaac aaccagggca acttctgcca gaacggaatt 1381 atcagcgccg acagaacgat ccagccggaa gcatatgaag tcaagtatgt ttaccagtcg 1441 gtctgggcaa cagccgaaaa ccttgatttg accaataaaa ctgtagagtt ctataacgaa 1501 ttcaacttca ccgaccttaa cgcatatgac attagctatg agcttttgga aaacggcaag 1561 gtgattgatt cgggcaagct ggatatcaac tgtgcgcccc gcgaaacagt taaggttgaa 1621 attccttata acgctcccga aaaagcagcg gccgacggtg aatatttcct caatatatat 1681 gttaagctcc ccgaggacac cctctgggcg gaaaagggtc accttgttgc aagcgaacag 1741 ttcaaggtcg acctggacgt aaccgagcat atcgggcttg atgtttcggc aatgccgaat 1801 gttacagttt tggatgaaga aaacaagaca accgtttcct ctgacaactt tgaagcaaca 1861 ttcagcagca aaacaggtct tttgctcagt tatacctata atggtgaaaa ggttatcaac 1921 gaaggacccg agcttacata tacaagagca actcttgaca acgaccgtga cctcagctgg 1981 gatagtgcaa aagctaagga aaccacctcg tttggtgtaa ttcccgatgc ttccggcaaa 2041 tttgtcacca ttgaagcggc gattgccgtt tcaaatgacg gcggcatcca gtatatgacc 2101 tataccgttt acggaagcgg tgagatcacc gtcaaatcga ccctcgacac cgtcagcgga 2161 agcgatgaaa tgcaccgcta tggcgcaacc atgaccctgc ccggtgagta tgagaacatc 2221 accttctacg gtgcaggcga gtgggatacc tataacgaca gacgcaaggg cgcccatatc 2281 ggaatctatg aaaccaccgt aagcgattcc ttctatccct atcctcagcc gcaggataca 2341 ggcaccaaga cgggcgtaag atacttcgcc ctcacatccg atgagcacga aacgggtctt 2401 ttgtttgtca gcgacagcga aatggaggct caggcacttc atttctcaag cttacagctc 2461 agaatcgaaa gcagagttcc aaagctccgc gatatgggcc gaacctatgt aacgctcagc 2521 catggttccc gcggaacagg aggcgcttcc tgcggacccg acacgctgga tcaatacaga 2581 atcaccgcaa acggcaagga ttatacctat atctatacca tcgttccctt caataaggaa 2641 gcagatgaca tcagcgagct ttggttgatg tttgccgaca acgaataacc aaataaaaaa 2701 cagccatatg aacaggatct aatgtgcccc ctgtcaagta gacagactaa aaaacaaaaa 2761 gaataggtta attgaataga ttctttca // LOCUS sequence160 2780 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence160 VERSION sequence160 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2780 /mol_type="genomic DNA" /organism="" /note="sequence160" CDS 2..169 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MVYEVFRAVKCKNEYIFLAASIIMAIIAPMSVLAEVSAVHCVLAV TIYISVSVGV" /locus_tag="LOCUS_5860" /note="MGA_768" CDS 215..703 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MFETLLIISAMFSLCYIEHNTEDYGLVFVILTLCGAWFADTGAYF AGTFFGKHKLCPKISPKKTVEGLIGGFVANAVLFVIYIRVFMGFLNTSWYIIFAVLGIV CCILSVIGDLQASVIKRKYDIKDYGRIMPGHGGAMDRFDSVLFVAPFMATVLSLLFKV" /locus_tag="LOCUS_5870" /note="WP_003384675.1 phosphatidate cytidylyltransferase (Clostridium botulinum) [pid:43.0%, q_cov:87.7%, s_cov:53.2%, Eval:2.9e-28, partial hit]" /note="MGA_769" CDS 715..1854 /product="1-deoxy-D-xylulose-5-phosphate reductoisomerase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011861463.1" /transl_table=11 /codon_start=1 /translation="MKSVCILGSTGSIGTQALEVVRAHGLWISGLAAKSNIKLLAEQAK EFKPKVVCVYDEDKREELCELLKDTGITVLSGMDGLCEIASLPETDIVLNSVVGMVGLK PTLAAINAGIDIALANKETLVVGGALVIDAARKRGVKIYPVDSEHSAIFQSLRGSKQSE VSKIILTASGGPFFGKTKTELESVTLKDALKHPNWDMGAKITIDSATLMNKGLEFIEAM WLFDVSPDMIEIVVHRESVIHSAVEFNDGAVIAELGVPDMKLPIQYALLYPNRLDCPTR RLSLTDYGTLSFYKPDYDTFDCLRACIKAAQIGGTAPAIVNGANEEAVRLFINGKIGFL DIGRAVTKALECIPSQKIACLDDVLDADKKAREFVLASY" /locus_tag="LOCUS_5880" /EC_number="1.1.1.267" /note="WP_011861463.1 1-deoxy-D-xylulose-5-phosphate reductoisomerase (Clostridioides difficile) [pid:53.4%, q_cov:98.9%, s_cov:98.4%, Eval:4.1e-106]" /note="MGA_770" ORIGIN 1 aatggtatat gaagttttcc gagcagttaa gtgcaagaat gaatatatct ttttggcagc 61 aagtattata atggcaatta ttgcgccaat gtccgtactt gccgaagtta gtgccgttca 121 ttgtgtttta gctgtaacta tatacatatc cgtttcggtg ggtgtataaa ttctgcgcca 181 tgagcacatt gattttgaaa cctgtgctct tttgatgttt gaaactcttc ttattatctc 241 tgcaatgttc tcgctttgct atattgagca taatactgaa gattacggac ttgtgtttgt 301 aattttgact ttatgcggcg cgtggtttgc cgatacaggt gcatactttg caggtacatt 361 tttcggtaag cataaacttt gtcctaaaat cagccccaaa aagacagttg aaggtttgat 421 tggcggcttt gttgcaaacg ctgttttgtt tgtaatatat atccgcgtat ttatgggctt 481 cctaaacacc tcttggtata ttattttcgc agttttggga atagtatgtt gtatactcag 541 cgttattggt gaccttcagg cgtctgtcat taagcgcaaa tatgatatta aggactatgg 601 aagaattatg cccggtcacg gcggggcaat ggatcgcttt gatagcgttt tgttcgttgc 661 gcccttcatg gcaacggtgc tttcgttatt atttaaagtt taatcggagt taaaatgaaa 721 tcagtttgta ttttaggctc gaccggctcg atcggtaccc aagcgctcga agttgttcgt 781 gctcacggtt tgtggatatc cggtcttgcg gcaaaatcaa atattaagct tttagcggag 841 caagccaaag agtttaagcc aaaagtcgtc tgtgtatatg acgaagacaa aagggaagag 901 ctttgcgagc ttttaaaaga cacaggcatc actgttttaa gcggcatgga cggtctatgt 961 gagatcgctt ctctgcccga aacggatatt gtgttgaaca gtgttgtggg aatggtggga 1021 cttaaaccca cccttgccgc gattaacgcg ggaattgaca ttgctcttgc aaacaaggaa 1081 acacttgttg tgggcggtgc tttggtcatt gatgctgctc gcaaaagggg agtcaagatt 1141 tatcccgttg acagcgaaca ctctgcaatt ttccaatctt tgcgcggctc aaagcaatct 1201 gaggtttcaa aaataatttt aactgcttcg ggcggacctt tctttggaaa aacgaagacc 1261 gaacttgaaa gtgttacact taaagatgcc cttaaacatc ccaactggga tatgggcgcg 1321 aagattacta ttgattcagc tacgcttatg aataaaggac ttgaatttat cgaggcaatg 1381 tggttgttcg atgtttcacc cgatatgata gaaattgttg tacaccgcga gagtgttatc 1441 cattctgctg ttgaatttaa cgatggtgca gttatagctg agctcggcgt tcccgatatg 1501 aaactgccca tacaatacgc gcttttgtat ccaaatcggc ttgattgccc aacaaggcgc 1561 ttatcgctta ccgattacgg aactttgagc ttctataaac ccgattatga tacgttcgat 1621 tgccttcgtg catgcattaa agcggcgcaa atcgggggaa ctgctcccgc aatcgtcaac 1681 ggagcgaatg aagaagctgt aagattgttc ataaacggca aaatcggatt tttggatatc 1741 ggcagagctg taactaaggc gcttgaatgt ataccctcgc agaaaattgc ctgtcttgat 1801 gatgttcttg atgctgacaa aaaagcaaga gaatttgttt tagcgtccta ttaatttgga 1861 gttgatattt tgaatttatt atatattgtt attgcaatct taattttcgg tgtaatcatc 1921 gtcattcatg agttgggtca ctttctcgtt gcaaaatcct gcggcgtaaa ggtcaatgaa 1981 tttgcaatcg gaatgggtcc gaagattttc agttttggta aaggcgaaac caaatattct 2041 cttcgagcac ttcctatcgg aggatatgta tcgatggaag gcgaggacga cgaaagcaac 2101 gatccaagag catttggcag aaagaaagtt tggcaaagac ttttggttgt tcttgcaggc 2161 gcaacaatga atcttatcct cggatttgtg attctcataa ttgtgacatc ctgcagtgat 2221 gacattatca ccacccagat cgccaagttt gaatcggaaa ctgcagcatc acatatgaca 2281 ggacttgagg tcggagataa aatcatcaat gtcaacggtt cgcggatttt cagtgacgcc 2341 gatttgtcct atcagttcca ggttgatgag gatatgacct ttgatatgac cgttattcgc 2401 aacggcgaaa aggtgaatct ccccgcagtt aagttcgatg ctgtaactct tgaggacgga 2461 acacaaactc tgcacataga tttctatgta gtgggtgaaa aggtaaatcc cttgtcagta 2521 attaaatatt catcaggtaa gtttgtatct gtttcaaaga tgattattca gtcggtagtc 2581 gatttagtaa gaggcaaata tggattgaac gacctttccg gtcctgttgg tattgtcggt 2641 gcgatcggcg atgttgtcgg ctccacccag cagggtgttg ctgtcggcga tatgcttttg 2701 aatcttgctt cttttgttgt atttataacc ataaacgtcg gcatattcaa ccttttacct 2761 attcccgcgc ttgacggttc // LOCUS sequence161 2771 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence161 VERSION sequence161 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2771 /mol_type="genomic DNA" /organism="" /note="sequence161" CDS 770..1555 /product="AAA family ATPase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_009898851.1" /transl_table=11 /codon_start=1 /translation="MGKIIAVSNQKGGVGKSTTVVNLAAAMGGCGKKVLVVDIDAQGNT TTGFGVRKSAIENTVYEVMIGLCRAQDAVVPTAFKGVSLITSAQKLAGAEIELANVDNR LMRLKMELLTVKDRFDFILIDCPPSLSLITLNALAACDSVLIPIQCEFYSLEGLVQLMD TIKRVKDGYNPNMYIEGILFTMYVSRYNLTAQVVNEVRKYFPNDVYNSVIPRNVALSEA PSYGRPIMYYDRSSKGAQAYEEFCKEFLERSRKLSKKRK" /locus_tag="LOCUS_5890" /note="WP_009898851.1 AAA family ATPase (Clostridioides difficile) [pid:52.6%, q_cov:96.2%, s_cov:97.7%, Eval:8.7e-77]" /note="MGA_773" CDS 1574..2419 /product="stage 0 sporulation protein Spo0J" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003226832.1" /transl_table=11 /codon_start=1 /translation="MAKAKGLGMGMDALFSQNETKKQASTLRLTEIFPNKAQPRTDFDD EAIKELSDSIKQHGVLQPLLVRPMPTGGYQIVAGERRWRASRLAGLTEVPVYIKELTDE QTAQLALVENLQREDLNPVEEAVGYKELMEAYGYTQEQVAKIVGKSRPAVANSLRLLTL DETTLGLVREKEISVGHAKVLAGVEDKELRAELALKVKRDLLTVRNLEELLKKASKPKK TAEPPKKDVYFKEVEISLAETMGRKVNVSGKNGKGKLEIEFYSNDDLGAIAKALAEMNK " /locus_tag="LOCUS_5900" /gene="spo0J" /note="WP_003226832.1 stage 0 sporulation protein Spo0J (Bacillus) [pid:45.9%, q_cov:97.9%, s_cov:98.6%, Eval:7.5e-61]" /note="MGA_774" ORIGIN 1 atgcggcact aaggctcggc tatgcacaat cgaccttggc aaacaaactt cggcttttga 61 agctcggggc ggatgaacgc agactgataa tagataaaaa cctgacagaa cgccacgcaa 121 gagcgctttt gcgccttaac gataaggaaa aaaggctcga tgtcatacat aaaattgcgc 181 gggataagct gagcgttgaa cgaacagagc ggcttattga cacgatgacg gaatatgagc 241 gtcattgcga gcgaataaga aaaggttcgg tgcttttcaa agacctgcga ttgtttatga 301 atacggtcaa caaagcggtg gaaacaatgc aaattgccgg ggtcgatgtg aatatggaca 361 aggttcaacg ggaggacgcg gtggaatttc ggatcgtggt gccgttggag aagaaagaaa 421 tgcagtaaat tttgcaacac aaacagcaac tgcaacttgc tgttggtaat tgttccatgt 481 ggaacaatgt caccgtcatt attcatcagc cttcccctcg agggggaggt gtcggtgtcc 541 gccgacggat gaggtgaact aaggttaatt caaagctttg tggtatgagc gaggccgtct 601 gacgtcttgc gttgccgaag gcgacagtag acgtcaggtg gccgagcggt caaatggcag 661 aaaagtttag ttgacggcaa tttgccgtca attttttgtt ttcctcttgc aatctcatta 721 tattattgtt atactgttta tatgtataat attttgaagg agggggatca tgggcaagat 781 tatcgccgtt tcaaatcaga aaggcggcgt tggaaaatca acaaccgttg taaacctggc 841 ggcggctatg ggtggttgcg gaaaaaaggt gcttgttgtt gacattgatg cacagggaaa 901 taccaccaca ggttttggtg taagaaaaag tgcaattgaa aacacagttt atgaggtgat 961 gatcggactt tgcagagcac aggatgctgt tgttccgacg gcattcaaag gcgtatcgct 1021 gataacctct gctcagaagc ttgcaggcgc ggaaattgaa ctggcaaatg ttgataaccg 1081 cttaatgcgc ctgaaaatgg agcttttgac cgttaaagac cgttttgact ttattttgat 1141 cgactgtccg ccgtcgctga gcttgataac actaaatgct ctggcggctt gcgactctgt 1201 tttaataccc attcaatgtg aattctactc tctcgagggc ttggttcagc ttatggatac 1261 cattaaaaga gtcaaggacg gatataatcc gaatatgtat attgagggca tcctctttac 1321 aatgtatgtt tcaagatata atttgacagc acaggttgtg aatgaggtta gaaagtattt 1381 cccaaatgat gtttataaca gcgtcatacc gagaaatgtt gcactcagcg aggctcccag 1441 ctacggcaga ccgataatgt attatgaccg aagctcgaag ggcgcccagg catatgaaga 1501 attctgcaaa gaatttcttg aacgatcaag aaagctttca aagaaaagaa agtaaacgaa 1561 agcgaggtta aacatggcta aagcaaaagg actcggaatg ggcatggatg ctctgttttc 1621 gcagaatgaa acgaaaaaac aggcgagcac cctgcgtttg acggagattt tccccaacaa 1681 ggcacagccc agaaccgatt ttgatgatga agcaattaag gagctttccg attcaattaa 1741 acagcacggc gttttgcaac cgcttttggt cagaccgatg cctaccggcg gatatcaaat 1801 tgttgccggc gagcgcagat ggcgtgcatc ccgcttggcg ggattgaccg aggttcctgt 1861 atacattaaa gagctgacag acgagcagac agcacagctg gcattggtgg aaaaccttca 1921 gcgtgaggat ttaaaccctg ttgaagaagc tgttggatat aaagaactga tggaagctta 1981 tggatacact caggagcagg ttgcaaagat cgtcggcaag agccgacctg cagttgcgaa 2041 ttcgttgcgt cttttaactc ttgatgaaac aacactgggt cttgtcagag agaaagagat 2101 ttccgtcggc cacgcaaagg ttttggcagg cgttgaagat aaagaactcc gcgcagagct 2161 tgctctcaag gtaaagagag atctgctgac ggtgcgaaat cttgaggagc ttttgaaaaa 2221 agcttcaaag ccgaaaaaaa cagctgaacc gccgaaaaag gatgtatatt tcaaggaagt 2281 tgaaatatct ctggcggaaa caatgggccg aaaggtcaac gtttcgggca agaacggcaa 2341 gggcaagctt gaaattgagt tttactctaa cgatgacttg ggcgcaattg ccaaggcatt 2401 ggcggagatg aataagtaag agcagacgga gcgagccgtg gctgacacgg cggctcgccg 2461 aaggtgaggc ggatcgtggc gtgccgtggc gagcggtctg tgtagaatta gctaagcaaa 2521 actccctccg tcacgcttcg cgtgccacct ccctctaaga gggaggcaat cggaaatgtt 2581 gttccatgtg gaacaatcgc catcaacgct tgcacaaagc gctattaaaa ctgcacatta 2641 tccaaaaatg tattgaaacc gacgtttgcg cgggcggcag cctgtcgcgc gcacctgcgg 2701 tgcggacagc tgccgcggcg cacaaagctt ggtgcgcttt ggcaagctga tatataaaca 2761 aaaaatcaaa t // LOCUS sequence162 2771 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence162 VERSION sequence162 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2771 /mol_type="genomic DNA" /organism="" /note="sequence162" CDS complement(1297..2001) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MTSPTHIAVLFDGEHQNPRALLDENYKANRPDYSDTPEEETPFSQ LPDVYSALDFLGILYAETLTCETDDWISGYVSKYKPDCEIVISSFDSDFFQLIDDNVKV LRYRGDSSTLCDEKYINQKLGISPSLYADFKSLTGDTADNIKGADKVGPKTAAWLINQF GSLENILANAENISKPAVKKSIISNSERLLKNYQLIKLSGECELPFELSKLEYSYTGIT TTEVLRAIGLKR" /locus_tag="LOCUS_5910" /note="WP_002355755.1 DNA polymerase I (Enterococcus) [pid:33.0%, q_cov:92.7%, s_cov:24.3%, Eval:2.1e-23, partial hit]" /note="internal stop codon at [2017:2019](-)" /note="MGA_776" CDS complement(2017..2142) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MEKLLLVDGMNLLFQMFFGMPARIVNHEGKAIQGTLGFVGA" /locus_tag="LOCUS_5920" /note="MGA_777" ORIGIN 1 ctcttgaagc tcgatttcgt tggatattga gaaataatgt atagggatgc ctgcatcgat 61 gaaatactga acagactgta cgcagaaatc agcaagctcg tcatacatat attcgccgtt 121 tttatccttg gcaagggtat agtagctgta tccgtttgcg gcttttgcgg tatatgcaac 181 aaaaggcaaa gtgcggtcat actgtcccca gcttgtgacc aaaactatcg gctcgattcc 241 gcgctcgatt gcggcatcgt aatatgcttt atatttggga tagccctgaa tcggagcata 301 cttttcatcg cctgcaagtc cgtgctgatc tctaaaacgc aggatgttga actcggcttc 361 gttgaaaata taatcatagc cctgttcttc ggcatcaatg ccgaccatcc agtcagagta 421 ccaggtgtac gatgcgccga agccgtcaat ggtctgatag gtggtatcca tatcaatgtg 481 ggcggtggtt aaaacagttg gatcggaggg gaccgattca acaacatata cgccatagat 541 aacatcatct ttgccgtcaa ccgccattgt catgggttct ttgatgttgc cgttgccgtc 601 aatatttccc gaatttgcgg catattttgt gaacattgat tttacggctt cgacatcgaa 661 ataagcatag ttatagccgc cctcaacaat aacatcggta catccgacac cgctgacggt 721 gccccaatgg ccgaaggtga cagacgggtc aacatttcct atatatttta ttataagctc 781 tgcaccctct gtttcaagcg cggaatataa gtcagcaaaa ccatcagaat tcagggtaat 841 ccaatggtac cagttggtta ttttgatacc gtcggcaagt ttttccgatt tgtcatatgc 901 gtgggaagtc acctgctcga agatgacggt ttttccgagc acctgcgact gtgcgcttag 961 gcaaacagtc agcgaaagaa tcagcactaa gcttatgagt aaagccgaaa atcttttcat 1021 aatgcacctc gtaaatttga taattaaatt ataccactaa ttaggagtta aaacattgac 1081 caattgagag aaaatgtttg acggattgtg taaaaacgca tatagcggaa agcaaaattc 1141 cgaagcttct gtttcggaag atgaattcag cgcggccgac actaaagctg cctttttcac 1201 gaactgcggc ggccgcttgg cgaggcgtct gccgggcatc acgcacggcg aagatgtgcg 1261 ggatggctgc aggtgccgag ccgcatttgc ggcgaactat cgtttcaagc ctatggctct 1321 taaaacctct gtagttgtga ttcccgtgta tgaatactca agctttgaaa gttcaaaggg 1381 aagttcgcat tcgcccgaca gcttgataag ctgatagttt ttcaaaagcc tttcagaatt 1441 tgaaattatt gactttttaa cggcaggctt tgaaatattc tcggcatttg cgagaatgtt 1501 ttcaagtgag ccaaattggt ttatcagcca cgccgcggtt ttgggaccga ctttgtcggc 1561 tcccttgatg ttgtcggcgg tatcccctgt caaagacttg aaatcggcat atagagatgg 1621 cgaaatgccg agcttttgat ttatgtattt ctcgtcgcat agtgtagagc tatctccacg 1681 gtagcgaagg actttgacat tatcatcaat cagctggaaa aagtcgctgt cgaaggatga 1741 aataacgatc tcgcagtcgg gtttatattt tgaaacgtag ccggaaatcc aatcatccgt 1801 ttcgcaggtg agagtttcag cgtataagat gcccaaaaaa tcaagggcgg aatatacatc 1861 gggaagctga gaaaagggcg tttcctcctc gggagtgtcg gaataatcgg ggcggttggc 1921 tttatagttt tcatcaagca aagctctcgg gttttggtgc tcaccgtcaa ataatacagc 1981 aatgtgagtg gggctggtca tacggataat tttaagctat gcaccgacaa agccgagtgt 2041 gccttgaatt gcttttcctt cgtgatttac aatgcgggcg ggcataccaa aaaacatttg 2101 gaacaacaag ttcataccgt caaccaatag aagcttttcc atatataccc ccaaaaagaa 2161 atgttaaaaa caaattgcca gatgcgacaa aatgttgtat aataagctta gctatatttt 2221 aattataact aaagccaatt aaggacgcaa cgactttttg gttgcaactg tccaaaatat 2281 ataaacagcg aggaaaaata atgtttaatt cgattttaaa tgcaattaag gaacacgaca 2341 ctatcatcat tcacagacac acaaagccag acggcgatgc tttgggatcg caggttggtt 2401 tgaaatatat cataaaggaa aacttccccg aaaaggcggt atataccgtc ggggacggtg 2461 cgggacatta cagctttatg gacggcaccg taatggatga gattcccgac tcgttttatg 2521 acggcgcatt ggcaattatt ttggactgcg gcggggcgca tttgataagc gatgagcgat 2581 ataagcttgc aaaaacaact gtgcgatttg accaccactt gtttgccgaa aagattgcag 2641 atattgaagc aatcgactct tcatatgaaa gctgctgcgg acttttgaca gcgtttgcaa 2701 tggatatggg gctgaggctc tcccctattg cggcaaagtc gcttttcaca ggtatggtca 2761 ccgactcggg c // LOCUS sequence163 2752 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence163 VERSION sequence163 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2752 /mol_type="genomic DNA" /organism="" /note="sequence163" CDS complement(334..576) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MFINKTNDGKNNICGDNIARIRKGMKISQRELADRLQIAGLDVDK NAIQRIECGKRFVTDIELVVLAKVLEQSVEELLNI" /locus_tag="LOCUS_5930" /note="MGA_780" CDS 689..1624 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MRNSQLIQQEISETAAKLKALEAEYNVLSDAFSSETKAIYAKIDQ ENRKLDTLKEPKVSPLFLLGIIVMIALGILGGNLGLILQIPCFVIAIILVIIRSSKKKS LKAQFEKQKDEINNQIFEYEFEVNEIESKNPRIHELKEGISELEYALRSLKQEFSDAFA AEKSAREEAEIIKTLGVNNVLVHVSPTVEGPMYKLSTAYITIDGTSRGIVAQPFSIISL SPGIHSISITFDIEPVFSSYSAQTITTHDVQFSVRDDNKYFTFKLIFNYDTLRNKLSYN IDATKPSELSGFLTESKLSRSDFNSYLSNL" /locus_tag="LOCUS_5940" /note="MGA_781" CDS complement(1666..2280) /product="cytidylate kinase-like family protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003435157.1" /transl_table=11 /codon_start=1 /translation="MSVITISREFGSGGRELGKRLADELGFAYFDKEIVTMIAQSSKLD ENYVESMLEKHSWNIPITYGTSFSHITYSHGYSPQTAIISEQQKIIKQLASSGNCIIVG RNADVILEELNPLRLFVYADMDSKLARCRQRAKEGENLTDVQMKRYIKKIDRDRARNHL LLSDIPWGDRRGYDLMINTTGANIKAMVSAVAEYAKAHFGI" /locus_tag="LOCUS_5950" /note="WP_003435157.1 cytidylate kinase-like family protein (Clostridioides difficile) [pid:45.1%, q_cov:99.0%, s_cov:97.6%, Eval:7.9e-47]" /note="MGA_782" ORIGIN 1 aagactattt ggatgaaaag gtatttgcct ctatggcaag cattaccgaa cagcccgatg 61 aacgtgatgt tgatggcttc aacgcctata tcgagcgcta taagggtatg cttgaagccg 121 aaaaggcagc agttaagaat ctcaagtaaa cagatattga gaaaggcggg gaaacccgcc 181 ttttttgttt gattttcaaa ttttggcggg gcggaggccg tcgtgtgcca tttttagttg 241 agcgatagca aaactaaaaa tcaggcacgt gacggagggg acccgcgctt cgggcctcaa 301 caaaaaagga cagcacttgc tgtcctttta tttttatata ttgagcaatt cttcaacgct 361 ctgttcaagt accttggcaa gcaccacaag ttcaatgtcg gtaacaaatc gctttccgca 421 ctcgattcgt tgaatggcgt ttttatcaac atcaagaccg gcaatctgta atctgtcggc 481 aagctctctt tgagagatct tcattccctt tcggattctc gcaatattgt cgccgcagat 541 attgtttttg ccatcattcg tcttatttat gaacatattt ttctcctttt tgacatttag 601 tgcttgtcaa taaaagaatt atatgctata atgactgcag atatgacatt cggtgaatgt 661 catactacaa ttttttggag gtatcaaaat gagaaatagt caactaatac agcaagagat 721 ttccgagacg gcagcaaaac ttaaagcctt ggaagctgaa tacaatgttt tgtctgatgc 781 gttcagttct gaaaccaaag caatttatgc aaaaattgat caagagaatc gtaaactcga 841 tacattgaaa gagccaaagg tatctccatt atttttgctt ggcattattg taatgatcgc 901 tttaggcatt cttggtggca atcttggttt aattcttcaa ataccttgct ttgttattgc 961 aattatatta gtcatcattc gatccagcaa gaagaaatca ctcaaagcac aatttgaaaa 1021 acaaaaagat gaaatcaaca accaaatctt tgaatatgag tttgaagtaa atgaaattga 1081 atccaagaat ccaagaatcc atgaattgaa agagggaatt tccgaactcg aatatgccct 1141 tagatctctt aagcaggaat tttcggacgc tttcgccgct gagaagtccg cgcgtgagga 1201 ggcagagatt atcaaaactc ttggcgtgaa taatgttctt gtgcatgtat ctccaactgt 1261 tgagggacct atgtataagc tttccacagc atatataacc attgatggaa cttctcgtgg 1321 tatagttgct caacctttta gcatcatttc gctctctcct ggaatccact cgatttctat 1381 cacttttgat atagaacctg tttttagttc ctattcggca caaaccataa caacgcatga 1441 tgttcagttc tctgtaagag atgacaataa gtacttcaca ttcaaactga tattcaatta 1501 tgatactctt aggaataagc tctcatataa tattgatgct acaaagccgt ctgagttaag 1561 tgggttctta acagaatcaa aactcagtcg atccgatttt aattcgtatc tatcaaatct 1621 ataaaacaaa aaaggacagc aagcgctgtc cttttgcttt ttgtcttaaa ttccgaaatg 1681 tgcctttgca tattctgcaa cggcggatac catagctttg atatttgcac ctgtggtgtt 1741 tatcatcagg tcatatccgc ggcggtcgcc ccaggggata tccgacaaga gcagatggtt 1801 gcgcgctctg tcacggtcga tctttttaat atagcgcttc atttgaacgt cggtcaaatt 1861 ttcgccttcc ttggctcttt ggcggcatct tgcaagcttc gagtccatat cggcatatac 1921 gaacaggcgc agaggattaa gctcctccaa aatcacatcg gcatttcgtc cgacgattat 1981 gcagttgccg gaagaagcaa gctgtttaat aattttttgc tgttcgctga tgattgcggt 2041 ctggggagag taaccgtgag aatatgtaat atgggaaaag ctggtgccat aggttattgg 2101 aatattccag gaatgctttt caagcataga ttcaacatag ttttcgtcaa gcttgctcga 2161 ctgcgcgatc atggtgacga tctctttatc gaagtaagca aagccgagtt catctgcaag 2221 gcgcttgcca agctcacgtc ctcccgaacc gaattcacgg ctgatggtta taacactcat 2281 aacatcactc ccaaagatta tttttacaaa taaattttag cacaggataa gccttgtcgt 2341 caagaagcaa aatatcagtc cacttgcaat tggcagggta atggtgtaaa atagtcataa 2401 taaaccgaaa gaagtgattg cgtgtcgcaa agatacatat gttttgacgt tgaaacgccg 2461 aataacgaca acaactgtat gagctcaatc ggtatcagtg ttgttgaaaa cggcgagatc 2521 atatatgatt tttattccct tgtaaatccc gaggcgagat ttgatgcttt caatattgaa 2581 tttaccggta tcactcccga gatggtcgct gacagcccga attttgccga gctttggcag 2641 gtcattgagc cgataatgtc aagcggaatg cttattgcac acaacgcacc atttgatatg 2701 agcgtgttgg caaagtgcct taaaagatac gaaatatatt gtgaagaaat aa // LOCUS sequence164 2733 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence164 VERSION sequence164 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2733 /mol_type="genomic DNA" /organism="" /note="sequence164" CDS complement(231..791) /product="sigma-70 family RNA polymerase sigma factor" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011393343.1" /transl_table=11 /codon_start=1 /translation="MNDREIVSLFLRRDEQVLALVKQKYEKLLYSVSYNILQSECDAEE CVADTITRLWQTIPPNEPENMAAYAIRIVKNLSLNKLRFSSAEKRAGDTYSLVLDELSE IIPSDENIEAYVDAKELGRLLNRFLEKLSPEYRVIFVKRYWLFRSVEEIATELGITTTK VTTSLHRTRKKLKDYLKKEGYEI" /locus_tag="LOCUS_5960" /note="WP_011393343.1 sigma-70 family RNA polymerase sigma factor (Moorella thermoacetica) [pid:24.4%, q_cov:97.3%, s_cov:90.2%, Eval:7.0e-09]" /note="MGA_785" CDS 979..1254 /product="autorepressor SdpR family transcription factor" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_000006512.1" /transl_table=11 /codon_start=1 /translation="MGLQNTLKALADPTRREILNMLKQGSLSAGEIVERFDMTGASISR HLSVLKDADLIHDRREGKFIYYELNASVLEEIMLWISNLKGVNEDD" /locus_tag="LOCUS_5970" /note="WP_000006512.1 autorepressor SdpR family transcription factor (Streptococcus mitis) [pid:59.3%, q_cov:100.0%, s_cov:95.8%, Eval:6.6e-26]" /note="MGA_786" CDS 1247..1888 /product="SdpI family protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_002262698.1" /transl_table=11 /codon_start=1 /translation="MIKKNLGLIILTSVIILLPIIAGLIMWNYLPEQIPTHWNAVGEVD GWSGKTFAVFGLPLFILAVHIVCILATAADPRNKNIAKKPLTLVLWICPIISVLCNSLI YCAAFEIPLSIEIIMPLLFGALFVIVGNYMPKCKQNYSIGIKLPWTLNDEENWNRTHIL AGKLWVAGGFLEMMTAFFGGFILFFIISIAMIIIPTVYSYVLYKKTCDDL" /locus_tag="LOCUS_5980" /note="WP_002262698.1 SdpI family protein (Streptococcus mutans) [pid:43.8%, q_cov:94.4%, s_cov:95.8%, Eval:3.5e-48]" /note="MGA_787" ORIGIN 1 aatgtcgata gcgtaacctt cgtttgtgat gccaagattt tcgacctcaa ctgaaagact 61 tgaaataaac cacgcactgc cggttgcaaa caatataaga agcaccgcag cgatgagcaa 121 ggctgtcttg cgtttaattg tgtgcttaat tgcaggctta tgctcagtga ttgcttcttg 181 catatacttt tcatcaatga aatccatagc ggaaatcagt ttgttttcct tcatatttcg 241 taaccctcct ttttgaggta gtctttaagc ttcttacgtg ttctgtgaag tgaagttgtt 301 acctttgttg tcgtgatgcc aagctcggtt gcaatttctt cgacagatct gaacagccaa 361 tagcgcttga cgaagatgac ccgatattca ggtgataatt tttcaaggaa acgattaagc 421 agtctgccca gctctttggc atcgacatat gcttcgatgt tttcatccga cgggatgatt 481 tcgctaagct catcgaggac taatgaatat gtatcccctg cgcgtttttc ggcagatgaa 541 aagcggagct tattgagcga gaggtttttg acaattctga tggcatacgc tgccatattt 601 tccggctcgt ttgggggtat ggtctgccaa aggcgagtta ttgtatcggc aacgcattcc 661 tcggcatcac attccgattg caggatgtta tatgaaaccg aatatagcag tttttcatac 721 ttttgcttga caagtgcaag tacctgctca tctcgcctaa gaaacaggct tactatttca 781 cggtcgttca ctttcttcac tcctttcttg aaggtacctt tcaccatata tgacacggca 841 gaagacgtgt ttgtcacaat gattttacaa gttttgaaaa attgtgtcaa attccctatt 901 gacaaatgga tttgcggatg ctataataca tttagcattt aggctaaatg ttaaatgatg 961 gcacaaagga gagaggaaat gggacttcag aatacactta aagcccttgc tgatccaaca 1021 cgcagagaga tactcaatat gctcaaacag ggcagcctct cggcgggtga gatcgtcgag 1081 cggtttgata tgacaggtgc atcaatatcc agacacttat cggtgctcaa ggatgccgac 1141 ctgattcacg atagacgtga gggtaagttc atttattacg agctgaacgc atcggttttg 1201 gaagagatta tgctttggat aagcaatttg aaaggggtta atgaagatga ttaagaagaa 1261 tttgggattg attatactca cgtcggtgat tattcttctg ccgataattg cgggactgat 1321 aatgtggaat tatctgcccg agcagattcc cacccattgg aatgccgtcg gtgaggttga 1381 cggttggagt ggcaagacat ttgcggtttt cggtttgccg ctgtttatac tggcggtgca 1441 tattgtttgc atactcgcaa cagccgccga cccgagaaat aaaaacattg ccaagaagcc 1501 gcttacactt gttttgtgga tatgccctat tatatcggtt ctttgcaatt cgctgattta 1561 ctgtgcggcg tttgagattc ccttgagcat tgagatcatt atgccgttgc tctttggtgc 1621 gctgtttgtt atcgtcggca actatatgcc caagtgcaaa cagaattaca gcatcggaat 1681 caagctcccc tggacactca acgacgagga aaactggaat cgcacacaca tacttgcagg 1741 taagctctgg gttgcaggcg gatttttgga aatgatgaca gcgttcttcg gcggatttat 1801 tctcttcttt atcatttcga tagcgatgat aattattccc acagtttatt catacgtact 1861 gtataagaaa acatgtgatg acttataagg tcaagaaaga cggcaaagtg taaaactttg 1921 ctgtcttttt tgcattttaa gaaaaaattc tccttgataa aaaggcttct ttatgatatg 1981 attataatgt taagttatgg tcacttattg tggcttttga aaggatgatt gttgaatgaa 2041 gatgacattc cgctggttcg gaaagaacag cgacagcgtt actcttgaac agatcagaca 2101 gatacccggc ataaccggtc ttatgggctt tttggattat aaagacgcag gtgagatctg 2161 gacagaagaa gagatcaagg aatatatcga cggcgttcac gaagccggtc ttgagtgtga 2221 ggtaattgaa agcgtcaatg ttcacgagga cattaagctt ggacttccca caagagataa 2281 atacattgaa aactattgca tcaccattag aaaccttgca aagtacggcg tcaagtgcat 2341 tgtatataac ttcatgcccg ttttggactg gttgagaacc gatcttgcaa agcctaatcc 2401 cgatggctcc acaagtatgt attatgacga agctgagctc ggcacacttt cccctttgga 2461 tattgttaag agaactgctg aaaactgcaa cggtttctcg cttcccggct gggagcctga 2521 aagactttct cagcttgagc aggttttgga aatgtataag agcgttgacg aggaaaagct 2581 ccttgaaaac tataaatatt tcctcgacgg aattattccc acttgcgagg aatgcggcgt 2641 tgtaatggct tgccaccccg acgatccggg atggaagatc ttcggtcttc caagacttgc 2701 gcacagccag gaaggttacg acaagatcgt taa // LOCUS sequence165 2720 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence165 VERSION sequence165 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2720 /mol_type="genomic DNA" /organism="" /note="sequence165" misc_feature complement(2082..>2720) /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_010964705.1:phosphoribosylamine--glycine ligase" /note="WP_010964705.1 phosphoribosylamine--glycine ligase (Clostridium) [pid:48.6%, q_cov:98.1%, s_cov:50.0%, Eval:1.4e-52, partial hit]" /note="MGA_790" /locus_tag="LOCUS_5990" ORIGIN 1 ataagcgaac agcaatcggt atgcttcttt tcaacggaaa ttttctgaac catcgcctga 61 atgggggtga gctggttctt gccgccgaag ggcatcaaaa ctgtacatgc accgatggtg 121 gagtcgaatc tttcggaaag tccgcgcttg gagcagatgt taagatcatt tgcgattctc 181 ttatagtttt ctgcaaatcc tccctcaata acttcgtcct taacttcggg ctttgcaggg 241 gtaatgacaa tgtgcttgtc agcaccgttg gaatttaaga actcgcggga gatatcaaca 301 atttttgcac cgttccacat cataacgagt ctgggttctt ctgttacaac ggcaacaggg 361 caagcgttga ggttttcttc atttgcaagc tccaagaacc tttcaacatc cttggcttca 421 acaacaaccg ccattctctc ctgcgattcg gagatcgcaa gctcggtgcc gtcaagaccg 481 tcatatttct tgggaactgc gttcaaatca attttaaggc cgtcggccaa ttcgccgata 541 gcaacagata caccgcctgc gccgaagtcg ttgcaacgat tgattaaacg gcttgcctct 601 gcgtttctga acagacgctg gagctttctt tcttcggggg cattaccctt ctgaacttct 661 gcaccgcagg tttcaaggga tgtaagggta tgggatttcg atgagcctgt tgcgccgccg 721 caaccgtcac gacctgttgc accacccaaa agaatcacaa tgtcgcctgc atcggggcat 781 tcacgtctta cgttttctgc gggagcagct gcgataactg cgccgatctc cattctcttt 841 gcggcatagc catcgtgata gatctcatca acaatgcctg ttgcaagacc gatctggttg 901 ccataggagg aatatcctgc tgcggcagtg gtaacgatct ttctctgggg gagcttgccc 961 ttgattgttt cactgacggg ctttaagggg tcagccgcac ctgttacacg catcgcgccg 1021 taaacatagc ttctgcccga gaggggatcg cggatcgcac caccgataca ggttgccgca 1081 ccgccgaaag gttcaatttc tgtggggtgg gtgtgggtct cgttcttgaa cagcaaaagc 1141 caaggctcgg tcacgccgtc aacctcaacg tcgatcttga cggtgcaagc attaatttcg 1201 tctgactcgt caagcttgtt taaaagtccc tttttcttga gctgtttaac tgcaacagtt 1261 gcaagatcca ttaagcaaat gggctttttc gaaccaagct cctgacgaac cttgatgtat 1321 tcatcatagg tcttagccaa aagctcgtcc tcaaacttaa cgtcgtcaat aacggttaag 1381 aatgttgtat gacggcagtg gtcggaccaa tatgtatcaa tcattcgaat ctcggtgatg 1441 gtggggtcac ggtgttccga cttgaaatat tcctggcaga acgcaatatc gtcagcatcc 1501 atcgcaaggc cgtattcctt gacaaatgct tcaagacccg ctctgtcaag cgcgataaag 1561 ccctcgaggg tcttgacagt tgtgggaatg tcatatttta cattgagggt ctcgggtttt 1621 tcaagggttg cctcgcgtgc ctcaacgggg ttgatgacat atttcttaat ttctgcgatc 1681 tcattttcac tgagctcgcc ctcaagaaca tatacctttg cggttctgat taaaggacgc 1741 tcgccctggg agatgatctg aatgcactgt gccgcagagt cagctctctg gtcgaactga 1801 ccggggagat attcaactgc aaaaactgtt ccgtttgctt ccagctcatc ggtcacaatg 1861 tcaagctgag gctccgaaaa aacggtcttt tttgcatagt cgaaaagctc gggtgtgata 1921 ttttccgcat catagcggtt aatgaccctg acgttttcaa gcgcgcaaat gcccaaaagc 1981 gttttggcgt cattcaaaag agccttggct tcgtttgcaa gctcgctctt tttttcaaca 2041 taaactctat ataccatata gcatttacct cttttcgata attaaaggca ttttgcgccg 2101 atgtcacggc gatagtatgc gttttcaaag ctgattcttt cagcattggc gtatgccttg 2161 tcaagcgctt ctttaaggct gggggctgtg gcggtgacgc ccaaaactcg tccgccgctg 2221 ttgaccaatt ttccattttt aagagcggcg cctgcaacat aaacgctgtt tgaaatatcc 2281 tcggggatgg tgatctcata tcccttttca tagctaaggg gatatccctt ggatgccatt 2341 acaacgcagg cggcgtgctc gtttttaaac ttgacctcgc aatcggcaag ggtgccgttg 2401 gtggtggcct gcataactgt caaaagatca gattcaagca aaggcaaaac gacctgggtt 2461 tcggggtctc cgaaacggca gttatattca attaccttcg ggccgttagg agtgatcata 2521 agtccgaaat aaaggcatcc cttaaaggtt ctgccctctg cattcattgc atttatggtc 2581 ggaaggaaga tcttttccat acataccttt gcaatgtcct cggtatagtg ggggttgggc 2641 gcaactgttc ccataccgcc tgtattaagt cccttgtcgc cgtcaagtgc gcgcttgtgg 2701 tccattgacg aaaccatagg // LOCUS sequence166 2677 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence166 VERSION sequence166 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2677 /mol_type="genomic DNA" /organism="" /note="sequence166" CDS complement(1680..2057) /product="50S ribosomal protein L7/L12" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_005782165.1" /transl_table=11 /codon_start=1 /translation="MADLKAFAEQLVNLSVKEVNELAQILKDEYGIEPAAAAVAVAAGP AAAGAAAAEEKSSFDVVLKNAGASKLAIVKLVKELTGLGLKEAKEMVDGAPSVIKEGLA KADAEGLKKQLEEAGAEVELK" /locus_tag="LOCUS_6000" /gene="rplL" /note="WP_005782165.1 50S ribosomal protein L7/L12 (Bacteroides) [pid:75.2%, q_cov:100.0%, s_cov:100.0%, Eval:7.8e-43]" /note="MGA_792" CDS complement(2095..2625) /product="50S ribosomal protein L10" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_005791518.1" /transl_table=11 /codon_start=1 /translation="MRKEDKALIIEQIANTLKEYSCFYLTETAGLNAEKTSELRRACNK ADIKLMVVKNTLLRKALESLDGDYSELYPSLKESTSIMFSNTGNAPAKLIKEVLKNDKD ATLPRFKAAYVEETVYVGADQLDTLANIKSKNELIADVIALLQSPAKNVVSALTSGGTK LHGILETLSKKED" /locus_tag="LOCUS_6010" /gene="rplJ" /note="WP_005791518.1 50S ribosomal protein L10 (Bacteroides) [pid:66.7%, q_cov:98.9%, s_cov:100.0%, Eval:3.3e-58]" /note="MGA_793" ORIGIN 1 aggagtctcg atcggacaca gacgtccata atgggtatag tgcacgtctc gcacctcaaa 61 tccggcacgt tcacgtgaca gaccgccggg accgagtgcc gacatacggc gcttgtgtgt 121 catttcggca agcgggttgg tctgatccat gaactgcgaa agcgcattag tcccgaaaaa 181 cgtgttgatt accgacgaaa tcgtcttggc attgataagg tcgatcgggg tgaacacctc 241 gttgtcacgc acattcatgc gttcacgtat cgtacgcgac atgcgggcaa gtcccacacc 301 aaactggtta tacagctgct cgccgacagt acgtacacga cggttgctca aatggtcgat 361 atcatcgaca tcggttttag aattgataag ttcgatcaga tacttgatga tggcaattat 421 atcctccttg gtgaggacct tgacatccat cgaagtaccc agattcaatt tcttgttgat 481 acggtagcgt cccacctcgc cgaggtcata acgcttctcc gagaagaaca ggttggtgat 541 cacctcacgg gcactggcgt catccggtgg ctcggcgttg cggagctggc ggtagatata 601 ctggatagcc tccttctccg aattacttgt atccttctgg agtgtattga atattatgga 661 atagtcgctc gtgttgacat cctccttgtg aaggagtatt gtgctgacac ccgagtcgag 721 tatatcctgg atatgttcct cttcaagtac ggtttcacgg tcgatgacca catcattgcg 781 ttcaatcgat acaacttcgc cggtatcctc gtcgacaaag tcttcaaccc atgtcttaag 841 gacacgggcg gcgaatttcc gtcctaccgc ctttttaaga ttggttttgg ttaccttgag 901 ttcctcagcg agaccgaata tctcgatgat gtccttatca ctttcaagac ctatcgcacg 961 caacagggta gtcacaggga gcttcttctt acggtcgatg taagcataca tgacattgtt 1021 tatgtcagtg gcaaactcta tccatgaacc gcggaacggg atgatacggg ccgaatacag 1081 cttggtcccg ttggcatgtg tgctctgtcc gaagaacact ccgggcgaac ggtgcaactg 1141 tgacacaacg acacgctcgg cgccgttgat tacaaacgtc cctttctcgg tcatatatgg 1201 gatagggccg agatacacat cctgaacttc cgtcgcaaaa tcttcgtgat caggatcggt 1261 acagtaaagt ttaagttttg ctttgagggg tacactataa gtcagacctc tttcaagaca 1321 ttcgtcaata gtgtaacggg gaggatcgat atagtagtca agaaattcca gcacaaagtt 1381 gttacgggta tccgcaatgg ggaagttctc ggcaaaaacc ttataaagac cctcattatt 1441 tcttttttcc ggaggagtat caagctggag gaagtccttg aacgacttca attgcacctc 1501 aagaaagtcg gggtaaggaa gaggattctt taccgacgcg aagttaacac ggggtttatc 1561 aaatgaaact gacatctaaa ataacgttaa agggaactca aattaaaata taacacaaaa 1621 aggttaagaa tcatcggtca ggaggattct taacctaatt acctgcaact caggcaatat 1681 tatttaagtt caacttcagc gccagcttct tccaattgtt tcttgagacc ttcagcgtct 1741 gccttagcaa gaccttcttt gattacgctg ggtgcgccgt caaccatttc tttagcttcc 1801 ttcaagccaa gaccggtaag ttccttaaca agcttaacga tagcgagctt gcttgcacct 1861 gcattcttaa gcactacgtc aaaagatgac ttttcttcag cagcagctgc acctgcggct 1921 gcgggacctg cagcaactgc aacagctgca gctgcgggct caatgccata ttcgtcctta 1981 aggatctgag caagttcgtt tacttcctta actgagaggt taactaattg ttctgcaaaa 2041 gcttttaaat ctgccatttt tttatgattt tattgattat ttactaattt ggttttaatc 2101 ttcttttttt gataatgttt caagtatgcc atgaagcttg gttccgcctg atgtaagggc 2161 tgaaacaaca ttcttggcag gagactgaag aagagcgatg acatcggcga taagttcgtt 2221 cttgctcttg atgtttgcaa gagtgtcgag ctgatcagca cctacatata cagtctcttc 2281 aacgtatgca gccttgaaac ggggtagagt agcatccttg tcattcttaa gaacctcctt 2341 gatcagcttg gccggagcgt taccggtatt ggagaacatg attgaagtcg attccttaag 2401 agaaggatac aattcggaat agtcaccgtc gagtgattcg agagccttgc gcaacaaggt 2461 gttctttacg accatcagtt ttatgtcagc cttattgcag gcacggcgca actcgctggt 2521 cttctccgca ttcaatcccg cggtttcggt aaggtaaaag cagctgtact ctttaagagt 2581 attggctatc tgttctataa ttaaagcttt atcttccttt ctcattttct taatttttta 2641 aattatgcgt caatcgactt ggagtcaacc ttaatac // LOCUS sequence167 2675 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence167 VERSION sequence167 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2675 /mol_type="genomic DNA" /organism="" /note="sequence167" CDS complement(497..1162) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MKKTALKAFIGIMVILCFALLPLSVISAAPAETGNAFDVQNFVYF SDVDELTDFISANSGKTAAELCDDKNKLGAYEFILSGEGFIYLPGGFDGFPDDQWANGI IEDTGIYISDNRIVIIGAQGNQKYMLTCTYAESSVDGGTVLPTETYKANGIDGDVKFAT GGGASYYFWEQDGYAFSIWMIDGLEFDEYSNMIPAQRISLSGDIVINEPVEIAIEEIE" /locus_tag="LOCUS_6020" /note="MGA_795" ORIGIN 1 ccggtgttga tgatttcgtc ttcagagtag ttgtggaagg agtcgtacca gctgtgatac 61 ttgattgtaa ctcctgcgcc tgcagcaact tcagcatcgg gcaatgtgat acctgcagca 121 gccaaaattg cttctgaatc ctcggttgaa agggtcaact taacgatttc gcgcttttcc 181 gagccacagc caaccaaagc gaagatcatt aaaacaacca gaccgagagc gataagtttc 241 tttgtcatgt ctaaaaattt cctttcggta atatcagttg tacaaaacgg cgccacctct 301 ttgcaccatt tcatagctat tatatatttt aacacaatct ttaattaaag gtaaattagc 361 gtaatgtatc aatttgaatg ttgttttttg ttaatattgc catggcaacc gcggacaaac 421 accaaaatat tgcaaaaact gatctcgtga aaacataaaa actgcccacc ccgcgaggag 481 tgagcagttg gtttcattat tcaatttcct caattgcgat ttcaacaggc tcgttgatta 541 caatatctcc cgataaagaa atcctctgcg cgggaatcat attactatac tcgtcaaatt 601 ccagtccgtc gatcatccaa atgctgaatg catatccgtc ctgttcccag aaataatatg 661 acgcgccgcc gcctgttgcg aacttcacat cgccgtcgat gccgttcgcc ttatatgttt 721 ccgtgggcaa aacagttcca ccgtccacag aagactcagc ataagtacag gtgagcatat 781 acttttgatt tccctgcgca ccaatgatga caattcggtt gtcgctgatg tatattcccg 841 tatcttcaat aattccgttt gcccattggt catcggggaa accgtcaaat ccaccgggaa 901 gatatataaa tccctcaccc gacaggataa attcatatgc accaagcttg tttttgtcgt 961 cgcaaagttc tgccgcggtc tttccgctgt tggctgatat aaaatccgtc agctcgtcaa 1021 catcggaaaa ataaacgaaa ttctgcacat caaaagcgtt gccggtttcg gcaggcgcgg 1081 cggaaattac agataaaggc aataatgcaa agcaaagaat caccataata cctataaatg 1141 cttttaacgc cgtcttcttc aaaagtatca cctcctgtta gtttacataa taattatagc 1201 aaaaagcttc acttttgtcc atttacatag tatccattat ttttatatgg gctttgttca 1261 tattcaacat aaaaaactgc ccaccccgcg aggagtgagc agttgatatt gtccgagatt 1321 acggattctg cgcgatgaat tcttcaacct ttgtgttgag ttcttcaacg tagtaagtca 1381 aaggttcggt gttcttttcc ttgatctgtg cccaagtgga agcatcagag cggtgaccgt 1441 tgtcatagaa gtcggaaatg tagcttgaaa gcttgtcgcc gaagttatag gagaagatgg 1501 tagcgtcgga gttgttagcg atatcgtagc agatatccca catctcgagc atttcatctg 1561 tccagaggta ggtttcttca agctgacgtc tgtcgatgga gattacggta gggtcaagaa 1621 tcttgaatct gtcgcaagat gccaaaagtg cagcgccttc gtggttttcg ccgcccttaa 1681 taagagcata gccgttgggg ttgcagttga gataatactt gccgtcgccg ttgttatctc 1741 tgggaacggg aacgaacata agctcgcctg cggtgacgtc gccccagacg ttggacacat 1801 cttcaacagg accggtgaat acgtatggac ctctgatatg gaagaggcaa aggccttcct 1861 tcataccgcc gccttcaacg ccgtttctga gtgaccagcc attgttccac caaggatata 1921 cacactggtt ctttgccagg tcataaagca tatttgcagc tctttcgagt ctggggtcgt 1981 caacgttggt gacaaatctt gcactattgg tgtcgtagta tacgatctca gcaccggtag 2041 agttcataag gcctgtagtg aagctccagc catccaaagc atatctatct tcgtcgggat 2101 cggagaattc tacgcacatt tcatagaata cgtcccaagt ccattcatcg ttatagtaaa 2161 gagtagcggg atcatcgaag ccccattcct caacaactct tctgttatat gcacaaactt 2221 caccgaagcc gatgtcggtg cagatggaat atacattctc acccagagcg cagtagttgt 2281 atacaaagtc cttaacgccg ttccaaagag gatcgtcata gtcgatgtaa tcatttacgg 2341 gagcgaagaa gccctgcaat gtcataccgg gatatacgcc tgcaccggat tgggtgaagt 2401 cgggggaagt gcctgccaga atgaggttgg caaggtcatc gccgtaagaa ccccaggtgc 2461 attcgatcca ctgtacatca cagccatact tttcctggaa ggtccagaca ccggtgttaa 2521 ccacttcacc ttctgaatag ttgtggaatc cgtcatacca ggagaaccac ttaacgatgg 2581 agcctgatgc agcaactgtt tcagcggcgg gaagtgtgat acctgctgct gccaaaattg 2641 cttcggagtc ctcggtagaa agggtgagct taacg // LOCUS sequence168 2670 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence168 VERSION sequence168 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2670 /mol_type="genomic DNA" /organism="" /note="sequence168" CDS complement(796..984) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MLYTVLSEFDIFFEDYAPDEMVDVSGRQIEYISLNKNKQITNLFS TNPAMYLNQRYMPGKHY" /locus_tag="LOCUS_6030" /note="MGA_798" CDS complement(984..1685) /product="ATP-dependent Clp protease proteolytic subunit" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011392585.1" /transl_table=11 /codon_start=1 /translation="MQEETVENAVQEQSDELEKFRDVELKNSKHCIHCLSIIGQIEGHY ILPPQNKTTKYEHIMPALVAIEQDMSIEGLIIIINTVGGDVEAGLALAELISSMHTPTV SLVVGGGHSIGVPLAVSAKKSFIVKSATMTVHPVRMTGLVLGVPQTLSYFEKMQERIVR FVCDNSNISSSRFEELMMKTGELVMDVGTVLTGEDAVKEGIIDAVGGLQDAIACLYEMI ENEPSKKVQVK" /locus_tag="LOCUS_6040" /note="WP_011392585.1 ATP-dependent Clp protease proteolytic subunit (Moorella thermoacetica) [pid:58.5%, q_cov:89.7%, s_cov:81.9%, Eval:3.4e-71]" /note="MGA_799" ORIGIN 1 ataaatataa aataccttga agcgatcgga tttcatcagc cattgaacaa gcttaattgc 61 accgattccg acaagtgccg aaaccaagaa gccgacaatg cactggccaa ttccaatatt 121 gactccttca gcaatgccgt ccttaacctc aacaagacat cctcccaaaa ttgcggggat 181 tcccagaatg aaggaatagc ttatagcttc acttcttttg agtccgcaga aaagacctgc 241 ggagatagtt gagccggagc gggaaacgcc gggcaatagc gcaatcgctt ggaaaaatcc 301 gatggttacg gcatcttttg ttctgacatc ggtcgcttcg cggtcaccgc tgctgtggtc 361 agccataaac aaaatcgcag cagtatataa gaagcaaata ccttcaacaa atatgcttgc 421 atcttcacta aacgactcaa agaagtcctt gaatatgtaa aacgggatga gcacagccgt 481 tgaaattatg aacataaaca aaagcctgcg tgtcggttcc atattcttaa aggtgaatcg 541 tcccgtaaaa atgtctttaa ttaactgcag agcttccatg aacagagcaa atatctgcat 601 tctgaataca accagaacgg caataagtgt gccaagatgc aaaattgcag agaacattaa 661 cgctccctcg ccgctgttac ctgtgaagtg ctgatatagc gaaagatggc ccgaagatga 721 tacaggcaga aactcggtta ttccttgaat tattgcttga agtattgagt tgatatatga 781 catttttatc ctccgtcagt agtgtttacc cggcatatag cgttggttaa gatacatcgc 841 cgggttggtt gaaaaaaggt tcgttatttg tttattcttg ttaaggctga tatattcgat 901 ctgtcttccc gaaacatcaa ccatttcgtc gggggcgtaa tcctcaaaaa atatatcaaa 961 ctcgctgagc accgtatata gcatcactta acctgcactt tctttgaagg ctcgttctca 1021 atcatttcgt ataggcaagc gatggcatcc tgcaatccgc cgacagcgtc tataatgcct 1081 tctttaacag catcctcacc tgtcagcaca gttcccacat ccattacaag ctctcctgtt 1141 ttcatcatca gctcttcaaa gcgggatgac gaaatgtttg agttgtcgca aacaaagcgc 1201 acgatgcgct cctgcatctt ttcgaaatag gaaagtgtct gcggtacacc caagacaagc 1261 ccagtcatcc ttacagggtg gacagtcatg gttgcgcttt tgacgatgaa tgacttcttt 1321 gcactaacgg caagcggtac accgattgaa tgccctccgc cgacaacaag cgaaactgtc 1381 ggtgtatgca tagatgatat aagctcagca agggcaagcc ctgcttccac atctccgccg 1441 acggtattta taatgatgat cagtccttca atggacatat cctgctcgat tgcgacgagc 1501 gcaggcatga tgtgctcata tttggtggtc ttgttctgag gcggcaaaat gtaatgcccc 1561 tctatctgtc caatgatgct taagcagtgg atgcaatgtt tggaattttt gagctccaca 1621 tcgcgaaatt tttccagctc gtccgactgc tcctgcactg cattttcaac tgtttcttcc 1681 tgcatatatc ctccaaggct ttttagggtt attatccgca gtttcagccg cgatatacgc 1741 taaaaatgaa ggatttaagt cacttatctt caaaatgaaa acaattataa atattatata 1801 cctattaata cttatagtca aggacagaga tgggtaaaat ggcaagattt gcaagatttc 1861 attcaaaaag ttttaaaaat tttaacgatt tatactgtaa aagtgatcgt caaatacttg 1921 acaataagac aaatataaac tactatatat agtattgaat aagttaagtt tcgaagggag 1981 ttttttatat gggacttaca cttgctgaaa agatcctcaa agcgcattgc gttgacgggg 2041 agtttgttaa agggaaagaa atcggaatta aaatagatca gacccttact caggatgcga 2101 cgggaactat ggcatatctt gagtatgaag ctatgggcgt accgcgagtc agaaccgaaa 2161 agagcgtggc atatattgac cacaacactc ttcagtcggg ctttgaaaat gccgacgacc 2221 accgtttcat cggttcggtt gcgagaaagc acggcatatt cttctctcgc cccggcaacg 2281 gcatctgcca ccaggttcat cttgagcgtt tcggcaagcc cggaaaaacg ctcatcggtt 2341 ccgattcaca cacacccaca ggcggcggat tgggaatgat tgcaataggt gcaggcggac 2401 ttgacgttgc tgttgcaatg ggcggcggta catattacat cacatatccc aagatcgtta 2461 aagttgaact tttgggtaag ctctctcctt gggtatctgc taaagatgtt attttggaag 2521 ttcttcgcag aatgagcgtt aaaggcggcg tcggcaaaat tattgaatac accggcgagg 2581 gcgttaagac actttccgta cccgaaagag ccaccattac aaatatgggc gctgagcttg 2641 gtgcaacaac gagcattttc ccctctgatg // LOCUS sequence169 2663 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence169 VERSION sequence169 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2663 /mol_type="genomic DNA" /organism="" /note="sequence169" misc_feature complement(262..>2663) /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_013389449.1:glycoside hydrolase N-terminal domain-containing protein" /note="WP_013389449.1 glycoside hydrolase N-terminal domain-containing protein (Bifidobacterium bifidum) [pid:39.0%, q_cov:88.9%, s_cov:40.5%, Eval:7.2e-144, partial hit]" /note="MGA_801" /locus_tag="LOCUS_6050" ORIGIN 1 aatggactgt taagccaccc ctctatttta acgtggtggc gtcaaattct tattccctga 61 ttcaatcata aaaaacgcag aaaatcaatc tgcgtttttt acatttgttt cgtgcttttt 121 ctttgtatac gccgccactt atgtcggatt ttcgaccaat tgtgcaaaag atttgacaag 181 ttatgcttac aacacagaca acagaagccg gatggctagg agaacctggc tatccggctt 241 ttgatttgac aatatgccac tttatttgtc ggtatcagac tcagttgtgt aagttttgaa 301 atagtcaatg gaaatgctgt ggtccttaac tcccgtgacg atttcatcca ttacaacaac 361 tttaattgta tgtttaccgt attcaaggtc ggtttttgca aataccaacg tatcctgagt 421 tttggtggat gtatgaacca aataatagtc cccgatctgt tctccgtcga tgtatataac 481 aacgccgtta tagtttggtt ttgcaactga gtaaagttca attcccgtac catagaaggt 541 aagttctgca gcagagcctg ctgaccacga acagttattt gttgacatat agtgatcatc 601 ttcggtgaaa agagtccagg aaccgctgta aataactctt gcatcgttac tgtcaatggt 661 ttcatttcta ccgcctactt caacggcttc atttgaagcg gcgctttcca tatcgttaac 721 actgacagag gttacaaaat atgtgtaata tatcgaatcg gcagattcca agtctgagat 781 ggcagtggta tcaatatact ctgtatttgt cacatcagag gcaacaagct tggcttccaa 841 agaatcggtg cgacgatata cattatagct ttcagcactt gcaatttcat cccaggtgat 901 cttgattttg tctgcgctat atcttacagc ctgaacattg tttggagcag taatcgtgac 961 cttgttcttg attgtatagg tctcgccttc ctttgcctca aagctgatgc ggtttttctg 1021 aacagtttta tattccactt cgtttccgtt agaatcagta attgagaaaa gatcgccaat 1081 aatcatctga acagcacatt caccgtcgtt agcagcttta acagtaactt cagttgctaa 1141 gcggttttcc cactttatat cgacctcata gtttccgcga gctacaagac cgttaacata 1201 accatcgctc caagcttcag gaatggcagg gagaatgtta atgtaaccca tgttgctctg 1261 cattaaggct tcggcaacac ctgcagtata accaaagttg ccgtcgatct ggaaaggcgg 1321 atgagtatcc caaagattat caagaatacc tgtttttatg agcgtttcga cgagcaggta 1381 catatgctct ccgtcaccga gacgtgccca agtattgatt ctttgtccca ttgcccatcc 1441 ggtagatgcg tcgactctgg aatcaagtga tacacgtgca gcttcgaacc attcaggtgt 1501 gtcaactgaa atgagatcgc cgggataaag tcccaaaaga tgagaaaggt gacggtgacc 1561 gtaagcgtct gagtttggta cacttccaag cctggtttct tcgtaccatt ccttgatctg 1621 tccgttagtt ccgatttcaa tcggttcgcg caaattggaa agaatatctc tccactcatt 1681 taatgttgct tcatcttcgc caacgatttc acctgcagtg atagtgtcgg taaacagctg 1741 ccaaataagt gactgctcat aagtgtttcc gtttgttctc ggtccgtgtt cgggcgaata 1801 tgcaggagtt gagatcagct tgccgttttc atcttcaaca aggatctggc tataaaagac 1861 agtctgctcc ttcataatag gatagatggt ttccttcagg aactcagcat ctaaagtgta 1921 ttcataatat tcccaaacgt tttgtatcat ccacggcaca cttgcaggcg accagcccca 1981 gtcaaacacc catccgggtg cagtccagcc gtaaggcgta gtctgtgtat tggcggtaaa 2041 accgttttgg gggttatctt ctgtcgattc aacaccgaag tacatatttg cagtaactct 2101 gcccggctca cgaagtccat caacataatc aatcatcgga attgcacatt cagcgagatt 2161 tgtattatat gcaggccaat agttcatctg caaatttaca tttatatggt aatccgagtt 2221 ccatgcgctt ccgtttgtgc caacccaaat gccttgcaag tttgcgggca aaatgttgtt 2281 ctcgcgagat gaggatacca aaaggtatct gccatattgg aacagcaaga cctccaagta 2341 tgctttttct gagtcactaa gtgaaccgga tttgtatgct gccaaaagct cgtcggtagt 2401 taaattcggc attttctgtc cgaggttgag gtcaactctt gcgagcatgt ttgtgaagtc 2461 cactctgtga gcatatttca aatcgtcgta gctcttcttt gcagcctttt caacatattt 2521 cttcactctt tgatcaagct ctgttttaga ctcgcctgtg cgataggtgg gatagtcaag 2581 tgcataatca gttcccatac ttaaaatgat tgttgcttcg cttacccccg aaattgccag 2641 tttatctcca tctgaattaa gct // LOCUS sequence170 2653 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence170 VERSION sequence170 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2653 /mol_type="genomic DNA" /organism="" /note="sequence170" CDS complement(1716..2651) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MSLCSCTPADAPFNAGTPDTNDPIVSQDTPMPNVTFEEVEADLPE NLVMIEYEGYVSEIWDEDGLTCFKLFNYRLDGDTYRSVEYTFGIYPNEHFKTTAVNPEI KVEDHVKIYSFTYDGNKSQKYHSADIITVIPKQGTTFYALVLNVNGTNIFAEGLEINGS NNRGLFDFTIADDTKITYNYTEIEASDISAGDIIAVTSSGTVLETYPSTYLGITQVSLL TPANKVPDYDPLVNASVTAKTFTGRVNWIYTHNGRIHLGMYDDTEWYCEVILPEGYETS AAVGETVTVTVDAVATINGLTKYSSPEVTK" /locus_tag="LOCUS_6060" /note="MGA_803" ORIGIN 1 atggagaaaa cagcgataat gaggattacg gcaacaattg caacaactgc gacagcagca 61 atgatgatta tagtcgcaat gctggggccg ggcttgcctg cacgggtgtt gatgaaagga 121 ttgacaggtt cgtcggcctc gacgggagcg acatagttag ggtcacctgc aagatccaaa 181 acgatggttg taaggcttcc tgcgggaagc tcatagtcct cgctgtattt acctgcttcg 241 agccaatatt tgtttctgaa tcggttttcg gttttaagcg actgataggt tacagagcct 301 aagatctcct cacctacgtc aagagccagg tattcgttgg aatcggaaag attgacagcg 361 acaacgacca attttttgcc gtcgggcgat ttgaaggcag tcatattcga ttcaaggtct 421 tcgttgatat caacgcggat gtagccttct ttgatgtact tggagaagtg catcattatg 481 taatggttgc cgccgcgggt aagatcggca ttttcacctg catcggcaat ttcaatgaga 541 gttattcccc tatcgggtgc ccaggcaccg ttccagaaga gatatgcgtt gaggtcttca 601 tagttgagtt catcgatgat aatgtttgca aggccgaagt agtcatcggt ataccattcg 661 gtctgccaga tgggataatc ggggtatgca gcgcgaattt ttgagaagtt gttgggagaa 721 aggtcagtac cgtaaagatg gtgacccatg atttcaaggc tttcgggaca gttttcaatt 781 acaggctcca aatatccctg caaaaggtcg ccgtagccgc ccattgtttc agcgccaagc 841 aaaacgggag cgaattcgcc gaaggcttct ttaaaggctt catataccgc gatgtgagct 901 ttccaatagc agcagtagtc atcggtttct tccattccaa ggaagaatcc tgcttcttgt 961 cttgccttgc cgttttcatc aacgtggcgt tcctgaagct caatttcgtt ggaaatagag 1021 aaataatgaa cgggaatgcc tgcatcaaag aagtatttga ttgactcaac acaatgttgg 1081 gccaaggcat catacatata ctcaccattt tcatccttgg caagggtata atatgagaag 1141 ccctttgcgg aaagctcagt aaatgcaacc caaggaaggt cgcggtcata ctgtccccag 1201 ctggttacca aaactgtagg ttcgattcct cttgcaacag cagcatcata gagcttttta 1261 tatgcaggat agccgtcaac ggcattctgg tgctcatcgc cgcagaggtt gaggtcgcgc 1321 aaacgtatga tattgaattc ggtgtcgttg aagatccagt cgtatgccag atcggcattg 1381 ttatgattta aaagccagtc ggcataccaa gtgtatgatg ctccccagcc gtcaatagtc 1441 tggtgtgtcg aggacatatc gaccgttgcg ttggtgtcgg cgctgacact tacggaaaga 1501 gctccgacgg caatgagcaa tgccattaaa acgcatagga tttttgacat tttcatatta 1561 tcactccaaa agcaaataaa tcgggggtat acccctatag ctatatatta caccttttga 1621 acgtgaattg gcaatgacaa attcttattc tttgattgat atatagaaat aatttcataa 1681 aaatctccgc cgaaaagtac gacggagatt ttgacttatt ttgtaacctc cggagaggag 1741 tatttggtga gtccgttgat cgttgcaacg gcatcgacgg tgacggtgac tgtttcgccg 1801 accgcggctg aggtttcata gccttcgggg aggataactt cgcaatacca ctcggtatcg 1861 tcatacattc caaggtggat tctgccgttg tgggtatata tccagttaac tctgcctgta 1921 aaggtctttg ccgttacaga cgcattgacg agcggatcat aatcaggcac cttgtttgct 1981 ggagttaaaa gcgaaacttg ggttataccc agatatgttg aggggtatgt ttcaagaacg 2041 gttccagaag atgttacggc gataatatcg cctgcggaaa tgtctgaagc ttctatttca 2101 gtgtagttat aagtgatttt agtatcatct gcgatggtaa aatcgaaaag tcccctgttg 2161 tttgagccgt tgatctcaag gccttcggcg aagatgttgg tgccgttgac attgagcacc 2221 aaagcataga aggtcgtgcc ctgtttggga atgacggtga tgatgtcggc gctgtggtat 2281 ttctgcgatt tgttgccgtc gtatgtaaag ctgtatatct ttacatgatc ttcaaccttg 2341 atttcgggat taaccgcagt ggtcttgaaa tgctcgttcg gataaattcc aaaagtatac 2401 tcgacagacc tataggtatc accgtccaaa cggtaattga atagcttgaa gcaggtcagg 2461 ccgtcttcat cccagatttc ggaaacgtag ccttcatatt cgatcataac gagattttcg 2521 ggtaggtcag cttcaacttc ctcgaatgta acgttaggca taggagtatc ctggctgacg 2581 attgggtcat tggtgtcggg tgtgcctgca ttgaacgggg catcagcggg cgtgcaggag 2641 cagagcgaca aag // LOCUS sequence171 2647 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence171 VERSION sequence171 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2647 /mol_type="genomic DNA" /organism="" /note="sequence171" CDS complement(421..2349) /product="DNA mismatch repair endonuclease MutL" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_000516465.1" /transl_table=11 /codon_start=1 /translation="MGNIHVLEKSVYELIAAGEVIERPSSVVKEMIENSVDAGASSITV EIKNGGRTYIRITDNGCGMTAEDIPLAFVRHATSKILAKDDLVSISTLGFRGEALASVC AVSKVEVMTKRREDDLGSHYVIEGGEELELDSIGCPDGTTFIIRDLFFNVPARLKFLKK DVSEGNAIANVVQKLALSHPEVAFKFIRDNKTELITSGDNKLLSVIYSVFGREFHSSCI PVDYTYNGVSVSGYVTKPLMSKANRAFQNFFVNSRYVKSVTCMVALEEAYRNQIMTGKF PGCVLTVKINPSNIDVNVHPAKIEIRFSDEKSVYDAVYFAVKNALMNFDAPTEIVYEEK KPKTLTHQEIFSKPAEPDKSVQLMFSSTRKSIDFSDIPKQETVATQNRPAVREVVSFEE PEEKNEPIKPAPVVTPIVKEPTPEISDRFKYINQSSFAKVEKPAEPEIIPEVSQKPQVK VIGELFKTYIVCECGEDMYLIDKHAAHERHNFEKIKSGAESLDMQALIAPIDVLISYEG YDAIRDNPDICKRLGFGIELLDAPKISLYGVPVLIGDEDPADLLTRFSDSLSSGKIGSG SELFDDLFHSIACKASVKANSITDKIELEELTKLIFEEDIRYCPHGRPVLIRLSKYEIE KMFKRIV" /locus_tag="LOCUS_6070" /gene="mutL" /note="WP_000516465.1 DNA mismatch repair endonuclease MutL (Bacillus cereus) [pid:32.6%, q_cov:100.0%, s_cov:100.0%, Eval:6.9e-94]" /note="MGA_805" ORIGIN 1 atatacattg cccttttctt ttgaaagttc caaaagctca tcgcggagcg tggtagatga 61 acaagattcg tcgaaggtaa tattatccac caaagaattg atatacaaac ccgttccgcc 121 gcaaacaagg ggtatcattc ccctattgcc tatatcttcg atagctttgt gggctaatga 181 aacataatca gcaactgaaa agctgttact cggttctaaa aaatcaatga ggtgatgagg 241 tactccatcc atttcttcgg gtgtaggctt tgctgtggca atggtcatac ccttgtagat 301 ctgcattgag tcagcggaaa cgacttcaca gccgatagtt ttggcaaggg caatgcttaa 361 agcggtcttg ccggaggcgg tggggccgca tataactatc agagactgat tggtcatact 421 ttacacgatc cttttaaaca ttttctcgat ttcatacttt gaaagcctaa ttaatacagg 481 tcttccgtga ggacagtatc ttatatcctc ttcaaaaatc agtttggtta gctcttcaag 541 ttcaatttta tctgtaatgc tgtttgcctt tacagatgct ttgcaagcaa tcgaatggaa 601 caaatcatca aacagctcgc tgcccgagcc gattttgcca gatgaaaggc tgtcggagaa 661 tcttgtgagt agatcagctg ggtcttcatc gccgattaaa acgggcacac cgtaaagaga 721 gattttcggt gcatccaaaa gttcaattcc aaagccgaga cgcttgcaaa tgtcggggtt 781 gtccctaatt gcatcgtagc cttcgtagga tattaaaacg tctataggag caattagcgc 841 ctgcatatct aacgattcag cgcccgattt gattttttca aagttgtgtc gctcatgagc 901 ggcgtgcttg tcgatcaaat acatatcttc gccgcattcg cagacgatat aggtcttgaa 961 caactcgcca ataaccttaa cttgaggttt ttgcgagacc tcgggaataa tttccggttc 1021 agcaggtttt tcaacctttg caaaagatga ctgatttatg tatttaaatc tatcgctgat 1081 ttcgggtgtt ggttctttaa caataggggt tacaacggga gcgggcttaa tgggttcatt 1141 cttttcttca ggttcttcaa aagatacaac ttcacgaaca gcaggtctat tctgtgttgc 1201 aacagtttct tgctttggga tgtcggaaaa gtcgatagac tttcgggttg atgagaacat 1261 cagctgaacg cttttatcgg gttctgcggg ttttgagaaa atctcttgat gtgtaagagt 1321 cttgggcttc ttttcctcat aaactatttc ggtaggagca tcaaaattca taagcgcgtt 1381 tttaacagcg aagtaaacgg cgtcgtatac cgatttttca tcgctgaaac ggatctcaat 1441 ttttgcagga tgaacgttaa catcaatatt tgacggattg attttgacag tcaaaacaca 1501 gcccgggaac ttgcctgtca ttatctggtt tcggtaagct tcttcaaggg caaccatgca 1561 ggtaacgctc ttaacgtatc ttgaattgac aaagaaattc tggaatgctc tgttagcttt 1621 tgacattaag ggctttgtta catatcccga aacggaaaca ccgttgtatg tataatcgac 1681 agggatacag gaagaatgga actctcttcc gaaaactgaa taaataaccg agagaagctt 1741 gttatcgcct gaggtaataa gctcggtttt gttatcgcga atgaatttaa aagcgacttc 1801 gggatgagaa agcgctagtt tttgaacaac atttgcaatt gcgttgcctt cgctgacatc 1861 ctttttgaga aacttcaaac gcgcaggaac attgaagaaa aggtcgcgta tgataaatgt 1921 tgttccgtca gggcaaccga tcgaatcgag ctcgagctct tctccaccct caatgacata 1981 atgtgagcca agatcatcct cgcggcgctt ggtcattacc tcgacttttg aaacagcgca 2041 aacagaggca agtgcttcac cgcggaaacc aagagttgaa atactgacaa ggtcgtcctt 2101 tgcaaggatc ttactggttg cgtggcgcac gaaagccagc ggtatgtcct cagcggtcat 2161 tccgcaaccg ttatcagtga ttcgtatata tgttctgccg ccgtttttga tttcaacagt 2221 gatgcttgaa gcacctgcat caacagagtt ttcaatcatt tccttgacga cagacgaagg 2281 tctttcaata acttcgcctg cagcgatcag ttcatataca gatttttcaa gaacatggat 2341 atttcccatt cttactccta tgtgttagat atattttatc acttcgctga caagctcacg 2401 cagttcattg tcggtaagct catcgatatt tgtctttctg agcatatcaa gagcatagct 2461 ctcgcccatt aggtcaaatg aaatttggtc ggtggatttt gatttttttg cattcatttc 2521 agcttggcgg ttcttgtctt caagtgtttc caaaagctct tttgaacgct ttaagatctt 2581 tgcaggaagt cctgcaagct ttgcaacttc aatgccgtag ctttcatcca caccgccgcg 2641 tactatc // LOCUS sequence172 2643 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence172 VERSION sequence172 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2643 /mol_type="genomic DNA" /organism="" /note="sequence172" CDS 1034..1405 /product="transcriptional repressor" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011860967.1" /transl_table=11 /codon_start=1 /translation="MTKQRQLIKSIIESAKGHLTAEEIYEISKQKMPNIALGTVYRNLG KLCEANEIGLISVSGRPDRYDKSVNTHGHTVCDKCGKITDFPAPVAEFKEQLEKHLGID ITAYDVSAHYICEDCKCAE" /locus_tag="LOCUS_6080" /note="WP_011860967.1 transcriptional repressor (Clostridioides difficile) [pid:40.0%, q_cov:96.7%, s_cov:93.0%, Eval:5.5e-20]" /note="MGA_808" CDS 1475..2008 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MNLKGTKTEQNLMTAFAGESQARNKYTYFASVAKKEGYEQIAEIF LKTAENEKEHAKLWFKALGELGDTAKNLAAAAEGENYEWTDMYDRFAKEAEEEGFKTLA YQFRAVAAIEKTHEERYRALLSNVEMQKVFEKAEETMWECRNCGHLVMGKKAPAVCPVC AHPQSFFEVRKANY" /locus_tag="LOCUS_6090" /note="WP_015943945.1 ferritin family protein (Desulfitobacterium hafniense) [pid:75.1%, q_cov:97.7%, s_cov:44.1%, Eval:5.1e-75, partial hit]" /note="MGA_809" ORIGIN 1 cgcgcgggtg agtattgggg gaatccagat taaaggatgg cggatgatgt ttggcatctg 61 gagcatcgaa gtgccgatac cttgagagat caaaccgccg aatttgttct cgcgatagct 121 cattacggca aagccaacca tttgacagca acatcccaca gcggcagcac ctgcggcgat 181 tcccgaaaga ccgagcgaaa cgccgattgc ggcggagctg atcggaagag tgagggcaat 241 gcccattaaa acagaaacaa cgatacccat tacaacagga tggctttcaa caccgaagtt 301 gatgagcgat ccgatccatt tcataaagga tgagatcgga ggacttaaaa gaattcccac 361 aattgatccg gaaattattg ttacaagcgg tgtgatgatt atatcgacct ttgttttgcc 421 cgaaacaagc ttgccaagct cgatgccgac atctgcggcg atgaatgcac ccaacggctc 481 gccgggacct gcaagtgtca atgaaccgag agtgaagttt gaaagactta ctttacctgc 541 aaacgcaccg acaagaccgc aaacagccgc agaaacagtt accaagtccc ctgcctgata 601 tcttgcggca actgcggcac cgatgcccgc acctgtcata gccttggcaa agccggcaat 661 aaggcggata tatgcgccga tctctccgcc gaccagcatt cccacctgat ccatgattgt 721 acctatgata agcgttgcaa acaagcctcg tgccattccc gaaagaccgt caataaacag 781 atgatttaaa taatctttaa tggatttcac tttgattcct ccatctattt aagttgttga 841 tttgattata tttccttgaa ctcggccggt caagacattt tattaaaatt ctacctttta 901 aagaattaaa gcggcaaagg taaagaaaaa atatgcaatt tttacataaa atttctctta 961 tggggtattg acaagctttt atcattatgt tattatattt ttgcgaacca ttcctaattt 1021 tgaggaggcg accatgacaa aacaacgaca attgattaaa agcataatcg aatccgcaaa 1081 aggtcatctg accgccgaag agatctatga aatttcaaag caaaaaatgc cgaacatcgc 1141 actcggtact gtttaccgca atttgggcaa gctttgcgaa gcaaatgaaa tcggactaat 1201 aagcgtcagc ggacgacctg acagatacga taaatcggtg aatacacatg gacacaccgt 1261 ttgcgacaaa tgcggaaaaa tcaccgactt ccctgcccct gttgccgagt tcaaagaaca 1321 gcttgaaaag cacttgggca ttgacatcac ggcgtatgat gtgagcgcac attacatatg 1381 cgaggactgc aagtgtgcag aataggacaa cacaaggtta gatgacggcg agaccgtctt 1441 taatatgaaa aaataatttt acaggagtgt tattatgaat cttaagggta caaaaactga 1501 acagaacttg atgactgcat tcgcaggcga atctcaggca agaaacaagt atacatactt 1561 tgcttccgtt gcaaagaagg aaggatatga gcagatcgca gagatcttcc tcaagacagc 1621 tgaaaacgaa aaggaacatg ctaagctttg gttcaaggct ttgggcgaac tcggcgacac 1681 cgcaaagaac ctcgctgctg ctgcagaagg cgaaaactat gagtggaccg atatgtatga 1741 cagattcgct aaggaagctg aagaagaagg cttcaagacc ttggcatatc agttcagagc 1801 tgttgctgct atcgaaaaga ctcacgaaga aagatatcgc gcacttcttt ccaacgttga 1861 aatgcagaag gtatttgaaa aggctgagga gaccatgtgg gaatgccgca actgcggtca 1921 ccttgtaatg ggcaagaagg ctcccgctgt atgccctgtt tgtgctcatc cccagagctt 1981 ctttgaagtc agaaaagcaa actactaata tttctttgtc ataaataact tgaccccgag 2041 cttctcgaaa gagaggctcg gggtttttgc gggggagaat taattggggt aacttcatat 2101 gcttcaatct gtgtcgttgg taattatgga gatacagggg cagtgcaatg atactctatc 2161 ttgttatctc tttctttaag aagcttttca aagaatttgt agctgtcctc ctcatcacca 2221 actactggag aaaaaccttc cattttcttc acattagttt tttctgtttc ggacatagtt 2281 tggaacatta caacgccaat gcattcccaa ccttccttcg gctgaatttt cataattatg 2341 tccttatccg cgctgtgatt cgatagaccc caggagacac ggtactgatc tttttgggaa 2401 ttgtagaata ttccgcaaac gtaaaaccaa tcagaattct cagtagcttc tttaatatcg 2461 gtgttcacaa atgcaatcag tccgtttttg tcgtatacat atcccgtttc gataaatttt 2521 ccattttcga agtattgatt ttcgtaagag taggaatatt catctgaaat ttctgaaatt 2581 tctagtttcg ataggatatg atttaattta tatttctggt cgtcactttc tatagtataa 2641 aaa // LOCUS sequence173 2638 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence173 VERSION sequence173 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2638 /mol_type="genomic DNA" /organism="" /note="sequence173" CDS complement(430..1476) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MGIALFCVILFLVLVIFYSGLRILEPTLFDKSGNQGNQVTVGDVG EEATPGVSTAEDETFEQWPDNTGKTIVKDGVSYFPRQDITVMLIIGVDRLGPAESSGYY RNDGAADVVSLVIFDEKNEECNILHLNRDTMVTMPVIGIGGNQAGTYYGQLTLSHTYGS GLKDSCENVEKTVSNFLGGILIDYYLSMSMDALSVLNDAVGGVTVNVTDDFSDIDPDIT MGEYTLMGDEALTFIRARKGLGDQKNISRIERQKEYMNGFIKAFKDSYNGDLEYILNTY ETVAPYLVSDCPINTFTSMIARYMDYPITEIISPEGENVLGDEYYEFHADEEKLSNLII DLFYAPKE" /locus_tag="LOCUS_6100" /note="WP_003972903.1 LCP family protein (Streptomyces) [pid:31.0%, q_cov:52.0%, s_cov:49.5%, Eval:3.0e-12, partial hit]" /note="MGA_812" CDS complement(1536..2165) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MKKIISMVTAFVLVLALACSVCASTFIPSISFNPTISVGSTTVVL MNGGYFGMITLGDGSTTNISPNCLIITPLSKVLESEYGVHANIRKNLLDCYNGINDGTV EVPAGESVRDIIDVSWVCDYHEDMLNQPGVTMTMSFKLGVAADEDVAVYTYDVEDKVLE PVVKAVNNGDGTVSVEFEHLCPVVFTVSSGDVVVEQPVEACVEEVE" /locus_tag="LOCUS_6110" /note="MGA_813" CDS complement(2235..2582) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MYKELENIRYKQNIIPIIAHVDRYISPFNTYNIPKRLSEMPVLVQ ANASFFLKPSTKLMAMRMLKNDQIHLLGSDCHNLSSRMPNLGAAIEKIEKHLGTQAIRR ICRYQDELLNV" /locus_tag="LOCUS_6120" /note="MGA_814" ORIGIN 1 acatgccatc aattctcctg catcgttcac aacaccgtag gcttccgcct tctcccaatg 61 atcctgatat agtgaatctg ggaaatcata ctcctccggc gtgtgaacga tctccttttc 121 cgctggtttt ttaacgatgg atacagtgca accttcatga tgaaacgggc ttatctcaag 181 gtcataatag ctgttgcttc tggtagtcag ggggatggtg gtgcctttcc atctatcttt 241 tggcaatgcg acaatttcat aattcataca ttctctctcc gttcctcaaa ttcaggtttg 301 ttgttctgct gatattgtaa catagtagct gacaataaca atcaatatct ttcgcaacca 361 tcgtctcggg cgatattacg ggaaaactgt tttacggaca cccgcccttt ggcaagggag 421 tttgtttatc tattcttttg gagcgtagaa caaatcaatg ataagattgg agagcttttc 481 ttcatcggcg tggaattcat agtattcatc gcccagaacg ttttcgcctt caggagagat 541 gatctcggtg atgggatagt ccatataccg cgctatcata ctggtaaatg tgttgatcgg 601 gcagtcggaa acaaggtaag gcgcaactgt ttcgtatgtg tttaaaatat actccaggtc 661 gccgttatag ctatccttaa acgccttgat gaaaccgttc atatattcct tctggcgctc 721 aattcgggag atgtttttct ggtcgcccaa gcctttgcgg gcacggatga aggtcagagc 781 ctcatcgccc ataagggtat attcacccat ggtgatatcg gggtcgatgt cggagaagtc 841 gtcggtaacg ttaacggtta caccgccgac agcatcgttc aaaacagaca aagcatccat 901 actcatagac aaatagtagt cgatcaaaat gccgccgagg aaatttgaaa ctgttttttc 961 aacgttttcg cagctgtcct tgagtcccga accgtaggtg tgagaaaggg tgagctgacc 1021 gtaataggtg cctgcctgat ttccgccgat gccgattaca ggcattgtga ccattgtgtc 1081 gcggttaagg tgcaaaatgt tgcattcctc gttcttctca tcgaagatca ccaacgaaac 1141 aacgtcagcc gcaccgtcgt tgcggtaata tccgctggac tcggcagggc ctaaacggtc 1201 aacaccgatg ataagcatta cggttatatc ctgacgggga aaatatgaca caccgtcctt 1261 gacgatggtt tttccggtat tgtcgggcca ctgctcaaat gtttcatcct ctgcggttga 1321 aacacccggt gtcgcctctt cgcccacatc accgaccgtt acctgattgc cctgatttcc 1381 gcttttatca aaaagagtgg gctccaagat ccggagccca ctatagaata tcacaagcac 1441 caggaacagt atgacacaga acaaagcgat acccattaag gcccttcttt gtttactcat 1501 ggcacacctt tcccttcagt ttaagggttt aagccttatt caacttcttc aacgcaagct 1561 tcaacaggct gttcaacaac aacgtcgccg gaagaaacgg tgaatactac agggcaaaga 1621 tgctcgaact caacggaaac ggtgccgtcg ccattgttta cagccttaac gacaggctcc 1681 aaaaccttgt cttcaacgtc ataagtgtaa actgcaacgt cttcgtcagc agctacgccg 1741 agcttgaagg acatagtcat ggttacgccg ggctgattga gcatatcctc gtggtaatca 1801 caaacccaag atacatcgat gatatctctt acggattcgc ctgcgggaac ttcaacagta 1861 ccgtcgttga tgccgttgta gcaatcaaga aggttctttc tgatatttgc atgaacaccg 1921 tattcgctct caagaacctt agacaaaggt gtaataatga ggcagttggg gctgatatta 1981 gtggtagaac cgtcgcccaa ggtgatcata ccgaagtatc cgccgttcat aagaactaca 2041 gttgtggaac cgacagaaat tgtggggtta aatgaaatac tgggaataaa ggtcgaagca 2101 catacagagc aagccaaagc aagcacaagt acaaatgcag ttaccattga aataatcttt 2161 ttcatcatac tcatctccaa agtaattatt tatttctgcg tcgaaccaac gcataaaacc 2221 aaaattgttg tgtgtcagac attaagcagt tcatcctgat atctgcagat acgtctgatt 2281 gcctgggttc cgagatgctt ctcaattttc tcaatcgccg cgccgaggtt tggcatacgg 2341 gaggaaagat tgtggcaatc ggagccgagc aagtgaatct gatcgttttt gagcattctc 2401 attgccatca gttttgttga gggtttaagg aagaagctcg catttgcctg aacaagcaca 2461 ggcatttcgc ttagccgctt ggggatgtta tatgtgttga aagggctgat atatctatcc 2521 acatgagcaa tgatcggaat gatgttttgc ttatatcgga tgttttccag ttctttgtac 2581 atattatccg tccatggagc tataggcatc tctattaaaa tacacctttt ttgcaaaa // LOCUS sequence174 2628 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence174 VERSION sequence174 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2628 /mol_type="genomic DNA" /organism="" /note="sequence174" CDS 324..677 /product="DRTGG domain-containing protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_012869442.1" /transl_table=11 /codon_start=1 /translation="MKISTIVELLDAKVLCGNDKVGDHVYPACGSDMMSDVLAFVKEQA VLLTGLVNPQVVRTAEMMDMRCIVFVRGKNPSPEILELADDCGIVVLSSAERMYTACGK LYANGLSGGSVHE" /locus_tag="LOCUS_6130" /note="WP_012869442.1 DRTGG domain-containing protein (Thermanaerovibrio acidaminovorans) [pid:48.2%, q_cov:94.0%, s_cov:91.7%, Eval:4.8e-24]" /note="MGA_816" CDS 674..1114 /product="anti-sigma regulatory factor" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_012869443.1" /transl_table=11 /codon_start=1 /translation="MTDIFEPIAFHYDVSGDNFTSAGEASVSVKKQLRKLGISPEIIRR VSIAMYEGEINMVIHANGGDADVLVYADKIVIFLKDTGPGIKDVNLAMQEGYSTAKDNV RALGFGAGMGLPNMKRYTDRMNIETVVGQGTTVTMEVDLTAQ" /locus_tag="LOCUS_6140" /note="WP_012869443.1 anti-sigma regulatory factor (Thermanaerovibrio acidaminovorans) [pid:48.9%, q_cov:95.2%, s_cov:97.9%, Eval:4.2e-35]" /note="MGA_817" CDS 1134..2444 /product="[Fe-Fe] hydrogenase large subunit C-terminal domain-containing protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_012583277.1" /transl_table=11 /codon_start=1 /translation="MKKHYHSVSLIRDKCKGCTTCLKRCPTEAIRIRDGHAVITPDRCI DCGECIKLCHQKAKKALFDPFDALNNYKWKIAIPAPALYGQFDNLDDLDYVLTGLLDIG FDDVYEVACAAELVSEYTRQYLKQPGIVKPVISSACPVVVRLISKRFPSLVDNVLPVLQ PAELAAQIARRETLAAHPELTSEDIGIFFISPCPAKVSYVKNPFGVEKSEIDAVLSMSD VYFRLVSAMNKIDVPKSLSKTGLIGISWAGSGGESSALFNDKYLAADGIENVIKILDEL ENEKMQDMEFIELNACNGGCVGGALTVENPYIAKARLKILRRYLPVSQNHLVADDLSAS EFEWQNELEYSPVSSLSQNMGEAMRKMREIQNLHKELPHLDCGSCGSPTCLAFAEDVVN GNAKIDDCIIKMREHISDAMSILRKLEKSPEGSEEDL" /locus_tag="LOCUS_6150" /note="WP_012583277.1 [Fe-Fe] hydrogenase large subunit C-terminal domain-containing protein (Dictyoglomus turgidum) [pid:32.0%, q_cov:97.7%, s_cov:95.7%, Eval:1.1e-68]" /note="MGA_818" ORIGIN 1 gtagctacct tctattccca gtttgcactt aaccccaagg gcgagtatac aatttctgta 61 tgtctcggta ccgcttgcta tgttaagggc gctcaggatg tttttgacaa gatcagcgag 121 atcttgggaa tcggcgcagg aggaatcacc cccgacggta agttctctct tgaagcaacc 181 cgttgcatcg gcgcttgcgg tcttgcacct gtaatgaccg ttaacagcga cgtgtacggc 241 aaactcaccg ctgatatggt tcccgaaatt cttgcaaaat atcagtaatc tgacaacact 301 aagctgatct gcggaggaaa gatatgaaaa taagcactat tgtcgagctt ctcgacgcaa 361 aggtattatg cggcaacgac aaggtcggag atcatgtata tcccgcctgc ggctccgata 421 tgatgagtga cgttttggca ttcgtcaagg aacaggccgt attgcttaca ggtcttgtta 481 acccacaggt cgtcaggacc gccgaaatga tggatatgcg ctgcatcgtt ttcgtaagag 541 gcaaaaaccc ctctcccgag atcttggagc tggctgatga ctgcggaatc gtggtcttat 601 ccagtgcaga gcgtatgtac accgcctgcg gaaagcttta tgctaacggc ctttcaggag 661 ggagcgtgca cgaatgaccg atatttttga gcctatagcg tttcattatg acgtaagcgg 721 agataatttc acctctgccg gcgaggcttc ggtcagcgtt aaaaagcagc ttcgcaagct 781 gggcatttcc cccgaaatca tcagaagagt ttccatcgcg atgtatgaag gcgagatcaa 841 tatggttatt cacgccaacg gcggtgacgc cgacgttttg gtctatgccg acaagatcgt 901 gatctttctc aaggataccg gccccggcat caaggatgta aaccttgcaa tgcaggaggg 961 atattcaacc gccaaggaca acgtacgtgc cctcggtttc ggtgcaggta tgggtcttcc 1021 caacatgaag agatataccg acagaatgaa tattgaaacg gtcgtgggac agggaaccac 1081 tgttacgatg gaggtagacc tgaccgcgca gtaaacccat ccggaggtca acaatgaaaa 1141 aacattacca ttccgtctcc ctcattcggg ataagtgcaa aggctgtaca acctgcctga 1201 agcgatgccc caccgaggca ataagaatca gagacggtca cgctgtcata acgcccgacc 1261 gctgtatcga ctgcggcgag tgcatcaagc tttgccatca aaaagcaaaa aaggcgctgt 1321 ttgatccgtt tgacgcgctg aacaattaca aatggaagat cgcaattccc gcacccgcat 1381 tatacggtca gtttgacaat ttggacgatt tagactacgt tttgacaggt cttttggaca 1441 tcggctttga cgatgtttat gaagttgcct gtgctgccga gcttgtttcc gaatacacca 1501 gacagtattt gaagcagccc ggtatcgtaa agcctgtgat ctcgtccgcc tgccccgttg 1561 tggtaaggct tatcagcaag agatttccgt ccttggttga caatgttctg cccgttttgc 1621 aacccgccga gcttgcggca cagatcgcgc gaagagaaac tttggctgcc cacccagagc 1681 tgacaagtga agatatcgga atattcttca tatctccctg ccccgcaaag gtgagctatg 1741 ttaaaaaccc cttcggcgtt gaaaagtccg agatcgacgc ggttttgtcg atgagcgatg 1801 tatacttccg cctggtttcc gccatgaaca aaattgatgt tcccaagtct ttatccaaga 1861 caggcctcat cggtatcagt tgggcgggct cgggaggaga atcgagcgct ctgtttaacg 1921 acaaatatct tgcggcggac ggaattgaaa acgtaatcaa aattttggat gaacttgaaa 1981 acgaaaagat gcaggatatg gagttcattg agctcaacgc ctgcaacgga ggatgtgtgg 2041 gcggcgcctt gacggttgaa aacccataca ttgcaaaggc aagactcaag attttaagac 2101 gttatcttcc cgtttcgcaa aaccatcttg ttgcggatga tttgtccgca agtgagtttg 2161 agtggcagaa cgagctggaa tactcccctg tttcctcact ttcccagaat atgggcgaag 2221 cgatgagaaa gatgcgcgag atccagaatc tgcacaaaga acttccccat cttgactgcg 2281 gctcctgcgg aagccccacc tgtctggcat ttgccgagga cgttgttaac ggcaacgcaa 2341 aaattgacga ctgcatcatc aagatgagag aacacataag tgatgccatg agcattttga 2401 ggaagcttga aaagagcccc gagggatcgg aggaagacct atgatggtaa acgaagcaat 2461 tgataaactc ggtttaaagg tgctttgcct ttccgatggc gaccgtgaaa tttcgggcgg 2521 ctattgcggc gaccttttaa gctgggtcat gggcagagcg gatgccgacc aagcgtggat 2581 aacgataatg tctaacgtta acattatcgc tgtttcgaca ctgatcga // LOCUS sequence175 2618 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence175 VERSION sequence175 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2618 /mol_type="genomic DNA" /organism="" /note="sequence175" CDS 329..2068 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MSDRKTLCMGCMEQIDDSTACPFCGYSDSTVYNPSYLAPKTVLDG RYVVGRLISYNGESALYIGYDNISGDKVFVKEYMPDALCSRSKSGPELCVDHGSVVQYK NYMSEFVELNKSLSRLRTMSHIVAPIDMFSQNNTAYVILQYTEAITLKQYLADNAGELT WEQVKKLFPPLLTTLSCVHNSGILHRGISLETILVTDRGELKLTGFSIAAIRTINTDLA PELYTGYSAPEQYSASEWEGTWTDVYGVAAVMYRLLTGCMPTEPMARVGRDSLLEPAKI NSHVPANVSKVIMQAIRLSCETRIHTVTDFVTKLFEQPSYMDKLPAGSTQTIPIQRPGH SSRGKKKKSSNAPAIIGAVILVAIVAAVFIMLASLFLPDNSNPDLPDNTSGNSDIVTNT PVSTDTPQSSTPSISNEPITSSQPTGNAFVMPELIGKKVENVINSDAWKERLSFDVIYD YSDVYESGIIFDQDIEQGTMLYPITTVKIFVSKGYSIVQIPSYIDEFGMNMTKEEYIVL LDALNIKYEIREIQTPYDLSGYVLGVYCQENGSEVGEDINVAEGYTLFVDVSVFTPGID IVG" /locus_tag="LOCUS_6160" /note="WP_164925470.1 serine/threonine-protein kinase (Thermanaerovibrio acidaminovorans) [pid:30.7%, q_cov:46.6%, s_cov:60.2%, Eval:2.1e-33, partial hit]" /note="MGA_821" ORIGIN 1 aaccgagcga caaaaatcaa aaagataacc aactgtacca gcaacatcat tgctgtcata 61 aaaagtctgc tctcaatcag ctttaaaatc cttttcatct gttatcctcc ttatcacatt 121 atcatatact actattatac tcgcaaaatc taaagctttc aataacccat tatataccaa 181 aaagttacaa gttagttaca gccgggtgac agtttggagt tatttattga ctttgttcaa 241 tttgggtgat atgatatcat cgttataaaa ggataactat gcgtttacgc gcttttaact 301 atatcatttg aaaggaaaga tatttcgtat gagcgatcgc aagactttgt gtatgggctg 361 tatggaacag atagacgatt cgactgcatg tcccttctgc ggctatagcg actctactgt 421 atataaccca tcatatcttg ctcccaaaac tgtccttgac ggcagatatg tcgttggcag 481 acttatcagc tataacggcg aatcagcttt atacatcggc tatgacaaca tttcaggcga 541 caaagtattc gtaaaagaat atatgcccga tgctttgtgc tcaagatcta agtccggtcc 601 cgagctttgt gttgaccatg gaagtgttgt tcagtataaa aactatatgt ccgagtttgt 661 ggagttaaat aaatcccttt cccgacttcg cacgatgtcc catatcgtgg cacctatcga 721 tatgttctcc cagaacaaca ccgcatacgt aattttgcag tataccgaag caataacctt 781 aaagcagtat cttgctgaca atgcaggcga gctgacttgg gaacaggtca aaaagctctt 841 ccctccgttg ttaacaacat taagctgtgt ccacaattcg ggaattttgc accgcggcat 901 cagccttgaa accattttgg tcaccgatcg cggcgaactg aagctcacag gcttctcaat 961 tgccgcaatc agaacaatca ataccgatct tgctcccgag ctatatacag gctattccgc 1021 tcccgagcag tattctgcca gcgaatggga aggcacctgg acggacgttt acggcgttgc 1081 cgctgtaatg taccgtttgc tcacgggatg tatgcccact gagcctatgg caagagtcgg 1141 cagagattca ttgcttgagc ctgcaaagat caattctcat gttcctgcaa atgtttcaaa 1201 ggttataatg caggcaattc gcctttcctg cgagacccgt atacatacag ttacggattt 1261 cgtgaccaag ctctttgaac agcccagtta tatggataag cttcctgcag gttcaaccca 1321 gaccatcccg attcagcgcc ccggccattc ttcaagaggc aaaaagaaga agtcctcaaa 1381 cgctcccgca atcatcggtg cggtaattct ggttgcaatc gttgccgctg tattcattat 1441 gctggcatcg ttgttccttc ccgataattc aaatcccgat cttcctgata atacctcggg 1501 caactcagat attgtgacca atacacccgt atccaccgat acacctcagt catcaactcc 1561 cagcatctca aatgaaccga taacatcctc tcagccgacc ggtaacgcat ttgtaatgcc 1621 cgagcttatc ggcaaaaagg ttgaaaatgt catcaacagc gatgcttgga aggaacgcct 1681 cagcttcgat gttatctacg attactcaga tgtttatgaa agcggaatca tcttcgatca 1741 ggatattgag cagggaacaa tgctctatcc cattacgact gtcaagatat ttgtcagcaa 1801 gggatattca attgttcaaa ttccttcata tatcgatgag ttcggtatga atatgaccaa 1861 ggaagaatat attgttcttc tcgatgccct caatatcaag tatgagattc gcgagatcca 1921 gactccttat gacctttcgg gctatgtttt gggcgtatac tgccaggaaa acggatccga 1981 agtcggtgaa gacattaacg ttgccgaagg atataccttg tttgttgacg tatccgtatt 2041 tactcccgga attgatatag ttggataatc aattggaaaa tgtttggttt tctttgtatt 2101 tttcacagat tttttcatca aagacgtgtc atttttggca cgtctttgtc tgttaaatca 2161 ttgacataaa cattttgcta tgctatattt aacttgttca agacgaatat tattgtataa 2221 tgatgttgga ggatgaacat tatgagtcgt acaatcggtg tcctcacaag tggcggcgac 2281 gctcccggaa tgaatgctgc gatccgttcc gttgtcagat ctgcacttgc aagaggattt 2341 agagttatag gaatcagaag aggatatcag ggtctgatcg aaggcgatat gttcgagatg 2401 tgtgcccgcg atgtttccga tataatgcaa agaggcggca cagtactcta taccgcaaga 2461 agccccgaat ttgaaactcc tgcgggagtt gccaaagcaa aggcaaattg cgatgctgtt 2521 ggcatcgaca gtcttgtcgt aatcggcggc gatggcacat accgcggtgc gctcgagctt 2581 ttcagactcg gcgtaaagat catcggaatt cccggcac // LOCUS sequence176 2610 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence176 VERSION sequence176 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2610 /mol_type="genomic DNA" /organism="" /note="sequence176" CDS 256..1572 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MKRLLKLALLFVMMLCLCGCDFLTFSVEGLLSSPIIADEQTAIYQ ALIARTGKEVFFEYPRSGSYRSAFVMTDVDQESGDEALAFYSLSSSQDEDVRLSILDRD ENGDWISMFEIQGAGNTVDKVLINRVGNNTDIIVGYGTRGYEGSQVIIYRYYMGALAVI YEGNYSALELYDLDGCGEEEIIIVSKTGAQSNATVIQSADGISYFTHEAALSSNAVSIE GHAIGKLETGESVLYVDVLDESGYISTELIYLRDDTLICPTSSIAGLREYTARPLGYLS VDYDGDSDVEVPVTEPFIGYASGSRGGIQLMTKWYSYDADQLCYVKKSNAYYNITDGYV FILPNRWLNVVTASRSEDGVVTFLKYDSSAETMEDMKPIMSFTSLSAYADSSALIDDGY TELVSTDFKRYFVKTLADESEPLVLTNDEIKDNFYGIDR" /locus_tag="LOCUS_6170" /note="MGA_824" CDS 1603..2304 /product="response regulator transcription factor" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_001142165.1" /transl_table=11 /codon_start=1 /translation="MKRILVCEDEDSIREFVVLNLKRSGYDVVDVNCGENAIKAFDEAT ERFDVVLLDIMMPGMDGFAVCKLLRERSDNIGIIMLSAKSQEMDKVSSLMMGADDYITK PFSISELIARVDAVCRRVSMTALRPEEKVTISSGPFTINMKSRVLLKNGEAIDLTQVEY QIMEYFLKNQNTALDRLSILHHIWGESYYGEEKIVDVNIRRIRMKIEDEPSNPKYILTV WGYGYKWSAEG" /locus_tag="LOCUS_6180" /note="WP_001142165.1 response regulator transcription factor (Bacillus cereus group) [pid:51.1%, q_cov:98.3%, s_cov:97.8%, Eval:2.7e-60]" /note="MGA_825" ORIGIN 1 acagcgatgt ttgcctgcgc ccgaattgca agctggtcgg ctcaccgctt tgaagagctg 61 ataaccggtc agcgcatcat ccgccctgca tacagaccca ccaagctcaa caaaaagtat 121 cttcccattg accggagata atggctgtaa aagtgtatta tatcggctta attacttgca 181 agtttatttg atttgtgata aaatgagata aggcgaactt tgccttatct catttatttt 241 tggaggtgaa agggtttgaa aagactttta aagcttgcgc ttttatttgt aatgatgctg 301 tgtctttgcg gatgcgattt tctgaccttt tccgttgagg gactgttgtc ctctcctata 361 attgcagatg agcagaccgc gatttatcag gcgcttattg cccgaacagg caaggaagtg 421 ttctttgaat atcctcgctc ggggtcatat cgctcggcgt ttgtcatgac tgacgttgac 481 caagaatcgg gcgatgaggc cttggcgttc tattctcttt catcttcgca ggatgaggat 541 gtgcgcctta gcattctcga ccgggatgaa aacggcgatt ggatcagtat gtttgagatc 601 cagggcgcgg gaaacaccgt tgacaaggtt ttgatcaacc gtgtcggcaa caacaccgac 661 atcatcgtgg gatacggcac ccgcggatat gaaggctcac aggttataat ttacagatac 721 tatatgggtg cgcttgccgt catttatgag ggcaactatt cggctttgga gctttatgac 781 cttgacggtt gcggcgaaga ggaaataatc atcgtcagca aaacgggagc acagtcgaac 841 gccactgtaa ttcagtctgc cgacggtatt tcatatttta cccacgaagc ggcgctttct 901 tcaaacgctg tttcaattga gggacacgca ataggcaagc ttgaaacagg cgaaagtgta 961 ttgtatgtgg atgttctgga tgaatcggga tatatttcaa ccgagcttat atatctgcgc 1021 gatgacaccc tcatctgccc cacaagctca attgcaggtc tgcgcgaata taccgcaagg 1081 cctttgggct atttaagtgt cgattatgac ggggactcag atgttgaagt gcccgtgact 1141 gagccgttta tcggatatgc aagcggctca aggggtggga ttcagcttat gaccaagtgg 1201 tattcatacg atgcggacca gctttgctat gttaaaaagt ccaacgcata ttataatatc 1261 accgacggct atgttttcat cctgccaaac cgctggttga atgttgtcac cgcatcaaga 1321 agcgaggacg gcgttgtgac cttcttaaaa tatgacagct cagcggaaac catggaggat 1381 atgaagccga tcatgagttt cacatctctg agtgcatatg ccgatagctc ggcgcttatt 1441 gatgacggat acaccgagct ggtttcaacc gatttcaaac ggtattttgt taagaccctg 1501 gctgacgaaa gcgaaccttt ggttttgaca aacgacgaaa ttaaagataa cttttatggc 1561 attgaccgat aagcattttt tgaaaggacg gcgaagaata taatgaagcg aattttggtt 1621 tgcgaggatg aagactccat ccgcgagttt gtggttttaa accttaaaag aagcggatat 1681 gacgtcgtgg atgtcaactg cggcgaaaat gcaattaaag catttgatga ggccaccgag 1741 cgtttcgacg tggtgctttt ggatattatg atgccgggaa tggacggctt tgcagtctgc 1801 aagcttttgc gcgagcgttc ggacaatatc ggaattatta tgctcagcgc aaagagccag 1861 gagatggaca aggtttcatc ccttatgatg ggcgcggatg attatattac aaagccattt 1921 tcaatctccg agcttattgc aagagttgat gctgtttgcc gcagagtgag catgacagcc 1981 cttcgtcccg aagaaaaggt gacgatcagc tcgggacctt ttaccatcaa tatgaagagc 2041 cgtgtgcttc ttaaaaacgg cgaagcaatc gacctgacac aggttgaata tcagataatg 2101 gaatatttcc ttaaaaatca gaacaccgct cttgaccgct tgagcatttt gcatcacatt 2161 tggggcgaga gctattacgg cgaggaaaag attgtcgatg tcaacataag aagaatccga 2221 atgaagattg aggatgagcc ttccaaccca aaatatattc tcactgtttg gggatatgga 2281 tataagtgga gtgcggaagg ataaacggga acatttgaaa ggcaggtgaa aagcgtgagg 2341 gcaaaaagca gtatcacaaa aagatgggcg ctcaataccc ttgggctttt cgcggctgtt 2401 ttggtcgttg cgggcatttt gcttttgaat ttggcacgga attactatgt atcttcagcc 2461 aagcaatacc ttacctcgaa aatggacctt gtgacctcgg ctttgtctga atataccact 2521 gaggcgggat ataagcagga agtcatatca attgtcgagc agtttgccga aaaggaaaga 2581 tatgagctta tggcggtgga tgccgagggg // LOCUS sequence177 2576 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence177 VERSION sequence177 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2576 /mol_type="genomic DNA" /organism="" /note="sequence177" CDS complement(23..238) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MKHIKHPDSVKKHDKHRTPEEVKIFRPKADVISAYQTNPMSDYYI SDDGCIYNKSDENIVMGKEWVDENEK" /locus_tag="LOCUS_6190" /note="MGA_827" CDS 434..1018 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MKNFNIYLKSLLFLFVCWLAAFVIVMFFPLAYQKMGPIMCLAFGV CSVGATLCIYGDWCIKLGEKAWDRNDTPEDMKTKQHFGFKIGLVPTIVNYIYVVLLYLS KLGVLKFDFYPWYKTLTFYFMPLTYLVAPNEAVNIDGKVMSVNVPAAELSWGAMIMFTL LPLVFLAICWGMYYIGYNHIDVKSKIIYSKK" /locus_tag="LOCUS_6200" /note="MGA_828" CDS 1083..1820 /product="N-acetylmuramoyl-L-alanine amidase CwlD" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011860636.1" /transl_table=11 /codon_start=1 /translation="MLKKLWVNKVGVAIMLLCTYLLVFGFIKTATPPDNVIAVDGALNG GMPTIILDAGHGGIDSGCVSVNGAEEKDINLSIMLRLRDMLEASGFEVIVTRDADRSIH DSGVQGLGQQKLSDMQNRLKIINSCDNALFVSVHQNQFTDSRYSGAQMFYPADSAESEQ LAGILQKQFVSLLQPDNNRETKPVTDEIFLLDNANCPSVMAECGFLSNPDEAALLESEE YQAKVAFTIFTGICEYVIANYGI" /locus_tag="LOCUS_6210" /gene="cwlD" /EC_number="3.5.1.28" /note="WP_011860636.1 N-acetylmuramoyl-L-alanine amidase CwlD (Clostridioides difficile) [pid:46.1%, q_cov:78.0%, s_cov:82.1%, Eval:1.4e-41]" /note="MGA_829" ORIGIN 1 ataatctttg cgggcgcaat aattacttct cgttttcgtc tacccattct ttgcccataa 61 cgatgttttc atccgacttg ttatatatac agccgtcgtc ggagatataa taatcggaca 121 tggggttggt ctgatatgct gagataacat ccgccttagg tcggaatatc tttacttcct 181 cgggtgtgcg gtgtttgtca tgttttttaa ctgaatcagg gtgtttaata tgcttcattt 241 tatcctccgt gcgcttttgc acttgatacg aaatggttga aaatgtttca taagatacgc 301 ctcgcttatg aggcagaatt attttttgaa aattgggtgt gtaatattcg tgaaattttc 361 gggaattgtt gtcatcaagg aaaaaatgct gtataatgga tgtatatatt acttgaccga 421 ggacggaata taaatgaaaa attttaatat ctatttgaaa tcgctgttgt ttttgtttgt 481 ttgctggctg gcggcattcg ttattgtaat gttcttcccg ttggcttatc agaagatggg 541 accgattatg tgtttggcgt tcggcgtgtg ttctgtgggt gcaacgcttt gcatctatgg 601 cgactggtgc attaagctgg gcgaaaaggc ttgggacaga aatgacactc cggaagatat 661 gaagacaaag cagcactttg gatttaaaat cggacttgtt ccaacgatcg ttaattatat 721 ttatgttgtt ttgctttatc tttccaagtt aggcgttttg aagtttgact tttatccctg 781 gtataagact ttgacattct actttatgcc gctcacatat ttggttgcac cgaatgaagc 841 agttaacatc gacggcaagg tgatgtcagt taacgttccc gcggcggagc tttcttgggg 901 tgcgatgata atgttcacac ttttgcctct tgtgttcttg gcaatatgtt ggggaatgta 961 ttacatcgga tataatcaca ttgatgttaa gtccaaaata atctattcca aaaagtaagg 1021 cttgaatatt tgaaagactt gcctcataag tttgtactaa aaaacaggtg gaggcaagga 1081 atatgcttaa aaagctttgg gtaaataagg tgggcgttgc aataatgctg ttgtgcacct 1141 acttattggt atttggattt attaagaccg cgacaccccc agacaatgtc attgcggttg 1201 acggtgcgct gaacggcggg atgccaacaa tcattttgga tgcagggcat ggcggaattg 1261 actcgggatg cgtcagcgtt aacggagccg aggaaaagga tattaacctc agcattatgt 1321 taagacttcg ggatatgctt gaagcgagcg gatttgaggt tattgttaca agggatgccg 1381 acagatccat tcacgacagc ggagttcaag gcttgggtca gcagaagctt tcggatatgc 1441 agaacaggct caagattatt aactcttgcg acaatgcgtt gtttgtatcg gtgcatcaga 1501 atcagtttac cgattcgaga tatagcggcg cgcagatgtt ttatcccgcc gattcggccg 1561 agagcgaaca gcttgcggga attttgcaaa agcagtttgt ttcgcttttg cagcctgaca 1621 acaacagaga aacaaagccg gtgacggacg aaatattcct tttggataat gcaaactgtc 1681 cgagcgttat ggcggaatgc gggttccttt ctaatcccga cgaggccgcg cttttggaga 1741 gcgaggaata tcaggcaaag gttgcgttta ccatattcac gggaatttgt gagtatgtga 1801 ttgcgaatta cggtatttaa aatataaaca ggacggaaaa aattatggct aaagtcaaaa 1861 gcgtatatgt ctgccgcgaa tgcggctttg aaactccgaa atggaacgga aaatgcccta 1921 actgcggagc ttggaattcg ctcgaggaaa ccgagagtgc gcccgttaca aaggcgaacc 1981 tttccgcggc gaaatcggga attgatttga gcgacagaat tgtttccctt tcggatgccg 2041 aggcctctgc agatgaggtg agatatcaca cggggcttaa agagctggac agagttcttg 2101 gcggcggatt ggttaaaggc tcgatggtgc ttttgggcgg tgagcctggt atcggtaaat 2161 cgactttgct gttgcagatc tgtcagcact tgggtcaaaa ccatacgatc ttatatgttt 2221 cgggcgaaga gtcgataaga cagatcaagc tcagggctca gcgattgggc gttgacagcg 2281 agaatttata tctgctggct gagtcggacg cgatgtcgat atgcgaaacg gtgtcgataa 2341 ataagccgga tattgtcatc atcgactcga ttcagacgat gtcggtgcga gagataaatt 2401 caacacccgg aagcatcaca caggtcagag aatccacaaa cctgtttatg aaaacagcga 2461 aaaacgagga gatccccttc tttattgtcg gacacgtcaa caaggacggc gcaattgcag 2521 gcccgaaggt tatggagcat atcgttgatg cggtgcttta ttttgagggc gacaga // LOCUS sequence178 2569 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence178 VERSION sequence178 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2569 /mol_type="genomic DNA" /organism="" /note="sequence178" CDS complement(1134..1925) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MSENYENPRKVNPIKSPAFKKYLSVSCVAILVIVAGVLLIWLAGA PRMDIPDDIYFLQLDTPADDAPVVVFETNMGTMKAVLYPNEAPAYCEYFMELVNSGYYD GTYICAIADSAYALGGTKFQDPNTTESPDSDTTQIEAEISNNLWPIKGALSSFIGTGGM WPFDKNYAGSTILFINDIDDAYMAPDALKRSYGEKLGGVFDEKGGIPNFARKYTIFGQI YYGWDVYESIMGTQVLETNQPASEIVFERVYISTYGENLPK" /locus_tag="LOCUS_6220" /note="WP_002263035.1 Cof-type HAD-IIB family hydrolase (Streptococcus mutans) [pid:26.3%, q_cov:77.9%, s_cov:42.0%, Eval:1.0e-16, partial hit]" /note="MGA_832" CDS complement(1942..2541) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MNLVFNGKYSGDENTLPQREHPEGFKMFKEPDSKKFMLIANGVSL GVTVLFLVIVGVMSGKYLIADLEAGKPWLIFLGIILPSLFIIPHELIHAICMKETVYMY SYFQAGAMFVLSLEDMTKTRFVLMSLAPNILFGFVPFLVALIFPQLYWLGLFGALSIGA GAGDYINVFNALTQVPKGAKIYSSGFHSYWYQPKAD" /locus_tag="LOCUS_6230" /note="MGA_833" ORIGIN 1 atagtcggaa tcgtagatct ctgtgagaag ataatctctc gattcttcca aaatgtcttc 61 tctttcaaga atgtccatct tgtcaacaag atagaagcag gtgtcgtcct gaattacggt 121 gaactcgccg accttgcagg tggtgaaaac atagttaaca aacttctgcg aggggatcgc 181 gctgttctta gcgatgatgt attcatcagc ataggggtct tcttcaacct caatatcctc 241 ggcatcttct gctccggatg cttcttcatc tgcagtgctg tcctcttcgg tttccggctc 301 aagggtttca agatatgcat tatattctgc aatcaggtcg tccatcgctt cgcctgcttt 361 cgctctttca agatatgaat ttgcaagggc aagctgtgct tcctttcttt cggcatcaat 421 ggcatcttca acgctgtcgg caaaggtgaa ggtcataaac ttgaggcgtg catattcatc 481 ctcaagataa gctctgatgg tctcctcggt ggtaccctta acaccgccga cttcatagta 541 tgcagcgaaa acaaggtctt ccttatatgc ggtttccaaa gccttttcaa cggttgattt 601 tgcaatacca acgctttcaa actgttcttg cgaggttgcc caggtggaat ttacctgcgc 661 cttaatgagc gccttgtcgt cagccgtcat ctcaagaccc aaatctctga aaagctgttc 721 aacaacaaca tactgcttgc acatatcaag agcatattcg ttgacatatt cggatacctt 781 ctggtcgcca atagtttcgt ccaagagcga gtagccgtac atatagtaat aataatagtt 841 catatcctct tcggaaaggg tatataccgc ctcggtgtag ccttggagct gatagaagat 901 ataaagaccg ctgttgatga caatgtcgcc ggccttgacg atccatgtgg tatcgccgca 961 tccgaccaag cccaaagcca ttacgcaaac aagcatcaaa gcaactattt tcttgatgat 1021 tgacatattt tttaacattc cttccgtttg tgggaaaatt gctgaaaatc agcatactaa 1081 agcattatac aacattttcg ggagcttgtc cataggcttt ttaacaaaac cgcttatttg 1141 ggcaggtttt cgccataggt ggaaatatat actctttcaa aaacaatctc gcttgcaggc 1201 tggttggttt ccaaaacctg cgtgcccata atgctttcat aaacatccca gccgtaatat 1261 atctggccga agatggtgta ttttcttgca aagtttggaa ttccgccctt ttcatcgaac 1321 actccgccaa gcttctcacc atacgaacgc ttgagggcat cgggcgccat atatgcgtcg 1381 tcaatgtcgt tgatgaacaa aattgtcgag cctgcatagt tcttatcaaa tggccacatt 1441 ccgcctgttc cgataaagga agaaagtgca cccttaatcg gccaaaggtt gttagaaatc 1501 tccgcttcga tctgtgtggt gtccgaatcg ggggattcgg ttgtgttggg gtcctggaac 1561 ttagtgccgc ccagggcgta agccgaatct gcaatcgcac agatatatgt gccgtcataa 1621 tatcccgaat ttacaagctc catgaaatat tcgcaatatg cgggagcttc attgggatac 1681 agcaccgcct tcattgtgcc catgtttgtt tcaaagacga ctacaggggc atcgtctgcg 1741 ggagtatcaa gctgcaaaaa gtaaatatcg tcgggaatgt ccattctcgg tgcgcctgca 1801 agccaaatga gcaatacgcc tgcaacaata accaaaattg caacgcagga aacgctcaaa 1861 tactttttaa aagcagggga cttgattgga tttacttttc tcggattttc gtaattctca 1921 ctcatttaaa tgtcctttct ctcagtcggc cttaggctga taccaatagg aatggaagcc 1981 gctggaatat atcttcgcgc cctttggcac ctgtgtaagc gcgttgaaaa cgtttatgta 2041 gtcgcctgcg cctgcaccga tcgaaagtgc accgaaaagt cccaaccaat acaactgcgg 2101 gaagataagc gcaaccaaaa aaggaacaaa tccgaaaagg atattcggcg caaggctcat 2161 taaaacaaat cttgttttgg tcatatcttc aaggctcaaa acgaacatcg ctcccgcctg 2221 gaagtatgaa tacatataaa cggtttcttt catacagatc gcgtggataa gctcgtgggg 2281 aataatgaaa agggagggga gtattatgcc cagaaagata agccaaggtt tgcccgcctc 2341 aaggtctgcg atcagatatt ttcccgacat tactccgacg attaccaaaa acagaacggt 2401 tacacccaga gaaacgccgt ttgcaatcag cataaatttc ttcgagtcgg gttctttaaa 2461 cattttaaat ccctcggggt gctcgcgctg gggcagggtg ttttcgtcgc ccgaatattt 2521 tccgttaaaa accaggttca tcttgctcac ttcgctttct taataacag // LOCUS sequence179 2566 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence179 VERSION sequence179 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2566 /mol_type="genomic DNA" /organism="" /note="sequence179" CDS 277..1146 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_010965639.1" /transl_table=11 /codon_start=1 /translation="MADFGTNPYGFKDAVTIEAERIFDSCSDRDCLEDLEVTFSDYEST QLVNEATYAKAKCVEVTSVYFQVEPIPFNCGFFSVDLTYTFAVTIELAANAAAPVQTVV GTACFTKKVILYGSDGGTKYFTSFNNGVVNVNGCNAGSTASLPKASVAVADPILLNLCL QCVPAYSACTDITCNESITIPSRKIICVTIGLFSIISLSRTVPVMVPAFNYEVPCKDCS SPSGTTETPCELFEKIRFPSNEFFPKSLEEATACSCTCAGIANAVASGQTSGNSGQGCP ANNCKTCQ" /locus_tag="LOCUS_6240" /note="WP_010965639.1 hypothetical protein (Clostridium) [pid:28.3%, q_cov:81.7%, s_cov:85.3%, Eval:3.8e-15]" /note="MGA_835" CDS 1252..1482 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MLGRVDDIEICSDSSTVKSMIVYGRPKLFGILGRDNDIIISNEQI DLIGRDVILVSVDNLSDITMNTSKESKFLFK" /locus_tag="LOCUS_6250" /note="MGA_836" CDS 1641..2369 /product="30S ribosomal protein S2" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011392546.1" /transl_table=11 /codon_start=1 /translation="MAVVTMKQLLEAGVHFGHQTRRWNPKMAPYIFTERNGIYIIDLQK TVKKLDEAYAFVKEVSANGGEVLFVGTKKQAGDSVKEEATRANAHYVNARWLGGMMTNF KTIQKRIARLEQLHKMAEDGTFDLLPKKEVAQLSLEIEKLEKYLGGIKNMVKLPAALFI VDPKREKIAVAEAKKLGIPVVAIVDTNCDPDEVDYVIPGNDDAIRAVKLISGAIADAII EGRQGETSAEEVTEEAPAEE" /locus_tag="LOCUS_6260" /gene="rpsB" /note="WP_011392546.1 30S ribosomal protein S2 (Moorella thermoacetica) [pid:73.1%, q_cov:93.8%, s_cov:95.4%, Eval:5.1e-97]" /note="MGA_837" ORIGIN 1 agttaagact cccgttcgtt tcaatgtcag gtgtcggcga aaacgcggca aaagcgcttt 61 ataatgccgc acagtcgagt gatttcatct cggttgaaga attctccctt tctgccggtg 121 tatcaaagac ggttatcgaa cagctgaaat cctttggcgc attcggcgat atgcccgatt 181 ctgcgcagat gtcgctgttt taagtaacta aacgtaatcc tcctgaataa tatgtagaga 241 agttttaaac tttaatactt attcaggagg atttatatgg ctgatttcgg aacaaatccg 301 tatggcttta aagatgcggt taccattgaa gcagaacgaa tttttgatag ctgctccgac 361 cgtgattgcc ttgaggatct tgaagttaca ttctcggatt atgaatcaac acagcttgtc 421 aacgaagcga cttatgccaa agctaagtgc gttgaggtga caagtgtcta tttccaggtt 481 gagcccattc ctttcaactg cggtttcttc tcggtagacc ttacttatac ctttgcagtt 541 acgattgagc ttgccgcaaa tgctgcagca cccgttcaaa cggttgtggg cactgcttgc 601 ttcacaaaga aggttattct ttacggtagc gacggcggaa caaagtattt cacatcattt 661 aataatggtg ttgtgaatgt caacggctgt aatgcaggct caacagcaag tctgccgaag 721 gcttctgttg ctgttgctga ccccattctt ttgaacctct gcctgcagtg tgtgcccgca 781 tacagcgcct gcacagacat aacctgcaac gagtcgatta ccattccgtc aagaaagatc 841 atctgcgtaa cgatcggtct gttctcaatc atttcacttt caagaactgt tcccgtaatg 901 gttcctgcat tcaactatga agttccttgc aaggattgct catcgccctc gggtacaacg 961 gaaactcctt gcgaactgtt tgaaaagatc agattcccct caaacgaatt cttccccaag 1021 agtcttgaag aggcaactgc ttgctcctgc acctgtgcgg gaattgcaaa cgctgttgca 1081 tcaggccaga catcgggaaa ttcaggtcag ggatgccccg caaacaactg caagacctgt 1141 cagtaaatat aattttgccg cctcagtcat atcattgact gatgtgactt tatgaattac 1201 acattatctg atttgaagcg gaaggaagtt gttgaaacaa ggtcggggat gatgctgggc 1261 agggtagatg atattgaaat atgctccgac agttcaactg ttaagtcgat gatcgtttac 1321 ggcagaccga aattgttcgg aatactcggt cgggacaacg acataataat ttcaaacgag 1381 cagatagatc ttatcggcag agatgtaatt cttgtaagtg ttgacaattt gtccgatatt 1441 acaatgaata catcaaagga atccaaattt ttgtttaaat aatcatcaaa aaaagcttgc 1501 attatttgca ctaatgtgat acaatattac cgcaattcgc acgcatgggt tttgccgtgg 1561 ttcccgaagt gattttgggt gaaggcaagc taacttatgc ggaggattaa aaaatataaa 1621 aaccatagga ggttactaca atggcagtag taacaatgaa acagcttctt gaagccggtg 1681 tacactttgg tcaccagaca agaagatgga acccgaagat ggcaccttac atcttcacag 1741 aaagaaacgg tatctatatc atcgaccttc agaagaccgt taagaagctc gacgaagctt 1801 atgctttcgt taaggaagtt tctgctaacg gcggcgaagt tctcttcgta ggtaccaaga 1861 agcaggctgg cgattccgtt aaggaagaag ctaccagagc aaatgctcat tatgtaaatg 1921 caagatggct tggcggtatg atgaccaact tcaagaccat ccagaagaga attgcaagac 1981 ttgaacagct ccacaagatg gctgaagacg gaaccttcga tcttttgccc aagaaggaag 2041 ttgctcagct ttctctcgaa atcgaaaagc tcgaaaagta tctcggcggt atcaagaaca 2101 tggttaagct tcccgctgct ttgttcattg ttgaccccaa gagagaaaag atcgctgttg 2161 cagaagctaa gaagctcggt atccccgtag ttgcaatcgt tgacaccaac tgtgatcccg 2221 atgaagttga ctacgtaatc cccggcaacg atgacgctat cagagctgtt aagctcatct 2281 ccggcgctat cgctgatgct atcatcgaag gcagacaggg cgaaacctct gctgaagaag 2341 taaccgaaga agctcctgct gaagagtaat atttacatta ttcagggcag gcaacaaaac 2401 ctgccctgac ccataaacct aatcaagatt acgaaaggaa tgtttaatat tatggctaat 2461 atcactgcta aggacgttgc tgctctccgt gagagaaccg gcgttggtat gatggactgc 2521 aagaaggctc tcgttgaggc tgaaggcgat tttgaaaagg caatag // LOCUS sequence180 2545 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence180 VERSION sequence180 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2545 /mol_type="genomic DNA" /organism="" /note="sequence180" misc_feature <1..617 /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_001884129.1:orotate phosphoribosyltransferase" /note="WP_001884129.1 orotate phosphoribosyltransferase (Vibrio) [pid:52.0%, q_cov:97.5%, s_cov:92.0%, Eval:5.7e-45]" /note="MGA_839" /locus_tag="LOCUS_6270" CDS 614..1687 /product="aspartate carbamoyltransferase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_012048210.1" /transl_table=11 /codon_start=1 /translation="MRSLIDILDFSVEEIDSLVTRAKDIIANPHIYSESCRGKKLATLF FEPSTRTRLSFEAAMYELGGEVIGFSEAGSSSAAKGESVSDTAKMISCYADIIAMRHPL EGAPLVAAKSAWIPVINAGDGGHSHPTQTLTDLLTISREKGGFDNLTVGFCGDLKYGRT VHSLIAALSRYINVRFVLISPDELKVPEYVKSDILRKNDIPYVETSSLDDAMPELDILY MTRIQRERFLDASQYERLKDSYILTPEKLETAKSDLCIMHPLPRVNEISVRVDSDPRAC YFKQALNGKYIRMALILYLLEQAKSPEKSFDENVIKGKFVCRNPRCITTCEQELEQSFR KGADGIYRCEYCEAEQK" /locus_tag="LOCUS_6280" /gene="pyrB" /EC_number="2.1.3.2" /note="WP_012048210.1 aspartate carbamoyltransferase (Clostridium botulinum) [pid:62.0%, q_cov:84.0%, s_cov:97.7%, Eval:9.2e-105]" /note="MGA_840" CDS complement(1780..2403) /product="DUF4867 family protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_010965899.1" /transl_table=11 /codon_start=1 /translation="MKIYSVYDPEFAPYGKVLEGYDTAELVDAMLKIPFGEGVSYEPAI DSLEACAIFEELSVNAYGGMPVQLGMCWGHNTKLNCLEYHRDSEVNIGSHDFILLLALE SDIKDGKLDTACVKAFKAPAGVAVEVYATALHYAPCHVNEADGFHTAVVLPKGTNTEKP ALTPKNEEDKWLWARNKWLLAHPETSEAAQGAYVGLVGENIDIA" /locus_tag="LOCUS_6290" /note="WP_010965899.1 DUF4867 family protein (Clostridium) [pid:50.2%, q_cov:99.5%, s_cov:99.5%, Eval:5.5e-51]" /note="MGA_841" ORIGIN 1 gcgcaggcgt tttgaagttt ggcgacttca ccgccaagag cggccgcaag atcccctatt 61 tcatcaatgc aggcgatatt aagaccggcg agcagattgc aaagctcggc gagttctatg 121 ctaaggcata ccttgaaaag gttggcaaca agaaaaccgt actttacggc cccgcatata 181 agggcatttc gatcgctgta tccagcgcag ttgctttggc aaagcagggt cttgatgttc 241 ccttcttctt caaccgcaag gaagctaagg accacggcga aggcggaatc tttgtcggat 301 atgttcccaa ggcaggcgaa gaggttgtaa ttgttgaaga tgttattacc gcaggcaccg 361 caatcagaga gagcatggca aacctttcct ctttagaggg cgttaaggtg tgtgcaacat 421 ttgttatggt tgaccgcaag gaaaagggca agaccgacaa gagcgccatg ggcgaaattg 481 aggatgaatt cggcttccct gtatactccg ttgttgacgt atacgacatc attgaatatc 541 tcgaagagga cgaagcaaac cgcgaaaacg ttgaacgcat caagaactat cttgcagtta 601 atggagcttt agtatgagaa gtcttataga catccttgac ttttctgtcg aggaaattga 661 ctcgctcgtc acaagagcga aggatattat cgcaaatccc catatttaca gcgaatcctg 721 ccgcggcaaa aagcttgcaa ctcttttctt tgagccttca acaagaacaa gactcagctt 781 tgaagcggca atgtatgagc tgggcggcga ggttatcgga ttttccgagg caggaagctc 841 ctccgctgca aagggcgaaa gcgtttccga caccgcaaag atgataagct gttatgccga 901 tatcatcgcg atgcgccacc ctcttgaggg agcgcctctt gttgcggcaa aaagcgcctg 961 gattcctgtt atcaatgccg gcgacggcgg acacagccac cccacccaga ctttaacgga 1021 ccttttaacc atcagccgcg aaaagggcgg gtttgacaac ctgaccgtcg gcttctgcgg 1081 agatttgaaa tatggcagaa cagtacattc gctgattgcg gcgctgtcaa gatatataaa 1141 cgtcagattt gttctgatct cccccgacga gctgaaggtc cccgaatatg tcaagtcgga 1201 tattctgaga aaaaacgaca ttccttatgt tgaaacctcg tcgcttgatg atgcaatgcc 1261 cgagctggat attctttata tgacaagaat tcagcgggag agatttttgg atgcaagcca 1321 gtatgaacgc ttgaaggatt cctacatact cacccccgag aagcttgaaa cggcgaagtc 1381 tgacctttgc attatgcatc cgttgccgag agtaaatgag attagcgtgc gcgttgactc 1441 ggacccaaga gcttgctatt ttaagcaggc gctcaacgga aaatatatcc gtatggcttt 1501 gattctctat ttgttggagc aggcgaaatc tcccgaaaag agctttgatg aaaacgtcat 1561 caagggcaag ttcgtttgcc gtaatcccag atgcatcacc acctgcgagc aggagcttga 1621 gcaaagcttc cgcaagggtg ctgacggcat ttacagatgt gaatactgcg aagcagagca 1681 gaagtaaaga aaatatagca aacataaaac ccgccgtggt atttccacag cgggttgttt 1741 ttgtgtgtag ccttcccctc aaggggaagc cttcataact tacgcaatat caatattctc 1801 gccgacaaga ccaacatatg cgccctgagc ggcttcgctt gtttcggggt gagccaagag 1861 ccacttgttt cttgcccaga gccacttgtc ctcttcgttc ttgggggtga gggcgggctt 1921 ttcggtgttt gtgcccttgg gcaaaactac agcggtgtgg aagccgtcag cttcgttaac 1981 gtggcaggga gcatagtgca aagctgtggc atatacttca acagcaacgc ctgcaggagc 2041 cttaaatgcc ttgacgcaag cagtatcaag cttgccgtcc ttgatgtcag attccagagc 2101 caagagcaaa atgaaatcgt gtgagccgat gttgacctcg gaatctctgt ggtattcaag 2161 gcagttgagc tttgtgttat gtccccagca cataccgagc tgtacgggca ttccgccgta 2221 tgcattgaca gaaagctctt caaagatagc gcaagcttcc aaagagtcga ttgcaggctc 2281 ataagaaacg ccttcaccga aggggatctt gagcattgca tcaacaagct ctgcggtatc 2341 atagccttcg agaaccttgc cgtagggtgc gaattcggga tcgtaaacag aataaatctt 2401 catagtggtg ttcctccata aaagttgtta agtctattat agcgcatcgg ggacggtttg 2461 gctataggtt ttggaaattt ttgttgtagt ggcgaccaca tattgtcgcc actgtaattt 2521 tcggctttgc gcttgtattg gcgga // LOCUS sequence181 2519 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence181 VERSION sequence181 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2519 /mol_type="genomic DNA" /organism="" /note="sequence181" misc_feature <1..810 /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_011986887.1:cysteine desulfurase NifS" /note="WP_011986887.1 cysteine desulfurase NifS (Clostridium botulinum) [pid:57.9%, q_cov:97.8%, s_cov:67.0%, Eval:8.3e-86, partial hit]" /note="MGA_842" /locus_tag="LOCUS_6300" CDS 845..1273 /product="Fe-S cluster assembly scaffold protein NifU" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003438275.1" /transl_table=11 /codon_start=1 /translation="MIYSEKVMDHFANPRNVGEIIDADGVGEIGNEKCGDIMKMYLKIE GGVIVDVKFKTFGCGAAVATSSMATEMIKGATIDEALQLTNKAVVEALDGLPAAKLHCS VLAEQAIKAALWDYYSRQGIDPTPIIGELHEHCESCSI" /locus_tag="LOCUS_6310" /gene="nifU" /note="WP_003438275.1 Fe-S cluster assembly scaffold protein NifU (Clostridioides) [pid:65.7%, q_cov:95.8%, s_cov:95.9%, Eval:3.3e-47]" /note="MGA_843" CDS 1317..2291 /product="tRNA 2-thiouridine(34) synthase MnmA" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_010965531.1" /transl_table=11 /codon_start=1 /translation="MAVKLLHDEGYEVAGVVMKMSDAHDGTVSAAQSAADALGIKLFVL DLRDEFKKTVIDFFAEEYLNGRTPSPCVRCNPNIKFKYLLKTALDNGFDRIATGHYAKV INDDGVYKLLKSDNDARDQSYMLAGLGQDVLSRIVFPLWGMAKDDVRTIAKDLGLECAS APDSEENCFVPDNDYAGYIERNYRASERGNFISPEGKPCGEHKGIIHYTVGQRKGLGIA LGRPCYVTEIDADTNEVKLGYERAMTDRVLLSNISETFPDAIKDGMSAKCKLRSTGKLL DCKVALADGGCVLTLDTPTPRVPAGQAGVLYDGNVVLGMGTIE" /locus_tag="LOCUS_6320" /gene="mnmA" /EC_number="2.8.1.13" /note="WP_010965531.1 tRNA 2-thiouridine(34) synthase MnmA (Clostridium) [pid:40.1%, q_cov:100.0%, s_cov:95.5%, Eval:2.5e-66]" /note="MGA_844" ORIGIN 1 gttgaccccg aggatattaa aaatgccatc cgcgaggata cagcgcttgt gacaatcatg 61 tatgccaaca acgagatcgg cacaattcag ccgatcaagg aaattgcagc gatctgtaag 121 gaaagaaaag taatgttcca caccgacgct gttcaggcgg ttggacacat tgccattgac 181 gttaaggact tgggcgttga tatgctctcc ctttcgggac acaagattca cgcacccaag 241 ggtgtcggcg cactttatgt gagaacaggt cttcgtattc ccaacctcat tcacggcggc 301 gcgcaggaaa gaaccaagcg cgctggaaca gaaaatgtcc cctcaattgt ggcattgggt 361 gaagcgatta cagaagctta cgaaaacctc acagaaaagc aggaaaagac caaggcaatg 421 agagataagc tcatcaatga gcttacaaaa atcaaggaaa gccgccttaa cggcgacctt 481 gaaaaccgtt tgcccggaaa tgtcaacata tcattcagag gaattgaggg tgaaagcctg 541 cttttgatgc ttgatttgga aggcatctgc gcttcaagcg gttcggcttg tacatccgga 601 tctcttgatc cctcccacgt tttgcttgca ctcggacttg accacgcaac tgctcacggt 661 tcgctccgtc tctcaatcaa cgaggaaacg acagatgaag atattgatta cattatcgaa 721 gcggtaccga gagttttggc aaagctcaga gcaatgagcc cctattggga gagaatttgc 781 aaaacagaag gcattgaagg acttatctga tagataatga tactacgaaa ggaagttaaa 841 tataatgatt tattctgaaa aggttatgga tcacttcgct aaccccagaa atgtcggcga 901 aattattgat gctgacggcg ttggtgagat cggcaacgaa aagtgcggcg acataatgaa 961 aatgtacctc aagattgagg gcggcgttat tgttgacgtt aagtttaaga cattcggctg 1021 cggcgcggca gttgctacaa gctcgatggc aaccgaaatg attaagggcg caaccattga 1081 cgaggctttg cagcttacaa acaaggctgt tgttgaggca cttgacggct tgcctgcagc 1141 aaagctccac tgctccgttt tggcagaaca ggcaattaag gctgcattgt gggattacta 1201 ttcccgccag ggcattgacc ccacacctat cataggtgag cttcatgagc actgcgaatc 1261 ctgctctatt taacaaacgc atattggtcg cgctcagcgg cggagttgac tcgtcagtgg 1321 cggtgaagct gctccatgat gagggatacg aggttgcggg cgtggttatg aagatgtctg 1381 atgctcacga cggcacagtt tcggcggcgc aaagcgcggc agatgctttg ggaattaaac 1441 tatttgttct cgatttgcgg gatgagttca aaaaaaccgt catcgacttc tttgccgagg 1501 aatatttaaa cggcagaact ccctcgccgt gtgtgaggtg caacccgaat atcaagttta 1561 aatacttgct caaaaccgcg ctggacaatg ggtttgaccg aatcgccacg gggcattatg 1621 ccaaggttat caatgatgac ggggtttata aactccttaa aagcgataat gatgcaagag 1681 atcagtcgta tatgctggca ggacttgggc aggacgtttt gagccgaatt gtgttccctc 1741 tttggggaat ggcaaaggat gacgtgcgaa caatcgccaa ggatctgggg cttgagtgcg 1801 cttcggcgcc cgacagcgag gaaaactgct ttgtgccgga taatgactat gcgggttata 1861 tcgaaagaaa ttaccgcgca agcgaaaggg gcaatttcat ttcccccgag ggcaagcctt 1921 gcggcgagca taaaggcatt atccactata ccgttgggca gagaaagggc cttggaattg 1981 cgcttggaag accttgctat gtgacggaga tagatgccga cacaaacgaa gttaagctcg 2041 gttatgagcg cgctatgacc gacagagtat tgcttagcaa tataagtgaa acattccctg 2101 atgcaataaa ggacggaatg agcgccaaat gcaagcttcg ctctacgggc aaattgcttg 2161 actgtaaagt cgctctggcc gacggcggat gcgttttgac gcttgacaca cccaccccgc 2221 gtgtgcctgc gggacaggca ggcgtgctgt atgacggaaa cgttgtgctg ggcatgggaa 2281 cgattgaata gatatttact tttaagcaag tgcttttttg tttgtttatt cgttgctctt 2341 tagtctttcg agccactcct cgggcaagac atattcttca aagccgaagt cgatcgagta 2401 tgccagatcg ttatatgacg taacatacaa ccgcacagct aagtttggct cttcttcaaa 2461 gaagccgtag accacaccgt agccatagca gttttcaagg agtccgttgg gcttcgtta // LOCUS sequence182 2519 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence182 VERSION sequence182 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2519 /mol_type="genomic DNA" /organism="" /note="sequence182" CDS complement(986..1594) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MKKVIALVLTFALALSLCACNLGEIVNKEISRGVIDENGYSSDYL GLRFTAPEGWVYATQSELSALMGEAVDITDQNKLFTELQLVYDMMVQDVLTGSNVIIIY ENLAVSGSEDITVEEYVEITKQGLTSVDMFTYTFNDEATVTLGDVDFTRVTVTCEYNGF TMEQAYYIAKLGSYMASISVTVTDGTSIETIEACFSALE" /locus_tag="LOCUS_6330" /note="MGA_847" misc_feature complement(1691..>2519) /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_010965003.1:RNA polymerase sporulation sigma factor SigG" /note="WP_010965003.1 RNA polymerase sporulation sigma factor SigG (Clostridium) [pid:61.6%, q_cov:93.5%, s_cov:100.0%, Eval:7.9e-84]" /note="MGA_848" /locus_tag="LOCUS_6340" ORIGIN 1 agtcggtcaa gagagtaatt gtcattgcat ttgcatcctt gccgagcttg cgtctgataa 61 gctcggtacc gccgagcata gttgaccact ggtcatcacc gccgaactgc aggttgcagt 121 tatagttccg gaagaggtag tagaagtcgt aagactgcat gatcatatag ttgaattcaa 181 ggaatgaaag acctttttcc attctttgct tatagcattc tgctctgagc atattgttaa 241 cagagaagca atgtccgaca tcgcgaagca attcaacata gttgaggttc aaaagccaat 301 cggcgttatt gatcatcatt gccttgcctt caccgaagtc aatgaactgt tccatctggc 361 gcttgaagca agcagcattg tggtcaatat cttctttggt gagcatcttt ctcatatcgg 421 ttctgcccga agggtcaccg atcattgtgg tgccgccgcc gatgagcgca atcggattgt 481 ttcctgccat ctgcaaacgc ttcataaggg taagagccat aaagtgacct gctgtaagcg 541 aatctgcggt gcagtcaaag ccgatgtaga atgtcgcctt accggtgttg acaagctctc 601 ttatctcctc ttcgtttgtt acctgtgcaa tcaagcctct ggcttgaagt tcttcataaa 661 ttcccattta tatttttctc ctttttgatt atttcccgaa aactgaaaag tccccgggca 721 aaagcccgag gacgatttgt taaaccgtgg taccacctca gttttccgca cataaaaatg 781 cggactcatt gggacgctgt aacgggcgct cccgcatact cctactgtga ttttcagagt 841 ataagctccg agatgtattc gccaagttcc gctcgccttt ttacaccaac caaaggctct 901 ctatgccgca tttaacaagg ttacttcttc tcttcatagc cgttttgaaa tataatatca 961 cttaattttg aaattgtcaa gaagcttatt ccaaagccga gaagcaagct tcaatagttt 1021 cgatagatgt accgtctgtg actgttacag aaattgaagc catgtatgaa cccagctttg 1081 caatgtaata tgcctgctcc attgtaaatc cgttatattc acaggttacg gtgactctgg 1141 tgaagtcaac gtcgcccaat gttacggttg cttcatcgtt aaaagtatat gtaaacatat 1201 caaccgaggt cagaccctgc ttggtgattt ctacatattc ctcgacagta atgtcttcag 1261 atccgctgac agcaagattt tcgtagataa taattacatt tgatccggta agaacgtctt 1321 gaaccatcat atcataaaca agctgaagct cggtgaagag cttgttctga tctgtaatat 1381 caacagcttc tcccataagt gcgctgagct cgctttgagt agcgtatacc caaccttcgg 1441 gagctgtgaa tctcaagcca agataatcgc tcgaatatcc gttttcatca attacacctc 1501 ttgaaatctc tttattaaca atctctccaa gattgcaggc gcaaagagaa agagcgagtg 1561 caaatgttaa aacgagtgct ataacctttt tcataaattt tcctccaaat catttaatga 1621 tttaactaaa ctatacacta atcggcactt tttgtcaata aaaaacgccc cacaatgtga 1681 ggcatttgtc ctatacttta gatttgattc ttttaagtgc cgacttttcg agtcttgaaa 1741 cctgtgcttg ggaaataccg atttccattg caacttctac ctgcgttttt ccttgataaa 1801 accgcagata aagtatgttt ttttccctct ccgaaagcat atgaattgct tcgcggatga 1861 gcagctcatc tatccacccc tcatcacttg aacggtcgct aagctggtct aacatatata 1921 gcgtatcgcc cgagttggag tatacaggct cataaattga aacaggttcg ctgattgatt 1981 caagcgcgaa tacaacatcc gcctttggca cttctaaaag cgatgctatc tgttcaaccg 2041 acggttcggc gttattaata cttgtgagct gctcctttgc ctgcattgct cgatatgcta 2101 aatctcttgt tgaacggctt acacgaatcg agttgttatc acgtaggtag cgtctgagct 2161 cgccacttat cataggtaca gcatacgttg aaaaccgcac atcaagggac aaatcaaaat 2221 tgtctatcgc tttaataagc ccaacaacac caacttgaaa caaatcatcg gcactggtac 2281 cgtttctgcc aataaacttt tgaatcacgc tcaatacaag ccgcaaattt ccttgaatca 2341 gatcttcgcg ggctttttta tcgccctgcc ttgaaagagc aagcaggcgc attttttcat 2401 cttctgtcag tactttaagt ccggatgtgt tcacacccga tatttcaact ttattatact 2461 gcataattac tccaaacaaa ttatttgaag taattattgc cttgagcatt atcagatat // LOCUS sequence183 2510 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence183 VERSION sequence183 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2510 /mol_type="genomic DNA" /organism="" /note="sequence183" misc_feature <1..999 /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_011948259.1:serine--tRNA ligase" /note="WP_011948259.1 serine--tRNA ligase (Clostridium botulinum) [pid:90.8%, q_cov:97.9%, s_cov:76.5%, Eval:6.4e-174]" /note="MGA_849" /locus_tag="LOCUS_6350" CDS 1125..2177 /product="endo-1,4-beta-xylanase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_012583995.1" /transl_table=11 /codon_start=1 /translation="MKTLKEAYKNYFDIGAAVSPHWLEEAADTLKAHFNSITCENHMKY NGIHEHQYERPPFKRPKPGEKPEMPKIEIVNRERFVHPCLELHTEGADKIYNFALANGF KLRGHTLAWHGSYPWGIFEQLTPEELETNLREHMAFVAKKYPACWCWDVVNEVADDKHG LFLRETVFKNKFGEDYLIKIYSMAREYFPDTVFVCNDYNEWVPHKRESILKIVDTLKAN GLVDAIGCQCHVSAFMTDEEFDQIKYAYEAYAKTGLRIHVTEMDVNCVSWKDPKEVTPE TLEKQADVYDKMFKLFRDYKDVIDSVTLWGVSDKHTWLNGFKNHGIKNSALLFDTEYNP TLALSRIVDF" /locus_tag="LOCUS_6360" /note="WP_012583995.1 endo-1,4-beta-xylanase (Dictyoglomus turgidum) [pid:34.4%, q_cov:99.4%, s_cov:98.8%, Eval:7.2e-46]" /note="MGA_850" ORIGIN 1 gaagaacttg gcgagaaggt caccaagatc atgatgacca ttcccaacat tatcgacccc 61 agcgttccga taggcaagga tgactcggaa aacgttgaag ttcagcgcta tggcgagcct 121 gttgtacctg atttcgatat tccttatcat accgaaataa tggaaaagct gaacggaatt 181 gatcttgact ccgcaagaag agttgcaggc aacggattct actatcttat gggcgatatt 241 gcaagacttc actccgcagt tatcgcatat gcccgcgatt ttatgatcga ccgcggtttt 301 acttatgtaa ttccccctta tatgatccgc tccaacgttg ttacaggcgt tatgagcttt 361 gccgaaatgg acgcaatgat gtataaaatt gagggcgaag acctttatct tatcggcaca 421 tccgagcact cgatgatcgg caaatttatc gaccagatcg ttcccgaaac tcagcttccc 481 atcactctca ccagctacag tccctgcttc agaaaggaaa agggcgcaca cggcttggag 541 gagcgcggtg tatacagaat ccaccagttt gaaaagcagg aaatgatcgt tgtctgcaag 601 ccggaggaat ctcccatttg gtttgataag ctctggcaga atacagttga tctgttccgt 661 tcactcgata ttcccgtaag aactcttgaa tgctgctcgg gcgacttggc agacttaaag 721 gtcaagtcgg ttgacgttga ggcatggagc cccagacaga agaagtattt cgaggttggt 781 tcttgctcca accttggcga tgctcaggca agacgcctta aaatcagagt taacggcgaa 841 aagagcaaat atttggctca tactcttaat aacaccgttg ttgcaccccc gagaatgctc 901 atcgcattcc ttgaaaacaa cctcaacgag gacggcagcg ttaatattcc tgtggctctt 961 cgtccttaca tgggcggtaa ggagaagatt ggcggataat atcaatcgaa cggaaggcac 1021 cgagcgatag cccgttcggg ccacctgttt gcactgttcc tacggaacgc gcttcgcaga 1081 cggccctcac tcccactgat ccctcacatt tacggaggaa cattatgaaa acattaaaag 1141 aagcatataa gaactacttt gacatcggcg cagcggtttc tcctcattgg ttggaggaag 1201 cggctgatac cctcaaggca catttcaact cgataacctg tgaaaaccat atgaaatata 1261 acggaattca cgagcatcag tatgaaagac cgcctttcaa acgccccaag ccgggcgaaa 1321 agccggaaat gccgaaaatt gaaatcgtca accgcgagcg ttttgttcac ccttgtcttg 1381 agcttcacac cgaaggcgcc gacaagatct ataattttgc ccttgccaac ggcttcaagc 1441 tccgcggaca cacccttgct tggcacggct catacccttg gggaatcttt gaacagttaa 1501 ctcccgagga gcttgaaaca aacctgcgcg agcatatggc ttttgttgcg aaaaaatatc 1561 ccgcctgctg gtgctgggat gttgtgaacg aagttgccga cgataaacac ggtttgttcc 1621 ttcgcgagac cgttttcaaa aacaagtttg gtgaagatta ccttatcaag atttattcca 1681 tggcaaggga atatttcccc gacaccgtgt ttgtatgcaa cgattataac gaatgggtgc 1741 cccacaagcg cgagtccatc ttgaaaatcg ttgacaccct caaggcaaac ggcttggttg 1801 atgcaatcgg ctgtcaatgc cacgtttcgg catttatgac cgacgaggaa tttgaccaga 1861 tcaaatatgc atacgaagca tatgcaaaga cgggtcttag gatccatgtt actgaaatgg 1921 atgtcaactg cgtaagctgg aaggatccca aggaggtcac acccgaaacc cttgaaaaac 1981 aggctgatgt atatgacaag atgtttaagc tcttcagaga ttataaggat gtcattgaca 2041 gcgtaactct ctggggcgta agcgataaac acacatggct caacggcttc aagaatcacg 2101 gaattaagaa cagtgcacta ttatttgaca cagaatataa tcccacttta gcactttcac 2161 gaatcgtcga tttttgaccg cttttcggtt gacttaggtc ggtttgtgtg ttaacatatt 2221 taaaataata gaattttggg aggatgttat atgctcgaaa caaatgctga tatcaagttt 2281 ggcaaagaag gcttgacctt tgacgatgtt cttttgattc ccgctgaatc aaatgtaaca 2341 cccaatatgg ttagccttaa aaccaccttg tgcaagggaa tcgaactaaa tgttccgatt 2401 atgacctctg ctatggacac agttaccgag tcgaaaatgg caattgctat cgcccgtgaa 2461 ggcggtttgg gaattattca taagaatatg accattgaaa gacaggctga // LOCUS sequence184 2510 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence184 VERSION sequence184 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2510 /mol_type="genomic DNA" /organism="" /note="sequence184" CDS complement(454..855) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MIDEGHIVANQSVNHYSMPELTVEEMRSEIMGLHEYMIENFGVQM TYFRPPKGEYSELSLAVTGDCGYKTMLWSFAYADWDPDTQPEPASSLQKMIDRLHPGAI YLLHAVSETNAYVLGDFIDAAREAGYTFK" /locus_tag="LOCUS_6370" /note="WP_009897898.1 delta-lactam-biosynthetic de-N-acetylase (Clostridioides difficile) [pid:48.5%, q_cov:100.0%, s_cov:43.6%, Eval:1.5e-30, partial hit]" /note="MGA_852" CDS complement(977..1423) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MKTKLLALVLSFALAAMTLTACAEIDDGRYNEGNPVTENPAITQP TDPDNLVSSAPTVSSEETTTTVSEPEPLPETSLTDVSDAIEELYVTGQWDYATLSTEGD GFGHGSHYDDANRPSGARRFNNGYSQYNATAMDQTDEKIITLTF" /locus_tag="LOCUS_6380" /note="MGA_853" ORIGIN 1 gacattttcg ccgcgcattg ttcatgattt gaggtcgatt atacagaact ttaaacgcgg 61 gtcgatcatc cttgcaaggg ttgctcccgc atttccgcag aggatgatta taatgtcata 121 gtcgggcata taggagcctc ctttggcggg gttgttggaa ggagcgaggc gtggcagaca 181 cggcgatgcg ccgaaggtgc atcggtttgt ggcgtgccgt gccgagcggt cagatgatgc 241 aaatgtttga aattcggcgg tttgcttgca aatttgcggc gatgccgcaa aagccgaatt 301 tacagcggcc gtcaagaatt ttcggtttct gcaaaagtga ttcggccgct tggaggcgtg 361 gctgacacgg cgatgcgatg aaattgcatc gcttgtggcc tgccgtgccg agcggtaaaa 421 aagcagatga ctattgccat ctgcttttgt ttgttatttg aaggtgtagc ctgcttcgcg 481 ggcggcgtca ataaagtcgc ctaaaacgta agcgttggtc tcagataccg cgtgcaacag 541 atatattgca ccggggtgaa gcctatcgat catcttttga agcgatgaag caggctccgg 601 ctgagtgtcc ggatcccaat cggcataagc aaagctccaa agcattgttt tatatccgca 661 gtcgcctgtc acagcaaggc taagctcgga atattcgccc ttgggcggac ggaaataggt 721 catttgaacg ccgaagtttt caatcatata ctcatgcaag cccataattt cggatctcat 781 ttcctcgact gtaagctcgg gcattgagta atggttgacc gattggttcg caacgatgtg 841 accctcgtca atcattcgct gcaccagctc aggctggcgc tcggcataat cctgaacgat 901 gaagaagatt gctcttacgc ccttttcctt aagggtatca agaatctgcg gagtgtagcc 961 gttttcataa ccctcgtcaa aatgtaaggg ttatgatctt ttcatcggtc tggtccatcg 1021 ccgtggcatt atactgcgaa tagccgttat tgaaccttct tgcaccgctt gggcggttgg 1081 catcgtcata atgcgagccg tgtccaaagc catcgccttc ggttgaaaga gttgcataat 1141 cccactgacc tgtgacataa agctcctcga ttgcatcgga aacatcggtc aaagaggttt 1201 cgggcaacgg ctcaggttcg gaaacagttg tggtggtctc ctcgcttgaa accgtcggag 1261 ctgaacttac aaggttatcg ggatcggtcg gctgagttat ggcggggttt tcggtaacgg 1321 ggtttccctc gttataacgt ccgtcatcaa tttcggcaca ggctgttaaa gtcatcgccg 1381 ccagggcgaa cgacaaaaca agtgccaata atttagtttt caaaactgta ttcctcccct 1441 ttcgcagatt gcgcgaaaac atatacaaat cggaataccg ctgtatcttt tttgagtgtg 1501 ccgaagttcg gcacgctaat atattgtgca agtaaaagaa aaatatcagc ggaaaaattt 1561 gttgaaattt gtcgctgata ttattataaa ctaaacattt gaaaaaatca attacaaggg 1621 tgttacaaaa aataagcctt cctcataaga ggaaggcttt agcgcatttc gtttattctc 1681 ttatcataaa ctcgcagatg gcgtagtaaa tctccgagga gccttcgaca gaatactcct 1741 tgatgaggcg gtatttgccg gggacaagct cgccgtagta gtttgtccaa tcaatgtgga 1801 agtcgtaact ctgaccagat tctaggacaa tggcctcggc ggggaatgta acaattccga 1861 tgtcgatgta gtgccactcg ccgtccttga atatctcgat cacatagctg ttgcctgttg 1921 tgatgggctt ttcgttgccg ttgagcattt taaactcggc accgtttgcg gtaagcgaac 1981 cattaacgat ttcgaaattg acgagacttt ccaaggactc aacagggtct tcaaccaata 2041 ttccttcctc aacctcgacc tcaacctcaa tttcagcttc ttcaacgatg atgccttcgt 2101 cggtatcaac gtacttgaaa tcctcatcgg tcaaggaatc ggggttagta ggatcgccgt 2161 ccaacaggat aacagcaaaa gcatataaag ctgtaggcga tacttcagga atatccggca 2221 catggcatac ggctacgcag actttttggc caaccataag agaatcagcg gtaatttccg 2281 tggcaccagg ccagtagcct gatcttatca acgtactctc actaacataa aagtatgcat 2341 tatctctgta attgggagga ttgtcgtcgt ttggtctgat cataatcttt acataaccat 2401 tatctgattc attgagctca atgatttttc cgtaaatgaa agcaacttca tcaagggcgg 2461 cagcaactat ttcacacttg tcgttgtacc atttgtcgaa tgtttccgaa // LOCUS sequence185 2508 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence185 VERSION sequence185 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2508 /mol_type="genomic DNA" /organism="" /note="sequence185" CDS complement(433..1326) /product="AAA family ATPase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_193500740.1" /transl_table=11 /codon_start=1 /translation="MQYLDSFTLPTRDREEQFLMFSHNHKLEMSCYASSLYPFGIFPEK RLNRIDFEPITVFCGSNGSGKSTLLNVIAEKLSVPRSAPFNKTPLYEEYLRFCEANLRF GSRLPKGSMIITSDDVFDYLLDIRAVNEGVDNRREDLFEEYNDFTDPKEPRFQMSSLED YDELKKRNLARSRTKSKYVSAQVKREIRTRSNGESAFLYFTDRIRENALYLLDEPENSL SASLQLELAEFIENSARFYGCQFIISSHSPFMLAMKGAAIYDLDREPAERVKWTDIENV RIYHKFFEKYRDDFGR" /locus_tag="LOCUS_6390" /note="WP_193500740.1 AAA family ATPase (Gemmiger gallinarum) [pid:50.9%, q_cov:98.7%, s_cov:97.6%, Eval:6.7e-79]" /note="MGA_856" CDS complement(1327..1935) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MTLGEYLFNPCGASSLPYDKALAVKIPLNMTVLHHRDFCSALLEK YIDEPYFRLIHRLEHIEDVSLPKGFVLSAVSSEQLVSQINSCYEDIGITKDSLSAFPAE MTVVVIDKSCGKIAASGLAKTYPTANEAALEWIQTSQEYRSRGLGRYVVCELLKRLRPR VEFVTVSGRCNNPHSPERLYRRCGFRGGDIWHILTEKEK" /locus_tag="LOCUS_6400" /note="MGA_857" ORIGIN 1 cctgttgcaa caaggcggca gataacttca agaccgtgac cgaaaacggt gccgggcaga 61 acttccatag tcgcattgtc aacatcagcg ctgacataat gggtcttgat tcctgcttcc 121 ttcaaaaggt tgaagtaata tacggaagtg cgcagatttg ccttgccgat gccctcaatg 181 gtcaagccga cgctgttctc tccgggatcg aaaacgccgt ccttgccggt gcagtcatcc 241 ttgaacttga gcattacgtt gccgttgtca aggctgtaaa catccttggt tttaccctca 301 tagatcttct tcataatttt tgaactcctt taatgtcgag tttacttcac tttttcaagc 361 gaaaccttac ataaataatt taaccgcgaa agcgctgttt tgtcaatatt tttggtgcaa 421 aaagtcagcc tttcacctgc caaaatcatc gcggtatttt tcaaaaaatt tgtgataaat 481 tctaacattt tcaatatccg tccatttcac cctctccgca ggctcgcggt caaggtcata 541 tatcgccgca cctttcatcg ccagcataaa gggcgaatgg cttgaaatga taaactgaca 601 gccgtaaaag cgggcagaat tttcaataaa ctcggcaagc tcaagctgaa gcgaggcgct 661 caggctgttt tccggctcat cgagcaaata gagcgcattt tcgcggattc ggtcggtgaa 721 atataaaaat gcgctttcgc cgtttgagcg ggttcttatc tcccttttaa cctgtgcgct 781 gacatatttg gattttgtcc tgcttcttgc aaggttgcgc tttttcagct catcataatc 841 ctcaagggag ctcatttgaa accgcggttc tttggggtcg gtgaagtcgt tatattcctc 901 gaaaaggtcc tctcggcggt tatccacacc ctcgttgaca gcgcggatgt ccaaaagata 961 atcaaaaaca tcgtcgcttg tgatgatcat actgcccttc ggcaggcgtg agccgaagcg 1021 caaatttgcc tcgcaaaaac gcagatattc ctcatacagc ggggttttgt tgaatggcgc 1081 cgagcggggc accgagagct tttcggcaat gacattcaaa agcgtcgatt ttcccgagcc 1141 gtttgaaccg cagaaaacgg ttatcggctc aaagtcgata cggttaagcc tcttttcggg 1201 gaaaatgccg aagggataaa gcgaagacgc atagcacgac atttcaagct tgtggttatg 1261 ggaaaacatc aaaaactgct cttccctgtc gcgggtcggc agagtaaagg aatcgagata 1321 ttgcatttat ttctcctttt ctgtcaaaat gtgccagatg tccccgccgc gaaatccaca 1381 tctgcgatag agcctttcgg gcgaatgggg gttgttgcac cttcccgaaa cagtgacaaa 1441 ctcgaccctc gggcgaagtc ttttcaaaag ttcgcatacc acatatcttc ccagtcccct 1501 gctgcggtat tcctgcgagg tctgtatcca ttcgagggcg gcttcatttg cagtcggata 1561 tgtttttgcc aagcccgaag cggctatctt cccgcaggac ttgtcgatta caacgactgt 1621 catctctgct ggaaatgccg aaagcgaatc tttggttatg ccgatatcct cgtagcagga 1681 gttgatttga ctcaccaact gctcggacga aactgccgat aaaacaaagc ctttgggcaa 1741 agaaacatct tcaatatgct caaggcggtg aatcagccga aaataaggct cgtcgatgta 1801 tttttcaagc aaggcagagc agaaatccct gtggtgaagc actgtcatat tcagcgggat 1861 cttaacagca agcgccttgt cgtaaggaag cgaagatgcc ccgcaggggt taaaaagata 1921 ttcacccaat gtcatcaaaa agtccccctt tcggtaatta tcaaaccaag tataccttaa 1981 aactgcccat atgtaaacag cccgaatcat ataactgtcc cgaacccccc cacaaatgtt 2041 gattttcagc agagaatttg gtagaataga ttcataatac agcctgtcac aaaagcgttt 2101 tttccgccgt agtatatatc agtacccaaa cacctttttg aaatctttgg agatctgata 2161 tatgcaaaca gttatttttg ccgctctcgg cgtcggcggt gcaacaatga taggcgctgt 2221 gattggattt ttgttcaaaa acatctcgaa acggttttcc gacattgttt ggtcattcac 2281 aactggcata atgcttgccg catcggtcat cgggttggtt ttgccctcga ttgagcaggg 2341 cggccgcttt gcagttttaa ttaccgttgc cggaatattt gcgggcgcgt ggagcttaaa 2401 cctgcttgat aaaacagtgc cccacttgca aaaaatgctg ggtgcgggca caaatgaagg 2461 ccatggtgta agcgcagata aggttttgct ttttgtcgcc gctatcgc // LOCUS sequence186 2507 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence186 VERSION sequence186 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2507 /mol_type="genomic DNA" /organism="" /note="sequence186" misc_feature complement(888..>2507) /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_013389627.1:discoidin domain-containing protein" /note="WP_013389627.1 discoidin domain-containing protein (Bifidobacterium bifidum) [pid:29.7%, q_cov:38.2%, s_cov:11.3%, Eval:3.4e-22, partial hit]" /note="MGA_860" /locus_tag="LOCUS_6410" ORIGIN 1 cttgaggtag ccataggcat tttctccctc gacgatcatt gaacagctct taacgcctgc 61 gtcggtgccg tcaagctggt caagaatgga tactttatat ccgtgagcct caccccagtg 121 gatatacata cgtataagca tttctgtcca gtcctgggct tcggtgccgc ccgcgcctgc 181 gtggaagttc aaaatggcgt tgttggcatc atactcgcct gtaaggagtg ttgaaagggt 241 gatcttgtcg atcttttcaa caaagccttc aagctcaagc ttaatgtcat ccaaaagcga 301 ctcgtcgtta tcttcataat acatttcaat cagcgttgca atatcatccg cctgcatatt 361 cagcttgcgg tcatcctcaa cgcggttttc aagcatcttt gtgcgttgca atatcttctg 421 cgacttgtcc atatcatccc agaagccggg ctcagccgcc ttgttgtgaa gctgttcaat 481 ttcttccttc gccgcgtcga tattcaaaac gctgtgaagc tccttgagct tgggtttata 541 ttcggaaagc tgttgtttga gctcgtcaat aagtaacata atttcctcca aatgtgagaa 601 tttgtataac tgatatatta tagcacaaag atgatgaata tgcaagtggg gagaaaggtg 661 gggcggaggc cgttgtgacc tgaaagggca cgacggaggg gacccaccgt tgggagcaaa 721 catagccgcc gtctgcgagc gcgttccgca ggaacagtgc cgcaggtggc agcggtcaat 781 tagcgagcta ctgcttgcgg gcctctccca tcgggagagg tgtcagcgaa gcggacggag 841 agggaaaaaa ctcagctccc cacttttcgt gaggagccga agcttaatta tctttccaat 901 ttgatggata caaggtcgaa gtcgcaaccg ggcaggaaga caagcttcag atctgccttg 961 ccgcagacct tttcaagatc gaaacgcttg gtaacgattt catcggttcc gccaaactca 1021 acaatctggt tgttggagcc ttcgggagtt gcaaaacgga tatgaacggt atcgttttcg 1081 ttgtgagttc tgcctgtaat ctcaattgcc gagattccct cttcaccgaa atcgaagccg 1141 ttgaattcaa cggttacgtt gtttccgatg tttgcgatca tatcttcctt gacggtgaag 1201 gtgtcgccat aaattccgtc gcggtcaagt gcggaaatcg tttcaccgat tcgggaagcc 1261 tcatcaaact tgaagccctt gaatcgaatc tgcgttttga atacaaagcg aatgctctgt 1321 gtaccggtca gcttcttatc cagcttgaag gtctgatact gatagtggtt ccatctataa 1381 ggcttctgat atacacagct gccaaacaaa ttgccatcgg cgtcggtaac atcaaacggg 1441 acgggatcgc cgttattata aatacctacg gtgagcacat ccgagcctgc cttgccgaat 1501 tcaacattgt caaactgaat atagcattcg ccccagaggg tctgaacgcc gccctcgaaa 1561 acattctgca atgtttcggt tgcactcgaa taaagcgatg cgctgacgat gtcgccgtaa 1621 ggattgaagc ccgcagggcc gaagccgtcg tttgacattt ccatttcgga aattatctcc 1681 tcataaggcg agccgttttt gcaatatgct cttaagcggt attcgccgtc gccctttgcg 1741 gtgatgattg cttcgccgtt ttccttttta atttcaacaa cgtttgtttc aatgcctgca 1801 tcggtaatcg ccttgaagcc gatgtcatcc aatgtaaagg ttgtaatctc gggataaagc 1861 ttaacagttg ccttaactgt cttgttgtcg ggggtgagct tgttcgattc aaccataagc 1921 tcgatttttc ttacgggaat ctcgcccgag ttttcggtct ttgagttttc aaaaccacag 1981 caaacctcgg ggttcttttc cgattctatt gctttaagaa ccaacttcgc atcgggaaga 2041 ccctttgagg atacaaccat ttcaacatcg cctgcatagt cctttgcggc aatcatcgca 2101 agaagcttgc cgttaaagag cttacggcag gttcccttat actggtcgta gtcggtggag 2161 tcgccgttgt cggtaccgac aagtcggcct gcgcccgaaa cggaaatttc aactctcgag 2221 cggtcattat caacagggtg gccgtcctta tcgagcattg agatctcaac aaagatcata 2281 tcctcgccgt tggctttaag ctcctgcttg ttgggaataa gagaaattgt tgcagcatcg 2341 ccgggggtat atcttgtcat ctcgcagaca gcgttgcctt cttcgtcata gccgacagcc 2401 ttgatgctgc ccttatgata aggcacctgc caacggcctg taagctcggt tccgtcaacg 2461 tggttatgct cataaatgcc catagattcg ccgtttacga acagctc // LOCUS sequence187 2505 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence187 VERSION sequence187 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2505 /mol_type="genomic DNA" /organism="" /note="sequence187" CDS 165..1676 /product="carboxylesterase family protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011086777.1" /transl_table=11 /codon_start=1 /translation="MLRKVKTENGWVRGIEAADPRITAFKGIPFAAPPIGENRWRAPQP CADWEGELDCSRFAPIGMQDTPGIGDNLYNREWHVDHEIPMSEDSLYLNIWTNAKSADE KLPVLVWYFGGGLQWGYTSEMEFDGERIARRGVVVVTVNYRLGVFGFLAHPELTAQQPD APTNFGSLDQQAGLKWVRRNIAAFGGDPDNITIAGQSAGGGSVMSQMTCPHNFGLFKRA IVQSALISSPYGGSHFGRPADLAAVEKNGEKFLECLGVKTIEEARKLDAFYIRNKYGEF AANNPRFFTIQDNKFSYGDPQKLFLEGKHADVDVMFGCTQDEFLSSIKANDENELKAKA VEIFGEKAQEFLSFNEAHTTDGKGNYAYVNGIEIAAKKLLEKNIENGNDKNGYFYCFDV PMPGWDNPGSFHSSELWFFFESLAKCWRPLTGKYYDLARHMCNYYCNFIKTGDPNGDDI DGTPMAKWNTYSEDAPCGMRFTPDGCVPETENKAFTRFLIDHTKK" /locus_tag="LOCUS_6420" /note="WP_011086777.1 carboxylesterase family protein (Bradyrhizobium diazoefficiens) [pid:34.0%, q_cov:93.4%, s_cov:89.5%, Eval:5.5e-56]" /note="MGA_861" ORIGIN 1 acccacgaag tgggtgtgac ggaggggacc cgcagctcac atactgctcg ctttctcctt 61 cgggcgttac acataaagat gaagactata aaaacctatt gtcatctatc cgaaaatgtt 121 gtataattga agtggaacat tataattttg gaggaggaac acttatgtta agaaaagtta 181 aaacagaaaa cggctgggtt agaggcattg aagccgcaga tccgagaatc accgctttca 241 agggcattcc ttttgctgct ccgcctatag gcgaaaacag atggcgcgca cctcagccct 301 gtgctgactg ggaaggcgag cttgattgct cccgctttgc gcctatcggt atgcaggaca 361 cccccggtat aggcgacaac ctttataacc gcgagtggca cgttgaccac gagatcccca 421 tgagtgagga cagcttatac ctcaacattt ggacaaacgc aaagagtgca gatgaaaagc 481 ttcctgtttt ggtatggtat ttcggtggcg gacttcagtg gggatacacc agcgagatgg 541 aatttgacgg cgaaagaatt gcaagacgcg gagttgttgt tgtaaccgtt aactaccgtt 601 tgggcgtttt cggattcttg gcacaccctg aactgaccgc acagcagcct gatgcaccca 661 caaacttcgg aagtcttgac cagcaggcag gactcaagtg ggtcagacgc aacattgcag 721 cattcggcgg cgaccccgac aacattacca ttgcgggaca gtcggcaggc ggcggaagcg 781 ttatgagcca gatgacctgc cctcataact tcggactttt caagcgtgca atcgttcaga 841 gtgcgcttat cagctcgcct tacggcggaa gtcatttcgg cagacctgct gatttggctg 901 cagtcgagaa gaacggcgaa aagttcctgg aatgcttggg tgttaagaca attgaagaag 961 caagaaagct cgatgcattc tatatcagaa ataaatacgg agaattcgcc gcaaataacc 1021 ccagattctt taccattcag gacaacaagt ttagctatgg cgacccccag aagctcttcc 1081 ttgaaggcaa gcacgctgat gttgacgtta tgttcggatg cacacaggat gagttcttga 1141 gttcaattaa ggctaatgat gaaaacgaac tcaaggctaa agcagttgaa attttcggcg 1201 agaaggcgca ggagttcctt tccttcaacg aagcacacac caccgacggc aagggcaact 1261 atgcttatgt caacggaatt gaaattgcgg caaagaagct tttggaaaag aacattgaaa 1321 acggaaatga caagaacggt tacttctatt gctttgatgt tccgatgccc ggatgggata 1381 accccggaag cttccattca agcgagcttt ggttcttctt tgaaagcttg gcaaagtgct 1441 ggcgtccgct gaccggaaag tattatgacc ttgcaagaca tatgtgcaac tattattgca 1501 acttcattaa gacaggtgat cccaacggtg acgacattga cggcacaccg atggcaaagt 1561 ggaataccta ttcggaagat gcaccatgtg gtatgagatt tactcccgac ggatgcgtgc 1621 ccgaaaccga gaacaaggca ttcacgagat ttttgattga tcatacaaaa aagtgatcta 1681 aatttaaaag ccacccgaag gggtggcttt tttgttgggt aattgcagga agcgagccgc 1741 atggggtttc agcagaaaag ttctgccaga aggcgtttaa tttaccgctg agagcttacc 1801 gtcatagtag acatagcctt gggagtcgac gacctcgcct gtgtcggcgc gtttaacggt 1861 gatggacaaa tcgcatttgc ggtcgccgaa ctcaaccatt ccgctggtga cgttatatgt 1921 cagcctatcg cccaaattct gaaggaattt tgaagcggta tagttatcgg tcaaatatga 1981 gcacttgcgg cggacgttga tctcaacatc gaagtcatcg ccatataaaa gggtgagctt 2041 atcaataagg tttgagtggc tgttaaggtt gtcaatttta aactgcaaat attcctcata 2101 atcagcgatc cagctttcgt tttgcgagta gtcctccata taataatgct cggtgatgta 2161 ctcgcccagc catgatgtgg ctttgcaggc gcctgtgaaa ttgaggtgat tgcggtcggc 2221 gtaaatgtct gtcgagaagt ccagcaggtt catatttagc atatttacat agtaggctct 2281 gaggtagtca tcaacaacat cgtggatgga gtttgcagac ttctgacagc ttgcatctgc 2341 agggaaaggc agatagatgc acaaaacctt gatttggttt tcgtcgcaat aatcgagaaa 2401 atcaatgaaa tagtcgtagc atacgctgtc aagctcgcgg gtctgttcct caccgatgga 2461 attatatccc actcccccgg cgtggccgac aagcatctgc gctcc // LOCUS sequence188 2490 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence188 VERSION sequence188 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2490 /mol_type="genomic DNA" /organism="" /note="sequence188" misc_feature <1..1065 /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_011039175.1:glycoside hydrolase family 3 protein" /note="WP_011039175.1 glycoside hydrolase family 3 protein (Xanthomonas campestris) [pid:35.7%, q_cov:83.1%, s_cov:33.7%, Eval:1.2e-40, partial hit]" /note="MGA_863" /locus_tag="LOCUS_6430" ORIGIN 1 cttaaaaacg acggtatttt gccattggat gcctacaaga tcaacaccat cggtgtagtc 61 ggccccaatg cgcagaacat cggtgccctc aacggcaact atcacggcac agcttcgcgt 121 tatgaaaccc ttcttatggg tattcaggat gcatttgacg gcagagttct cttcagtgag 181 ggatgccaca agtttgctca gaagaccgaa ggtctggctt tgccctatga cagaatcagc 241 gaggcagtaa tcgttgccga acattcggat gttgttgttt tgtgcgtcgg cttggacgaa 301 tcaatggaag gcgaagaagg cgacaccggt aacgcatatg cttccggcga taagggcgac 361 ctcagacttc ccgagccaca gaagagattg gttgatgccg ttctcgaagt cggcaagcca 421 acaattgttg ttttggcttc cggctctgct ctcaatattg aaactgacaa ggaaaacgcc 481 ctcatccagg cattctaccc cggctccgaa ggcggcaagg cagttgccga catcattttt 541 ggcaaggtta gcccctccgg caagctccct gtaacattct acaccgatat agaatgtatg 601 cccgaattca ctgactactg catgcgcgag cgcacctatc gctataacga taactccaag 661 ggcaatgtgc tttatccctt cggcttcggc ctttcatatg gcgacgtcaa ggttaagagc 721 gctaccgcat ctgtcaccga cgatgttgtc aaggcagttg taaccttgaa aaatgacggt 781 cttgcttccg gcgatgtttt gcaggtatac ttcaagtcgg aatccaagga tgctgttaag 841 aaccatgctc tttgcgcatt caagaaggta tatgttcccg cagacgaaga aaccgtaatc 901 tttatggata ttcccgttaa gaacctgacc gttgttaacg atgacggtgt aagatatctc 961 gataaatctg caaagaccac cctttacttc ggtacaagcc agcccgatga gctttccgtt 1021 aagctgggcg gcaaggcacc tgtagcagtt gaaatcaagt tataatcagt tctaagaaat 1081 taggggagcg caggacgttc cccttatttg aaattttagt ttttggaaca tttttcggag 1141 gttaattttt atggtatacg gcaaaaaccc ccttacccgc ggcgactttc ccgaccagga 1201 tgtcatccgc gtcggcgata cttactatat ggtatccacc acaatgtact tcatgcccgg 1261 cgcggtaata ttgcgctcat atgacctcat caactgggag atcatcactc atgtttatga 1321 cgagctggat gataccgaac gacagcgcct cgatggcgat aagcacgcct atgccaatgg 1381 aatgtgggca cctgtgattc gttaccacga cggcgttttc cacgttatct ttatcgcaaa 1441 cgacacccac aagacctatc acttcaccgc aaccgacatt atgggtccct ggaccaagtc 1501 atatattgag ggattctatc acgatacatc ccttttgttc gatgatgacg gcagagtata 1561 tttaatgtac ggcggccgcc acatccatct caccgagatg gagcctgacc tttcaaagcc 1621 aaaggcaggc ggagttaaca aaattgtaat tgaagacaaa cccggccgtt tcctcggcta 1681 cgagggatgc catctttata aggtcggcgg caaatattac gcattcttca ttcacgctca 1741 ccccgaccgc tggttcagaa ccgaggcttg ctttatggct gaccacattg aaggcccttg 1801 ggtaggcgcg gatgtaatcg actataacct tgaagacaac aagtgcggcg ctcccggtgt 1861 tgctcagggc ggtattgttg atactcccga cggcagatgg tttggcgtta tcttcggcga 1921 ccgcggagcg gttggaagaa ttcccaacct tgttccgatg cattttggcg aggacggttt 1981 cccaatcttc gacaccccta caattaatgt ctgcaacaca tctactcgtc ccgaccataa 2041 gtatgcaccc attttcatca gcgacagctt tgactatgag ccggacgaaa atggcaagat 2101 ccgccttaat ccctcttggg agtttaacca cattccaaag aatgactact ggacagtcaa 2161 ggactccaag tttattctca ccaccgaaaa gattgcgcca actgttgagc ttgcaagaaa 2221 cacccttacc cagcgtaccg tctggcctga gtgcgaagca attgtcaccg ttgacggaac 2281 aaatctcaac gatggcgact gtgcaggtct tgcaataatg cagcacttct atggtcttgt 2341 gggcgttgca aaggaaaacg gaaagtacta tgccgttatg cgttgccgtc agcccgattt 2401 tgagggcgag cgtgagcgcc tcgagcttga cagcccgatt ttgcaggtta aggcgaaagc 2461 gcacttcggc aatcatcccg aatatggcga // LOCUS sequence189 2484 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence189 VERSION sequence189 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2484 /mol_type="genomic DNA" /organism="" /note="sequence189" ORIGIN 1 gcaaagccga tgcggtcgat ccaccactta tagccgtttt tctgcatatc agcccagtta 61 tataaaggat ttccccaaag ctgaccgtcc aaagcatatg catcgggcgg gcatcctgca 121 acgttgatgg gttttttctc ttcatcgagc tcgaaaagct caggctcaag ccaagcttca 181 accgagtcga gggcgcaata tatcggcata tcaccgatta tttcaattcc cttggagttt 241 gcatattttt tcagctcatg ccactgcttg aagaactcat actgcaagaa aatataatat 301 ccgattcggt ctgcaaggcg ctgctttgca tcggcgattg cttcgggctt tgcaagcctt 361 aaatcgtctt cccattctct ccagggcttg ccgccgtttt ccgctttaag tgccataaac 421 aagccatagt tttcaaccca cgacttatgc ttttcgagga acttgttata gtcctcatcg 481 ggtacaaatc tcttatatgc gatattaagg acatcaaaga cggtgttata gatcataccg 541 tagttgatat actgaggatg gtcgccgaac tgaacttttt tatattccga cttcttcaaa 601 aggccgtcag cctcaagtgt ttcaaggtcg atgaaatatg gattacctgc gtgaatggag 661 caggactgat agggcgagtc gccatagcct gtcggggaaa gaggtaagat ctgccaataa 721 tgctggcctg ctttaacaag gaagtcaacg aactctcttg cgtgttttcc cattttacca 781 atgccgtatt cgcccggaag cgatgcgatt cccagcaaaa ttccgcttgt tctcattttc 841 aaatcatatc ctttcaaaat gctcaaaaac ttttgtgcat caaatagcta atgatattgt 901 accaaaaacg gctgaaaaat tcaactgttg tcaataatat ttatgctata actatactat 961 tgaaaaattg tttgaaaagt agtatactga ttctatatca ttccatttcg gaggtcgact 1021 atgcccgata tatcaaatat cgacaagaat ttttactatg acggcaagct tggcgtgagc 1081 cttagcgaaa atgaaaccgt gttccgcgtt tgggcgcccg aagctgaagc cgttaaggtt 1141 ttgctttata atgaccagca caccctctcc cctttcgctg ctgatgaaat gtcaaagagc 1201 aaaaagggcg tttgggagat ttcatatgat aggagccttg agggcacata ttacaatttc 1261 agctattgct atggcggaaa atggcaggag ggtgtggata tatatgcaaa cgcctgcggt 1321 tgcaacggcg aacgcggata tgttgcagac ttttcaaagc tttcccctga cggctgggaa 1381 aacgacagct acgttaagct tgaaagctac gcagacgcgg tgctgtatga aacacatata 1441 agagattttt ctaaaaaccc gtcaagcgga ataagcgaag aaaaccgcgg aaagtttttg 1501 gcttttaccg aggaaaacac ccgctctatc gacggagaaa agacttgtct ttctcacatt 1561 gaggacttag ggataaccca cgttcatctt ttgcctgcgt ttgattatga aggcgttaac 1621 gaggcaaacc ccacagacta caactgggga tataacccga aaaactataa catccccgaa 1681 ggatcatatt caagtgaccc ctttgatccg agtgcaagaa tcatcgagtt taaaaagatg 1741 gtaatgtcgc ttcacaataa aggtatcggc gttgttatgg atgttgtata taatcataca 1801 tttgagtcct gcgattcgtg gtttgaaatt gcatatccga aatactatca cagatttaaa 1861 caaaacggca gtttttcaaa cggctccggc tgcggaaatg aaatggcgag cgagagaaaa 1921 atgtgccgca gatatataat cgactcggtt ttgtggtggg ctaaagaata tcacattgac 1981 ggcttcagat ttgaccttat ggcgctgttg gatgttgaca ccatgaacga aattgtcgac 2041 aagctcaaag agataaaccc cagcgtaatt atttacggcg agggctggac aggcggagag 2101 tgtatgcttg caggagatga gcaggcatcg accgcaaatg cgaaaaagac acccgatatc 2161 gcatacttca acgacagcta tcgagatacc attaagggca acagctttgt tgacgaagcc 2221 aagggctacg ccgcaggaaa tattcactgc aaggcaggtg cggttgcggg acttttgggc 2281 aaggtttggt gggcaggctc gcctttgcag actgtcaact attgcgaagc ccacgatgat 2341 ttgacccttt gggataagct ttgcgtgtct gcacccggag cgcaccttga tgaccacaaa 2401 aagatggcaa gattttcgct ggcgctggta tttttggcgc agggaattcc attcatccag 2461 gcaggacagg agtttattcg aacc // LOCUS sequence190 2482 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence190 VERSION sequence190 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2482 /mol_type="genomic DNA" /organism="" /note="sequence190" CDS complement(314..952) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MEYIIIGLLLICIGLLIVLLGRKPKTDVTVREDLRGIEAMLKASN ELSVNQDKALREEISGALSRGQSRQAEDTERLTQSVIKQLTAMNETTASGLEKVRLATE QRLDKLQGVVDEKLSKTLNERLESNFKQIGDSVGELYKSLGELKNLSGGVSALNRTLSN VKTRGVWGEQQLGAILEQTMTPAQYDINFIKKRGSNDRFEFAIKMPNKG" /locus_tag="LOCUS_6440" /note="WP_012868945.1 DNA recombination protein RmuC (Thermanaerovibrio acidaminovorans) [pid:36.9%, q_cov:83.0%, s_cov:39.3%, Eval:3.6e-29, partial hit]" /note="internal stop codon at [314:316](-)" /note="MGA_868" CDS complement(994..1164) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MTYIIILGLGLAFLYTLRDGLLVLQNKRDALEAQKAYPTNIIHAN GEQCNQNKLSA" /locus_tag="LOCUS_6450" /note="MGA_869" CDS 1334..1888 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MSSFKLIAGVAIPDTTKLKREYKQSRGRLYLTLSAEDYPAFWRES VKLLGEGVFFFVEIPDDNDQTRLYYLDNCTASVAQAILKRYGSVLYSDGVIKFGFGSHS TEDEIYMMDYQTLSIYSQNLAPYEELLEKMGYLKNKNALLAWDILSEDNAGECTCIEAD DESYVDMINNLIDVGMYPAQG" /locus_tag="LOCUS_6460" /note="MGA_870" ORIGIN 1 atgcggtaac tgtggtggga cctgtcacaa aaatgtgctg ctgtgtctga caccattcgg 61 tcagcccggg aattctcaaa acctctgcat ataaaccctc tgtgggcagg aacataactg 121 caaagtcggt ggtgtttggc acatcaatat acttcgagct gatggtcttc gcttctgttt 181 taattctcgc ttcaagctcc ttggttgcgg catcaaccgc atctctatct cccgattcag 241 ccgcaagagc aattcggtca tatatatctg ttggtagatt cgattcgatg ggcaaataag 301 taaaatctcc cgactagccc ttgttgggca tcttaattgc aaattcaaat cggtcattag 361 agccacgctt tttaataaag ttaatgtcat actgcgcggg ggtcattgtc tgctccaaaa 421 tcgcgcccaa ctgctgttcg ccccagacac ctcttgtttt aacatttgaa agggtgcggt 481 taagggcgct aactccgccc gaaaggtttt tcagctcacc cagcgattta tacagctcac 541 ccacgctgtc gccgatctgc ttgaagttcg actccagtcg ctcgttgagg gtctttgaaa 601 gcttctcgtc aacaactccc tgcaacttgt caagtcgctg ttctgttgcg agtcttacct 661 tttccaatcc cgaggcggtg gtttcgttca tcgccgtcaa ctgcttaatt accgactgtg 721 tcaatcgctc ggtatcctcc gcttggcgcg attgccctct cgataacgcg cccgagatct 781 cctcgcgcaa tgccttgtcc tgattaacgc ttagttcgtt ggatgctttg agcatcgctt 841 caatgcctct aagatcctct ctgacggtaa catccgtttt aggctttctt cccaaaagga 901 caataagcag acctatgcat atcaaaagca gtcctatgat aatgtattcc ataagttaaa 961 tctcccgtta ttttattgtc ggacggcaaa aaatcaagca gataatttat tttgattgca 1021 ttgttcgccg tttgcgtgta taatgttagt tggatatgct ttttgagcct ccaaagcgtc 1081 gcgcttgttc tgcaaaacaa gaagtccgtc acgaagagta tataaaaaag caagtccgag 1141 tccgagaatg ataatgtatg tcattatttt atcctcactt tcataataat aaaagttttg 1201 tcttttgtca atcggtggga tgtcccgcct gcatttacat tttattatat taaaagtcca 1261 aatattcgga caattaaaaa atgcttgcaa atatccgtcc aaaaaaccgt actcaaagaa 1321 aggaaaacgc catatgtcct ccttcaagct tattgccggt gttgcaatac ccgacacaac 1381 gaagctcaaa agagaatata aacagtcacg cggaagatta tatttaactc tatccgctga 1441 ggattatccc gcgttctggc gcgaaagcgt caaactgctc ggcgagggtg tattcttctt 1501 tgttgagata cccgacgaca acgaccaaac aaggctctat tatttggata actgcaccgc 1561 atcggttgca caggcgattt tgaagcgata cggctcggta ttgtattctg acggtgtcat 1621 aaaattcggc ttcggttcac attcaactga ggacgagatt tatatgatgg actaccagac 1681 tttaagcatc tattctcaga acttggcacc ctatgaagag cttcttgaaa aaatgggcta 1741 tttgaagaac aaaaacgccc tgctcgcttg ggatatcttg agcgaggaca acgcagggga 1801 atgcacctgc attgaagcgg acgacgaaag ctatgtggat atgataaaca acttgatcga 1861 cgtgggaatg tatcctgcgc agggataatt tcgcactccg tgcgaaatgt gcggataccc 1921 aacaaagtaa attttccgac ataagtcggt gaaaataaaa aataacaatt taggagtgta 1981 acaattatgg cttatattat cggcgttgat atcggtacca gcggcaccaa gaccgttctt 2041 ttcgacgaag gcggcaaggt aatcgcttca aaaaccattg aatatcccat gtatcagccc 2101 aagaacggct atgctgagca ggaccccgca gactgggcaa atgccgcagt taacaccatc 2161 aaggctgtta tggcaatcag cggcgttgac aaggacgacg ttaagggtat cggtctttcg 2221 ggacagatgc acggtcttgt aatgctcgat aaggacaatg aggttatccg tccttctatc 2281 atctggtgcg accagagaac agccaacgaa gttgaagaaa tgaatcagaa gctcggcaga 2341 gaaaagctca ttgaaatcac agctaacccc gccctcacag gctggactgc tgccaagatt 2401 ctctgggtca agaacaatga acccgaaaat tatgagcgct gccgtcacat cttgcttccc 2461 aaggactata tcagatttgt tc // LOCUS sequence191 2477 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence191 VERSION sequence191 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2477 /mol_type="genomic DNA" /organism="" /note="sequence191" CDS 213..1043 /product="prohibitin family protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011461868.1" /transl_table=11 /codon_start=1 /translation="MSKIFNKKTIIILLVAIVVIATVASSMTIVEAGHTGVVVTLGKVE DHVLQEGLHFKIPFIQEVVRIDNRITKLDVDTEAFSKDLQTVSTTIAINYRVDTSKSYS IYKNIGRNYESVLVIPAVNEVLKAIAAKYTAEESVTNRTLVSEGLVVGLNEKLNEIGLY VTDVNIINFDFSEAYINAIEEKQVAQQQLLKAETEKQTAITNAEAEAEATKIRAEAEAE ANRILAESITAELIEYQKIEKWNGELPVVSGGGTTPILDVSTIIADNAEVPAGE" /locus_tag="LOCUS_6470" /note="WP_011461868.1 prohibitin family protein (Desulfitobacterium) [pid:40.0%, q_cov:89.9%, s_cov:89.9%, Eval:1.7e-46]" /note="MGA_872" CDS 1046..1378 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MAKLESPINGRFHEVKSRIYHGVISGSISCELNGESNFVGRNSRC SVMVFERYSAFGGNRVSLSVTLYQDGDGPIHMSAIASGGSQAIFAKINTFSEESFLENI REVLAE" /locus_tag="LOCUS_6480" /note="MGA_873" CDS 1405..2148 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MKKLLAVVLAAVMMLSLCSCAFGKAVTAYSLYSKAVKTIEEAGGF ETDCKITMSVAMFGESLDIPVNVNIKKNGEDYQLSTDMGTGAIKTTYAGGYVYVDYDSE SGVRYSLATESEAANELNAELNAYSIPKLTEELLEAVEVVKNEDGTKAISVSLTEEQAQ SMFGAAGIYEDFVFESIVLEMHFTENNELSTMDIAVDGQMIILGSELPGSIKCEYTFIN FGTAPEISLALSPDRYEDGGEYEAE" /locus_tag="LOCUS_6490" /note="MGA_874" tRNA complement(2191..2280) /product="tRNA-Ser" /inference="COORDINATES:profile:Aragorn:1.2.38" /locus_tag="LOCUS_t0110" /note="Aragorn_11" tRNA complement(2318..2406) /product="tRNA-Ser" /inference="COORDINATES:profile:Aragorn:1.2.38" /locus_tag="LOCUS_t0120" /note="Aragorn_12" ORIGIN 1 aattttgatc atcgccggta ttgagatcta taagcgattt ttccgcgatc ccgaataaaa 61 tgaaacaaat ttagccgatt tagacaaatg ccccattctg tggggcattt tcttattgac 121 ataagtcgtg caaaattgta ttatttatat cagtaagcag gcgtaaaacg ctaataatat 181 ataagtgata acacggaaag gaaaatgaaa aaatgagcaa aattttcaac aaaaaaacca 241 taatcattct tcttgttgca atcgttgtga tcgcaaccgt tgcaagcagt atgaccattg 301 ttgaagcggg acacacaggc gttgtcgtca ccctcggtaa ggttgaggac cacgttttgc 361 aggaaggcct tcacttcaag atccccttca ttcaggaggt tgttcgaatt gacaaccgaa 421 tcaccaagct ggatgttgac accgaagcat tctccaaaga ccttcagacc gtttccacca 481 ctattgcaat caactatcgc gttgacacct cgaagtccta cagcatttat aaaaatatcg 541 gcagaaatta tgaatccgtt cttgtaattc ccgctgtaaa tgaagtttta aaggcaattg 601 ccgccaagta taccgcagag gagtcggtca caaaccgtac ccttgtttcc gagggcttgg 661 ttgtaggtct taacgaaaaa ctcaacgaga tcggtcttta tgtaaccgat gtcaacatca 721 tcaacttcga cttctccgag gcatatatca atgcgattga agaaaagcag gttgcacagc 781 agcagctttt gaaggctgaa accgaaaagc agactgcaat cacaaatgcc gaagcagaag 841 cagaagccac caagatccgc gcagaggcag aagccgaagc aaacagaatc ttggcagaat 901 ccatcaccgc agagcttatc gaatatcaga agattgaaaa gtggaacggc gaattgcctg 961 ttgtttccgg tggaggtact acccctattc ttgatgtatc aactatcatc gctgataatg 1021 ctgaagttcc cgcaggagaa taaaaatggc taaacttgaa agccctatca atgggagatt 1081 ccacgaagtt aagtcgcgga tatatcatgg tgtaatttcg ggaagcattt cttgtgagct 1141 gaacggagaa agcaattttg tcggcaggaa ttcccgttgc agtgtgatgg ttttcgaaag 1201 atacagcgca tttggcggaa accgcgtgag cctcagtgtc accctttatc aagatggtga 1261 cggtccgatt catatgagcg cgatcgcatc gggcggaagt caggcgattt ttgcaaagat 1321 caatacattc agcgaagagt cattcttaga aaatattcgc gaagtattgg ctgaataaaa 1381 catacccgaa aggtgatttt gaaaatgaaa aaacttttgg cagtcgtgct tgcggctgta 1441 atgatgcttt ccctttgctc ctgtgcattc ggcaaggcgg taacggctta ttcattatat 1501 tcaaaggctg ttaaaacaat tgaagaagcg ggcggctttg aaaccgactg caaaatcacc 1561 atgagcgttg caatgttcgg cgaaagcctt gacattcccg tgaacgtcaa cattaaaaag 1621 aacggtgagg attatcagct ttcaaccgat atgggcacag gcgcaattaa gaccacctat 1681 gcgggtggat atgtatatgt tgactacgac tcggaaagcg gtgtcagata ctcccttgca 1741 accgaatcgg aagccgcaaa tgaactcaat gccgagctta atgcctacag cattcccaag 1801 ctgaccgaag aacttttgga agccgtcgaa gttgttaaaa atgaggacgg caccaaagca 1861 atcagcgttt ctttgacgga agagcaggca cagtctatgt tcggtgccgc aggcatttat 1921 gaggacttcg tgtttgaatc aattgttttg gagatgcact tcaccgaaaa caatgagctt 1981 tcaaccatgg atattgctgt tgacggccaa atgattattt tgggatctga gcttccggga 2041 agcatcaagt gcgaatacac attcattaac ttcggcacag ctcccgaaat cagccttgcc 2101 ctctctcccg accggtatga ggacggcgga gaatacgagg cggaataatt ataaaaagaa 2161 aagacaccct tgtgggtgtc ttttttgttt tggcggagaa agagggattt gaaccctcgc 2221 gccggtttcc cgacctactc ccttagcagg ggagcccctt caccacttgg gtatttctcc 2281 aaatagttgc cgtttggtga tataaggctg tatcgcttgg cggagagggt gggattcgaa 2341 cccacggtac gtcgccgtat cactggtttt caagaccagc tccttaaacc gctcggacac 2401 ctctccaagt gagctttaca gccttactat aatatcacat caatttgccc atgtcaagag 2461 ttttttattt attttcc // LOCUS sequence192 2472 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence192 VERSION sequence192 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2472 /mol_type="genomic DNA" /organism="" /note="sequence192" misc_feature <1..1074 /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_164927193.1:PBP1A family penicillin-binding protein" /note="WP_164927193.1 PBP1A family penicillin-binding protein (Chlorobaculum tepidum) [pid:32.0%, q_cov:75.4%, s_cov:33.4%, Eval:2.3e-23, partial hit]" /note="MGA_875" /locus_tag="LOCUS_6500" CDS 1079..2197 /product="class I SAM-dependent RNA methyltransferase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_010963546.1" /transl_table=11 /codon_start=1 /translation="MAQKLRLCCPCHFGLESVLSFEIKKIGGENLIVSDGRISFDGDPS MIARANIFLASAERVLVELGSFTAKTFDQLFEGVRALPLEQFIGKYDKFPVKGHSLKSQ LHSIPDCQAIIKKACVKRLEKVYGISRFEETGALYQIQFNILKDVVTVYIDTTGPGLHK RGYRKTSNDAPIKETLAAGIIDLAHVRSDSVVVDPMCGSGTLLIESAYKALRLAPGLRR KFVAQSWSIIPEEIWREQRSLALDSISKESQFKGYGFDIDPFAVDLSISNAKTAGVLPR IEVAQRDIVNHVPVKGAITICNPPYGERMLELKEAEELYKKMGQVLRPDRENPCYIISP HEDFETLFGKKADKKRKLYNGMLKCNLYMYFN" /locus_tag="LOCUS_6510" /note="WP_010963546.1 class I SAM-dependent RNA methyltransferase (Clostridium) [pid:45.0%, q_cov:96.5%, s_cov:96.2%, Eval:1.6e-86]" /note="MGA_876" ORIGIN 1 cagccgggtt catgcatcaa gccattggca tcatatgcct tggctgttga ccgcgacttg 61 atcacctggt cttcccagtt cttggattca cccttgctaa ttgaagatca aggttctgaa 121 aacggctacc ttgtctggcc gagaaactat tcgaccaccg gtgcatatac cacatcatgg 181 tcaagagatt ataacttcac atattccgcg cttcagcgct cacttaatac aaccgctgca 241 cagctcgtcg agcttctttc gcccagtgaa tgttttgagt ttttatacta caagctgcac 301 cttgattcgc ttacgcttta tcagaacgga cttaccgata ttgcacgttc tcctatgtcc 361 gtcggcgctt tgaccaacgg cgtttccttg caggagatta caactgcata ccagatattc 421 ggcaacggcg gaaaatatta tgattctacc tatatttcga gaatcatcga caacaacggc 481 gaggttgtat atcagcattc attcatcggt gaacaggtaa ttgacgaaag ctctgcgtat 541 gttatgaatc gaatgatgga aactgttgtt tccggttccc gcggtacggg ccgacttgca 601 cgccttgaaa attgtgagct tattgcaaaa acaggtacta cccaggactg ggctgacctt 661 tggtttgtgg gctgcactcc cgaatatgta acaggtcttt ggatcggcca tgacattccc 721 aaggaaatgg aaacctcgac cttctacggt tcctcgcaga tgtggaaaaa catcttcggc 781 gacatcgctg aaaatgagga tttgaaggag tttgaagcta catcaagcgt tgttcagcgt 841 gaatattgtg aggttaccgg tttaattgca ggaagcaact gcgccgatac cttaacaggt 901 tactataagc gcaccaacat tcctgcaacc tgttcgggtg agcatttaat tgatgacacc 961 atcattttgg acgattctgt aattgtcacc gaaggcgttg acaccctgga ttatgaaaca 1021 ttgacaggca acttgtataa ttatgtatat gaccttgtca gaacttggag ataaataaat 1081 ggctcaaaaa ctaagacttt gctgtccttg ccatttcgga ctggaaagcg tattatcatt 1141 tgagataaaa aagataggcg gcgaaaacct cattgtcagt gacggcagaa tctcctttga 1201 cggtgacccg tcgatgattg caagagctaa catcttcttg gcatctgccg agcgcgtttt 1261 ggttgagctt ggctcattta ccgccaagac ctttgaccag ctttttgagg gcgtaagagc 1321 actgcctttg gagcaattta tcggaaaata tgacaaattt cccgttaaag gccactcgct 1381 taaatctcaa cttcatagca ttcctgactg ccaggcgata attaaaaaag cctgtgttaa 1441 gcgccttgaa aaggtctatg gcataagccg ttttgaagaa acaggcgcgc tttatcagat 1501 tcagtttaac attttgaagg atgttgtaac tgtatatatt gacactacag gccccggtct 1561 gcacaaaagg ggatatcgca agacctcaaa cgatgcaccg atcaaggaaa cccttgcggc 1621 aggcataatt gaccttgcac acgtacgaag cgatagcgtt gttgttgacc cgatgtgcgg 1681 aagcggaaca cttttgatcg aatcggcata taaggctttg agattggcac cggggctaag 1741 acgcaagttc gtagcacaaa gctggagcat tattcccgag gaaatctggc gcgaacagcg 1801 atctctggca cttgattcaa tttcaaaaga atctcagttc aaaggatatg gatttgatat 1861 agatccattc gcagttgatc tttcaatatc aaatgctaaa actgcaggcg ttttgccgag 1921 aatcgaggtt gctcagaggg atattgtcaa tcatgtacct gttaagggcg cgattacgat 1981 ttgcaatccg ccttacggcg agcgaatgct tgagcttaaa gaagctgagg aattatacaa 2041 aaaaatgggt caggttttgc gacccgaccg cgaaaatcca tgctatatca tctctcccca 2101 cgaggatttt gaaaccttgt tcggcaagaa ggcagacaaa aagcgaaagc tatataacgg 2161 aatgcttaag tgcaatttat atatgtattt caactaaaaa taaaagtgcg attccaattt 2221 gggaatcgca cttttttgcg ttcagaccgc gccaacaaaa atcgcaaagc gaagttatta 2281 ttttgcgctc gctatttgca aacttaatcg gatatttcgc cataacaaat gtttccgtct 2341 gtctcggtga tagttaaatc tttaatctca aatataaaag tttctgtaaa gtgtttaaca 2401 tttacgatca cataattctc tgtatgtaca atatgccact cggtatcctt atatttttca 2461 aacaacacct ta // LOCUS sequence193 2466 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence193 VERSION sequence193 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2466 /mol_type="genomic DNA" /organism="" /note="sequence193" misc_feature <1..1236 /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_003357725.1:translation elongation factor 4" /note="WP_003357725.1 translation elongation factor 4 (Clostridium) [pid:63.7%, q_cov:99.3%, s_cov:67.6%, Eval:1.3e-153, partial hit]" /note="MGA_878" /locus_tag="LOCUS_6520" CDS 1259..1639 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MNKVLLSNKWLQFGISVFKVIYLIFIGALTVWTFLYDIRFDSEAA FYFLYIGLSVIFCVFMFISRQQFITRVMSMVLLLPVFLLILFNMAKPIIYLPCLAVSVF MFFACGSKANTKVIMGSLYLLM" /locus_tag="LOCUS_6530" /note="MGA_879" CDS 1703..2080 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MLNSSVTDTSITSEYDMDRIERLNANSISPDGKYRYYILDVQDND RGKVIIVVEPNDRDINYRFFSLVEVGYTTRIAKYHTRGVTPDIEWLSGNKIRYRFGENA EWKTSTISPPTEKNYLRFLGV" /locus_tag="LOCUS_6540" /note="MGA_880" ORIGIN 1 aagcctttaa agtgccttat ttttgacagc tattatgact cttataaggg tgtaatcatt 61 tacgtcagag ttaaggaagg tacacttaaa gtcggcgaca ccattcgttt gatgtccaac 121 ggtgctgaat tccagactgt cgaagttgga tatatgggtg caacggagtt gataccttcg 181 ggtgaattga aggccggtga agttggatat atcacagcat ccatcaaaag cattaccgac 241 accaaggtcg gtgacaccgt tacaaatgca tttgcgcctt gcgatgaacc tttggcaggt 301 tataaaaatg ttcagccgat ggtatattcg ggtatttatc ctgcagacgg tgcaaagtac 361 ggcgacctgc gcgatgcact tgacaagctc aagctcaacg atgcatcgct gacatttgag 421 ccggaaacct cggttgcttt gggatttggc ttcagatgcg gattcttggg tctgttgcat 481 atggagataa ttcaagagcg acttgagcgc gaatataacc ttgaccttat tacaaccgct 541 ccctcggtta tttacagagt tacgatgaat tcgggcgagg tcaaatatat tgacaaccct 601 acccactcta ccgatccttc gttgattaca atggcggagg aaccgatgat aaatgcgcat 661 agatatgcgc cgaatgacta tgtcggaaat attatggagc tttgccagga gcgtcgcgga 721 gttttcagag atatgaaata tatcgatgac aagcgcgttg acattcacta tgagttgccg 781 ctcaacgaag taatttacga cttctttgac acactcaagt cgcgcacgag gggctatgct 841 tcatatgact atgaaatgct gggatatgcc gaaagtaagc ttgttaagct tgacttgctt 901 ttgaacggag aaattgttga cgcactttcc tttattgttc atgcagacag agcatataac 961 agaggcagac gcctttgtga gaagcttaag gtcaacattc ccagacagat gtttgaaatt 1021 ccgattcagg cggcaatcgg cggaaagatc attgcaagag aaaccgttaa ggcatatcgc 1081 aaggacgttc ttgccaagtg ctacggcggt gacataacca gaaagaagaa gcttttggaa 1141 aagcagaagg aaggcaaaaa gcgtatgcgc cagcttggta ctgtagaggt tccgcaggag 1201 gcgtttatga gtgttctgaa gcttgattcc gaataatgaa acggaggtta tgtatataat 1261 gaataaggtc ttgctttcaa acaaatggct ccaattcgga atatccgtct ttaaggtaat 1321 ttacctcata tttatcggtg cgctgacggt ttggacattc ctgtatgata tccgattcga 1381 cagcgaagcg gcgttctatt tcctatatat cggacttagc gttattttct gcgtgtttat 1441 gttcatatca aggcagcagt tcataacaag ggtaatgtcg atggtgctgt tgttgccggt 1501 gtttctttta attttgttca acatggcaaa gccgatcata tatctcccct gccttgcggt 1561 aagcgtgttt atgttctttg cctgcggcag caaagccaac acaaaggtta tcatgggaag 1621 cttgtatctt ctcatgtaaa ttgtaagact aatcggattt tcgattcttt cgacgctgtt 1681 cggcggaaac acagttgaaa cagtgcttaa ttcatctgta acagatacaa gcattacaag 1741 cgagtacgat atggatagaa ttgagcgact gaacgcaaac agcatttcgc ccgacggaaa 1801 atatcgctat tacattttgg atgttcagga caatgaccgc ggaaaggtta ttattgttgt 1861 tgagccaaat gaccgcgaca taaactatcg tttcttctcg ctggttgagg ttggatatac 1921 cacacgaatt gcaaaatatc acacaagagg cgtgacaccc gacattgagt ggctctcggg 1981 aaataagata agatacagat tcggcgagaa cgccgagtgg aagacatcta ccatttcccc 2041 gccgaccgaa aagaactatc tcaggttctt gggagtataa acaaaaagat aaaccgcact 2101 gtattttaaa atacggtgcg gttttttatg cggtgagtga ggcggcagcc cgtgtgcgcc 2161 ttagcgcaca cgccccgtgg caaaaccacg gggaagcctt tttgcccctg cggggcaaaa 2221 aggcttggct gccgcgaagg gagcggcgtc tgcaggcgaa tcgccgaagg gcgattgtgc 2281 cgcaggtgcc gcgtataaac tcatctcgac atataaaaaa gctccccaaa atcggggagc 2341 ttgatttttg attaaaggat aattgtttcg gtgccgtcaa gacctgtgag aatttcggtc 2401 ttgtcgccgg aaacgattcc gattgtaacg gtgacctgaa ccttgacgtt gtcgatcaat 2461 acattg // LOCUS sequence194 2445 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence194 VERSION sequence194 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2445 /mol_type="genomic DNA" /organism="" /note="sequence194" CDS 417..1052 /product="DUF421 domain-containing protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011948011.1" /transl_table=11 /codon_start=1 /translation="MLTVFIRGVILYAVVIFSARLMGKRQLGELSPGELVITILISNIA TLSMEETSLPLILALTPIFTLVCIDVIISYAVLKSKKFRHLVSGTPRVIISEGKIDQQA LKELRYSVADVMCSLRGLGIFDISQVQYAVVETTGSVSVMLKAEHQPLTKQSVSKPEKS ADPPKIVISDGDVHDKKAAARIGLDHKKVFICTEDSNGKINVIPKEGK" /locus_tag="LOCUS_6550" /note="WP_011948011.1 DUF421 domain-containing protein (Clostridium botulinum) [pid:42.5%, q_cov:84.8%, s_cov:80.6%, Eval:3.6e-37]" /note="MGA_883" CDS 1049..1420 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MKRLVLSISIIAVIAAMGIVTIFFIQSQNEKLYGKLDLVIYKYEN NEDVSKELAELEEFAREYTKKLNYFADEEKLEELYEAVITLKTLYFDSSEEFRTECARI RLLADRIYRREIPDMGRIL" /locus_tag="LOCUS_6560" /note="MGA_884" CDS 1508..1954 /product="transcriptional regulator NrdR" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_005902339.1" /transl_table=11 /codon_start=1 /translation="MKCPFCNFEDTKVIDSRPSEGKKRRRRECTQCGKRFTTYEIVEKP ILMVSKKDGSFEPFDRAKLIAGITTATKKRAISLADIEDIVDSIENKMANEMRSEISTA EIGDSVLSALKDIDLVAYVRFASVYKDFNDLDSFIHIVSELDGK" /locus_tag="LOCUS_6570" /gene="nrdR" /note="WP_005902339.1 transcriptional regulator NrdR (Fusobacterium nucleatum) [pid:51.4%, q_cov:98.0%, s_cov:98.0%, Eval:2.1e-37]" /note="MGA_885" ORIGIN 1 ctccctctcc gaaggtgtta atgaccttct tttcgttgga aaatccgcaa ccgtcggcaa 61 tatatgaaaa cacttcatcg ggcagacggt tgcgctttga aaattccctc aatggctcat 121 atatgattcg cgaaagttct ctcgatgcaa ccattccctc aagggagatt agcgcggttt 181 taactcccgc cgtttcaaag cgcataacat ttaagtcgct tgaatcgccg aaaatttcct 241 tgagccttgc aatgctcttt tcaagccttg aatatatatt ttcgttctca taatccgctt 301 tttgcatttt ttagcctatc cttcgatact ttttcatatc ttttccctat ggagcgtgat 361 tattccgcta tttgcgggaa acaatatgga taaactttaa agcgaggagc aaaaaaatgc 421 ttacggtttt cattcgcggc gtgatactat atgctgttgt aattttctcg gctcggctta 481 tgggcaaacg ccagcttggc gagctttcgc ccggcgaatt ggtgataaca atattgattt 541 caaacatcgc cacactttcg atggaagaaa catccttgcc gctgatattg gcgttgactc 601 cgattttcac acttgtctgc atcgacgtta tcatcagcta tgcggtgttg aagtcgaaaa 661 agttccgaca tttagtgtcg ggcacaccga gggtaataat ctctgaaggc aagatcgacc 721 agcaggcact caaggaactg aggtattccg tggcggatgt aatgtgttca cttcgcgggc 781 tgggaatttt cgatatttcc caggtgcagt atgctgttgt tgaaacaacg ggctcagtca 841 gcgtgatgct caaagcagag catcaacccc tgacaaagca gagcgtcagc aagccggaaa 901 aatcagccga cccgccgaaa atcgtcatca gcgacgggga tgttcacgac aaaaaagccg 961 ccgcacgaat cgggcttgac cacaaaaagg tgtttatctg tacagaggat agcaatggca 1021 aaattaacgt aattcccaag gagggcaaat gaagcgcctt gttttaagca tttcaatcat 1081 cgcggtgatc gccgcaatgg gcattgtaac catatttttc attcaaagcc agaacgaaaa 1141 gctatacggc aagctggatc tggtgatata taaatacgaa aacaatgagg atgtttcaaa 1201 ggaactcgct gagcttgagg agtttgcgcg ggaatataca aaaaagctaa attacttcgc 1261 agacgaggaa aagcttgaag agttgtatga agcggtaatc actttgaaaa cactttattt 1321 tgacagctca gaagaatttc gcaccgaatg tgccagaatc cgcctgcttg cagacagaat 1381 ttatcgccga gagatacccg atatggggcg aatactttaa aaaaagcact tgcaaaccac 1441 agcattttgt gatatagttt acctataaat acaagataaa cgtccctgaa aggatggtag 1501 acaaaaaatg aagtgcccgt tttgcaattt tgaagatacc aaagtcattg actcacgccc 1561 aagcgaaggc aaaaagcgcc gcagacgtga atgcacccag tgcggaaaga gatttacaac 1621 ctatgagatc gttgaaaagc cgatcttgat ggtatcgaaa aaggacggca gttttgagcc 1681 ctttgacaga gccaagctca ttgcgggtat taccaccgca accaaaaagc gtgccatcag 1741 tcttgcggat attgaggaca ttgttgacag cattgaaaac aaaatggcaa atgaaatgcg 1801 ctcggaaatc tccaccgccg agatcggcga ttccgttctt tcggcactca aggacatcga 1861 ccttgtggca tacgtccgct ttgcatctgt atataaggac ttcaacgacc ttgacagctt 1921 catacatatt gtaagcgagc ttgacgggaa ataaatacat aaacacaaag agagaacaaa 1981 cagcctttgc tgtactgttc tctctttttt gttgcgagat atttgcttcg caaatgcgat 2041 atattttcgt ttgcgctcaa atgcgatatg atataaatcc ttttgtgccc cgcagggcat 2101 atcgcttccg caggaaatat cgcgcgtaag catatcgcaa atcccgcaag ggatttatat 2161 cgctgtgtta tccttgaagg ataacacgtg ccggtggttt tgtttttgtg ttacagcatg 2221 ttaccaaaac agacatttta ctgatattcg tatcacattt tgtgataatt tatgcctcgg 2281 agcgcgcaaa atcctataat atgattatca aaaggtcata aaggaggatt tctgtgcgga 2341 tcaaagacat tcgtgaagat aacgacacca cccaagccac ggttgcggaa tatttgaaca 2401 tccgccagaa tacatactcg caatatgaaa cgggtcagcg ccagc // LOCUS sequence195 2443 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence195 VERSION sequence195 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2443 /mol_type="genomic DNA" /organism="" /note="sequence195" CDS complement(41..1258) /product="3-phosphoshikimate 1-carboxyvinyltransferase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_010964213.1" /transl_table=11 /codon_start=1 /translation="MTINFKPTKLSGSVSAVPASSEAHIKLICAAFSIGRVRNVPFTED VCATLDALKSLGLVFDTVGDNVIFRTYHPNRMPIINCGSSVKTLIYFMCLACACIGNVV ATFDGSDKLPKDAIEALLKVLGAHGITSDYNGSLPFTIKGSLNSGEFTLDTEYAEDFVT GLIIALSRNNTDSFINVVGGDYPKSGILLAADILKEAKVLTASNEDVYIIRGGQSYKLF ETTIGGDFALASNFVVANAMNSNVRVAGLDAMSAQPEKTIFEIIRRVQSSGCKGFDLNC LEIPNLVPILAVYACSLNGTTCLCNAKSRSSNSYVDTELVCDMINSVGGKATALSDRIV IDGVKNLTGGTIDCRSDHRIALASAILSTICTDDVTVLNVECVAKPYASFLDDYRRVGG NVTIIN" /locus_tag="LOCUS_6580" /gene="aroA" /EC_number="2.5.1.19" /note="WP_010964213.1 3-phosphoshikimate 1-carboxyvinyltransferase (Clostridium) [pid:27.1%, q_cov:98.5%, s_cov:97.7%, Eval:9.4e-40]" /note="MGA_887" misc_feature complement(1288..>2443) /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_011836754.1:DNA helicase PcrA" /note="WP_011836754.1 DNA helicase PcrA (Streptococcus sanguinis) [pid:39.7%, q_cov:99.7%, s_cov:54.1%, Eval:1.5e-76, partial hit]" /note="MGA_888" /locus_tag="LOCUS_6590" ORIGIN 1 aaattagcca tgagttgtat cctttcggta tattggaata tcagttgatt atggttacat 61 ttccgccgac acgtctgtag tcatcgagga aggacgcata gggttttgca acacattcaa 121 cgttcagaac tgtaacatca tcggtgcaga tggtggataa aattgcagaa gccaatgcga 181 ttcggtggtc ggacctgcaa tcaatagttc cgcctgtaag atttttaact ccgtcaatta 241 caattcggtc tgacaaggca gttgccttgc caccaacaga gttaatcata tcgcaaacaa 301 gctcggtatc cacataacta ttggaagagc ggctttttgc attgcataag catgtggttc 361 cattgagaga gcaggcgtat actgcaagta ttggaacgag atttggaatc tcaaggcagt 421 taaggtcaaa acctttacat cccgatgatt gtactctgcg aatgatttca aaaatcgtct 481 tctcgggctg agcagacatt gcatcaagac cggcaacgcg gacgtttgag ttcattgcat 541 ttgcaacaac aaagttggat gcaagggcaa agtcaccacc gatagtggtt tcaaacagct 601 tgtatgactg accgcctcgg atgatatata catcttcatt ggatgccgtg agcacctttg 661 cctctttcaa tatgtctgca gcaagcaaaa ttcccgactt gggataatcg ccgccgacaa 721 cattaataaa gctatcggta ttgtttctgc taagcgcaat tatcagaccc gtaacaaagt 781 cctcggcata ttcggtgtca agagtgaatt cgcccgagtt aagacttccc ttaattgtga 841 aaggaaggct tccattgtaa tcagaagtaa taccgtgagc tccgagaacc ttcaacaatg 901 cttcaattgc atctttggga agcttgtcac ttccgtcgaa agtggcgacc acattaccta 961 tgcaagcgca agcgagacac ataaagtata taagcgtttt tacggaactg ccacagttga 1021 tgattggcat tcgattggga tgatatgttc tgaagatgac attatcccct actgtatcaa 1081 aaaccaagcc cagcgacttg agagcatcaa gagttgcgca gacatcctcg gtaaagggca 1141 catttctaac cctgccgatt gaaaaagctg cacagatgag cttaatatgg gcttcactac 1201 tcgccggaac tgctgaaacg gagccggaaa gctttgtagg tttgaaattg attgtcatat 1261 cttatatcat tcctttcggt gatatgttta tatctttttg atttttgcaa agtttgccat 1321 gatttttttg gtgccaacct tgtcgaaagc aatttcaagc atggtgtcgt tggacattac 1381 tgttgctttc aatacagttc cctcgccgaa aattgcatgc gaaacgcgct cgcccattga 1441 atatgtttcg cgaggagcag acgatgcagg ctttgcaaac gcagtggtcg atgacgagcc 1501 aaatccgccc tttgcaacat ttgctgtggg tctttgcgga gcgggggcct tggaatttaa 1561 cggtgtgctt tcaaatttga gctcaatatg ttctttggga agctcggtga taaagcgcga 1621 aggacggttg aagttagtgg agccatagag catacgctgt tttgcgtgag taatgaaaag 1681 gtttcgcttt gcgcgagtta tagcaacata tgccaaacgg cgctcttctt cgacatctgc 1741 ctcggtatcg agcgaacggg aggacgggaa gatgttttcc tccatgccga tgatgaaaac 1801 attagggaat tcaagtccct ttgcagagtg tacggtcata agcataaccg catcggcgtt 1861 agggtccatt gagtcgatgt ctgtatagag agcaatctcc tccaaaaatc ccgacaaaga 1921 agggttttcg gcgttttgag aatagtttat catcgttgat ttaagctctt caatattttc 1981 aaggcgagtc tgtccctctt cgccttggag cttgagcatt gttaagtatc ctgttttgtc 2041 gagcagaata tccaaaagct ccgccagggg aatctgttcg ctcagcgctt tgagctcatc 2101 aaataccttt gccagctcag caagtcttga agcagcgcgt gaaaggatcg gataatcccc 2161 agcattgcgc ataacctgta aaggcgattc gccaagggtg tttgcaacct gttccaagtt 2221 atcgacagtt gcgtctccga ttgcacgctt aggttcgttg atgatgcgtt ttaagcgcaa 2281 aaggtcggtt tcgttgttaa ttacggacag ataagagatg atgtccttga tttccttgcg 2341 gtcatagaac ttgatgccac cgaacacacg gtatgatatt ccgcttgcaa caagtgcgcg 2401 ctccatcgcg ttggattgag cgttcatgcg gtataaaaca gcg // LOCUS sequence196 2442 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence196 VERSION sequence196 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2442 /mol_type="genomic DNA" /organism="" /note="sequence196" CDS complement(315..1808) /product="flotillin family protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_002896230.1" /transl_table=11 /codon_start=1 /translation="MLTYIIIGAIILLAVFLFATGYLKAPPDTAYIISGLGSKKRILIG KAGFRVPFFERVDKLSLGVMQVDVKTSEAVPTNEFINVSVDGVANIKISSDPQLLERAS EALLGKNRQELVALVTQVLEGNMREIVGSVGLKEMVQDRQGVAKKITENVVPDMEKLGI EVVNFNIQNFKDGAGTIENMGIDNVEQIRKNAQIAKANAQRDIAIATSKAQQEANAVKV ESEKMIAEQNAELAVQQAEMKVRSDAKRAEADAAYSIQHEEQRKVIEIAKTNADIARRE KEAELADKDIAIKERELDAQIKKQADALKYQSQQEAEAELIRDLNLLTLKPILFIANVG EDEVADAMSNPHVQKVQQYAAEEGAEVIAVSAKVESEIAELDDEDAKEFLAELGLAESG LDKLIKASFKLLGLITFLTAGEQETRAWTIRKGTKAPQAGGKIHSDIERGFIRAEIVSY DDLMAAGSQAAAREKGQVRLEGKEYVMQDGDVTYFRFNV" /locus_tag="LOCUS_6600" /note="WP_002896230.1 flotillin family protein (Streptococcus) [pid:39.5%, q_cov:80.3%, s_cov:80.9%, Eval:2.5e-72]" /note="MGA_889" ORIGIN 1 ggcattatcc tacctatcac ggagctcatg gccctctaaa cgttattgcc tgcccaatat 61 ttcacaaaca atacaagtcc agtatactgg ttttgattct cattgtcaat aaggtcgtat 121 aaaaaagact ctaccgaagc agagcctgtt tagggggagg gtggaactca cagacgacgg 181 tgtccttctt caccgcatcg tctgtttgct tttgcacttt tatcatatca taattagtca 241 aaaagtcaat atgtcaaatg gtcgatttta tgaaaaaaga caactttttt tcaaaagctg 301 tctttgaggt ttcattatac gttgaagcgg aagtacgtga cgtcgccgtc ctgcatgacg 361 tattccttgc cttcgaggcg gacttgacct ttttcgcggg ctgcggcttg gctgcctgct 421 gccatgaggt catcgtacga tacgatctct gcgcggatga agccgcgttc gatgtcgctg 481 tggatcttgc cgcctgcctg cggtgctttg gtacctttgc ggatcgtcca agcgcgggtc 541 tcttgttcgc ctgcggtgag gaaggtgatg agtccgagga gtttgaacga tgctttgatg 601 agtttgtcga gacccgattc tgcaagtccg agttcggcga ggaattcttt ggcatcttcg 661 tcgtcgagtt cggcgatctc ggattctact tttgctgata cggcgatgac ttctgcgcct 721 tcttctgcgg catactgctg tactttttgt acgtgcggat tgctcatcgc gtcagcgact 781 tcgtcttcgc ctacgttggc aatgaagagg atcggtttga gcgtcaggag gttgaggtct 841 ctgataagct ctgcttcggc ttcctgttgt gactgatatt tcaaagcgtc tgcttgcttc 901 ttgatctgtg cgtcaagctc gcgttcctta attgcaatgt ccttgtcggc aagctctgct 961 tccttttcgc ggcgagcaat gtcggcatta gtctttgcaa tttcaatgac cttacgctgc 1021 tcttcgtgct gaatcgaata tgcggcatct gcttctgcac gcttagcatc agaacggacc 1081 ttcatttccg cctgctgaac agcaagttcc gcgttctgct ctgcaatcat cttttcagat 1141 tcgaccttaa cagcattggc ttcctgctgt gccttcgagg ttgcaatagc aatgtcacgc 1201 tgtgcgtttg ccttggcgat ctgtgcattc ttgcggatct gctcaacgtt gtcaataccc 1261 atgttttcaa tggtacctgc gccgtcctta aagttttgaa tattgaagtt tacaacctca 1321 atgcccagct tttccatatc gggaacaaca ttttcggtga tcttctttgc aacgccctgt 1381 ctgtcctgaa ccatttcttt aagtccaacg gagccgacga tctcacgcat attaccctca 1441 agtacctgag ttactaaagc gacaagctct tggcggtttt tgcccaagag cgcctctgat 1501 gctctctcca aaagctgagg atcggatgaa atcttgatgt tagcaacgcc gtcaacgctt 1561 acgttaataa attcgtttgt gggaacagct tcgcttgtct taacgtccac ctgcattaca 1621 cccaaggaca atttatctac tcgctcaaag aaaggaactc tgaagcctgc tttaccaatg 1681 agtatgcgct tcttggaacc aagacctgaa attatgtatg cagtatccgg cggtgctttt 1741 aagtaacctg ttgcaaacag aaatacagcc agaagtatga ttgcgccaat aatgatgtaa 1801 gttaacattt aagttacctc ctttaaaatg atggtttgct ttctcccggt ttgtcaaaag 1861 cgtgagttcg cgagttgtac gggaatctat acaaaaagac tcccagcgtt attcaacact 1921 gaaagtctcg ttttaatcaa tgatatagat ctaagtacga accgagcacc tgcagttgct 1981 gtcatgacga tacgtacaca ttgccggggc aatgaactac tccctttcga cacaatatac 2041 aatatcatac ataaagaagt ttgtcaatag attaacgaat gatttgtatg tttgcataat 2101 tccgtgaaat gcttttgtgc attctatgca aaaaggaaca aatcctttca atgtattgcc 2161 atattgtcac atcagtggcg agaacacttt caaaaatgcc tgaagcaggg catataatgc 2221 gcccttctta ttgatatcag caagcgttat ctcctgagat ttttccagcg tttcaaaaaa 2281 gtctatctct gcttgctcaa cgcatttcga cttatatgcc aaaacgctgt tttcaaagtg 2341 caaataaaaa cttctgaagt caaaattcac agtgcccaaa acacagactt cgctgtcggc 2401 aatcaagctc tttgcgtgca taaagcctgg tgtatactca ta // LOCUS sequence197 2430 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence197 VERSION sequence197 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2430 /mol_type="genomic DNA" /organism="" /note="sequence197" CDS complement(122..652) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MERDSLKSMLYSFARFGLYFLINIFGVIMAKVFIRSIGSFLVPRL QLHYNDELLSFFSFLIPLALFIALFADDAKRHTAYGTYNMTLVGIVMILTSAVYYIPVL VMPHIDDKATLLAIENMYFSGYWLSLIDTSIEIYALIEIIIYLIACIGTYAVARKIYVK KFDSGEYEYLYDR" /locus_tag="LOCUS_6610" /note="MGA_891" misc_feature complement(784..>2430) /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_004082550.1:endo-1,4-beta-xylanase XynA" /note="WP_004082550.1 endo-1,4-beta-xylanase XynA (Thermotoga maritima) [pid:35.5%, q_cov:73.7%, s_cov:33.8%, Eval:3.4e-54, partial hit]" /note="MGA_892" /locus_tag="LOCUS_6620" ORIGIN 1 cgcataatta aacagcagaa tatgcaaaaa cccgcaggta tttcctgcgg gtttctttat 61 tgtaataaaa aagagaaggc gttgttatta gccttctctt ttgcttgttc taatcagtca 121 tttacctatc gtaaaggtat tcatattcgc cgctgtcaaa cttcttgaca tatatctttc 181 ttgcaaccgc atatgtacct atgcaagcga tcaagtagat gataatctca attagtgcat 241 atatctcaat gcttgtgtca ataaggctga gccaatagcc ggagaaatac atattctcaa 301 ttgccaaaag cgttgccttg tcgtcaatgt gaggcatcac caaaacaggg atgtaataca 361 ccgcagaggt caatatcata acgattccga caagcgtcat attatatgtg ccatatgccg 421 tgtggcgttt tgcgtcgtca gcaaacaggg ctatgaaaag cgctaatgga atcaaaaatg 481 agaaaaagct caaaagctcg tcattataat gaagctgaag cctcggaact aaaaagcttc 541 cgatcgagcg aatgaacacc tttgccatta tcacgccgaa tatgttaata agaaagtaaa 601 gtccgaatct tgcaaagcta tatagcatgc ttttaagtga atctctttcc atattttcct 661 ccatagtatc agtataaata tataatacca cttgtcagta ccatcttgca agtctttttt 721 aaaaaactcg gcaagaaata tggcataacc acacatattc cgcgtgatta tgccaattat 781 cttttaataa tataacctca ttacttcctg aattttatag aaacagggct tgggctggaa 841 gtttgtgtca aacagagtat atgtagtctt gtcgttggaa tagaatacaa atccgtccat 901 caatccgaag atggtgacag atgtgatatt tgcttttccg ccgccgtcgg tgtcaagctt 961 tctcaacatc ttgaaaatat cctcatatct cttcgactgc acctgcaggt cataatcaga 1021 aaggctgtct gccgatatgc tcatctcgga aatgtgtatc tcaatgccaa gacgggcata 1081 ttggttgata gcttcctcaa tgtttgaaat gctgggccag cttattcccc atgtgtcctg 1141 cattcccaaa ccgtcaataa gccccttgct cttaagatat tcgcacagct tatatacata 1201 tgtgcgcttt gaggacatat gggtgttgta atcgttataa aacagcttaa cgccctctgc 1261 ggcatatttt ctcgcgctgg taaatgccag ttcaacataa tcctcgccca aggtcacata 1321 ccaagggttg tcgtttccgc cgttctttgt tctgcaagca aaaatgcttc cctttgcgcc 1381 ggattcgggg tcaaccgcct cgttaacaac atcccagcaa taaataactc cggggtattt 1441 ttcctggcaa tatgtcatga cctgcttaat gtagctgtca agtcgctttg ccattgtatc 1501 ataatcgacg tattttccgt ccttctgata tccctctcta aagaaccagt cgggggtttg 1561 tgtatgccaa acaagagtgt gacccctcat ttgaattccg ttttcatagc accacttgag 1621 ggtcttgtca acgcttgaga agtcaagtgc ggggtcctgc ttgccgcttc ttgcgtttga 1681 aatgctcttt tgctgattca aaagatatga cggcttcatc agatttgtaa gtgttacgct 1741 gttggcgtga tgccatacga tcgccatata ttcttccgaa ttaacagcgg cattcgatgt 1801 gccattgccc gtaagtccga agccgaactt gaaatagtct ttacaaagct ccttcattga 1861 aggcgccgtc atcgccgcac tcaaatcata cttgctcttt gtatagtcat agtaatatgt 1921 cttaacaggc tcagcttctg actttgcttc ggttgtagtt gtcgcctcgg tggttgtggc 1981 aactgttgtt gtaacctcga caggcttttc cttgctcaaa tactttccgt tgacaaatct 2041 ttcttctccg cggaatttaa ttctcgccca gccgttatcc acccagccgg taacttcaac 2101 cagatcgccc ttatcaacgt ggctgattct ctcgccgctc tgttcaggcg ttgctcttac 2161 attcaaatcc gcagttgcat aaagtttttc gctcgcaggt gtaatcaccc agtcgggctc 2221 aggatctggt gtggttgttg cctctgttgt tgttacaggg acggttgtgg ttgcctcggt 2281 agtcgtggtc gcttctgtgg tagtaacctc ttctgtagtt gtttcttctg ttgtggttgt 2341 tgcttcagtc gtcacctcgg gtgcctgtgt agcttcgtcg cttgtgacgc tcggctcctg 2401 cgggctgtgc gcttctttgt cggcgcatcc // LOCUS sequence198 2416 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence198 VERSION sequence198 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2416 /mol_type="genomic DNA" /organism="" /note="sequence198" CDS complement(469..1740) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MNRFDILEGIGYIDEELIDEACEKSVRARPSRTRLALIAAAAVMA IALVSCGIYEIVAAWSEVKTEPYDYLSIHDRIESFQALTYDTDYINALAAEYGIASEEL VVNQYHEEIRFGYYFSQVLIASKEKAVALLITDAEQFTFDFEFNGYFIHEKTKEFKIET QSVTAKGGTLEIIMYCEDGWECFGGILARSHPEEELNMFTPIFAISDGKHSGTFLYTDE YYTKLSEKAWEIYDSGKEGEVASKSQYDHNSLHDGKKKYDVKVSGLEAMIEKYAEGITY PTEKTYYVCDEGENGEFIELGYIYDDSGAMVFMNENAESTATILYATGIFYNAEKDEYR VVKQTVTTTDAAVARFHSKDGWKCIGVTAYRLVQDSFEPYGSAASVTYIENDMADSMYF AEKVWKELANNVESMELVFASTGK" /locus_tag="LOCUS_6630" /note="MGA_894" CDS complement(1737..2291) /product="sigma-70 family RNA polymerase sigma factor" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_000840007.1" /transl_table=11 /codon_start=1 /translation="MNTKITELYFARNQQAIDETKREYGKLLSGIVSGILPQEQDVEEC LNDTYLQLWNTIPPTHPESIRAYACKIARNLALNKLKYITAMKRGSQFDVVLDELSEVI PADTDVQSQVDSRELGRLISKFLRQQPSDNRIIFIKRYWQFMPSNEIAKDLGYSRTKVN SSLHRTRARLRKFLNERGYNA" /locus_tag="LOCUS_6640" /note="WP_000840007.1 sigma-70 family RNA polymerase sigma factor (Bacillus) [pid:25.7%, q_cov:89.1%, s_cov:86.2%, Eval:2.0e-08]" /note="MGA_895" ORIGIN 1 agaactccca gcaggcctgc acctggtgcg cacaggtcag ctacaaatcg gagcaggaca 61 aaaagcacga cgaatttttg tgcaaggata tgcttgcaat ggagaagcac gtttcgggac 121 tttatgacac cagcgtgttc gaatttaatg acacccaggc aagaaacgtc ctcaaccata 181 tccagaagga agaacaggaa cacggcgaca agctttataa gtatatgtcg gcaaacggga 241 tgtacaatta acagctgagt aaacttagct tttaataaga agtttgcctt ccgcgactaa 301 agccacggat tttgctacgc aaaaccggca agcttcacat agtgcaaagt cgctcccttc 361 gggagaggtg ccgcgcgtaa gcgtgtcgga gagggctaca cggcgcgccc tcgcaaacaa 421 aaccccaccc atccttgcga tgagtggggg tgcttgcggg tgtgtgtctt attttcctgt 481 tgaagcaaag accagttcca tcgattcaac gttgtttgca agctccttcc agaccttttc 541 tgcgaaatac atactgtcgg ccatatcgtt ctcgatgtaa gtgaccgacg cagcacttcc 601 atacggctcg aaagaatctt gaaccaagcg gtaagccgtt acgccgatgc atttccagcc 661 atccttcgag tggaatctcg caactgcggc atcagtggtc gtaacggttt gtttgactac 721 gcggtactcg tccttctcgg cgttatagaa tatgcctgtt gcatagagga tagtcgctgt 781 gctctctgca ttttcgttca taaagaccat tgctccgctg tcgtcataga tatatccaag 841 ctcgatgaac tcgccgtttt cgccctcatc gcagacatag taggtctttt cggtgggata 901 ggtgatgcct tcggcatatt tttcaatcat cgcctcaagt ccgctgacct taacatcata 961 cttcttcttt ccgtcgtgaa gcgagttgtg gtcatattgg gatttgcttg ccacctctcc 1021 ttccttaccg ctgtcgtata tctcccaagc cttttcggag agctttgtat aatactcgtc 1081 ggtgtaaagg aatgtgccgg aatgtttgcc gtcgctgatt gcgaaaatgg gtgtgaacat 1141 attcagctct tcttcggggt gcgacctcgc cagaattccg ccgaaacatt cccagccgtc 1201 ctcgcagtac ataataattt caagcgttcc gccctttgcg gtgacgcttt gcgtttcaat 1261 cttaaattct ttagtctttt cgtggatgaa gtagccattg aattcaaaat caaaagtgaa 1321 ttgctcagca tcggttatta aaagcgcaac tgctttttct ttagatgcga tcaggacttg 1381 gctgaaatag taaccaaagc gaatttcctc atggtattgg ttgacgacca gctcttcgct 1441 tgcgatgccg tattctgcgg ccaaagcatt aatatagtcg gtatcatatg tgagtgcttg 1501 gaatgattct attcggtcat ggatgctcaa atagtcatat ggctccgtct tgacttcact 1561 ccacgccgca acgatctcgt atattccgca ggaaacaagt gctattgcca tgaccgccgc 1621 cgcggcaatt agagcgagtc tcgttcttga gggccttgcg cgcacgcttt tttcgcacgc 1681 ttcgtcgata agttcctcgt cgatatatcc gattccttcc aaaatgtcaa atctgttcac 1741 gcgttataac ccctttcgtt taaaaatttg cgcaaacgcg cccttgttcg gtgaagcgag 1801 gagttgacct ttgtcctcga gtagcccaaa tcctttgcaa tctcgttgct gggcataaac 1861 tgccaatacc gcttgatgaa aatgatgcgg ttgtcgcttg gctgttggcg caaaaacttg 1921 ctgatgagcc gtccgagctc gcggctgtcg acctgcgact gcacatccgt gtctgcggga 1981 ataacctcgc tcagctcgtc caaaacaacg tcaaactgcg agccgcgctt catggctgtt 2041 atgtatttaa gtttgttcag cgctaaattc cgcgcgattt tgcaggcgta tgcgcgaatg 2101 ctttcgggat gtgtcggggg aatggtgttc caaagctgta agtatgtatc gtttaagcat 2161 tcttccacat cctgctcttg gggcagtatt cccgaaacga tacccgataa aagcttgccg 2221 tattcgcgct ttgtttcatc tattgcttgc tgattgcggg caaaataaag ctcggtgatc 2281 ttggtgttca ctctatcgct ccttccttga aaagacatct ttcatctata tagacaacgt 2341 gagttggggt tttgtcgcgc atatatttaa attttattga aatttctttg caaagtcaaa 2401 tcggtgtggt ataata // LOCUS sequence199 2414 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence199 VERSION sequence199 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2414 /mol_type="genomic DNA" /organism="" /note="sequence199" CDS 108..644 /product="DNA topology modulation protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_000720566.1" /transl_table=11 /codon_start=1 /translation="MQRVMIIGNCGAGKTHFSLALAQKTGLPVVHLDKLKWHGDWQALS SEEFDPLLEEELKKPRWIIDGNYNRTIEWRMEYADTVIYLDFSTLACLYGVTTRVLSNY GKTRPDMGGNCPERFDMEFMRFVFEYRKKRRKPVLEMLANAEDKQVIILKNRREVNRFL KSLPLEGKVSAYADG" /locus_tag="LOCUS_6650" /note="WP_000720566.1 DNA topology modulation protein (Bacillus) [pid:41.2%, q_cov:92.1%, s_cov:95.9%, Eval:4.4e-34]" /note="MGA_896" CDS complement(708..1868) /product="3-phosphoglycerate dehydrogenase family protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_000490229.1" /transl_table=11 /codon_start=1 /translation="MYNILTLNKIAAIGTDNFDKAKYNVGEAVASPDAIMVRSASMLDM QFEENLVAIARAGAGVNNIPVDRCSEEGICVFNTPGANANAVKELVVAGLLLASRKVTD AIDWAKTLKGNGAEVPKQVEKGKGQFAGPEIMGKTLGIIGLGAIGVKVANTPLSLGMKV VGYDPFLSVNAALGLKPNVNVVKSLAEVYAAADYITLHLPYNAETKDTVCAESIAKMKN GVKILNFARGELVNNADIIAALEDGSVSCYVTDFPNDDVIGVKNVVAIPHLGASTPESE DNCAYMAAVELIDYIETGKITNSVNLPNCELAKTADHLVCVIHRNVPAMFSQITAVISA AGGNIENVVSKAKKDWAYTMMDVTGDVAKAFAEINNIDGVTKVRVL" /locus_tag="LOCUS_6660" /note="WP_000490229.1 3-phosphoglycerate dehydrogenase family protein (Bacillus cereus) [pid:49.9%, q_cov:100.0%, s_cov:99.7%, Eval:4.2e-106]" /note="MGA_897" misc_feature complement(1861..>2414) /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_011462039.1:3-phosphoserine/phosphohydroxythreonine transaminase" /note="WP_011462039.1 3-phosphoserine/phosphohydroxythreonine transaminase (Desulfitobacterium hafniense) [pid:69.9%, q_cov:99.5%, s_cov:50.6%, Eval:4.1e-70, partial hit]" /note="MGA_898" /locus_tag="LOCUS_6670" ORIGIN 1 gccggggctt cgcccgtcgg cgcacaaaag ttttagattc tgagcaaatg cagcgcgtct 61 gcgaaaaggg cggcagtccc gcaggtgcgc ggggaaagga gcacaggatg caaagagtaa 121 tgataatcgg caactgcggc gcaggcaaaa cccactttag ccttgcgctt gcgcaaaaaa 181 ccggattgcc cgttgttcac cttgataaac tcaagtggca tggcgattgg caagcgcttt 241 caagtgaaga atttgacccg cttcttgaag aggagcttaa aaaaccgcgt tggataattg 301 acggcaacta taaccgcaca atcgagtggc gaatggaata tgccgacaca gtcatatatc 361 tcgatttttc aactcttgct tgtttatatg gtgtaacgac gcgcgtgctt tcaaactacg 421 gcaagacacg ccctgatatg ggcggaaact gccccgaacg gttcgatatg gagtttatgc 481 gctttgtttt tgaatatcgc aaaaagcgcc gcaagccggt tcttgaaatg cttgcaaacg 541 ctgaggataa gcaggtaatc attctcaaaa accgccgaga ggttaatagg tttttgaaaa 601 gccttcccct tgaggggaag gtgtcggctt atgccgacgg atgaggtgga cttagggaca 661 actgagcaca aaaagacccc cgtgaggagg tcttttcttt tttattatta gagtacacga 721 acctttgtaa cgccgtcgat gttgttgatt tcggcgaaag cctttgcaac atctcctgta 781 acgtccatca ttgtgtatgc ccaatccttc ttggccttgg atacaacgtt ttcaatattt 841 ccgcctgccg cagagataac agcggtgatc tgggagaaca ttgcgggaac atttctgtgg 901 ataacgcaaa ccaagtggtc agcggtcttt gcaagctcac agttgggcag atttaccgag 961 ttggtgatct tacctgtttc aatgtagtcg atcagttcaa ctgccgccat atatgcgcag 1021 ttgtcttccg attcgggagt tgatgcgcca aggtggggaa ttgcaacaac attcttaacg 1081 ccgataacat cgtcgttggg gaagtcagtg acatagcagg aaacgcttcc gtcttcaagc 1141 gccgcaataa tatcggcatt gttgacaagc tcgcctcttg cgaagttcaa aatcttaacg 1201 ccgtttttca tctttgcgat agattcagcg catacagtgt ccttggtttc tgcattataa 1261 ggcaaatgca aggttatgta atccgctgcg gcataaacct cagccaaaga ctttacaaca 1321 tttacattgg gcttgagtcc cagtgcggca tttaccgaga ggaaggggtc atatcccacg 1381 accttcatgc ccaaagaaag cggggtgttt gcaaccttaa cgccgattgc gccgaggccg 1441 atgataccca aggtcttgcc cataatttca gggcctgcga actgtccctt gcccttttca 1501 acctgctttg gaacctcagc accgttgccc tttaaggtct tagcccagtc aatagcatcg 1561 gtgaccttac gggaagcgag caaaagtcct gcaactacaa gttccttaac ggcgttagcg 1621 tttgcaccgg gggtgttgaa tacacaaata ccctcttcgg agcaacggtc aacgggaata 1681 ttgttgacac cggcacccgc acgggcgatt gcaacgaggt tttcctcaaa ctgcatatca 1741 agcattgatg ccgagcggac cattattgca tcgggggagg cgactgcctc gcccacgtta 1801 tatttagctt tgtcaaaatt atctgtgccg atagcggcaa tcttgttaag tgttaaaata 1861 ttatacattt tcagcctcaa actttctcat gaattcgacc agcgcattaa caccctcgat 1921 gggcattgcg ttgtagatgg atgcgcgcat accgccgaca gaacggtgac ccttgatgtt 1981 gataagtcct gccttcttgg cttcggaaac aaactttgca tcaagctcct cattgcctgt 2041 aacaaaggga acattcatca aagatctgtc cttgcccata acagttgcct tgaagagctt 2101 tgaagaatcg aggaagtcat acaaaacagc agccttttca gcgttcagct ttgccatcgc 2161 ttcaagtccg cccttttcgg caacccagtc aagaacaaga cccaagatat aaataccgta 2221 tgtaggggga gtgttataca ttgatccgtt gtctgcgtga gtctgatagt tgaacatggt 2281 gggggtaatg tccattgcgt tgccgatgag gtcttcgcga atgatgacaa cagtgagtcc 2341 tgcgggaccc atgttcttct gcgcacctgc atagatcatt ccatactttg aaacatcaac 2401 aggctcggaa agaa // LOCUS sequence200 2406 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence200 VERSION sequence200 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2406 /mol_type="genomic DNA" /organism="" /note="sequence200" CDS complement(71..766) /product="ribonuclease III" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003428341.1" /transl_table=11 /codon_start=1 /translation="MNKLHEFEKIIDYKFNNIQLLFEALSHSSFANESKDGLKSNERLE FLGDSVLSIVVSEYLFSNFSDLPEGELTKTRSTLVCEKSLHSFGKTISLGDYIMLGKGE EITGGHQRPSIIADAFEAVIAAIYLDGGYDAAKRHIMRFMPADVRTAVKKAYDDYKTIL QEIVQKNPEESVEYHLVGESGPDHNKTFTIQVLLNSNVIGEGTARSKKQAEQLAAKEAL KLMGCITDD" /locus_tag="LOCUS_6680" /gene="rnc" /EC_number="3.1.26.3" /note="WP_003428341.1 ribonuclease III (Clostridioides difficile) [pid:51.8%, q_cov:96.5%, s_cov:94.5%, Eval:5.1e-59]" /note="MGA_900" CDS complement(769..1767) /product="phosphate acyltransferase PlsX" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_012047867.1" /transl_table=11 /codon_start=1 /translation="MTIIIDGFGGDNAPLEVLKGSLNAKSKLGVDITVVGNEENIRKCA LDNNLDISALNIHHADTVMEVCEDPKKILKEFKNSSMAVGLQLLKDGEGDAFVSAGSTG ALVMGATFIVKRLKGIKRPALATVMPTLGAPCMIMDVGANAEVRPEILHQFAIMGSAYM KNLMGVESPRVALANIGTEPTKGRELEVETYKLLSASDLNFIGNIEARQIPLGDADLVV TDGFSGNILLKSIEGMAKFFSASLKDMFKSGPLSILGYLCLKGMVNEFRKKMDYKEHGG APLLGTAKPVFKAHGSSDAKAFYNAIRQAKTFCEKEVIKEFAAAISSGSEE" /locus_tag="LOCUS_6690" /gene="plsX" /EC_number="2.3.1.274" /note="WP_012047867.1 phosphate acyltransferase PlsX (Clostridium botulinum) [pid:46.0%, q_cov:96.7%, s_cov:96.1%, Eval:1.4e-72]" /note="MGA_901" misc_feature complement(1764..>2406) /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_000195254.1:methylenetetrahydrofolate--tRNA-(uracil(54)- C(5))-methyltransferase (FADH(2)-oxidizing) TrmFO" /note="WP_000195254.1 methylenetetrahydrofolate--tRNA-(uracil(54)-C(5))-methyltra nsferase (FADH(2)-oxidizing) TrmFO (Staphylococcus) [pid:60.1%, q_cov:97.2%, s_cov:47.8%, Eval:5.0e-71, partial hit]" /note="MGA_902" /locus_tag="LOCUS_6700" ORIGIN 1 gtgctgattg caaaagctgc aacggttagg gcaaccgata tggggtacaa agattgaaag 61 atttgctttc ttagtcatct gtaatacagc ccatcagctt taaggcttcc tttgcggcaa 121 gctgttcagc ttgttttttg cttcttgcag tgccctcacc aatgacattt gagttcagaa 181 gcacctgaat ggtgaaggtt ttgttgtggt cgggtcccga ttcgccgaca aggtgatatt 241 caaccgattc ctcggggttt ttctgaacaa tctcctgcag aatggtctta tagtcgtcat 301 atgccttttt gacagccgtt ctgacgtcgg caggcataaa acgcattata tggcgctttg 361 cggcatcata tccgccgtcg agataaattg cggcgattac cgcttcaaag gcatcagcaa 421 ttatcgaggg gcgctgatgg cctcctgtga tctcctcgcc tttgccgagc attatataat 481 cacccaagga aatggtcttt ccgaagctgt ggagcgattt ctcgcagaca agggtcgaac 541 gggttttggt cagctcaccc tcgggaagat cggaaaagtt ggaaaacaaa tattccgaca 601 caactatcga caaaacggag tcgcccaaaa attcaaggcg ctcattggat tttaagccat 661 ccttcgattc gttggcaaat gacgaatggg acagcgcctc gaacagaagc tgaatattgt 721 taaatttata atctattatc ttttcaaatt cgtgaagctt attcacaatt attcctccga 781 accggacgaa attgcagcgg caaattcctt gattacttcc ttttcgcaga aggtctttgc 841 ctgtctgatc gcgttataga atgccttggc atcgctggaa ccgtgagcct taaaaacagg 901 cttggctgtt cccaaaaggg gcgcaccgcc gtgctcctta tagtccatct tctttctgaa 961 ctcgttaacc atgcccttta agcaaaggta gcccaaaatt gaaagaggac cgcttttgaa 1021 catatccttt aaggatgcag agaagaactt cgccatgcct tcaattgatt tgagaaggat 1081 attgcccgag aagccgtcgg ttacgaccaa atctgcatcg cccaagggaa tctggcgggc 1141 ttcgatgtta ccgatgaagt taaggtcact tgccgaaagc agcttatatg tttcaacttc 1201 gagctctctg cccttggtgg gctcggtacc gatgtttgca agggcaactc tggggctctc 1261 aacacccata agatttttca tatatgcaga gcccataatt gcaaactggt gaagaatttc 1321 gggcctgacc tcggcatttg cgcctacgtc cataatcata cacggcgctc cgagggtagg 1381 cattacagtt gccaaagcgg gacgcttgat gcctttaagg cgcttgacga tgaatgtggc 1441 acccataaca agagcgcctg ttgagcctgc ggaaacgaaa gcatcgcctt cgccatcctt 1501 taggagctga agtcccacag ccattgagga gtttttgaat tctttgagta tcttcttggg 1561 atcctcgcag acttccatta cggtatcggc gtggtgaata tttaaagctg aaatatcaag 1621 attgttgtca agagcacatt tgcggatgtt ttcctcatta cccacaaccg tgatatcgac 1681 accaagcttt gattttgcat ttaaagatcc cttcaaaact tccaagggag cgttgtcgcc 1741 tccgaagccg tcaatgatta ttgtcatagt ttgcctccta tcacattgtc aagagcacaa 1801 agcgcgcgat ttgcaagcgc ttcatacttt tcctgcttgt ttttaattct ttcgggaagc 1861 tcgggcagta ttcccatatt gcagcccata ggctgaaaat ctgccgagtg gccgtatgcc 1921 acatacttcg aaagtgcgcc gagcattgtt tctgagggta aggtgatttc ctctttgccg 1981 agaagctttc ttgataagct cattgcggca tatattcccg aagcggctga ttcgatatat 2041 ccttcaacac ctgtcatctg acctgcaaaa tagatgcggt tatcgggaat aaagcagaaa 2101 tgctcgtcca atattccggg agaattgatg taggtgttgc ggtgcataac gccatagcgg 2161 acgaattcgg catttgccag accgggaatc agcgaaaata ctcgcttttg ctcaccgaat 2221 ttgagatttg tttggaatcc tacaaggtta tatagtgtgc cggagttatt ttccttgcga 2281 agctgaatga cagcataggg acgacggcct gttcgggggt cggttagacc cacaggcttg 2341 agaggaccga aacgcattgt gtcctctccc ctttttgcaa gcacttcaat tggcatacag 2401 ccttca // LOCUS sequence201 2403 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence201 VERSION sequence201 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2403 /mol_type="genomic DNA" /organism="" /note="sequence201" CDS 51..638 /product="manganese efflux pump MntP family protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011948910.1" /transl_table=11 /codon_start=1 /translation="MILDFVFIFNSALLGVGLAMDAFSVSLANGLNEPCMKKRKAFGIA GIFALFQALMPMIGWICVHTILQYFKAFEKLIPWIALGLLGFIGGKMLIEGIKNKADCE EKPGVGIAALLMQGVATSIDALSVGFTIAEYELVMALLAVVIIAAVTFVICSAGIYIGK HAGTKLAGSAGIFGGAILIFIGIEIFVTSFMK" /locus_tag="LOCUS_6710" /note="WP_011948910.1 manganese efflux pump MntP family protein (Clostridium botulinum) [pid:37.2%, q_cov:91.3%, s_cov:91.5%, Eval:6.6e-24]" /note="MGA_903" CDS complement(692..1186) /product="superoxide dismutase family protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_010964672.1" /transl_table=11 /codon_start=1 /translation="MIENNIGCYMSALRRQPNAMALIRGKGEYCDIKGTVRFYQLRSGV LTALEISGLPTLCDKCKSPVFGFHIHEGECCTGNAGDPYADTGAHFDMCENMHPYHSGD MPPIFSSCGCGFMIFLTDRFCVRDIVGRTVVVHAHPDDFHTQASGNSGEKIACGEILAS C" /locus_tag="LOCUS_6720" /note="WP_010964672.1 superoxide dismutase family protein (Clostridium) [pid:38.0%, q_cov:96.3%, s_cov:87.9%, Eval:7.6e-24]" /note="MGA_904" misc_feature complement(1262..>2403) /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_002262240.1:AI-2E family transporter" /note="WP_002262240.1 AI-2E family transporter (Streptococcus mutans) [pid:38.8%, q_cov:86.3%, s_cov:87.2%, Eval:8.0e-62]" /note="MGA_905" /locus_tag="LOCUS_6730" ORIGIN 1 acaagcttat aaatacagta gtataattat gccgatttgg aggaattata atgatattag 61 attttgtatt catatttaac agcgcacttt taggcgtggg acttgctatg gatgcctttt 121 cggtttcgct ggcaaacggt ttaaacgagc cgtgtatgaa aaagcgcaaa gcatttggaa 181 ttgcgggaat tttcgcgctg ttccaggctc tgatgcctat gatcggatgg atatgcgttc 241 acacgatttt gcagtatttc aaggcatttg aaaagctcat cccctggatc gcactcggtc 301 ttttgggatt catcggcgga aagatgctga ttgaaggaat taaaaacaag gctgattgcg 361 aagaaaaacc gggtgttggt attgcagctc tattgatgca gggtgttgca acatccattg 421 atgctttgtc agttggattc accattgcgg aatatgaact ggttatggca ctcttggcgg 481 tagtgatcat cgcagcggtt acatttgtaa tctgttcggc aggcatatat atcggcaagc 541 atgcaggcac aaagcttgca ggaagtgcag ggattttcgg cggtgcaatt ttgatattca 601 ttggaattga gattttcgtt acaagcttta tgaaataata gaacaagacc cgcgagtttt 661 taagctcacg ggtcattttt gttatattca gttaacagga agccaatatc tcgccacagg 721 cgatcttctc gcccgaattt ccagaggctt gagtgtgaaa atcgtcagga tgggcgtgaa 781 caacaaccgt tcttccgact atatcgcgaa cacagaagcg atcggtcaag aaaatcataa 841 aaccgcaacc gcatgatgag aatatcggcg gcatatcgcc cgaatggtat ggatgcatat 901 tttcgcacat atcaaagtgg gcacctgtat cagcataagg atcgccggcg tttcctgtgc 961 aacattcgcc ctcgtggata tggaatccaa agacagggct tttgcattta tcgcaaagtg 1021 tcggaagacc gctgatttca agggcagtta atactccgct tcgaagctga taaaaccgaa 1081 cggtgccttt gatgtcacag tactcccctt ttccgcgaat cagcgccatt gcatttggct 1141 gacggcgcag agcggacata taacatccta tattgttttc tatcataaaa agaatcctcc 1201 aaataaataa gtatcccttt atgatatgca gattttcaga aaatgttcgt actttgctta 1261 atcattttga ctttttggat ttcttcttgt tggcaggttt tgtcggctgt ttcttcacag 1321 ccttttcaac gggtttgatt tcctcaataa cggtagggat atctacaagc ggttcatccg 1381 ccaaagcaag ctcagcgggg tcagcagatt tattaacgtc gtttttaacg atgcgataga 1441 ttgccgcaac aatcggaaca ccgatcagca ttccgaatat gcccataatt ccgccgccga 1501 cggtgattgc cgccaagacc caaattccgg gaaggcccaa agatgagcct acaaccttgg 1561 gatagatgat gttgccttct aactgctgaa gaatgacaag gaatattaag aagaagagcg 1621 ccttgatggg cgaaacagtt aaaatcataa aagcgccgac aactgcaccg atatatgcac 1681 cggccacggg aatcaatgca gttaaagcga tgagcgcgcc gatcatggtc gcataaggga 1741 gctggagtat cagcataccg attatacaca aaaggcctaa aattacagct tcggtgcact 1801 gtccgacgat atacttgcgg aagcaatcat ttaagataga gagaacgtaa gtaattttgt 1861 tgtacatctt ctccttaata taatgctttg aaaccttgga gcactgtgct ataagcttgt 1921 cacgtccgat aaggaggtat acagagaaga tgatgctcaa gaatgaggtg acaattgccg 1981 agaatacaga tgaaacggtg tttatcacaa catccatcac acttccgaga cttgaagaaa 2041 gcatattgat tatctcgtca atgcggcttc tccagtcgat agattcgagg aaggcgatat 2101 tttcctcaga aagcaaatga tacttgtcaa tcaagtcgat caacttgttc atagctccgg 2161 gtatcatatc gatcaaaagc ttcatacacg aagtgaattc agggattacc aaacctgtta 2221 ccaatgcgat tatggcgagc aaggtgatat atgccgcgat catacaaatc ggtcggcggg 2281 acttcagcac tgctttcttg gtggattttg ggaaataaag ctcttcatat cggctcataa 2341 ggatgtttac aagataagca attgcaaagc cgatcagtaa aggcgcagct gcattaaaaa 2401 cag // LOCUS sequence202 2380 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence202 VERSION sequence202 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2380 /mol_type="genomic DNA" /organism="" /note="sequence202" ORIGIN 1 gcgttcccga aggcgttgaa ataatgagac ttgaaaacgt tggtgtttcc atcaccggta 61 actccaccaa ccccacaata ttccagcaac ccgttgcagg tacctataag aagtggtgcc 121 aggaaaacgg cgttaactac ttctctgttg cttccggcgg cggaaccggc agaacccttc 181 accccgacaa catggcagca ggccctgctt cctacggtat gactgatacc ttgggcagaa 241 tgcacggcga tgctcagttt gcaggttctt cttccgttcc tgctcacgtt gaaatgatgg 301 gtcttatcgg cgcaggtaac aaccccatgg ttggtatgac cgttgcatgt gcagttgcag 361 ttgaagaagc tttcaaggct taatcttttg caaatataaa taattaacag gcagagttta 421 accgatctgc ctgtttcatt ttcacaattt gtatatacct actgtttctc ggtttttgaa 481 cactgatttc ggttgacaaa ctctttttaa atgtagtaca attaatctgt ataaatattt 541 gaacagggga tgtttgaatg aaacgcatac ttagttttac tttggcactt atcatggcac 601 tgacagttct gccgatgatt gcttttgcaa ccgaggtaac tgtaaacgac gaatcgcttc 661 ccgcagttat cgatcctgct tcgactgaag cacccgcaga agtggaagtg cattatcaga 721 ccgtcacaca tgcaaacccg ctgtattaca gtgagcctgt aattacatct gtgaccgaat 781 atcactattc cactcagtat cttgccaact tcaacttcaa cttcgatgat tatcattctg 841 aagctgatgt aattgaagag atcacagagc atcttcataa cagagaaact gcgtttactg 901 tctatgtaaa ggtagacgca tattatggta caatatcaag tgatctcttc tatgccgcaa 961 tagagcatac aggcgcggct gatgaaggtg actatatcaa gtatcagtac ggcggattcg 1021 atgcaggaat tagctatgcc atatctggcg acacttatgt ccagatcgat tatactgttt 1081 cctactacgc tgacgcagca caggaagcaa ctgtcgacaa taaggtgtca acagtgcttg 1141 ctgctttaaa tgtcaacggt atgagtgatt acgagaagat aaaggcgatt tatgactaca 1201 tctgcctcaa cgttgtatat gactacgata acctcaatga tcctacatat cttttgaagc 1261 actctgcata tgccgcactc attaacggca aggctgtatg ccagggttac gcacttttgt 1321 tctatcgctt agctttggaa cttggaatcg actgccgaat tgtaacaggt cagtcggagg 1381 gacagaatca cgcttggaac atcgttaagc tgaatggaaa atattataac gttgactcca 1441 cctgggatgc tgaatacttt gacaagagag gcgtatataa ctacttcctc aagagtgatg 1501 ccgactttga tgagcacatc cgcgatgctg aacattcaag tgaatcgttc tacgccgcat 1561 atcctatgca taccgaaagc tacgacgtta accttgctgt tattgacgcg ggcacttgcg 1621 gcgctcaggg cgataacctc acttggtcac tttcaggcga cggaattctt accattgacg 1681 gcaatggcga tatgtttgaa tatggctggt ttttcgacga aaacgatgat atgtacagaa 1741 tcgacccgcc gtggttgaaa tatttcgaaa gaatcaagca gattaacatc ggtgttggtg 1801 ttgaatatat tgtcccttgg acccttgtaa actgtacaag tcttgaaaat gtattcgtcg 1861 atgatgcaaa cacatctctt tgcgacatca acggtgtatt gtacgataca caattgacaa 1921 ctctgtttgt ctaccctgaa aagagtgcaa ttaccgatta cgttatgccc gaaacaatta 1981 cttggtttga aatcggaatt caggctgata accttaaaac tattacattg cccggaaatc 2041 ttgagagtgt acaattctgg tactgcccca atctcgaaac tgtaactgtt aactctctct 2101 ttaccgagat ttatgaactt gaccagagtg taaccattcg cggatatgaa gattcagtag 2161 ccaaggaata tgcccttgca aacggaaaca catttgtttc ccttggcgag atccccagag 2221 tagtaatcga atccggaaat tgcggagata atctcacatg ggaatttgac aaccgcggca 2281 cactcaccat cagcggcgaa ggcccgacct acgattatgg ctttggagag gacaactcgg 2341 tccttctcac tccttggttt acctttaagg atagcatcaa // LOCUS sequence203 2376 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence203 VERSION sequence203 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2376 /mol_type="genomic DNA" /organism="" /note="sequence203" ORIGIN 1 agaactgcaa ggtctgtctg ggtgtcatat ccgattacgg ttgcttcata ttggtcggca 61 ttgctgtcaa cgatcataac tgtcttcgcg tcttcaataa cgtgagcatt ggtgatgatg 121 tagccgtccg agcttatgat tatgcctgtg cctgttgcgg tgctgttgcc aagtgtgcag 181 cttacgccta caacagaagg cgataccttg tcataaatgt cgggaatgct caaagcatcc 241 tcgggtgctg caagctgttc aagggtggga tattctctgt gggaaacatc gcctgcggtt 301 gtgcttgcat cgtcggcggg aacttccgaa acctcggggt cattttcgcc gggaatatca 361 acgccgggga gattttcgtg ggggtttctt ccctcgccgt cagtctcgcc gtcaacaacg 421 gtgttgtttt gctgtttatc aatattaatg tcgattccgt tgttctcaag aattgcggaa 481 tataccgaaa cggtgacaac aactacaaca aaaatgctca aaagtgcggc gacgattccc 541 aaaatcactc tgcctgcatt tgtctgcttc tttgcgggag cgtcgggggt atagacatat 601 tcatttgtat attcggtgtg agcatatgcg ggagtaggct caggttcgcg gacaggtgtg 661 ggctcgggtt gaggagcagg ctcgggtgag gaaacactct cgactacagg ttcagcatta 721 tcctcgaccg tttccgaaat gatctttgct tcaataattt cgggctgaga agcttctgcc 781 gatacagtag cctcattttc attattttca gcgccgttat ttaaaatttc aaattctgac 841 ataatagcct ccaaaaacat ggtaattgat ttaaattccg tcagtcatta taacacaaaa 901 caagttgtat tacaattttt tcagaaatgt ttctcaaggt catctaccat tatacccgtg 961 tatgtgaaaa ctgtatgaaa acaaacggaa tttttaacat catctttttt caccgtcgtc 1021 acgccttgat aaatgtgaat tagtgtggta taatactgac gaatttacat aaatttccga 1081 aaaaggaggt tagtgacata tggtatatac ggacttgctg tttctgtttg cgtttttgcc 1141 gatcgcaact gcttttataa tgattttaag cgagccttgg gaaaagaatc tggctgcagt 1201 tgccttatcg ctcatattta ttgtctgggc aagaccgata tattatgcgt tgataattct 1261 tcctgtaatc gtaacatatg tggcggctcg gctttacaat aaaacaaaaa gcggagcgat 1321 tattgtttcc gccgagatta tatctttaat attcggcggc ggctttgccc ttatttcggg 1381 cacagatgca acccttggcg gagcgatctg ctcggtcgga tttttgcttt tcacattaag 1441 gtcgtttatg tatcttaatg atgtgaagca tggtcaagac tccgaaaagg atttcacagc 1501 cttgggcgcg tatttgattt catatgaatt tatgctgatt tcgcccgtta agagttacag 1561 cgagctgagc gaacatctta aaacaagaaa gttcaagctt tcaaatttga gcttgggaat 1621 gaagaacttt gttttcgggc tttcaaaggt tgcaattttg ggtctttcgt ttgacagggt 1681 gaggcttgcg gcactcaatt cggatgcaac accttgggtc aatgcaataa tcggtctttt 1741 ggcggttatt gttgaaacat atatcctcct tgacggatat actcagatgt cggcaggact 1801 tgcctgcatt aacggcgtgc cgatggtttc gtcgggtgtc gccatccgtc cgagagcgag 1861 tcttattggt catatatcgg atgtatacgc agaccttggc gaagctgttg aaaagcactt 1921 cggcaaaagc gcaaaggcaa acattgtcgg acttgttgtt tgctcgctga tcgcaggtgc 1981 ggcaattgcc ctagaaaacg gcgcagttgc gttctttgcc cttgttttgg cggcactgat 2041 gatctcaaat gcgccctccg agcaaaagtc cggcttgttc gattttattg tcagccttgt 2101 tcttgccctc ggcggcttcc tgcttcttgc gaacggttcg gcatcgggcg ttgcaggctg 2161 gtttgcgtcg ttaaatccca acaactatga atttgacata tcatatgctt tatatgacga 2221 gctgacgagg gtgatccctt ggttggtcat cggaattgtg agcatcaccc cgttgcccga 2281 aatgtttgct tcggtattcc gcgcaagaat gtcggaaaac gaaaagtttt attcaattgc 2341 aagagcactc ggaacttgta tatgcgtttt gctgct // LOCUS sequence204 2369 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence204 VERSION sequence204 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2369 /mol_type="genomic DNA" /organism="" /note="sequence204" CDS 59..1504 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MENIKAIHLGPAKCAVDLGDGSERGEYVNQDYVLNKIGRPHRGIN LMYCYYPLDEGWPARASDAFVSTDKTNAWAYPYDDYFPYRGGLNGDKSAEVFEQIRDIR RHGQDVVFTLTADPNISDEHIIAIANDMKPFGRVLFRLNHEATGSWFSFNKRCTYQEVA DFFVRFTNIMHEHAPNVKMILCIGGVEDLSQEKIVMEEIFAEAVRATDIWSVDKYMALH WGWPHDVAEKGGHSHGYTGAGPVYDMTKASYKRFKHLCGRVEKPMVMSEFNADGDVTGP YDQCKTIRHYLDKLIEDDAKWFSGFTFYQFRDRGRLGLEWEDPNNPDVGIELPAMKEYK EIIKQDWFQPKMEQGAELTLPATLRWGGAEDAEGIAVPVHLERDPVFFELNFSENDESN LMIECNGRWFYKSPKCKFVDLMPAFFENRLDGEMDLTIKFFAPPASGENDLTIEGGDVN TYATINELPNIRIRYEAVIPYHG" /locus_tag="LOCUS_6740" /note="MGA_910" misc_feature complement(1735..>2369) /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_003436250.1:pyruvate kinase" /note="WP_003436250.1 pyruvate kinase (Clostridioides difficile) [pid:50.2%, q_cov:99.5%, s_cov:35.7%, Eval:7.3e-51, partial hit]" /note="MGA_911" /locus_tag="LOCUS_6750" ORIGIN 1 tatacttatg ctatgagttt aaattccacg gaattattat atgaaaggac ttacagctat 61 ggaaaacatc aaagcaatcc acttaggccc cgcaaaatgt gctgttgact taggcgacgg 121 cagcgaaaga ggcgaatatg taaatcagga ctacgttctc aacaagatcg gcagacccca 181 cagaggcatc aacttgatgt attgctatta tcctttggat gaaggctggc ctgcaagagc 241 aagcgatgct tttgtatcga ctgataaaac aaacgcatgg gcatatcctt atgatgatta 301 cttcccctat agaggtggat tgaacggcga caagagcgcc gaagtttttg agcagataag 361 agatatccgc cgtcacggtc aggatgttgt ttttaccctt accgccgacc ctaacatctc 421 cgatgagcac atcattgcta tcgctaacga catgaagccc ttcggccgag ttttgttcag 481 actcaaccac gaagcaacag gctcctggtt cagctttaac aagagatgta catatcagga 541 agttgccgat ttcttcgtaa gatttaccaa catcatgcac gagcatgctc ccaatgttaa 601 aatgatcctt tgcatcggtg gtgttgaaga cctcagccaa gaaaagatcg taatggaaga 661 gatctttgca gaggctgtca gagcaactga catctggtcg gtagataagt atatggctct 721 tcactggggc tggcctcacg atgttgcaga aaagggcgga catagccacg gttataccgg 781 cgcaggccct gtttatgata tgaccaaggc atcgtataag cgcttcaagc acctttgcgg 841 cagagttgaa aagccgatgg taatgagtga attcaacgcc gatggcgacg ttacaggtcc 901 ttatgaccag tgcaagacca tccgtcacta tcttgacaag ctcattgagg acgatgcaaa 961 gtggttctcc ggctttacct tctatcagtt ccgcgatcgc ggaagactcg gccttgagtg 1021 ggaagacccc aacaaccccg atgtcggcat tgagcttccc gcaatgaagg aatataagga 1081 gatcatcaag caggattggt tccagcctaa aatggagcag ggcgcagagc tcacactccc 1141 cgcaacatta cgctggggtg gcgcagaaga tgccgagggt attgcagttc ccgttcatct 1201 tgaaagagat cctgtattct tcgagcttaa cttctctgaa aatgacgaat ctaacctcat 1261 gatcgaatgc aacggcagat ggttctataa atctcccaag tgcaagtttg ttgaccttat 1321 gcccgcattc tttgaaaacc gtcttgacgg cgaaatggac ttgaccatta agttcttcgc 1381 tcctcccgca agcggcgaaa acgacctcac tattgagggc ggcgacgtta atacatatgc 1441 aacgatcaat gagcttccca atatcagaat cagatatgaa gctgtaattc cttaccacgg 1501 ataaatgttt agcgggatgt ccgtatcgga catcccgctg cgatataaat tccttgcggg 1561 atttgcgata tgcttacgcg cgatatttcc tgcggaagcg atatgccctg cggggcacaa 1621 agggatttat atcatatcgc actgaccttg tcagtatatc gcgtttgcgc agtaaacata 1681 tcgcttataa aacaaaaaga gagaacaaat gctgttctct ctttcttttt gtgtttactt 1741 tatcgtttca accttgatgg tatttgtgtt tccgggcaga ccgtttatct gtccgccggt 1801 taaaacaacg ttgtcgccct ttttgagctt caaaacatcc ttcgcctgat gcaatgcctg 1861 atagaacatt acctcctgcg agtcatactc ctcgctcaaa acgggaatta caccccagct 1921 caaattcagc tgacgccaag cgcgctcgtt ggtagtggtg ccgataatat cgcaaggcga 1981 acggaaacgg ctgaccattc gggcggttct tcccgaaatt gagttaacaa caatgcactt 2041 tgccccaacg tctatcgcca ttgcacaggt tgcatgggat atcgcgtcaa ggttgtttct 2101 gatcttatat tcggtggtgg cgaaccaacg gttatagtcg atgtgctttt ctgtaaattc 2161 tgcaatttcc gccatattct tcaccgcctg cgagggatat ttgcctgcgg cggtttcgcc 2221 cgagagcatg attgcacttg agccgtcata aactgcgttt gcaacgtcgg agatctccgc 2281 acgggtggga cggggattgt gtatcattga ttcgagcatt tccgttgcgg tgataacgcg 2341 cttgcccaaa agtctgcacc ttgaaatga // LOCUS sequence205 2366 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence205 VERSION sequence205 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2366 /mol_type="genomic DNA" /organism="" /note="sequence205" CDS complement(103..1038) /product="TIGR01212 family radical SAM protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_009968016.1" /transl_table=11 /codon_start=1 /translation="MSKAFEYSDGSKRFHTLDWELKKLFGKKVVKIPLDLGLGCPNRDG AKGVGGCTFCSEFRSGEFSGDMRLSLAEQFDETKKLYSKWPDALYIAYFQAGTNTYAPV HKLKGLFNEALALPDVVGLSISTRPDCISDEIADMLAELSERTYLTVELGLQSAKNATL ARINRGHTYEEFLAGYNKLVSRGVKVCIHIINGLPGETKQDMLETAKQVAKLSPYEIKI HLLHIISGTKMADEFAAGEFDVMSFEDYVNTVCDQLETLPPETVVARLTGDGDRKTLIA PDWSRDKRKVLNEIDKELRRRDSRQGKNRP" /locus_tag="LOCUS_6760" /note="WP_009968016.1 TIGR01212 family radical SAM protein (Bacillus) [pid:52.8%, q_cov:97.7%, s_cov:94.7%, Eval:1.9e-87]" /note="MGA_912" CDS complement(1035..2288) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MAKKKKNKDKLPRPEALIAREVPAKETPAFEIGRKGDEFDRMYTK AVREKTADADRLLKDLSRESKADKFNFLDAILPFLIIVFAALTFGVVSRGDIEEMFTTS FSAQSILDGTYTSQLDKIYSETLPFGEEIAYIGSFFGFGEQEKPKPDGEELPEIPPEEE EPVVTEPIVTEPVVTTPPETVTTTVTTTEPETLVTEPATYMMITNARVNIRAEASAEGE RLGRFDEGELVEVVEIGYGGWAKIIYGDGYAYVFAEYLSPVDGVEPPEVTEETTNAESE VIPDDTEETGDDVEYEITVMYAVSTVNIRLEPSTDSAILGYFIINEPVDVIEIQPDGWA KILYNGMTAYVYSEYLDVEPVVTTVEGQEEEIVTSAESEEIIPDETSVSEDGGMTETEQ TDEEEIIDDESTAEEETE" /locus_tag="LOCUS_6770" /note="MGA_913" ORIGIN 1 cccgccgcag gcgggcgaag accgctgcgt gcagcggtca ggcggcgctg cacgaccgca 61 taagctcgcg gcaaacgtgc tataaaaaca aaaaccgccc tattaaggac ggtttttacc 121 ctgtcgggaa tctcttcttc tcaattcctt atcaatttca ttcagaactt ttcgtttatc 181 tcgactccaa tcgggtgcga tgagtgtttt tctgtcaccg tcgcccgtaa gccttgcaac 241 caccgtttcg ggcggaagcg tttcaagctg gtcgcagacc gtgttcacat aatcctcaaa 301 gctcatcaca tcaaactcgc ccgcggcaaa ttcatctgcc attttggtgc ctgaaatgat 361 atgcaaaagg tgaattttga tttcatatgg cgaaagcttt gccacctgct tggctgtttc 421 aagcatatcc tgctttgttt cgccgggcag accgttgatt atatggatgc agacctttac 481 gcctcggctg acgagtttgt tatatcccgc aaggaattct tcatatgtgt gtcctcggtt 541 gattcgcgca agtgtcgcgt ttttcgccga ttgcaagcca agttcaactg ttaggtacgt 601 cctttccgac agctccgcca gcatatctgc aatttcgtcg ctgatgcaat cgggtcgggt 661 agatatggac aatcccacaa cgtccggcag agcgagcgcc tcgttaaaca gccctttcaa 721 tttatgaaca ggggcatatg tgttggtgcc tgcctggaaa tatgcaatgt ataacgcatc 781 aggccatttg gagtagagct tttttgtttc gtcaaactgc tccgcaaggc tcagacgcat 841 atctcccgag aattcgcccg agcgaaattc cgagcaaaat gtgcatccgc caacgccttt 901 ggcgccatcg cggttggggc atccaagccc tagatccagc ggaattttta cgactttttt 961 gccgaaaagc tttttcagct cccaatcaag ggtgtgaaac cgctttgaac cgtcagaata 1021 ttcaaaagcc ttgctcattc ggtttcctct tcggctgtcg attcatcatc aatgatctct 1081 tcctcgtcgg tctgctccgt ttcggtcatc ccgccgtctt ctgaaacaga ggtttcgtcg 1141 gggattattt cctcgctttc tgccgaggtg actatttctt cctcctgtcc ctcaaccgtg 1201 gtgacaacag gttcaacgtc aaggtattcg gaatatacat atgcagtcat accgttataa 1261 agtatctttg cccagccgtc aggctgaatt tcaattacat caacaggctc gttgatgatg 1321 aaataaccca aaattgccga atcggttgaa ggctcaaggc ggatgttgac cgttgaaaca 1381 gcatacatca ccgttatttc atattcaaca tcgtcaccgg tttcttctgt atcatcggga 1441 ataacttcgc tttcggcgtt agtggtctcc tcggtaacct cgggaggttc aactccatca 1501 acaggcgaga gatattcggc aaatacatat gcgtaaccgt cgccgtaaat gatcttcgcc 1561 caaccgccgt atccgatttc gacaacttcg accaattcgc cctcgtcaaa tcggcccaaa 1621 cgctcaccct ctgcgcttgc ctctgcgcgg atattgaccc tcgcgttggt tatcatcata 1681 tatgttgcag gctcggtaac caaagtctcc ggctcggtgg tggtaacggt tgtggtcact 1741 gtttcgggcg gagttgtaac aacaggttcg gtcacaatcg gctcggtgac aacgggttct 1801 tcctcttcgg gaggaatttc gggaagctct tccccgtcgg gctttggctt ttcctgctca 1861 ccgaagccga agaaggaacc gatatatgcg atctcctcgc cgaaaggcag agtttcgctg 1921 taaattttgt caagttgcga tgtatatgtt ccgtcaagga tcgactgcgc gctgaagctt 1981 gttgtgaaca tctcttcaat atcgcctctt gatacaacgc cgaaggtcag cgccgcaaag 2041 acaataatga gaaacggcag aattgcatcc aaaaagttga atttatccgc cttcgactcg 2101 cgggagagat ctttcaaaag tctgtccgca tccgcggttt tttcgcggac agccttggta 2161 tacattctgt caaactcgtc gcccttcctg ccaatttcaa aagcgggagt ttccttcgcg 2221 ggaacttcac gcgcgatgag cgcttcggga cgcgggagtt tgtctttatt ctttttcttc 2281 tttgccaaaa cgttcatcct cctttcggca gagttgggtc gcccgatagt gggcaagaat 2341 gtgcgtttat ctgactgccg ccgcgc // LOCUS sequence206 2365 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence206 VERSION sequence206 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2365 /mol_type="genomic DNA" /organism="" /note="sequence206" misc_feature complement(679..>2365) /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_003437073.1:YgiQ family radical SAM protein" /note="WP_003437073.1 YgiQ family radical SAM protein (Clostridioides difficile) [pid:55.7%, q_cov:99.8%, s_cov:87.0%, Eval:3.0e-183]" /note="MGA_915" /locus_tag="LOCUS_6780" ORIGIN 1 ccgtgatgac aaacctttaa aacatcggca tcaaggtcgt atgagttgtt gacataatac 61 ttctctgcca aggcttcaat atctcctgta aacaggaatg aatgctctcc gatatcatac 121 ttgatgagga tcgaatagtt attcaagttg tcctctttat agtcggagat atacatttta 181 attctgccgt caccaaagtc gaattcgaga ttctcgcctt tatacagcct tgctccgcga 241 tttgcaaccg ccaacaaaaa acgctcatag gttttggttg tgggaacgtg ctccgcagca 301 atttcgggca tatagatctt gccgatctcg atatcagatg atattaccga tgcaagtccg 361 cccatgtggt cggagtgcgg atgtgtcgca attatatagt caaggcggtc aattcccagt 421 tcttccaagt aactgagaac aaccgggcca tattccgctt cacccgagtc gattagcatt 481 gtcgttccat cagtggcaac aataagctcg ctatctccct gaccgacgtt gatgaaatgg 541 acactcgact cccctgcctc taccgttacg gtatctgacg gtttcgctgg aagtcggatg 601 gtaattaagc ccttctcgtt gagcgcaaaa attgcaagcg ctgcgattac agctacacag 661 agaagaataa ccagtatatc atttcttttt tgctttttgg tttttcgttt tgccataatt 721 tcctccggat gagcgtcggt tgtcctgtac cgcatggctt actctgcccg aagtttttcc 781 gcgggcggag gatttttgct gttgttttct taaatattcg ttatcgggtt ttacaaggtg 841 ctccttgccg ttgccgataa ggtcgcgcct gtccgctcgt tccaaaatct caattatgcg 901 gcgctgattc ttaggcataa agtattgcaa aagagcgcgc tgtgcagatt tttcctcggg 961 agtttttgca acatatacag gctgcatagt gtatggatca aggcctgtat aaaacataca 1021 ggtggaaatc gttccgggag tgggatagaa gtcctgcacc tgctcgggat ggatattatt 1081 ttcctttaag aacaatgcaa gctcaattgc atcgttaatt gtgcttcccg gatgagatga 1141 cataaggtaa ggaacgagat actgctcttt tcctatcttg cccgtaatct cataaaactt 1201 cttctggaaa cgcttgtaag cttcaatatg aggcttgccc attttatcca aaacctgtgc 1261 tgagcaatgc tcgggggcaa ctttaagctg accgctgacg tgatatttga tcagctcggt 1321 cataaattcg tcgtccttat cctcaatcag atagtcatag cggatacctg aacggatgaa 1381 cacctttttg accttcggaa ttgcgcggag ctttcgcaga atttcgagat attccttgtg 1441 gtcaacatca aggtttgcac aaggcttggg tgccaagcac tttttgccct tgcaaagacc 1501 catttcaagc tgttttttgc aagatgtatg cctgaagttt gcggtaggtc caccaacatc 1561 gtggatatat cccttgaagt tgggcatttg tgttataagc tctgcttctt taagaataga 1621 ttcctcgctt cgtacagaaa tctttcttcc ctgatgcaaa gcgattgagc aaaagttgca 1681 aaaaccgaag caaccgcgat tgtgagtgat tgagaattga acctcttcaa ttgaaggcac 1741 gccaccctct ttttcataca tcgggtggta tgtgcgcata taaggaagtg aatacacttc 1801 gtcaagttct tcagttgtga gtgcccgcgg gggcggattt tgaaccagca tcatattgcc 1861 gtgacgttgg attattgttc tgccgtaaac ctcatcctgc tggtcatatt gaattcggca 1921 ggctttggca tacatttcct tgtttgatac aaccatctca aaggaaggac attcaactgc 1981 gccgtaaggc gtttcaaccg tgggacaaag ataacaggtg cctctgacat cgcggatatt 2041 cttgatgctt tcgcccgcat tcaagcggtt tgcaagctcg acaatgcagt tttcgctcat 2101 accgaacatc aaaatatcgg ctttggaatc aaccaaaaca gatgggcgaa cagaatcgtc 2161 ccaatagtca tagtgtgcaa atcggcgcaa agaggcttca agtccgccaa gcataatcgg 2221 tgtatcgggt gtcagcctgc gcaaaatgct tgaatatacc gatgcggctc tgtcgggtct 2281 cttgcccatt acgtttcctg cagaataggc atcgtgctca cggcggcgct ttgcaacact 2341 gtaatgcgca accatcgagt cgata // LOCUS sequence207 2359 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence207 VERSION sequence207 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2359 /mol_type="genomic DNA" /organism="" /note="sequence207" CDS complement(465..2228) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MKKILCYTRKPLDEAIYAPRLAYSMHLAYETPEGFAPLNHNSGVL FVKATQNPETLQLYPKSLKKPCLCALPEGGYAVAAIRVEANGEPDESSKGCVVVFRSDD LINYTELGLIKLCDDHIEDISLHFCKNCDHLVVKYKIGESITRVMLNTLTEPSNDVRPC EKLNIPEIETDIEGAEPRNFVEVPDELFCHLKKKLLTPVNTDITLDKTKVASVDELLAV GATAHYSDGSCARKRIDWCVPENLTSGTYKIKGKIHQDHFEFPLAINRADPCVYRYNGA YYFIATNDADGNHSISVRKADSIPELKDAEEHLILDSVTYPHVGGLLWAPEFHEVGGKL YIFHACTPKEFGDEESHVTAYNYSGDLTEKSSWEMPIKVQKPDGSPLYTVGITLDMTTF ESGGDTYAVWSQRQFNPCDLGAWLYIAKLDQKEPWKLTTEPVLLSMPELGWQNNHTLVD EGPFALIRDGKIYLTFSSALVDTTYCVGMFTADLGADLLDISNWHKTGYPLLSSASVEG EYGPGHNAYCIDEYGDIWNTYHARPGVNGPRSSGIRRVHIGFDGEPVLDMTEEKDVCPA LREVEITLELK" /locus_tag="LOCUS_6790" /note="WP_010964837.1 family 43 glycosylhydrolase (Clostridium) [pid:33.8%, q_cov:47.2%, s_cov:82.9%, Eval:4.4e-39, partial hit]" /note="MGA_917" ORIGIN 1 gccttcctta cgggaaacga ttgagggtgc ccaggagcaa cctgcccaag tgcacacttc 61 ggttacaggg acggttgttt catatctcca gttgaccata tcatcggtgg agtagcagac 121 cagggtgttg attgagccgt aggagttgtc gcccatgccc attttttggt cgaactcctg 181 agagtcgttg gtaccataaa cataaagtct gccgttatat tcaacagagg tggggtcggc 241 aaagaagatt gttgaggaaa cggggtttga gttggtcatt tccttgaatg cttctgtcaa 301 actgtcgcca acggaaagac ccaaatcctc ggtaggaaca atggtctttg caagggtaaa 361 atcgctcgcc tcacccgatg cacaaccgca aagcattgaa gcaacaagca taaaagcaac 421 taagagtgcg aaaaatcttg ttttcatagc gttttatctc cttattattt taattcaagg 481 gttatttcaa cttcgcgaag tgcgggacaa acatcctttt cttcggtcat atcgaggaca 541 ggctcgccat caaagccgat gtgtacacgg cggatacccg agcttctggg gccgttaacg 601 ccgggacggg catgataggt gttccagatg tcgccgtatt cgtcgatgca ataggcgtta 661 tggccggggc cgtattcccc ttcaacgctg gcggatgaaa gaagcggata acccgtttta 721 tgccagttgg aaatatctaa aaggtcggca cccaaatcag cggtgaacat accaacacag 781 taggtggtgt cgacaagcgc gctggagaag gttaaataga tcttaccgtc tcggatgagg 841 gcaaatggac cttcgtcaac aagggtgtgg ttattctgcc aaccaagctc gggcattgaa 901 agcaaaacag gctcagttgt gagtttccaa ggttcctttt ggtcaagctt tgcgatatat 961 aaccacgcac cgagatcgca ggggttaaac tgacgctgtg accaaacagc ataagtgtcg 1021 ccgcccgatt caaaggtggt catatcaagg gtgataccca cggtatataa aggcgagcca 1081 tcgggctttt gaacctttat tggcatttcc caagaggatt tttcggttaa atcaccgctg 1141 taattgtatg cggtgacatg ggactcttca tcgccgaatt cctttggagt gcaagcgtgg 1201 aagatataaa gcttgccacc tacttcatgg aattcgggtg cccagaggag accgcctacg 1261 tgcggatatg ttacgctatc aagaatgagg tgttcttcag cgtctttaag ttcgggaatg 1321 gaatccgctt ttctcacaga aatggaatgg tttccgtcgg catcgttggt ggcaatgaag 1381 taatatgcac cgttgtatcg atagacgcag gggtcagcac gattgattgc aagcgggaat 1441 tcaaagtggt cttggtgaat tttacccttg atcttatatg tacccgaggt gaggttttcg 1501 ggaacacacc agtcgatgcg cttgcgggcg cacgagccgt cggaatagtg tgcagttgcg 1561 ccgacagcga gaagctcgtc aacagaagca actttggttt tatcgagggt gatatcggtg 1621 ttaacgggag ttaagagctt ctttttaagg tgacagaaga gctcatcggg aacctcgaca 1681 aagtttctcg gttcagcacc ttcgatatct gtttcaattt cgggaatgtt cagcttttcg 1741 caaggtctta catcgtttga gggctcagtc aaggtgttga gcattacacg ggtgatgctc 1801 tctccgattt tatacttaac tacgagatgg tcacagtttt tgcaaaaatg cagggagata 1861 tcttcgatat gatcatcgca gagcttaatg agtccaagct cggtatagtt tataaggtca 1921 tccgaacgga aaacgaccac acagcccttc gaagattcat ccggctcacc gttggcctca 1981 actctgattg cggcaacagc atatccccct tcgggcagag cacaaaggca aggcttttta 2041 aggctcttgg gatatagctg gagtgtctcg ggattttgag ttgcttttac aaacaaaaca 2101 cccgaattat gatttaaagg cgcaaaacct tcgggagttt cataagccaa gtgcatactg 2161 tatgcaagcc taggggcata aatggcttcg tccaatggct tgcgggtata gcaaagaatc 2221 tttttcatat cgataacctc catatatact gattatataa taacattata acggattaca 2281 gtcaaatcat caatgactaa atctaactta taattgacgg attatgagga aacatatgct 2341 tttaacttca atttgcaaa // LOCUS sequence208 2357 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence208 VERSION sequence208 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2357 /mol_type="genomic DNA" /organism="" /note="sequence208" CDS 150..1694 /product="alpha-amylase family glycosyl hydrolase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_013399407.1" /transl_table=11 /codon_start=1 /translation="MAKQPVWLDNAIFYEIYPQSFMDTNGDGIGDFQGIISKLDYIKEL GCNALWINPCFESPFGDAGYDVSDYCKVAPRYGTNEDLKQLFNEAHKRNMHVLLDLVPG HTSVEHKWFKETLKAEQNEFTDRYIWTDSIWTTPYGMGCIRGISDRDGSCAVNFFSHQP ALNYGFYEVTESWQQPTDAPGPKATLEAMKDVMRFWLGMGCDGFRVDMAGSLVKNDPES KGTIALWQNVREFLDREYPNAAMVSEWGEPDKSLQGGFHMDFLLHFGPSHYNDLFRCDE PYFCKRGKGDAGEFVKKYLENYEKSERKGLICIPSGNHDMDRLARKCDTDEQKASFAFL LSMPGAPFIYYGDEIGMKYVENLVSVEGGYGRTGARSPMQWDNSTNAGFSSASKEMLYV PLDPDPNRPTAEKAMADKCSVYHEVKKLIEIRQAHKALQSKGDIEFISNGEKGAPLAYV RSCDDEKIFVVINPADRKASVEAPAKLGECIYVLGEAKAEGNEVVLGGCSAGFFTI" /locus_tag="LOCUS_6800" /note="WP_013399407.1 alpha-amylase family glycosyl hydrolase (Gardnerella vaginalis) [pid:46.2%, q_cov:93.4%, s_cov:92.6%, Eval:4.0e-126]" /note="MGA_918" ORIGIN 1 acaaacagtt ccgcaactgc gggtggcata ttcgcgagaa ttcaaaaatt ttcgcctatg 61 cctattgcat tttactgtgc aggtgatata agatatacat agggctttgg tccgtaaaat 121 tccaccaata tgaacaggag aaatgactta tggcaaaaca acccgtttgg cttgacaacg 181 cgatttttta tgaaatatat ccccaatcct ttatggacac aaacggcgac ggcatcggcg 241 attttcaggg aataatctcc aagcttgatt acatcaagga gcttggatgc aatgcgcttt 301 ggatcaaccc ttgctttgaa tctcccttcg gagatgcagg atatgatgtt tccgattatt 361 gcaaggtcgc acccagatac ggcaccaacg aagacctcaa acagcttttc aacgaggctc 421 acaagcgaaa tatgcacgtg cttttggatc ttgttcccgg ccatacctcg gttgagcata 481 agtggttcaa ggaaaccctc aaggcggagc aaaacgaatt caccgaccga tacatctgga 541 cagacagcat ttggacaaca ccttacggaa tgggttgcat tcgcggaatt tccgaccgcg 601 acggctcctg cgctgttaac ttcttctccc accagcctgc tcttaactac ggtttctatg 661 aagtaaccga gtcttggcag caacccaccg atgcgcccgg accgaaagcc acccttgaag 721 cgatgaagga tgtaatgcgc ttctggcttg gtatgggatg cgacggattc cgagttgata 781 tggcaggttc gctcgttaaa aacgatcccg aatcgaaggg cacgattgct ttgtggcaga 841 atgtaagaga gtttttagat agagaatatc ctaatgcggc aatggtttcc gaatggggcg 901 agccggacaa gtcgcttcag ggtggattcc atatggactt cttgttgcac ttcggcccca 961 gccactataa cgacctgttc cgctgcgatg aaccttattt ttgtaaacgc ggcaagggcg 1021 atgcaggcga atttgttaag aagtatcttg aaaactacga aaagtcggag cgcaagggct 1081 taatttgcat cccctcgggc aaccacgata tggacagact tgcaagaaaa tgcgataccg 1141 acgaacagaa ggcatccttt gcattcctct tgtcgatgcc aggtgcgccg tttatctact 1201 atggcgatga gatcggtatg aaatatgttg agaatctcgt ttccgtcgag ggcggatatg 1261 gcagaacagg cgcgcgctca ccgatgcagt gggacaattc aaccaacgcg ggcttcagct 1321 cggcatccaa ggaaatgtta tacgttcccc ttgaccccga cccgaatcga cccacagccg 1381 aaaaagcgat ggcggataag tgctcggtat atcacgaagt taagaagctg atcgaaatca 1441 gacaggcgca caaggcgctt cagtcgaagg gcgatattga gtttatttca aatggcgaaa 1501 agggtgcgcc tttggcatat gtcagaagct gtgatgacga aaagatattt gttgttatca 1561 accccgctga ccgcaaggca agtgtcgagg cgcctgctaa gttgggcgag tgcatttacg 1621 ttttgggcga ggcaaaagcc gagggaaatg aagttgtttt gggcggatgc tcggcagggt 1681 tctttacaat ttaatagtat caaaaaaact ccgtacagaa aactctgtgc ggagattttt 1741 cgtgtatgat tcccccttcg cttggcaaca cttacagtat atgaacgagg ggagatctta 1801 taaatgcaaa agagcacaag aaacattgtt ttggcatcgg cggcggttgc aggggcgtcg 1861 gcattgggca tgatgtatca cacatcggca aaaaatctgg tgaaactggc gcttgaccgc 1921 gaacagccga aaaatattca aaagggcaga gcttggctga cgggcgcccg cgacattgaa 1981 gcgttcctca aaaaagcaaa ggaaacatcg aaagcacttg agagcaaaaa cttggagcgc 2041 attgaaatta aggggcggga cggcatcaca ctcgtgggac attggcagga atgtcaaaac 2101 ccaaaaaggg tcatcattgc aatgcatggc tggcgttcgt catggtcaca ggattttgga 2161 atgatatcgg agttttgggc aaagagcaac tgtagtgtct tatatgccga acaacgggcg 2221 cagggcgaaa gcggcggaga atatatgggc ttcgggctta ttgaacgata tgactgtctt 2281 gaatgggcaa aatgggtgaa cgaaaacgta agcaatactc tgcctatata tcttgcggga 2341 gtttcaatgg gagcggc // LOCUS sequence209 2353 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence209 VERSION sequence209 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2353 /mol_type="genomic DNA" /organism="" /note="sequence209" CDS complement(252..1133) /product="oxidoreductase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003976313.1" /transl_table=11 /codon_start=1 /translation="MSTKSWFNKNTQNLSGKAVALFGASGGLGQELCRYILALGGRLIV IDRNPKKQRALIHTLLGEYPDGSIDGLICDLEDIDSVKQVAVILEKLDVDIIIHNAGAY SIPRRICKTGLDNVFQINFASPYYITRALLPYLEAKGGRVVVLGSIAHNYSKTDPEDTD FRTRKKASLAYGNAKRYVMFSHLELAKTHPNVHISVAHPGITFTNITAHYPKLIFAIIK HPMKLIFMRPKKAALSVVKGLFSDTPAYSWIGPRLFDVWGLPRIKKLKTCKNEEIMHIY AKSEEIYTFLCN" /locus_tag="LOCUS_6810" /note="WP_003976313.1 oxidoreductase (Streptomyces) [pid:27.4%, q_cov:87.4%, s_cov:86.5%, Eval:9.6e-22]" /note="MGA_920" CDS complement(1136..1636) /product="peptide-methionine (S)-S-oxide reductase MsrA" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_001831153.1" /transl_table=11 /codon_start=1 /translation="MNQHKTAYFAGGCFWCITPTFKETPGVISVLSGYSGGDEANPAYA DVKNQNTGHRETVCIEYDSEQVSFDELFEIFLNGVDPFDDGGQFIDRGHSYTLAVYYLC NEQKRIAEEGIAKLEKLSGKRVYISVEPFKSFYSAEEEHQDYYLKHPKEFAQELIDSGR VKE" /locus_tag="LOCUS_6820" /gene="msrA" /EC_number="1.8.4.11" /note="WP_001831153.1 peptide-methionine (S)-S-oxide reductase MsrA (Staphylococcus) [pid:46.5%, q_cov:93.4%, s_cov:91.8%, Eval:1.4e-36]" /note="MGA_921" CDS complement(1647..2327) /product="EFR1 family ferrodoxin" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003434727.1" /transl_table=11 /codon_start=1 /translation="MVKIYYFSGAGHSKRVAEFLAYRLDTEAQEIRQDVKASGDTLAVI VPVYCQNVPDPVARFLQKAEAKHFVLIATYGRMSYGNVIYEASKLVSGDVIAAAYLPCG HTYLGQADSPDLSGLEGIFERIEAPKAVAIPPSYKSAWADIFPNLRSRIGVKIIKNSRC TECAVCESVCPMGEISKGVTNKRCIRCLKCVCACPENALDVKYNAVLRLYLKKKPKNDK VVYL" /locus_tag="LOCUS_6830" /note="WP_003434727.1 EFR1 family ferrodoxin (Clostridioides difficile) [pid:27.0%, q_cov:89.8%, s_cov:89.6%, Eval:1.9e-10]" /note="MGA_922" ORIGIN 1 caaaactact tttttgatat tttctttgtt cattttattt tttctccttt tggggttaat 61 ctctcgcata acggctgttt tcagtcagcg ctaatatgcg ttgattatac cacctgcgga 121 caggatttgt caacgaaatt tgcataaata ttcacgtttt tgaaaagttt atgcagacgg 181 cgcagttttg ggcgtttcag cggttggaat atgtatatat ttaataataa gcgctgtgca 241 catcgccgaa gtcagttgca taaaaatgta taaatctcct cagattttgc ataaatatgc 301 ataatctcct cattcttgca agttttaagc ttttttattc tcggcagacc ccagacgtca 361 aacaatctcg gtcctatcca agagtacgcg ggcgtatcgc taaacagccc tttaaccacc 421 gacagagccg cctttttagg tcgcataaaa ataagcttca tcgggtgctt gatgattgca 481 aaaatcagct tcggatagtg cgcagtgatg tttgtaaacg taattcccgg atgggcaacg 541 gatatgtgaa cattcggatg cgtttttgca agctccagat gcgaaaacat cacataacgc 601 ttggcgttgc catatgcaag gctcgctttt ttgcgcgtgc gaaagtcggt atcctcgggg 661 tcggtctttg aatagttgtg agcgatgctt cccaacacca caactcttcc gcccttcgct 721 tcaagatatg gcaaaagcgc acgggtgatg taatatggag atgcaaaatt gatttgaaag 781 acattgtcaa gccccgtttt gcaaatgcgc cgagggatgc tgtatgcccc tgcgttgtgg 841 atgatgatgt caacatcgag cttttcaagt atgacggcga cctgcttgac cgaatcaatg 901 tcctcgaggt cgcagatcag cccatcaata gagccgtcgg gatactcgcc cagcagagta 961 tgaatcagcg cacgctgttt tttcgggttg cggtcgatga cgataagccg cccgcccagc 1021 gcaagaatat atctgcaaag ctcttgtccc aagccgccgc ttgcgccgaa aagcgcaacg 1081 gccttgcccg agaggttctg cgtatttttg ttaaaccatg attttgtgga catagttatt 1141 ccttcaccct ccccgaatcg atcagctcct gtgcgaattc cttcgggtgc ttgaggtaat 1201 aatcctggtg ctcttcctcg gcggaataaa agcttttgaa cggctcaacg ctgatgtata 1261 ccctcttgcc cgacagcttc tcgagctttg caatgccctc ttctgcaatg cgtttttgct 1321 cattgcaaag ataatagacc gccaaggtat acgagtgacc tcggtcgatg aactggcctc 1381 cgtcgtcgaa ggggtcaacg ccgttcaaaa agatttcaaa cagctcatca aagctcacct 1441 gctccgaatc atattcgatg cagacggtct ctctgtgacc ggtgttctga tttttgacat 1501 ctgcatatgc agggtttgcc tcatctccgc ccgagtatcc gctcaaaacg ctgatgactc 1561 ccggcgtttc cttgaatgtc ggggttatgc accaaaagca tccgcccgca aaatatgctg 1621 ttttatgttg gttcatttac atcaccttac aaatatacca ctttgtcgtt cttcggtttt 1681 ttcttcaaat atagtcgtaa aaccgcattg tattttacat cgagagcatt ctcggggcaa 1741 gcacaaacgc acttcaagca tcttatgcac cgcttgttcg tcacgccttt gctgatttcg 1801 cccatcgggc aaacagattc acaaacggcg cactcggtgc aacggctgtt tttgatgatc 1861 ttcacgccga tgcggcttcg taagttcgga aaaatatctg cccaagcgct tttgtatgat 1921 ggcggaatcg ccaccgcctt tggggcttcg atcctctcaa atattccctc aagaccactc 1981 aaatcgggtg agtctgcttg gccgaggtat gtatgcccgc aaggcagata cgccgccgca 2041 atcacatcgc ccgaaacaag ctttgacgcc tcataaatca cattgccata gctcattctt 2101 ccgtatgttg caatcagcac aaaatgcttt gcctcggctt tttgcaaaaa ccgcgccacc 2161 gggtcaggaa cgttctgaca atacacagga acgattaccg caagtgtgtc gcccgaagct 2221 ttgacgtctt gccttatttc ttgcgcctcg gtgtccaatc gataagccaa aaactcagca 2281 acccgttttg aatgccccgc gccggagaaa taataaatct taaccatcta tatatcctcg 2341 cattatcgca cac // LOCUS sequence210 2352 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence210 VERSION sequence210 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2352 /mol_type="genomic DNA" /organism="" /note="sequence210" CDS complement(208..693) /product="YqeG family HAD IIIA-type phosphatase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_002263504.1" /transl_table=11 /codon_start=1 /translation="MIHKPNYVFNSVADISLEFLEKEGIKALILDLDNTLTTHNNPVPD PMRLAWFEAVKKSELPMIIVSNNHYERVKPFADALGLDFVPDGRKPLTYGYNEAVKRLG LDKSSIASVGDQIFTDVIGSRLTGIKSIFVFPIEPETGFWFRVKRTLEKPLRPKRKE" /locus_tag="LOCUS_6840" /note="WP_002263504.1 YqeG family HAD IIIA-type phosphatase (Streptococcus mutans) [pid:35.8%, q_cov:93.8%, s_cov:86.3%, Eval:5.1e-25]" /note="MGA_924" CDS complement(771..944) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MAEVRVGKNESLDTALKRFKRSCARDGVIAEVRKREHYEKPSVKR KKKSEAARKRKY" /locus_tag="LOCUS_6850" /note="WP_010964600.1 30S ribosomal protein S21 (Clostridium) [pid:74.4%, q_cov:75.4%, s_cov:74.1%, Eval:2.9e-13, partial hit]" /note="MGA_925" CDS complement(1067..2230) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MKDWAFNRQRYWGEPIPIVYCEHCGMVAVPYEELPLRLPKVENFE PGSDGESPLAKIEDFVNCTCPKCGKPARRETDTMPQWAGSSWYYLRYCDPHNADALASK EALEYWMPVDWYNGGMEHVTRHMIYSRFWHHFLYDIGAVNTAEPYMKRTAQGLILGPDG EKMSKSKGNVVDPLDVIKLYGADVLRVYTLFMGDYEKAAPWSDNSVKGCKRFLDRVWAL QDNVLDGDTYRPEFTSKMHKMIKKVTSDIDNMKFNTAIAAMMTILNDFTALGSINRAEL RDFLIMLYPFAPHITEEMYESLGFGGYIHDAKWVAYDEALCKDNEIEIAVQIKGKLRDR VMVSAEAEQAEVLELVKSSEKIAAEIAGKTIVKEIYVKGKLVNIVAK" /locus_tag="LOCUS_6860" /note="WP_000009461.1 leucine--tRNA ligase (Bacillus cereus) [pid:48.7%, q_cov:99.7%, s_cov:48.6%, Eval:3.2e-106, partial hit]" /note="internal stop codon at [2261:2263](-)" /note="MGA_926" ORIGIN 1 gcgaaagggt tattccaaat tgctgagcat tggcctttaa ggatgatgcc aacgattcgg 61 aaacgcgaac gccttgtccg cactgatatt caaacgcatc gaggttcatc gagttaaggt 121 attttggcat atcaagcgag cttttatatg ccttggcaaa tgcttcagag cttcctgcag 181 ggccgaaaat tgcgttcatt taagatatca ctcctttcgc ttgggtcgaa gcggcttttc 241 gagggttcgc ttaacacgga accaaaagcc ggtttcaggt tcgattggga atacaaagat 301 gctttttatg cctgtaagac gtgagcctat aacgtcggta aaaatctggt cacccacaga 361 agcgattgat gatttatcca atcctaagcg tttgaccgct tcgttatagc catatgtgag 421 tggctttctg ccgtcgggga cgaaatcaag acctaaagca tcagcaaagg gcttgacgcg 481 ctcatagtga ttatttgaaa ctattatcat cggcagttcc gatttcttaa cagcctcaaa 541 ccaagcaagg cgcatggggt cgggcacggg attattgtgg gtggtgaggg tgttgtcaag 601 gtctaaaatt aaagccttta tcccctcttt ttctaaaaac tccaaggaga tatccgcaac 661 ggagttgaaa acatagttgg gtttatgaat cataaataaa tccttaaaat aaaaacaaaa 721 gcgaacagat tatactgctc gctttcactt aataattttg cattattgaa tcaatacttg 781 cgcttacgag cagcttcaga cttcttctta cgctttacgg aaggcttttc atagtgctct 841 ctcttgcgta cttcagcgat aacgccgtct cttgcgcaag atctcttaaa acgcttgagc 901 gctgtatcca acgattcgtt tttgcctaca cgaacttctg ccatttactg ttccctccct 961 ttgcataccg agcagaggta attgtgcact aagccatagt gcaactaaat acattataca 1021 cataaacacc agcaaagtca atagcaaaag tcaaaatatt tgaaatttat ttcgcaacga 1081 tattgacaag cttgccctta acgtaaatct ccttgacgat agtcttgcct gcaatttcag 1141 cagcaatctt ttcgcttgat tttaccagtt ccaaaacctc agcctgttca gcttctgcag 1201 ataccattac tctgtcgcgt agctttcctt tgatctgaac tgcgatctcg atctcgttgt 1261 ccttgcagag tgcttcgtca tatgcgaccc acttagcatc gtggatatat ccgccgaagc 1321 cgagggattc atacatctct tcggtgatat gaggagcgaa gggatagagc ataatgagga 1381 aatcgcgaag ctcggcacgg ttgatcgagc ccaaggcagt gaaatcgttc aaaattgtca 1441 tcatcgcggc gatcgcggtg ttgaacttca tattgtcgat gtcagaggtt accttcttga 1501 tcatcttgtg catcttggat gtgaattcgg gacggtaggt gtcgccatcg agaacgttgt 1561 cctgcaatgc ccagactctg tcaaggaatc tcttgcatcc cttaacggag ttatcgctcc 1621 aaggagctgc cttttcatag tcgcccataa agagagtgta aactctcaat acatcggcac 1681 catagagctt gataacatcc agcgggtcaa caacattgcc cttggacttg gacatctttt 1741 caccgtcggg acccaagatg agtccctgtg cggttctctt catataaggc tctgcggtgt 1801 tgacagcacc gatgtcatag aggaagtggt gccagaagcg ggagtagatc atatgtctgg 1861 tgacgtgttc cataccgccg ttgtaccaat caacaggcat ccagtattcg agcgcttcct 1921 ttgaagcgag agcatcagca ttgtgcggat cgcaatagcg caggtaatac caggatgaac 1981 ctgcccactg gggcatggtg tcggtctcac gtctggcggg cttgccgcac ttgggacaag 2041 tgcagtttac aaagtcttca atcttggcaa gagggctttc gccatctgag ccgggctcaa 2101 agttttcaac cttgggcaag cgcaaaggca attcctcata aggaacagca accattccgc 2161 aatgctcaca gtatacgatc gggatgggct cgccccaata tctctggcgg ttgaatgccc 2221 aatccttcat cttatactgt acgcccttct cgcctattcc ctattcggaa aggtaagcaa 2281 gcatcttttc aattgaatcc ttcttgttgg tcaggccgtt gagaacgccg gaatttacca 2341 tttcgccgtc gc // LOCUS sequence211 2352 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence211 VERSION sequence211 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2352 /mol_type="genomic DNA" /organism="" /note="sequence211" CDS 111..839 /product="SDR family oxidoreductase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_009897780.1" /transl_table=11 /codon_start=1 /translation="MKTALVTGASRGIGAAIAFELARAGYAVAVNYATNKDAAESVIEK ISKNGGVAKGYKADISNAGEVTRLFEDVSAELGEIEVLVNNAGVAHIGLLQDMTDSEIE RLVGVDLLGAIYCSKEAVKRMVKLHKGVIINISSMWGEVGASCEAVYSTCKAGVIGLTK ALAKEVGPSGIRVNCVSPGVIATDMNAELDDETMQSLCEETPLLRIGSANDVASTVAFL ASDEASFITGQVLSVNGGII" /locus_tag="LOCUS_6870" /note="WP_009897780.1 SDR family oxidoreductase (Clostridioides difficile) [pid:48.1%, q_cov:99.6%, s_cov:98.4%, Eval:6.5e-60]" /note="MGA_929" CDS 855..1346 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MEGIREQLVKKPVDSQDKLKSALVLAASLVLAIIVVFLIAVFASV MMLVGLIFAGLIMWGGWWLTGEFSVEYEYCYSNGELTVDKIINRRRRKNMCSVELRRAD AFYKNPSKLPDATVISAVGELEDVYAISYNDPTYGTAVLVFTPDERMLEAIKPYLPRII " /locus_tag="LOCUS_6880" /note="MGA_930" CDS 1343..1693 /product="holo-ACP synthase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_002679605.1" /transl_table=11 /codon_start=1 /translation="MRVGIDSVEIDRIQKSFEINGFFEKAYSPAEREFLSAKKNPYPSA AANFAAKEAFGKAMGCGLSGFSLDEVSVLRDDKGAPYLKLSGKAKELGKLYRFTVSLTH TKTTATAIVIAY" /locus_tag="LOCUS_6890" /EC_number="2.7.8.7" /note="WP_002679605.1 holo-ACP synthase (Treponema denticola) [pid:42.7%, q_cov:96.6%, s_cov:94.3%, Eval:7.4e-17]" /note="MGA_931" ORIGIN 1 aagcccttta tcgacataat gtatgagggt gtatccgctt gggcaacgat ttttgacgac 61 tactacgttt tagcatttac tatctaccga tgaggagatg acacaaagat atgaaaacag 121 cgcttgtgac gggtgcttcg cggggaatcg gcgcggcaat tgcatttgag cttgcaaggg 181 cgggatatgc tgttgcggtg aattatgcca cgaacaagga cgccgccgaa agtgtgattg 241 aaaaaatctc caagaacggc ggagttgcca aaggatataa ggctgatatt tcaaacgcgg 301 gcgaggtcac acgacttttt gaagatgtaa gcgccgagtt gggtgagatt gaagttttgg 361 tcaacaatgc aggcgttgca catatcgggc tgttgcagga tatgacggac agcgagattg 421 agcggttggt cggcgttgat cttttgggcg cgatttactg ctcgaaagaa gctgttaaac 481 ggatggttaa gctacataag ggcgttatta ttaacatttc ctccatgtgg ggtgaggtcg 541 gtgcctcctg tgaggcggta tattccactt gtaaggcggg agttatcggt ttgacaaagg 601 cgctggcaaa agaggttgga ccttcgggaa taagagtcaa ctgtgtttcg ccgggagtta 661 ttgcaacaga tatgaacgca gagcttgacg atgaaacaat gcagtcgctt tgcgaggaaa 721 ctcccctttt gcgaatcgga agcgcaaacg acgttgcgag caccgttgca tttttggcaa 781 gcgatgaagc atcattcatc acgggacagg ttttgtcggt caacggcgga ataatataaa 841 ggagataagg aattatggaa ggaatcagag aacagctggt taaaaagcct gtggattcgc 901 aggataagct taaatcggca ttggttttgg cggcatcgct cgttttggcg ataatagtcg 961 tttttcttat tgcagttttt gcaagcgtga tgatgctggt cggtcttata ttcgcaggtt 1021 tgatcatgtg gggcggatgg tggctgacgg gcgagttcag cgttgaatat gaatattgct 1081 actcaaacgg cgagctgaca gttgacaaga tcatcaaccg cagacgcaga aagaatatgt 1141 gctcggttga gctcagacgc gctgatgctt tctataaaaa cccgtccaag cttcccgatg 1201 cgacagttat cagcgcggtt ggcgagcttg aggatgtata tgccatcagc tataacgatc 1261 ctacatacgg cacagccgtt ttggttttca cacccgatga aagaatgctt gaggcaatca 1321 agccctatct gccgaggatc atatgagagt tggaattgac agcgttgaga tcgatagaat 1381 tcaaaagagt tttgaaatta acggcttttt tgaaaaggct tactcccctg ccgaacgcga 1441 gtttttgagc gcgaagaaaa acccataccc ttcagctgcg gcaaattttg cagcaaaaga 1501 agctttcggc aaggctatgg gctgcggatt aagcggattt tcccttgatg aggtgtctgt 1561 cttgagggat gacaagggtg cgccctattt aaagctatcg ggtaaggcca aagagcttgg 1621 caagctgtat cgctttacag ttagccttac acacacgaaa acaactgcga cagcaatagt 1681 gattgcatat tgatatgaag aaatttatca gtttggcggc attttctcag gcggaagatg 1741 ccgcttttga gaaaaatctg cctgttaatg agttgatctc ccccgatggc ggagagatgg 1801 aaattgtgga tatgtgtaaa gttaaagagc tttaccctaa gcgttccata aacgggcaca 1861 aaggaacctt tggaaggttg cttttgattg tcggctccga cagatttatg ggtgcagcac 1921 agatttcaac actttccgcg cttcgttcag gcgttggaat tgcaagcgtt atatctacaa 1981 atgaggcgac gagagcactt gcaataagtg caaaggaagc gatattcact cgcgcagatt 2041 caagctctga cgggtttatt acggcaagtg aggagaatat tgcaaaaatc aaacaagagc 2101 ttgaaaaagc cactgcggtt ttggtcggat gcggtttagg aaatacgcct gatactgtga 2161 aaattcttga aaccgcagtc ttaaatgcaa attgtccgat aattattgac gcagacggaa 2221 taaacgcgct gacaagccgc atagaattgc ttaggacagc aaagacagag gtcattttga 2281 ccccgcacgt cggcgagttg gcgaggcttt gtgatgtgta tattaactac gccgcaaagc 2341 accgcgcaga gc // LOCUS sequence212 2350 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence212 VERSION sequence212 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2350 /mol_type="genomic DNA" /organism="" /note="sequence212" CDS 332..1033 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MNKSKAYDMIEQMGTPEKADKALCELKAYWESLLSQYSVNSPDEK LNRMVNIWNQYQCMVTFNMSRSASYFESGIGRGMGFRDSNQDILGFVHQIPDRARERII DLASTQLPDGNCYHQYQPLTKKGNSDIGSNFSDDPLWMILSTAQYIKETGDLTILDEMV PYDNDPAQAKTMMHHLKLSFERVVNNLGPHGLPLIMRADWNDCLNLNCFSYTPGESFRP PHPRTERLPNR" /locus_tag="LOCUS_6900" /note="WP_004082399.1 glycosyl transferase (Thermotoga maritima) [pid:68.8%, q_cov:94.8%, s_cov:27.2%, Eval:2.4e-88, partial hit]" /note="internal stop codon at [305:307](+)" /note="frameshifted, insertion/deletion at around 991" /note="MGA_934" CDS 1030..1938 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MMVACMFTFIIPEYIALCKIKGLDDDARVAEEAVKKMADAVMTHG YDGEWFLRAYDDFGRKVGSHENEEGKIFIEPQGFAVLSGLGKESGKDLRALESVNKYLS TERGLVLNNPAFTKYFVEYGEISTYPGGYKENAGIFCHNNAWIICAEAFVGHGERAFEY YSKIAPAYNEDISEIHKTEPYVYAQMIAGKDAKPEHFGQAKNSWLTGTAAWNFVAVSQY ILGIAPDYDGLRIDPCIPSDWDGFKASRLFRGARYNITVSNPENVCKGVKTIKCDGVRL SSNLVPAFEAGTVHEVEITLG" /locus_tag="LOCUS_6910" /note="WP_004082399.1 glycosyl transferase (Thermotoga maritima) [pid:59.9%, q_cov:100.0%, s_cov:36.9%, Eval:3.1e-108, partial hit]" /note="frameshifted, insertion/deletion at around 991" /note="MGA_935" ORIGIN 1 aagcataggc gaagttgagg tcgaaggctc tgccatttac cacaagaccg aatatcgcga 61 acgtcgtaac cattatgctg tatatgctgt taatactcct atcgacggct ttgacacaga 121 ccgcgacagc ttcttgggtc tttacaacgg atttgatcat cccgatgttg tctttgaaaa 181 tcagtcaaag aactcccgtg cgctcggctg gagccctgtt gcatctcacc gcataagcgt 241 tgaccttaaa gcaggcgaag aaaagtcgat agtattcatc ctcggctatg ttgaaaacgc 301 atattaggaa aagttccttt cctacggctc aatgaataag tctaaagcat atgatatgat 361 cgaacagatg ggcacacccg aaaaggctga caaggcgctt tgcgagctca aggcttattg 421 ggaatcgctt ctttctcagt acagtgttaa ctcacccgac gagaagctca accgcatggt 481 aaacatctgg aaccagtatc agtgcatggt aaccttcaat atgtcccgct ccgcatccta 541 ctttgaaagc ggaatcggca gaggtatggg cttcagagat tcaaaccagg atattttggg 601 ctttgtccac cagattcccg acagagctcg tgagcgaatc atcgaccttg catctacaca 661 gcttcccgac ggcaactgct accaccagta tcagccctta accaaaaagg gcaactcgga 721 tatcggctca aacttctctg atgacccgct gtggatgatc ctttcaactg cgcagtacat 781 caaggaaacg ggcgatctga ccattttgga tgaaatggtg ccatatgaca acgaccccgc 841 acaggccaag actatgatgc accacctgaa gctcagcttt gagcgtgttg taaataacct 901 tggccctcac ggtttgccgt taattatgcg tgccgactgg aatgactgcc taaatctcaa 961 ctgcttctca tatacccccg gcgagagctt cagaccacca catccaagga cggaaaggtt 1021 gccgaatcgg tgatggttgc ttgtatgttc accttcatca ttcccgaata tatcgcgctt 1081 tgcaaaatta agggtctgga tgatgatgca cgtgttgccg aagaagctgt caagaagatg 1141 gctgacgctg ttatgaccca cggctatgac ggcgagtggt tcttgcgtgc atatgatgac 1201 ttcggtcgca aggtgggctc tcacgaaaat gaagagggca agatcttcat tgaaccccag 1261 ggctttgcgg ttctttcagg cctaggcaag gaatcgggca aggatcttcg cgcccttgaa 1321 agtgtcaaca aatatctttc aaccgagcgc ggattggtgc tcaataaccc cgctttcacc 1381 aaatatttcg ttgagtacgg cgaaatttcc acctaccccg gtggatataa agaaaacgca 1441 ggcattttct gccacaacaa cgcttggatt atctgtgctg aggcatttgt cggacacggc 1501 gagcgtgcct ttgagtatta ttccaagatc gctcccgcat ataacgagga tatttcggaa 1561 attcacaaga ccgagcctta tgtatatgcc caaatgatcg ccggcaagga tgccaagccg 1621 gagcacttcg gtcaggcaaa gaacagctgg ctgacaggta ctgccgcttg gaacttcgtt 1681 gctgtatccc agtatatttt gggtattgcg cccgattacg acggcttgcg cattgatccc 1741 tgcattcctt ccgattggga cggcttcaag gcttcccgtc tgttcagagg tgcaagatat 1801 aacatcaccg tttctaaccc cgaaaatgtc tgcaagggcg ttaaaaccat caagtgcgac 1861 ggcgtaagac tttcaagcaa ccttgttccc gcatttgaag caggcaccgt tcacgaggtt 1921 gaaattacct tgggataaat tacaaactgt aatttatttc aaattaaagt cgcaaattgt 1981 tgaaaactcc cctgtttgct gccaaaaaag gcacgtagac aggggatttc tcaacttatc 2041 aacaaagttt tcaacatttt tgtgagttta caagttgtaa accccctccc tgtgggtggg 2101 ggcaatttca gcgaagctga aatcgggggg tgggcaaaaa cattgctccc gttggtcgca 2161 aggttttaac aagaacccgc tttgcggctt cttgacacgt cgccgaaggc gacaccgcta 2221 ttacaacgcg caaggataac cgctatcaca gttgaatccc atgcgcgacc tattccgcta 2281 atttatcttt acgctgtggt tgcaagatta agtctactga taatgcggaa taatctcttt 2341 ttgaaaagga // LOCUS sequence213 2348 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence213 VERSION sequence213 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2348 /mol_type="genomic DNA" /organism="" /note="sequence213" misc_feature <1..524 /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_009896126.1:DNA repair protein RecN" /note="WP_009896126.1 DNA repair protein RecN (Clostridioides difficile) [pid:53.3%, q_cov:96.5%, s_cov:29.9%, Eval:6.9e-45, partial hit]" /note="MGA_936" /locus_tag="LOCUS_6920" CDS 539..1078 /product="DJ-1/PfpI family protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_008760842.1" /transl_table=11 /codon_start=1 /translation="MVVCFIANGFEEIEALTSVDCLRRCELDVLTVGIGSCIIRGSHGI AVVTDTDDGMFTPSEDIDMIILPGGMPGTLNLEANKCVQSTIDYCVEHNIPIAAICAAP SILGHKGLLEGKKAVCYPGFESELKGAEVADCRVVTDGNIITAKGMGAALEFSYAIIEK LISKERAELLKGAIID" /locus_tag="LOCUS_6930" /note="WP_008760842.1 DJ-1/PfpI family protein (Bacteroides thetaiotaomicron) [pid:44.1%, q_cov:98.3%, s_cov:96.2%, Eval:3.8e-33]" /note="MGA_937" CDS 1117..1884 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MAEQSKNNNEFDEILSSILDKSSSDNKENNREGIITKPESYADVL MTYSTDTEAADFNDIELEESFEKTNVFASVEQENAAPKAKNKAKEKPQLQPKPVKEKKK RRPRKNYSAYGGIVLATLVVCCSIIISLFGIVVGRDFLGIDGSTNEFTIYIPEGSSVDD IANQLYSEGVIDYVDFFKAVVKISDAGTMYPGDLDITGGMSYGDIINALTQMREAKATA TVTFIEGTALYDAALKLEEAGVCDADDFIFTFN" /locus_tag="LOCUS_6940" /note="MGA_938" ORIGIN 1 caaatgagct tgagttttta aatatgcccg atgttaaaat tgaggttaaa atggaaaccg 61 gcaagctcac atccgttggt atggatactg tcgagttctt aatttccgcc aaccgcggag 121 aaactcccaa gcctttagcg aagattgctt cgggaggtga gctttcaaga attatgctgg 181 cattaaaaac cgttcttgcc gatagggacg atattcccac gctcatattc gatgaaatag 241 actcgggtgt cagcggacgt gccgcgcaga agattggaat caagcttcgt gaaatttcaa 301 gaaaaagaca ggttttgtgc gtgacccatc tggcacagat tgccattatg gcagatgacc 361 atcttttaat cgaaaagaac tcggttgatg aacgcacagc caccgaaatt aagcatttaa 421 cttttgatga gagaaaatat gaaattgccc gaattcttgg tggcgataat ataactgaaa 481 ccgtgcttaa agatgctgag gaacagcttt tgagtgcgag atagaggagg attttgaaat 541 ggttgtttgt tttattgcaa acggattcga agagatcgag gcgctgactt ctgttgattg 601 ccttcgcaga tgtgagctcg atgttttaac cgttggaatc ggttcttgca ttatacgagg 661 atctcacgga attgcagttg taacagatac cgatgacggt atgtttacgc cgagcgagga 721 tattgatatg ataattcttc ccggtggtat gcccggaaca ttgaatcttg aagcaaataa 781 atgtgttcag tcgactattg attattgcgt ggaacataat attcccatcg ctgcaatatg 841 tgcagcaccg tcaattttgg gccataaggg acttttggaa ggcaagaagg cggtttgcta 901 tcccggattt gaaagcgaac ttaaaggcgc tgaagttgca gattgcaggg tggttactga 961 tggcaatatc attactgcaa agggaatggg cgcggcactt gagttttcat atgcaataat 1021 tgaaaaactc atttcaaagg aacgcgcaga acttcttaaa ggtgcgataa tcgactgata 1081 attttgagtt aatgttaaag aaaggattgt taagttatgg cagagcaaag caagaacaat 1141 aatgaatttg acgaaatcct gtcttcaatt ttagataaat catcctctga taacaaagag 1201 aataatcgcg aaggaattat tactaagccc gaaagctatg ctgacgtttt aatgacttat 1261 tctaccgata cagaagctgc tgactttaac gacattgagt tggaagaatc ctttgaaaaa 1321 accaacgttt ttgcttctgt tgagcaggaa aatgctgcac ctaaggcaaa gaataaagct 1381 aaagaaaagc ctcagttgca acctaagcct gttaaggaga aaaagaaaag gcgtccccgc 1441 aagaattact ccgcatacgg cggaattgtt ctggcaactc ttgttgtttg ctgttcaatt 1501 attatttcgc tgtttggcat tgttgtcgga cgcgactttt tgggcattga cggctcgaca 1561 aatgaattta caatttacat acctgaaggc tccagcgttg atgatattgc aaatcagctc 1621 tatagcgagg gcgtgatcga ctatgttgat ttcttcaagg ccgttgtcaa aatcagcgat 1681 gcgggaacaa tgtaccccgg cgatttggat attacaggcg gcatgagcta tggcgacatt 1741 attaatgcac tgactcaaat gcgcgaagca aaagccacag cgaccgttac ttttattgag 1801 ggtacggccc tttatgatgc cgctctcaag cttgaagaag cgggcgtttg cgatgcggat 1861 gactttattt tcaccttcaa ctaaactgtc tatggctatg aatttgaaaa gcatgttgca 1921 tcatcaagcc tcaaattcta taaatatgag ggatatcttt tccctgatac ttatgagttt 1981 tatttaggcg actcgacata taacatcgtc aagaaaatta aacagcgcac cgctcagatt 2041 ttgagcgctg atgttattgc gagagcagct gagatgggct atactcttga cgaggtcgta 2101 acacttgcat caattgttca gcttgagtgc ggcgatgcta acgaaatgaa aaatgtttca 2161 tctgtattct taaacagact caataatcct gagcaatatc ctaagctcca atcggatacg 2221 acggtattct atatcaataa tgttattaag aagctttcaa gaattcagta tgaggaaatg 2281 tataacgcat acgacagcta tgtttgcaca ggcctgcctg tcggagcaat ttgtaacccc 2341 ggttcgga // LOCUS sequence214 2344 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence214 VERSION sequence214 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2344 /mol_type="genomic DNA" /organism="" /note="sequence214" misc_feature <1..1906 /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_177221404.1:preprotein translocase subunit SecA" /note="WP_177221404.1 preprotein translocase subunit SecA (Moorella thermoacetica) [pid:54.9%, q_cov:97.6%, s_cov:69.5%, Eval:7.8e-191, partial hit]" /note="MGA_940" /locus_tag="LOCUS_6950" ORIGIN 1 aagaaccgca actctgacaa aagcgggcgt tgcaaaagcc gaggctcatt tcggcgttga 61 aaacctttcg gacaccgaaa atgtcaccct tttgcaccac attaaccagg caattaaagc 121 aaacggcgta atgcgccgcg atattgacta tgttgttaag gacggcgagg tcatcatcgt 181 cgatgaattc acaggacgat tgatgtatgg cagacgctat aacgacggtt tgcaccaggc 241 aattgaggct aaggaaaatg tcaaggttgc ccacgagtcg aagaccattg caaccatcac 301 tttccagaac tatttccgac tttacaaaaa gctctcgggc atgacaggta ctgccgccac 361 cgaggaaaac gaattcagag agatatataa cctcgacgtt gttgttgttc ccaccaaccg 421 cccgatgatc cgccttgacc agccggatgt tgtatataaa accgagaggg caaagtttaa 481 cgcagtcatc gaagagatcg tcaaggctca ccaaaagggt cagcccgtat tggttggtac 541 cgtttcgatc gaaaaatccg aattgctttc cgcaatgctt aaacgccgcg gaattcagca 601 tgaggtttta aatgccaagc accacgaacg cgaagcacag atcgttgcgc aggcaggtca 661 gtacggcgct gtaaccattg ccaccaatat ggcaggtcga ggcaccgaca ttatgttggg 721 cggtaatgcg gaattcttgg cgaaggcaca gctcattaaa gaaggcttcg gcgaggaact 781 gatgtatgac attacaggct tcggcgagac cgaagacgag cagatcattg aaggcagacg 841 tcgctataac gagcttttgg agcagtacgg cgcagagatc aaggaaaagg ccctcaaggt 901 taaagaagcc ggcggacttt acatcatcgg caccgagcgc cacgagtcaa gacgaattga 961 taaccagctc cgcggccgtt cgggtcgaca gggcgacgag ggtgaatccc gcttcttcct 1021 ctctcttgag gatgatttga tgcgactttt cggcggcgac cgaatcaata tgatgatgga 1081 aacaatgaac gtccccgaag atatgccaat tgagtcgaag atgctttcaa acgtgatcga 1141 atcttcccag aggcgagttg agggcagaaa cttcaacatc cgtaagaacg ttttgaacta 1201 tgacgacgtt atgaacgcac agcgcgagat catttacggt cagcgttcga tggttcttga 1261 cggcgaggac attaagcact atatcattaa gatgataaag gactttgttg caaacagcat 1321 tgcaacatat ctgcccggcg aggaagagga tcagtggaac tttgccgcct taaaggagca 1381 ttttgcaggc ttgttcccgc ttccgaatga ctataacttc accgcccgtg accttgacaa 1441 gctctcaaag caggatatta ttgatcagac aacagaaatg gctctggcaa gatatgagga 1501 aaaggaagcg gagctttcgg cacccatttt gcgcgagtgc gagcgagttg cgcttttgca 1561 ggtcgttgac tccaagtgga tgcagcatat tgacgatatg gcagagctta aacgtggcat 1621 ctcgcttaga tcctacagcc agcgcgaccc tgttgttgaa tatcgctttg aaggcttcaa 1681 tatgttcgat gaaatgattg tcgctatttg cgaaaacacc ataagaatcc tttataatac 1741 acacttaaag aaggaagctc cgatccagcg cgttcaggtt ttgaaggccg aggatacagg 1801 ctcggacggc tcggtatctg cgacacgcag gtcgcagaag gtcggcagaa acgacccttg 1861 tccctgcgga agcggaaaga agtataagaa gtgctgcggc cagtagtaaa ttctcgttgc 1921 actcgaattg actacaaaaa tacggctttc aagagcaccg ctcttgaatt ttgctgcgca 1981 aaaccgccgt attttaggtg cctgccgttc agcgacggag atatgcccta tagtggcggg 2041 cctgtgtgcc cgcgcgggcg accacatagg gtcgccctta tataaaatca acccaaaggt 2101 gattaaaaaa tgaaattctc aactgcattt aaaagcgctg atattctttt gcccaagtgc 2161 gaggatatgt caaaatggtc ggttgtcgcc tgcgatcaat ataccagcga gccgaaatat 2221 tgggaaagag ttgaaggact tgttgctgac agcaaaagca cccttcgcct gactctgccc 2281 gagatatatt tagagcaaga gggcgttgac gaaagaattg aaaacatcaa caagtcgata 2341 gatg // LOCUS sequence215 2339 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence215 VERSION sequence215 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2339 /mol_type="genomic DNA" /organism="" /note="sequence215" CDS 459..2081 /product="alpha-amylase family glycosyl hydrolase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_010906091.1" /transl_table=11 /codon_start=1 /translation="MKRMLVFFLAILMLVCTMTGCAKPKDISGKYDLDKSRNEAIINDA GEPKELNTGNNRVFYQIFVGSFSDSNGDGVGDLRGIIERFDYLNDGDDSSGLSLGVEGI WLTPIFKSPSYHKYDITDYYEIDPQFGTMDDLKELITLCHERNVKLILDLPFNHTSTTN MWYINFINAHKADDTENEYYDFYTYADAPQAGRGFALIRGTDHYYECNFSGDMPELNFD NEAVRQAVVDIAKYYLDMGIDGFRFDAAKYIYMGEEPKNAEFWKWYMAELRAIKSDVYT VAEVWDSDSLTYPYFESTNCFNFTMSQTSGVIAQTAKAGNVNVFTSYVARYIKAIQERR AEATPVTFIANHDMDRAAGYLTLAAGQAKVAANLSLLMPGSTFIYYGEEIGLKGSRGSN NTDANRRLAMLWGDDDTVKDPEGANYDAEQSNGTVLTHLPDGNSLYNHYKKLIAIRKAN PEIVYGSFEPLHTDTKLGGFVSTLDGSSVVVIHNTSRGSVTVDLSELTDVNFAVIVEYE GVETETLEVTVLTSGGQTSVVLR" /locus_tag="LOCUS_6960" /note="WP_010906091.1 alpha-amylase family glycosyl hydrolase (Lactococcus) [pid:34.2%, q_cov:91.5%, s_cov:90.8%, Eval:2.5e-78]" /note="MGA_943" ORIGIN 1 caaaaatatg agttgccgtc aggctgatag tcaacctcat attcaacctt gatattaccg 61 atctcgcgcc acgtctgtgt gcagtcaaac ttcttacccc ttctgaaaag ggcattgtta 121 atgtttgacc actcgcagga aaaggttcct ccgcctgtaa gggtcattgt cgtgtcgcca 181 tggtccttcc aaagctcata tccatagccg tcctcttcgc cgatctcaaa gtcgtgcaat 241 atcttttgct caccttgaca tccgcaaaga acgctcgcaa tcagcagaaa gcatatcaac 301 acagtaagcg ttcttttaaa gataatcata atgttccaag acctcctttg ctgatatatt 361 atcatacttt ttccggtttg tccacctgtc ggcgctccaa aagattcttg caagcgatga 421 cttattgtgg tataattcgg ttaaagggag gattgtttat gaaacgaatg ttagtgtttt 481 ttcttgcaat acttatgctg gtgtgtacta tgacgggatg cgctaagcca aaagatataa 541 gcggaaagta tgatttggat aaatcccgca atgaagcaat aattaatgat gcaggtgagc 601 cgaaggagct taacacaggc aacaaccgcg tgttctatca gatatttgtc ggttcattct 661 ccgattccaa cggagacggt gtgggcgacc ttcgcggaat aattgaacgt tttgactatc 721 tcaacgacgg cgacgattcc tcgggactca gcctcggagt tgagggtatc tggctgactc 781 cgatctttaa gtcgccatca tatcacaaat atgacatcac cgactactat gagatcgacc 841 ctcagttcgg caccatggat gacctcaagg agcttatcac gctttgccac gaacgcaacg 901 tcaagctgat tttggatctg ccctttaacc acacctcaac cacgaatatg tggtatatta 961 attttatcaa tgcccacaag gcagatgata ccgaaaacga gtattacgat ttttatacct 1021 atgccgatgc tcctcaagcg ggcaggggat ttgccctcat ccgcggcacc gaccactatt 1081 atgaatgcaa tttctcgggt gatatgcccg agctgaattt cgacaacgag gctgtaagac 1141 aggcagttgt cgacatcgcg aaatattacc tcgatatggg tatcgacgga ttccgttttg 1201 atgccgcaaa gtatatctat atgggcgaag agccgaaaaa cgcagagttc tggaagtggt 1261 atatggcgga gcttagggct atcaagagcg atgtttatac cgttgccgag gtttgggaca 1321 gcgactcgct tacctacccc tattttgaat ccacaaactg tttcaacttc acaatgagcc 1381 agacatcggg cgtaattgcc cagaccgcca aggcgggaaa tgtcaatgta tttacatcat 1441 acgttgcccg atatattaaa gcgatccagg agcgacgcgc agaagctacc cctgttacat 1501 ttatcgcaaa ccacgatatg gaccgcgctg cgggatattt gacccttgcc gccggacagg 1561 caaaggtggc tgcaaacctc tcacttttga tgcccggctc gaccttcatc tactatggcg 1621 aggagattgg acttaaaggc tcgcgcggct cgaacaatac cgatgccaac cgccgacttg 1681 cgatgctttg gggtgacgat gacacagtca aggaccccga gggagcaaac tatgatgctg 1741 agcagtccaa cggcacagtt ttgacccatc ttcccgacgg taacagccta tataaccact 1801 ataaaaagtt gattgcaatc agaaaagcca accccgaaat cgtatatggc tcctttgagc 1861 ctttgcacac cgacaccaag cttggcggct ttgtttcaac tcttgacggc agctcggttg 1921 tggtcatcca caacacatct cgcggctctg tgacagttga tttaagtgag ctgaccgatg 1981 tgaattttgc agtgatagtt gaatatgaag gtgttgaaac agaaaccctt gaggtaacag 2041 ttttaaccag cggcggccag acaagcgtag tgctgagata aaataaaaaa ataaacggca 2101 ggagaattcc tgccgtttat tttttatgcc aatcaataga tcaaattctt ctcggtctca 2161 tgatcgaaga agtacattac ctttccgggg aaggtcaggt gaacgggatg accgttcttg 2221 agctgagcgc gctcctcatg gctgaggtta actgtgggcg ttcttgcaat aagctttgtt 2281 tcatcgtcca cattaatgtg caaatgaagc tcgctgccca tcatttcgtt taccttaac // LOCUS sequence216 2336 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence216 VERSION sequence216 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2336 /mol_type="genomic DNA" /organism="" /note="sequence216" CDS complement(796..1500) /product="ABC transporter permease subunit" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_109792089.1" /transl_table=11 /codon_start=1 /translation="MKAILKRELSAYFNSLIGYIFLTAFFAASGVLFSITSLQYGSTDM GSMFSMLFFVLLVLIPILTMRTLSEDKRQKTDQCLLTAPVSLTGLVMGKFLAAFIIYAM GVAMTFVYAVVISFMGAVSWLEVMGNIVGLLLVGMAYIAVGVFVSSMTENQVIAAVGGF ACMVALYLISSIASIIPVEWISKILTELSFSDRYLTFTYGIFDFSNVLFFISATVIFIF LTIRVLERRRWS" /locus_tag="LOCUS_6970" /note="WP_109792089.1 ABC transporter permease subunit (Minwuia thermotolerans) [pid:28.4%, q_cov:97.9%, s_cov:96.7%, Eval:1.2e-23]" /note="MGA_946" misc_feature complement(1504..>2336) /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_011057313.1:ABC transporter ATP-binding protein" /note="WP_011057313.1 ABC transporter ATP-binding protein (Thermosynechococcus vestitus) [pid:38.8%, q_cov:93.1%, s_cov:79.3%, Eval:2.5e-45]" /note="MGA_947" /locus_tag="LOCUS_6980" ORIGIN 1 atttccgagg tgcgtatgtt aaccgaatca acaacgtatc cgttcttgtc caaaaggtct 61 gtaagtcccg aaacatccga ctcgtttgca ccggtatagg tcaaaacggt gacggtgatg 121 gggttagcat cggttacagc catgatcgcg ccggtcaaag cctgctcggc atttgaagag 181 gaaacggcgt tgtttgaaat aaagagataa tgtgcctgcg ccgagccgta atattcaaca 241 tactggctga cataagcgga gtaatcgtcc aaaacattca agatgtccat aagggaaacg 301 attttaactc ggttatgctc gccgttttca agctcaacaa taatgtcgca ctgctcaagg 361 tcataagcat agtttgaaac aaagtctggg ttagagagaa gatccttata gcttacggag 421 atgttggggt tgtgctgttc atatctcttc aaaagctcgg cacattgcac cgcatattca 481 cttatagatc tgaattcgtc ctcagtcgcc ataacggtga tatcaaccgc aacgtcgatg 541 cctgccaaat agtcaagcgt ttcctgggaa acggaataga tgctgtcatc tgtcaggtcg 601 agggtgatgg ggaaacggtc gaagagcatt gttgcaacaa cgttgatcaa aacaactgct 661 gcaatgaaaa gtgctgtcaa accggtggca aaggagccgt atttaagctt gcgcttgtta 721 attttgccat cattgccgat aagcttcgag gttaaagatt taatattcat tttaaattct 781 cctttcccaa agccattatg accagcggcg gcgctcaagc accctgatgg tcaagaagat 841 aaagatcacg gtagcactga taaagaacaa aacgttactg aagtcaaaga taccgtaggt 901 gaatgtcaaa tatctgtcgc tgaaggaaag ctcggtcaaa atcttggata tccattcaac 961 ggggatgatt gaagcaatcg aagaaatgag gtagagcgca accatgcagg caaatccgcc 1021 cacagcggca attacctggt tttcggtcat tgaagaaacg aaaacgccga cagcgatata 1081 tgccatacca accaaaagca ggccgacgat atttcccatt acttcgagcc atgaaacggc 1141 gcccataaag gaaattacaa cggcatatac aaaggtcatt gcaacgccca tagcgtaaat 1201 gatgaatgcc gccaaaaatt tgcccattac aagtcctgta aggcttacag gcgctgtcaa 1261 aagacactgg tcggtcttct ggcgcttgtc ttccgacaaa gttctcattg tgaggatcgg 1321 aataagtacc aaaagaacga agaagagcat tgagaacata ctgcccatat cagttgagcc 1381 atactgcagg ctggtgatcg agaacaatac acccgaagcc gcaaagaatg cagttaaaaa 1441 gatatatccg atgagggagt taaaatatgc gctgagttcg cgctttaaaa tcgctttcat 1501 tgattagttt tcctcccctt cttcaatatt ttcaagctcg ttagccttgt cgttcaagaa 1561 ttcgcccaga ctttcgccca ttgtgagctt caagaagatg tcttccaaac tcagctcgct 1621 tgatttaagt cccaaaaggt accagtttct tgatgccaag cgcttaaaga ggtcgcgtct 1681 gatgtcggtg ccttctgtcg cttcaatgtt atattcccaa acgccctttt ctctttgcat 1741 atcagcaaca acggtttcaa cgccgggaat ggtctgaata atcttaatga cctcgtcctt 1801 ggggccgtca atgcgggcaa tcagcttgtg gtcagccgag agggtgtttg aaaggttgtc 1861 cgctgtgtcg tcggcaacga ttctgccctg gttgataaca acgatcctgt cgcataccgc 1921 ctgaacctcg ctcaagatat gggaggacaa aattacggta tggtttttgc ccaatttctt 1981 gataagtgtt cgaatctcga tgatctgctt ggggtcaaga cctacagtag gctcgtccaa 2041 gatcagcaca tttggattgc cgacaagcgc ctgagccaag cccacacgct ggcggtatcc 2101 ctttgaaagg tttttgatca ttcggtcata tacattttcg attttaacca gctcgcaaat 2161 ttcctttaag tgggtatttc tcggaagtgt acagcctttt aagtcataga tgaaatataa 2221 atactctctt acggtcatat cgagatataa cggaggcaat tcgggcagat atcctatctg 2281 cttctttgcg ccgatggggt cctccaaaat gtcaatgccg ttgatgagcg cttcgc // LOCUS sequence217 2335 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence217 VERSION sequence217 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2335 /mol_type="genomic DNA" /organism="" /note="sequence217" CDS 468..1394 /product="RnfABCDGE type electron transport complex subunit D" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011948146.1" /transl_table=11 /codon_start=1 /translation="MASKLRLSVSPHIHTRDTVQSIMLDVIIALLPATLAGVIIFGLRS LAVIAVCIIASVLSEFIFNKIVKKDQSIGDLSAIVTGLLLALNLPANVPLWQAAIGSIF AIVVVKCFFGGMGCNLVNPAITARVFMLVAFGSMATAAFPVDSTASATPLVGMAEGTNT LSLTQLFLGNHGGAIGETCALALLIGGIYLIIRRVITWHIPVAFIGTVFLFSLCLEGFD VIAALQWILSGGLFIGAFFMATDYVTSPETSSGKIIAGVFCGIITVMIRFWGNYPEGVS FAILLMNIMDPYIGAWTAKKVFGGEDR" /locus_tag="LOCUS_6990" /note="WP_011948146.1 RnfABCDGE type electron transport complex subunit D (Clostridium botulinum) [pid:48.7%, q_cov:98.4%, s_cov:98.4%, Eval:5.9e-78]" /note="MGA_949" ORIGIN 1 agtgctgtta ccacacccaa gaatgtgatc gttcccatcg gcacatccat tcaggagctt 61 gttgatttct gcggcggctt caagtcggag ccgggcaaga tcatctatgg tggtcctatg 121 atgggcatca ccgtgcccga tacgagcgca ccaataatca agaatacaaa tgcgatcatc 181 gcattcaacg aaaaggactc tgaacccaag aagattcagc cttgtatccg ttgcggcaga 241 tgcgttaacg cctgtccctt cagcttgaat cccccgctta ttgcaaaggc gctgaacgat 301 aagaattttg acagtcttta taagcttggt gccgatatct gtatggaatg cggatgctgt 361 gcttttgttt gccccgcaaa cagacctatt gttcagaaca acaagattgc aaaggcagag 421 cttaaagaag ctcttgcgaa gaaaaaagca aaggaggcaa ataaataatg gcttcaaagc 481 ttcgtctttc ggtttcgccc catattcaca cccgtgacac agttcagagc attatgcttg 541 atgtcataat tgcccttttg cccgcaactt tggccggtgt gataatcttc gggcttcgct 601 cgctggcagt gatcgctgtc tgcattattg cctcggtgct cagtgaattt attttcaaca 661 agatagtcaa aaaggatcag tcgatcggtg acctcagcgc cattgtaaca ggcttgctct 721 tggcactcaa tcttcccgca aatgttcccc tttggcaggc ggcaatcggt tcgatcttcg 781 cgatcgttgt tgtaaagtgc ttcttcggcg gaatgggttg caaccttgtt aaccctgcaa 841 ttaccgcaag agtatttatg ctcgttgcct tcggttcaat ggcaaccgcc gctttccctg 901 ttgattccac cgcttctgcc acacctttgg taggtatggc ggaaggcacc aacacccttt 961 cgcttactca gctcttcctg ggtaaccacg gcggtgcgat cggcgaaacc tgtgctttgg 1021 cacttctcat cggcggtatt tatcttatca tccgccgagt aattacatgg catattcccg 1081 ttgccttcat cggcacggta ttcctgttca gcctttgtct tgagggcttc gacgttattg 1141 cagctctcca gtggatcttg agcggcggct tgttcatcgg tgcattcttc atggctaccg 1201 actatgttac cagccccgaa acatcctcgg gcaagatcat tgcaggtgtc ttctgcggta 1261 tcattacagt gatgatccgc ttctggggca actaccccga gggagtatcc tttgcaatac 1321 ttcttatgaa cataatggat ccttacattg gcgcttggac cgcaaagaaa gttttcggag 1381 gcgaggatcg atgaacatat ctcttaaaag tattctttcg ctcacagcta tctgtgcggc 1441 agttgcaatt ttaatggctg cgactaattt catcacatct cccattattg aagcaaatga 1501 agctgctgca gcaaacgacg ctttgctcgt tgtaatgcct aacggttcgg gctttgaagc 1561 ggttgatctt tcaacctaca cacttcccgc aaccgtcaac gaggtatata aggaagcaaa 1621 cggcggatat gttgtcaagc tgaccaccac cggttattcc tcgggtatgg tcattatggt 1681 cggtgttgac ggctcgggca ctgttacggg tgcaacctgc ctcggctcaa gcgagaccct 1741 cggatatgaa aagacctacg gcgacacgac agtcggtgca accgttgcaa caatcgactc 1801 actcgatacc gttgcaggcg caacaagaac caccgaagca tataaaaacg ctgttaagga 1861 tgccctcaac accgcagtta ttatgggcgg cggcgaggtc gatatcagaa ctcccgaaca 1921 gattttggct gagaccctca gcgctgcgct tcccgcaggc gaaggcaagt tcacctcctt 1981 cttcattcag gaagttcttt ctgtcaccga tgctgtatat cacgctgata acgatgccgg 2041 ttatgtattc gtttcgggcg aagcttatgt tggtgttgac gcttcgggta acgtagtttc 2101 cgaagttgac gaggctctca aggcttcaat cgaaagcgat gccaagatat tcttggcttc 2161 cgaggttgaa attattgacc tctcggctta tgagaatatt ccctcgcaga tagtaaatgc 2221 atataagacc cttacaggca actatgtatt tgaactcaag gctgcaggct ttggtatcaa 2281 cggcgacgag tggtatcagc cttcgggcga atatatcgaa attatgatct ctgca // LOCUS sequence218 2331 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence218 VERSION sequence218 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2331 /mol_type="genomic DNA" /organism="" /note="sequence218" CDS complement(1269..2015) /product="4-hydroxy-tetrahydrodipicolinate reductase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011861884.1" /transl_table=11 /codon_start=1 /translation="MIRAVISGCCGKMGRVVADVIDAREDIKVIAGIDVAVKECGFTVY NKPMELPEVQDVIIDFSHPSALGDLLEYALTNGTALVLASTGYDKEQIAKIESASHSVP IFFTANMSLGINLLSELAKKATAVLGGQFDIEIVEKHHNQKIDAPSGTALMLANAINDV SDDKYNYVYDRHSVRKKRDGNEIGIHAVRGGTIVGEHEIIFAGRDEVITLSHAAYSKEV FAVGAVNAAVFMVGKDAGLYSMADLL" /locus_tag="LOCUS_7000" /gene="dapB" /EC_number="1.17.1.8" /note="WP_011861884.1 4-hydroxy-tetrahydrodipicolinate reductase (Clostridioides difficile) [pid:46.8%, q_cov:100.0%, s_cov:99.6%, Eval:2.0e-59]" /note="MGA_952" CDS complement(2065..2331) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MLSNILPFETHEICRLCLEDNFTEARRLALKYLDVANKLFIDVNP VPVKEAMNLMGMGVGPCRLPLYEMREQDKVALRASLERVELVK" /locus_tag="LOCUS_7010" /note="WP_011391089.1 4-hydroxy-tetrahydrodipicolinate synthase (Rhodospirillum rubrum) [pid:48.1%, q_cov:92.0%, s_cov:27.7%, Eval:2.8e-16, partial hit]" /note="MGA_953" ORIGIN 1 gagggtatgt cctatggtat gatgatgtgt gtccagcttg ataaaaaaga cgaatttgac 61 cgcatttgga agtggtcaat gaccaatatg tatatgaccg agggcagaca cgcaggctac 121 tttgcttggt cctgtgcgcc cagcggcaaa aagaatgccg acggccctgc acccgacggc 181 gaagagttct atgcaatggc gctcttcttt gcatctcacc gttggggcga cggcgaaggc 241 atctacaact attcccggtg ggcaaaaact atcctgcgtg actgtttgca tcgcaacggc 301 gaaggcgata agcccggcgc aacaatgtgg gatttggaca acaagctaat caagtttgtg 361 cccgattgcc ggtttagtga cccctcatat catctgcctc atttttatga gcttttcgct 421 ctttgggcag atgagcgcga ccgcgctttt tggaaagatg ccgcagatgc atcccgcaaa 481 tatttgcata cagcatgcca ccccgaaacg ggtctttgct ccgattatgc tcattatgac 541 ggctcacccg ttgtgggcgt tccttggggc agacccaacc agagaagaat cgaccgcttc 601 tattccgact catatcgcac cgccgcaaac ttgggccttg actccgaatg gtataatgtt 661 gatacttggg ctgctgaaaa cgttgcacgc ttgcagaaat tctttgccca aaaccccaag 721 gcgatggaat atgctccccg aatcgacggc gaattcaccg aggaagaggt tatgcaccca 781 actgcgataa tcgcaaccct cgctcaaggc tcaattgcag ttcttaacag cgaaaatgca 841 accgacgagg aaaaatcaag agctatcgac tgcatcaaaa agtttatgga tacccccata 901 cgccaaggca aacgcagata ttacgacaac tgtctatatc tgttcgcgct tctggcgctg 961 tcgggaaatt acagaatcta ctgatagtta aaagcagacg gtttcccgtc tgctttttgt 1021 atgctaagct cttaccgctc gccacggcgg tggcatagcg cctacgtcgg cgcacgccac 1081 gccacggctc gctccctcgg cggcaaccaa gccatttgct cagcaccaaa agtggcgggt 1141 cccctccgtc acgcaccaat ttcagtttcg cattcgctca actaaaaatg gcgcacgacg 1201 gcctccgccc cgcctcccat gcacaaaaaa cagcccccta tttgtcgcca aataaggggc 1261 tttgtttatc ataataaatc cgccatactg taaagccctg cgtctttacc aaccatgaat 1321 accgccgcat tgaccgcacc caccgcaaac acctctttcg agtatgccgc gtgtgaaagg 1381 gtaatgactt cgtcacgtcc cgcgaagata atttcgtgct cgccaacgat tgttccgccg 1441 cgaactgcgt gaataccgat ctcatttccg tcgcgctttt tccttacact gtggcgatcg 1501 taaacatagt tatacttgtc gtccgacacg tcgttgatgg catttgccag catcagcgca 1561 gtgccgctgg gggcgtcgat cttctggttg tgatgctttt caacaatttc aatatcaaac 1621 tgtccgccca aaaccgctgt agcttttttt gcaagctcgc tcaaaaggtt aatgcccagc 1681 gacatattcg ccgtgaagaa aatcggtacg ctgtgggatg ccgactcgat ctttgcaatc 1741 tgttccttgt catatcccgt cgatgccagc accaaagcgg tgccgtttgt caaggcatat 1801 tccaaaaggt cgcccaaagc cgatggatga gagaagtcga tgatgacatc ctgcacttcc 1861 ggcagctcca ttggcttgtt atatactgta aagccacatt cctttacggc aacatcaatt 1921 cccgcaataa ctttaatatc ctcgcgggcg tcaatgacat cggcaacaac tctgcccatt 1981 ttgccgcagc aaccgctaat tacagctcga atcatgattt atcattcctt attgtgtgta 2041 atttattgca tatgtaaagt tagctcactt tacaagctca acgcgctcaa gcgatgctct 2101 gagtgcaact ttatcctgct cacgcatctc ataaagcggc aatctgcaag gtccaacgcc 2161 catacccatc aggttcatag cttccttaac gggaacaggg ttgacatcaa tgaagagctt 2221 attcgcaaca tcaagatatt taagagctaa acgccttgcc tcggtgaaat tatcctccag 2281 gcagagtctg cagatctcgt gggtttcaaa aggcaatatg tttgaaagca c // LOCUS sequence219 2327 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence219 VERSION sequence219 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2327 /mol_type="genomic DNA" /organism="" /note="sequence219" ORIGIN 1 gacgagccaa acgcaatcgt taagggacaa ggcgcaatcc aagctccttg ggcaggtgta 61 tatgacatca cagttgacct caacgcgatg actatcactc tcactactga aactcctgac 121 cccaatgctt cgtcaagccc gatgctcacg accgagtgga ttcacacaga atatctaccc 181 ggtgcacctg ccggcgggga tctccgtttt ggcgctgcag tggatggaaa attgatagta 241 accgacaagc ttgcaaaaat catctatgca tgggacgaaa acggacaatc aacgttctat 301 gaccttaatt cggtggttga atcggccgga acagcaataa cagcagatga cgcaggcaac 361 gtgattgtaa acacagcgtt ccccaatgct gcatcttcaa ccgactgggt aatcatacct 421 gccgatggct cagctccggt gcctgtagaa cttgaccttg gcgaagttgc tgctgcgcgt 481 tgcgaccaga ttggccgagt agtaggaaac gtgttgggcg aagaaggcgg ttacatgtgg 541 attccgacca acggcagctc acaaatcgct attgttaaga tcgtaaatgg tgttcaagac 601 atggattaca gccaggctgc aacagacggc ggtgttgcga taaatacatc agttgtagca 661 caacctctgt acaccacagt tgccgaaata gataatctta tggacgaaaa cggtgatttg 721 acaccctcat tctatttgcg cagccgctca aatccgcaat atgtgtatat gtggaatgcc 781 gatgcgacag aaatggaagc ccttgtattt gacgcagtag ccgagtcagg cgcacaggcc 841 aagaacgctt cacaagaagg tttcgaaaca ttcaaattgc aaggcacaca atattttgtt 901 ctcccgttga gttcagacgg aacgacaaac ggccgtggca cacactttgg cgtatttgac 961 caagacaaga accttgtagc cgaatacaac gaatacagca agaccgcttt gggacaagca 1021 ttcggcagct tctttgtagt tcccaatgac gattattcgg tatatatcta ccgttggatc 1081 gccggcaacg tagcagctaa atacaaattt actcttcctg ctcctcaagc acccgaaaaa 1141 gtaaatatgt atatcttcgg ttcgttcaac aactgggatc ccgcgacttc agttgaaatg 1201 actatggctt cagaaggtgt ttacacaatt gaagaccttg aactcacagg cgaccacaac 1261 ttcggtctct caacagtgca atcagccaac tgggacgaag ttaacgccag ccgttacgga 1321 tttgaagttg acaatacagt agcagttctt gacgagccaa acgcaatcgt taagggacaa 1381 ggcgcaatcc aagctccttg ggcaggtgta tatgacatca cagttgacct caacgcgatg 1441 actatcactc tcactactga aactcctgat cctaatgtca aacctgcttc tactctttat 1501 atccttggta atgtaaacgg cggtctttgg aatcctgcca atgcagttgc catgacttct 1561 tcagaagagg gtaaatttga agttcaggta acagtggacg ctaatgacag cggcagaggt 1621 acattcatct tcactgaaaa tgccggttct tgggacgaaa tcaacaaggg cgtgcgctac 1681 ggttcagaat atgacggttg tctccttgct acagacgcag caatcgaact tattaagggt 1741 tcagaagcat cttgggcaat cgctgcaggc gaatacaagt ttgttgttga tgtagtagct 1801 tgtacagtaa cagcaaccaa gatctctggt atcggtgaaa tcgaggctga atcggctgct 1861 cctgtttact acaacctcca aggtatcgaa gttgccaacc ccgaaaacgg taaagtatat 1921 atcgtgaaac gtggcaataa agttgctaag gaagtgaaat aatcctcatc gccataggcg 1981 acatgtatag aaggccgtca cccaaaaggt ggcggtcttt ttgttttgct ttgcttgaaa 2041 attgttgctt attagaattt atttaattac ttttgcgata ctgaaataaa gaaaatcaaa 2101 aactaaaaat cagattttat gaaattacgt aatctattaa ttgccggagc agtcgctgtg 2161 tcgagtattg catcggctca atctccgctc tatattttcg gctcgtttaa cgggtggaat 2221 ccagatgctt caacagaaat gagctacagc ggaggtgtgt acagtgttga taatatagaa 2281 tttggcgcag gtgggaattt tgctgtctcg actgtgaaat cgtcaaa // LOCUS sequence220 2316 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence220 VERSION sequence220 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2316 /mol_type="genomic DNA" /organism="" /note="sequence220" CDS 159..1046 /product="NAD(+)/NADH kinase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_012546443.1" /transl_table=11 /codon_start=1 /translation="MTVFIYPNLNKDGALECTLNVCALLNELGVKIKMSSQLIDFIKLD YIEFITSNISISDCDIVISVGGDGTILKCARLCAENDKELLGINCGRLGFMATLEKEDI ALLSRLVSGDYSVEKRMVLDVIVKRSNGDTEVYNALNDAVVYHGILGKIYDFKVIADGT VVSLLRADGIIFSTPTGASAYSLSAGGPLIEPSLDCIEFTQICPHSLFARSMIFSPEKT LEVEYDAGSNTHVCLSIDGAEPIILDKSDKLYIKRSDMRVKLVDILGNSYFNAIGSKLM QPTKELRRSDKNEG" /locus_tag="LOCUS_7020" /note="WP_012546443.1 NAD(+)/NADH kinase (Thermodesulfovibrio) [pid:34.2%, q_cov:91.9%, s_cov:94.3%, Eval:5.1e-39]" /note="MGA_956" CDS 1036..1485 /product="arginine repressor" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_010965374.1" /transl_table=11 /codon_start=1 /translation="MKDNRKNAILEIVSQFEVDTQETLQALLLERGFSVTQATVSRDIK QLSLVKIMSENGGYKYSLPPKSGDNTTKSMFESLFSHSVNSLDRAMNTIVIKCHTGMAN AVCSQLDAADYGDIVGTLAGDDTIFVLMRTEQEAIDMLNELSKLL" /locus_tag="LOCUS_7030" /note="WP_010965374.1 arginine repressor (Clostridium) [pid:38.9%, q_cov:100.0%, s_cov:98.7%, Eval:1.4e-25]" /note="MGA_957" ORIGIN 1 accaaataag ctgattcctt caccaattaa gggcggggac ggcaatattg agtatttaat 61 tttgcttgta aagtctataa actttacaca caaatctttt gatataaaat caatagttga 121 tgaggcattt gcatcagcta agtgaaaaga gtgattttgt gacggtattt atctatccaa 181 atttgaataa agacggtgct ttagagtgca ctctaaatgt atgcgcgttg ctcaatgagt 241 taggcgttaa aatcaagatg tcttcgcaac ttattgattt cattaagctt gattacattg 301 agtttatcac ttcaaatatt agcatttccg attgcgatat cgtgatctct gttggaggcg 361 acggaacaat tttgaagtgt gcacgtcttt gcgccgaaaa cgacaaagag cttttgggca 421 tcaactgtgg gcgtcttggc tttatggcga cccttgaaaa agaggatatt gctttgcttt 481 cgcgccttgt gagcggcgat tacagtgttg aaaaacgtat ggttttggat gttattgtta 541 agcgctcaaa cggcgacaca gaagtttata atgcccttaa tgatgctgtt gtatatcacg 601 ggattttggg caaaatttat gactttaagg ttattgcgga cggaaccgtt gtgtcattgc 661 ttcgcgcaga cggcataatt ttctcgacgc ctacaggtgc ttcggcatat tcgctttctg 721 ccggtggacc gcttattgag ccttcccttg attgcattga atttacacag atttgccccc 781 attcgctctt tgcaagatca atgatcttct cgcccgaaaa gacgcttgaa gttgaatatg 841 atgcaggaag caacactcat gtttgtctta gtattgacgg tgcagagccg attattttgg 901 acaagtctga taagctatac ataaaacgct cggatatgag agttaagctt gttgacattt 961 tgggcaacag ctactttaat gctatcggct caaagcttat gcagccgaca aaggaactca 1021 gaaggagtga caaaaatgaa ggataacaga aaaaatgcta tcttggagat cgttagtcaa 1081 tttgaagtcg acactcaaga aaccttgcag gcactgcttt tggaacgtgg cttttcggtt 1141 actcaggcga ctgtttctcg cgatattaag cagctctcat tggttaaaat tatgagcgaa 1201 aatggcggat ataaatattc tttgcctccg aaatctggcg ataatacaac caaatcgatg 1261 tttgaaagtc tgttcagtca ttctgtcaat tctcttgaca gggcaatgaa cacaatcgtc 1321 ataaaatgcc ataccggtat ggcaaacgct gtatgttcgc agcttgatgc tgctgattac 1381 ggcgacatcg tcggtacgct cgcaggtgat gacacaatat ttgttttaat gagaaccgag 1441 caggaagcaa ttgatatgct taacgagctt tcaaagcttc tttaatccac ttaagtaaga 1501 agggataacg tatgctaaaa gagcttcata ttgaaaatct cgctgtaatt gaaaatgcaa 1561 ctgtttcttt aggggagctt tttaatgttt ttaccggaga aacaggcgca ggtaagtcaa 1621 tactcatcgg cggaattaac gctgtgttag gccaaagaac aactaaagac atcgtgcgca 1681 caggcaaaga caaagcatat gtcagcgcag tattttgcga tatccccaag tctgttaagg 1741 aaaaatccgc ggagcttggc tttgaaattg aagacgagct gattatttcc agggaaatat 1801 cccgtgatgg cagaagcaca gctcgaatta attcacgtcc tgttaatgta tctgtgatta 1861 aagagctggg cgacctgctg ataaatatcc acggtcagca cgacaatcag gtgcttttgg 1921 atcccgatac gcatttgggc atacttgata gttatgctga actgtcagat gtaattgacg 1981 actacagagt atcgttcaag gagcttcagt cggttgcaag acatattcaa aaggtcaaac 2041 aaagcgaaca gcaaagagtt caaagagaag cttatcttaa ttccgttgtg agtgatatcg 2101 gttcacttga tattcaagaa ggcgaggatg aagcggttga agaacgcttc agatttgcag 2161 ataatgctgt aactctgtct gatgctttgc gtacagcctt gggtctgttg tcgggcgatg 2221 acgaaatatc aggtgccggt gatatgatat cacgggcata ctctgaactt gcgatatatg 2281 atgacattat aatacatttc ctaccaaaaa aacaac // LOCUS sequence221 2312 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence221 VERSION sequence221 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2312 /mol_type="genomic DNA" /organism="" /note="sequence221" CDS complement(919..1974) /product="glycoside hydrolase family 5 protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_010964144.1" /transl_table=11 /codon_start=1 /translation="MTDTKYTPASLIADMKIGWNLGNTLDAPNGETTWHNPVTTKEMID KIKELGFNTVRVPVSWHNHVGGHPVYCIDTPWLDRVQQVVDYVIDNGMYCILNSHHDDR MFIPTYERLEYGKAYLTSLWSQLSERFKDYGQKLLFEAMNEPRELKTPYEWHLDFNVEH CHELADCINIYNQTFVNAVRSSEHQNNKERFLMVPSYDAAPLHAIPDAFVMPVDPSDRL VLSIHAYTPYNLCLNMNSDVDILTEETKKDIDWFMINIYKKFVSNNIPVVIGETNILNK NNPETRYEWCKYFFSLARQYGMMCCLWDTNGGPMKMLNRRTLTLYEDGEALLKGMFDGL KEDVKGVLELK" /locus_tag="LOCUS_7040" /note="WP_010964144.1 glycoside hydrolase family 5 protein (Clostridium) [pid:46.5%, q_cov:86.3%, s_cov:80.0%, Eval:3.5e-72]" /note="MGA_960" ORIGIN 1 tgatcataaa gtcgtcgata gatgattctt ccgactgacc aaacttgact ttatccattc 61 cgttgcccat taccaagtca tacggagtat aggcgtgaat tgaaagaata agtctgttct 121 caaccgagtc cttgggcata ctgaaatatt gattcaaagc atcataaggg cttgcggaat 181 agggcggaac agaaagatat ctgtcggtgt tgtttccgcc tgttgctctg acggtatcaa 241 caaatatctg attcagttcg tttaaaaccg ccgccgaatc acggcaggtc tgagaatttg 301 tgtcaaacca ccattcgttg ttggtgcctg caagtctggg ctcgttcatc gactcgaaaa 361 tcaggtgata gtcataatcc ttgaagcgtt cagccacctg ataccaaatg tccttaatat 421 actccccgga ggccttggcc ttctctttcg agggatagta ataatcgttg tcgtggtggg 481 agttgatgat tacatacatt ccgttgtcaa taccgtagtc aacaacctcc tgaacgcggt 541 cgagccacga cttgtcgata tttctgtttt tatcaacatg cttgccccaa gaaacgggca 601 cacggatggt gttaaagcca agctccttca gcttgtcgat catctccttt gtggtggtgg 661 gctgtcccca tgagttttcg ccgtcggggg catcaagggt gttgcccaag ttccaaccga 721 tgctcatttg tttgatcagc tcatcgggag cgggtgttgc gatgacctct tcggcaatcg 781 gagcttcggt ggttgtcaca ggcggctcgg aaacggttgt gtcctcggtc acaacagggt 841 catcgacagc tgtatctgca caagcgcaga gcatggttaa aagcattaaa acgctgagca 901 aaagtgcaat cagttttttc atttaagctc caaaactccc ttaacatctt ccttcaagcc 961 gtcaaacatt cctttcagga gtgcctcgcc atcttcatac aatgtaagcg tgcggcggtt 1021 aagcatcttc ataggtccgc cgtttgtatc ccacagacag cacatcattc catattgacg 1081 tgcaagcgag aagaaatatt tgcaccactc atatctggtt tctgggttgt ttttattcaa 1141 tatatttgtt tcgccgatta caacgggaat attgtttgaa acaaacttct tgtaaatgtt 1201 aatcataaac cagtcgatat cttttttggt ttcctcagtc agaatatcaa catccgagtt 1261 catattaagg caaagattat aaggggtgta tgcgtgaatg gacaaaacca atctgtccga 1321 cgggtcaacg ggcattacaa acgcatcggg tattgcgtgc aagggcgctg catcatatga 1381 gggcaccata aggaagcgct ctttgttgtt ttgatgttcg cttgatctta ccgcattaac 1441 aaatgtctga ttataaatat taatgcaatc agcaagctcg tggcaatgct ccacattaaa 1501 atcaaggtgc cattcatatg gcgttttaag ctctctcggc tcgttcatag cttcaaacag 1561 aagcttctga ccatagtcct taaagcgttc ggaaagctgt gaccaaaggg aggttaagta 1621 tgccttgcca tactcgagac gttcatatgt gggaataaac attctgtcat cgtggtggga 1681 gtttaaaatg caatacattc cgttgtcgat tacataatca acaacctgct gaactctatc 1741 cagccaagga gtatcaatgc aatatacagg gtgtccgccg acgtgattat gccatgaaac 1801 gggcacacga acggtgttga atcccagctc cttgatcttg tcgatcatct ctttggtggt 1861 gacgggatta tgccaggtgg tttcgccgtt gggggcatca agggtgttgc ccaaattcca 1921 gccgattttc atatctgcaa taaggctcgc aggggtatac ttcgtgtcag tcatatttat 1981 cctccaaaaa tctaaaaatg tacatttatt atcgtttctg tgtgctgatg ctaatgttta 2041 ctttaaaatt caataattat tcagccgttc cgttgaggcc gtccatgagt ccctgatata 2101 cctcttcgca ggagtcgtag atctttaagt ttgttctgtc aaacaagccg taggtctcct 2161 cgccgtaact gtcgtgtccg ttatcccacc aacagcagac cattccaagc tctttagcct 2221 tggaaacata gtatactgcc catttatatc tttcctgggg gttggccttg ttaatgcatc 2281 ccatttcggt tataacaacg ggtatgcccg ca // LOCUS sequence222 2298 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence222 VERSION sequence222 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2298 /mol_type="genomic DNA" /organism="" /note="sequence222" CDS complement(185..409) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MKKMIEEYRAVASALEKRSKELAEMIKNERDVFALHRLERRKYII DTERYEVLRDIRDMTEILMREEALYGEAV" /locus_tag="LOCUS_7050" /note="MGA_963" CDS 619..822 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MDKKKIERINFLARKSKTVGLTELELLEQAKLRQEYRDAFKASLE VQLNNISIVEEDGSVTDLSKKN" /locus_tag="LOCUS_7060" /note="WP_002901318.1 DUF896 family protein (Streptococcus) [pid:54.2%, q_cov:88.1%, s_cov:69.4%, Eval:1.8e-10, partial hit]" /note="MGA_964" CDS 865..1866 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MDLYQQSSQKQKLLILQKILMTETDENHPLSVNELIQKLKFYDIK AERKTIYDDIATLASVGMDIVVDKRGHSNVYYVGSRLFQDEELLVLADAVASSKFLTIK KSNELIKKLQSLTSKHNATNLRRSIYVGNRVKTFNESIYYSINSIHEAIHKDRNISFKY FEYDTDKKKRYRYDGKLYTVSPYYLIWENDCYYLVCGLIKHGTISSYRVDRMTDVSVTD VKRRQLSVDEDQLAKQLRATYSMFGGRTETVTLEMSSKLINVVIDRFGESVLLNLISDD TFTVRAEVQISPTFWGWLFQFGTQAKIVAPKSVADEAQIELKKILEMYQAAE" /locus_tag="LOCUS_7070" /note="MGA_965" ORIGIN 1 caactccttc gcaatatcca ccattgtttt gttttcaaag aagtattttt ccgcgtaaag 61 cctttgctta tccgtcaaaa cttctttaac tgcccgcttc aaaagctcgt ggggaattgc 121 aaggcgtctt attgctcccg acgtgccgat tgacttcagg ctttgcgcct cctcatgact 181 tatcctacac agcctcgcca tacaaagctt cctccctcat caaaatctcg gtcatatcgc 241 gaatatcccg caagacctca tatcgctcgg tatcaatgat gtattttctg cgctcaagcc 301 ggtgaagcgc aaatacatct ctttcgttct ttatcatctc ggcaagctcc ttcgagcgct 361 tttcaagcgc tgaggcaacc gccctatatt cttcaatcat ctttttcaat attttctcct 421 ttctccgcac attgtggtag ccgatatgcc ccaaaagaga acatatgttc caattccttg 481 cttttaatga taaccaattt tgcgcgaaag tcaaccaatt ttgcatatca gtctgttttt 541 ttggacacga ctattgaaat gcttgttgat aaatgttaaa atgatgctgt aaaatgtaat 601 taaaaccaag gagtttttat ggataagaag aaaatcgaaa gaatcaattt tttggcgaga 661 aaatcaaaga ccgtgggact gaccgagctt gaacttcttg agcaggcaaa gctcagacag 721 gaatatcgcg atgctttcaa agccagcctt gaagtccagc tcaacaacat ctcgatagtt 781 gaggaggacg gctccgttac cgacctttca aagaaaaact gattcgccta agcctatcat 841 caacagggga gagtgacata attaatggat ctatatcagc agtcaagcca aaagcaaaag 901 ctattgatat tacaaaaaat acttatgacc gaaacggatg agaaccaccc tttgtccgtc 961 aacgaactta ttcaaaagct gaagttttat gatattaaag cagaacgtaa gaccatttat 1021 gacgacattg caactcttgc atctgtcgga atggatatcg ttgtcgataa acgcggccac 1081 tcaaatgtat attatgtcgg ttcccgtttg ttccaggatg aagaacttct ggtccttgcc 1141 gatgccgttg caagctcaaa gttcctgacg ataaaaaaat ccaatgagct gatcaaaaag 1201 cttcagtcgc tcaccagcaa gcataatgca accaaccttc gccgcagcat ttatgtcggc 1261 aaccgagtta aaaccttcaa cgagtcgatc tattattcaa tcaactcgat tcacgaagct 1321 atacataaag accgcaacat cagctttaaa tattttgaat atgacaccga caagaaaaaa 1381 cgctatcgct atgacggcaa gctatatacc gtttcaccat attatttgat ttgggaaaac 1441 gattgttatt atctcgtttg cggacttatt aagcacggca ccatttccag ctatcgcgtt 1501 gaccgaatga ccgatgtttc cgtcaccgat gtcaaacgcc gtcagctgtc tgtggatgaa 1561 gaccagcttg caaaacagct tcgtgccaca tacagcatgt tcggcggaag aaccgaaacc 1621 gtcacccttg aaatgagttc aaagctgata aacgttgtaa ttgaccgctt cggtgaaagt 1681 gtcctcttaa acctcatttc tgatgacaca ttcaccgtcc gtgccgaggt gcaaatttcg 1741 cccaccttct ggggatggtt gttccaattc ggaactcagg caaagatcgt tgcaccgaag 1801 tctgttgcag atgaggctca aattgaactc aaaaagattt tagagatgta tcaagcagct 1861 gaatgaccgc tccgcgccac ctgctcggac ggcttcgcca cccttcgcag acggcgatcc 1921 gctcccttct tgctcgcaca acatcgcgag cccccgtcac actctacaca cccaaacgcc 1981 cttaaaaagg aggtcatatt atgccaaaac tatccaaccc caacgccgac cgcaacgccc 2041 agattcttta tgactacatc tgcaaagttc agggcaacta tgttctgacc ggccagcagg 2101 aatttcccga caaccgacgc gccgaatttg aaatgcgcta tcttcgcgag gtaaccggca 2161 agctccccgc tatccgcgga cttgactata tgggcggcga atttgaaaat gtcaaccgcc 2221 gttcccttga gtggcataaa aacggcggaa tcgtgtcaat ttgctggcat accggcatca 2281 acggttatgc ttacagag // LOCUS sequence223 2292 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence223 VERSION sequence223 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2292 /mol_type="genomic DNA" /organism="" /note="sequence223" misc_feature complement(1153..>2292) /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_011227893.1:ABC transporter substrate-binding protein" /note="WP_011227893.1 ABC transporter substrate-binding protein (Thermus thermophilus) [pid:25.2%, q_cov:78.9%, s_cov:63.1%, Eval:1.9e-15, partial hit]" /note="MGA_968" /locus_tag="LOCUS_7080" ORIGIN 1 aggagctgtc ctcattgaga gttgtatata cgcttataac cgtaaggtcg cgcatctcga 61 tggatgaacc cattgcaaga gcagcgtaat cgaactcaag aagctcttca tcggtttcaa 121 tactaacctt tccgtttgca aatgtttcgg catcggtcaa aagatatgca ggggcgttgc 181 cctcgcttat cttttgaata ttacccgggt catcaggctt catcattcgg tatgtaagtc 241 ccgaaacctg ataggttccg cctgcttcat aatactgaac ggtgccgacg atgcgggctt 301 cgtttccgat tgaaaggata tcaagtccct cgcccgaaag gccgtagcca tagtatacgg 361 acataccgta atacatattt gtttcggggt cataggattc aacgtatacg cttgagccgt 421 cattaacggt gattacacca ttaaatgcga ccttgatacc gttatagtcg gaaatgttac 481 agcgcagttc ctttaaggtc agctcaaccg cttcgccata atagaagtcg gggtcgggct 541 tgccggaata tacgccgagc tttaattcct ttgcctggtt tatcgcggac atacaggttg 601 aaccgtagcg gttctgtgcc gatgaatttg cgattgcaag gccgttttgc aagatctcga 661 tattcagatt tctgtattct tccatatcgg ctgtcttata ccatacccag acaaggtatc 721 tgcctcccgt tgaatcgacg ttccagttgg agtcgtccga ttcaatgatg atagaggtgg 781 catttgacag tttttctttt gtgaagttgg ccgcggcttt gccgtattct tcaatttttc 841 ccgtcgactc gggggtgttg atggcgagat atcttgcctt taacacaccc gtgtcgatta 901 cagatgaagg aacattgaag tgggtggtgt cgccgtcaat gaatgttttg acggtgacct 961 cctgtttgac agtgtcggat gccatattga gctttatttg agaagcccag tcggtttcgg 1021 tgaagcttgc gccgtctgta gcgacatcgc cgatagcatt atctgctccg cagccgacaa 1081 aagccgttaa ggcaacacac aaaagagtga gtaatgaaag tattcttaag aattgtttca 1141 ttagttttta aattatcctg cgtattcgca ttctgcaaca gcgtcttcga atgccttgag 1201 gatcatagca tcaacgtcgc cgccgtcgtc agcagtcaag cacttggaaa ggagggtgcc 1261 gacctggtca cgagctgcag aagagccgtt gaatgcagga gaggtgtagt atgcggattc 1321 ctgttcaaga cataccttag cggagagagc ggaaatgtac ttgccgccgt cagcatttgc 1381 aaggaatgca gaataagtct cgttttcagc aacggacttg agaacgggaa cgtaaccgga 1441 agccatggag aattcagcct ggaattcaac actggtggtg aggaacttaa cgaagagcca 1501 agaagctaca acttcctgag gattggactt ctggaagatg caaacgctgg gaccctggga 1561 gataaccttc ttgttatcag cgcttacctg aggaatgggg caaatgccaa cttcgaaggg 1621 ataagtgccg tcagcattag cagcaggtct ctggtaggta gcacctgcgg aggagccgat 1681 agacatatag ctcttggtgc cttcaagggt ggtgaacaaa ccggaggtgt atgcaccgta 1741 gagggtctga gtggtcaaat aacccttctg gtaccattct ctgaacttct tgatgaagtt 1801 acggttggtt tcgttgttga agaggtagtg gtcgcctgta gcggaggtgt aatcggaatc 1861 atactgctca gtcatattga tgaaccagtt ggattcggag tcgtagccga gaggaatgga 1921 atcggggtcg atttccttga tcttctggca aactgctccg agctcgtccc aagtggtggg 1981 aacggtgaga ccgttagcgt cgaagaaggt cttgttgtag taaagaactc cggtggactt 2041 ggagaagggc atggtgtaca tcataccgtc gccgaactga gcgccttcag cgtagtaacc 2101 tgcgatgaag tcgttcttct gctcatcagt aagacccaat acttcggtgg tgccgtctgc 2161 tcttgtaacg gtgatgtcgg actcgatcaa gctatcgagg gtgacaacag ccttagcaag 2221 gttgtaaaga gcagcgtggt cgggatagca gtaagcgatg ttgggctggt tgccaacggt 2281 gatctcggtg ga // LOCUS sequence224 2288 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence224 VERSION sequence224 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2288 /mol_type="genomic DNA" /organism="" /note="sequence224" CDS 1550..1690 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MEPTTVFDIVMGLLDNKRYQELKIIMEQMNPADIALILDEAEEKA R" /locus_tag="LOCUS_7090" /note="MGA_970" ORIGIN 1 gatggtgacg ggatacattc tcttatagtc gtgaacacgg actgcatcgc ggagcatttt 61 ggtaacttca acgccgcggg gacctgcatg ggtatcataa atttcgttgc cgatactcca 121 cattatcata ctggggtggt tgcggtcacg tcttacccag cttgcaacgt cacgctcatg 181 ccattcgggg aagaaacgtg catagtcata atcggtcttt ttgaattccc acatatcaaa 241 cgcttcggaa tttattataa ttcccatttc gtctgcaagc tccatcagct caaccgaggg 301 agggttgtgg gatgttctga tcgagttgac acccatttcc ttgagacttt caaactggcg 361 gcgcaaagcc gttttgttta cagcagagcc taaagcgccc aaatcgtggt gcatacatac 421 gccgaaaatt ttaatattct taccgttaag gaagaaacct tcgttttcat cccaacgggt 481 ggtcttgaag ccaacatttt caacgcgctc atcaacggtt tcgccatcga cgataagctc 541 ggtggtgaga atatagcaat aagggttgtc aacatcccaa agcttaggat tttcaacatc 601 aagggtctgg gatacaacgg tgacgtcgct tgaaagcgca acattgcaag aagcctcagc 661 cttaattttt ccgcactgtg caacaagagt gtgcttaaca cttgcgttgg cgttaccctt 721 gacctctgtg tcaatttcaa ggcgccattt gccatcctcc aaaatcggaa caacgtaggt 781 gccgtcgggg atgatttcgt tttcaccctt gatggtgagc cagatgtttc ggaaaattcc 841 ggcgcccgaa taccaacggg tgttggggga tttatggtga actacgacgc gaatttcgtt 901 gtccccttct ttaaggttgg tcaaaggaac atcgaaggtg gtgtagccgt atttccattc 961 atatatcttt tcgccgttga ggaagatctc cgagtccata tatacaccct cgaagcgaag 1021 ggtataatat ttgccggaaa tgtcatgcgc ggtgaagttt ttcttatagc atccgtcgcc 1081 gtcagcatag aggcgatgtg tgtcgtgcac caaccagtca tgggggatgt caacagggcg 1141 atagtcgcag gcgttgggag tttcaccgat gttttttagt gcgaagctcc agccgccgtt 1201 aaatagagtt cttgtcattt agttacctcc ttgtgtgaaa gcagtatata aattattata 1261 atggaacatg aggcacattt caattgaata aattgacttt ttcaagaaat tttatatatg 1321 aatattatta catttttctt gacgattgcg tattgtggga gtataataaa atcaacgacg 1381 atgtcggaat aagataatga atcaggagtg agatttgtgt aagctaatat accgcgaggg 1441 tgcaaaatag tttggcttat tagggttcac aggtgtgtgc tccgataaga ttaatatttt 1501 tgtgccccca tgatctttga agttcaaaag aaagtgaggg gttttaattt tggaaccgac 1561 aaccgttttt gacattgtga tggggctttt ggataacaag cgttatcaag agctgaagat 1621 cataatggaa cagatgaatc ctgcagatat tgcattgata cttgacgaag ctgaggaaaa 1681 agcgcgctga cacttttcag gcttttgcca aaagagctgg catcggaaac ctttgcatat 1741 atcgaaacag aacagcagga gcaattaatc agcgcatttt ccgacaggga gcttcgggca 1801 gttgttaacg agcttttctt ggatgatacc gttgacttga tcgaagagat gcctgcaagc 1861 gttgtggcaa gaattcttaa aaataccgac tcggaaacaa gaaagcagat caacgagctt 1921 ttggcatatc ccgacgacag cgccggaagc ctgatgacac ttgagtatgt atatttcaat 1981 caggatacca ccgtcagcga agcatttgag cgaatcagac aggtcggcgt tgcaaaggaa 2041 acgatctata cctgctatgt caccgaaaga cggcgacttg tgggcgttgt ttctcttttg 2101 gatatgctca cggcagaaac cgacacatcc ataagagaga ttatggaccc gaatgtaatc 2161 agcgttacga ctcttgagga taaggagcac gttgctgcag catttgcaaa atatgacctt 2221 ttggcgttgc ctgttgttga tacggacaac cgccttgtgg gtattgtcac cgttgacgac 2281 gctatcga // LOCUS sequence225 2288 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence225 VERSION sequence225 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2288 /mol_type="genomic DNA" /organism="" /note="sequence225" CDS 55..762 /product="response regulator transcription factor" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003359320.1" /transl_table=11 /codon_start=1 /translation="MPQGKVLIIDPDKNICELLRIYLEREGYSVITSGDGEEGLLKFSA LKPDIVVLEVVLPGVDGWQICREIRKKSNIPLIYITAKSEVFDKVLGLELGADDYVTKP FDSKELVARIKAVCRRTNLAKEDNAVKEVHFDGLDLNMTRYELRIKGKLVDAPPKELEL LYHLASHPNIVFNRDQLLDEVWGFEYYGGSRTIDVHIKRLRQKLDGVSPKWILRTVWSV GYKFEVNDGETQA" /locus_tag="LOCUS_7100" /note="WP_003359320.1 response regulator transcription factor (Clostridium botulinum) [pid:53.5%, q_cov:95.7%, s_cov:97.4%, Eval:9.2e-64]" /note="MGA_972" CDS 784..1590 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MRDFFDEDFPLSAKQEEEYKKRQEELEAEKAKAEETPDAFDDDYE QAYSEPIDEAFTISPEVEFAEDDEPYEMYYAGMSETEEIFETLTQDEPEAAEEVQPEEP EAVEEIVEQDPIDSAPIFSLELDEPLDDGFLPDAPIIISEEEPECEEIPEEEDDLSAEL RSLTEKLDSMERAVNAMNAPAGETDDDDEPANFSYEYDERYFAEEETTAYKHPELVKKP AVKPAAKAKKASSGDMTINLKTLAKVGAVVAGAVVAAKLLSDDKKK" /locus_tag="LOCUS_7110" /note="MGA_973" ORIGIN 1 gattttataa tataataatg atgtattact atctttatga taaggagtga tttgatgcct 61 cagggaaaag ttttaataat cgaccccgac aagaacatct gtgagctttt gcgaatctac 121 cttgagcgcg agggttacag tgttatcacc tcgggcgatg gcgaagaggg gcttctcaag 181 ttttccgccc tcaagccgga tatcgttgtg cttgaagttg tgcttcccgg agtggacggc 241 tggcagatat gccgagagat aaggaaaaaa tcaaacattc ctctcatata tataactgcc 301 aagtcggaag tattcgataa agttttggga cttgagcttg gcgccgacga ttacgtcacc 361 aagccatttg acagcaagga gcttgttgct cgaatcaagg cggtctgccg aagaacaaat 421 ctggcgaaag aggacaatgc cgttaaggaa gttcactttg acgggctcga cctgaatatg 481 accagatatg agcttagaat caagggtaag ctcgttgatg ctcccccgaa ggaattggag 541 cttttatatc accttgcatc acatcccaac attgttttca accgagatca gcttttggac 601 gaagtctggg gctttgaata ctacggcggc tcgagaacca ttgatgtaca tattaaacgt 661 ctgcgccaaa agcttgacgg agtctccccg aaatggatac tccgcacagt ctggagcgta 721 ggatataagt ttgaagttaa cgacggcgaa acgcaagcat aataccgaga aaggaacacc 781 gttatgagag atttttttga tgaagatttc cctttgagcg caaagcagga ggaagaatat 841 aaaaagcgac aggaagagct tgaagccgaa aaggcgaaag cagaggaaac tcccgacgct 901 tttgacgacg attatgaaca ggcttattcc gagccgatag atgaagcatt taccatatct 961 cccgaggttg aatttgccga ggatgacgag ccttatgaaa tgtattatgc aggcatgagc 1021 gaaacggaag aaattttcga aacgctcaca caggatgaac cggaagctgc cgaagaagtt 1081 cagcccgaag agcctgaggc tgttgaagaa attgtcgagc aggaccctat cgactcagcg 1141 cccatattct ctcttgaatt ggatgagccg ctggacgacg gtttcctgcc cgatgctccc 1201 ataatcattt ccgaggagga acccgaatgt gaggagattc ccgaagaaga ggacgatttg 1261 agcgcagagc ttcgctcgct gaccgaaaag ctggacagca tggagcgcgc agttaatgca 1321 atgaatgccc ccgcaggcga aactgacgat gacgacgaac ctgcaaactt ctcatatgaa 1381 tatgacgaga gatatttcgc cgaggaagaa acaactgcat ataagcaccc cgagctggtt 1441 aagaagcctg ccgttaagcc tgcggcaaag gcaaagaaag cctcgtcggg cgatatgacc 1501 atcaacctca aaacccttgc aaaggtcggt gcggtcgttg caggcgcagt tgttgcggca 1561 aagctcttgt ccgacgataa gaagaagtaa tattacgtat acctttattt agaaagcgaa 1621 ttttttatgg aaaaccttga aaagaattta ctcgaaaacg actccaatat tgcaaccgaa 1681 gcaacctccg agcagaacat aatccctgca gaagaaaccg acgcattgga agaagcggtg 1741 gttgctgaaa cagaagcacc catggagaat atcacagaag aattacccgc agaggaaatt 1801 gctccagaag cagagttgat tgctgaaccc gaatcggcag tttccgcaat tgaggagctt 1861 cgtgcgctgg ccgccgcaga ggcagagcag tgggactata tgccaaagcc tgttggaaag 1921 ctgaaaagac gtcagcaccc atattggcgc gcatttttca cccttctgat aatctttatt 1981 atactgttct ttgttgcggc tgaaagcgtt ttcggcaagg gctggataat caaccgcttg 2041 ggcgaacacg gtgacaacaa aatagacttc acgcttccca ttgccgagct tcccaagctt 2101 gaaacggaat actatcaggc aagcggaaaa tataccaccg agggcgttgc aaaggctgtt 2161 ttgccttcaa ttgtaaccat tgaagccttt gttgagggtt ctccccttgc cgcatattct 2221 cagggctcgg gcgtaataat gtcgagcgac ggatatatca tcaccaatgc ccacgttatt 2281 gaggaagc // LOCUS sequence226 2286 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence226 VERSION sequence226 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2286 /mol_type="genomic DNA" /organism="" /note="sequence226" misc_feature <1..1583 /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_012583939.1:YIP1 family protein" /note="WP_012583939.1 YIP1 family protein (Dictyoglomus turgidum) [pid:32.0%, q_cov:93.0%, s_cov:65.2%, Eval:1.2e-61, partial hit]" /note="frameshifted, insertion/deletion at around 1617" /note="MGA_975" /locus_tag="LOCUS_7120" CDS 1583..2218 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MIYDMTPLQWLSHVIFHPFEGYEDMRWKKAGSLKISFVIVFFLFL AQMISARYGGFAFNMRAYSDIFNVVPILVQSVAYYATWVVANWSLCTLLDGEGNMRRIA IYTAYALVPFIVCSFISTGISYFLTLDESIWTTTISTLGLAWSGVMLVFGMKACHQYSF TKTIISMILTVVGMLLILCLLVLVMSLFQQVWLFILTIYTEILYRVRS" /locus_tag="LOCUS_7130" /note="WP_012583939.1 YIP1 family protein (Dictyoglomus turgidum) [pid:27.4%, q_cov:93.4%, s_cov:28.4%, Eval:4.0e-20, partial hit]" /note="MGA_976" ORIGIN 1 ctgaggaccc gtatacatcc tatagctaca acgcatggag tgttgcactg ccttctcaga 61 acggttacat tgttaaagac acaataaccg gtgctgacat gggccttgac cagctctccg 121 accccaacag cccgttgttt atcagcgagg acgaacccgc aactcttaca gatgccaagg 181 atttcttcct ctcgcccaac aatgaattct ttattgttga cacgggtaac aacagaattt 241 taagaactga cattaacttt aaccttattg cctgctataa gaactttaca ggcggtaagg 301 tagtagaaga aattaaggac gcagaaggca atgtaattga gtctattcct gcaacaaccc 361 ttaagagccc ctacggcatc tttgttgatg aagacgacat tatgtacatt gctgacagag 421 ataatcagcg tattatcaag tgcggattcg actgtgagat cattactgag tatgtaagac 481 ccgaaacaga gctttatgac tcggtatcct tctactgcac aaaggttttg gttgacgcag 541 ctaagaacgt ttatgttatc tgccctgcgg tcaacaaggg tgctatcatg ttcgcaccca 601 gcggctcatt catgggttat tacggtgcaa accgtgttga agttactgct gaagtaatca 661 gaaacaagct ttggagaaag ttcgcctctg aagaacagat cgcaggtatg atcaacatta 721 cccctgttga atatgcaaac ttcgacgttg accatgaagg ctttatttac acagtaaccg 781 aagttgccga tgtttcgacc gacgcagtta aaaagcttaa ccctgccggc tataacattt 841 tggaaaccac cacaaatgct gctgatattt cattcggtga ccagcagtcc atcacttatt 901 cgggcgcaac aaccgcaacc cgtttgactg acgttgctgt cggcgaaaac ggcatcatca 961 acattttgga ctatacaaca ggacgtgtgt tccaatatga taaggaatgt agcttgctgt 1021 tcatcttcgg atgtgaccag gaagcacaga acggcggttt tgacaaccct aatgctgttg 1081 aatgttatgg cgagaatatc tacgttctcg acggcagaaa caacgacgta acagtttatg 1141 aagaaacgct cttcggcgga ttggttcatg aagctgttga tatgtttaac gaaggcttgt 1201 acgaggattc gttagatctt tggcgcgaag ttcttaagcg cgacggtaac tacaacatgg 1261 catatcttgc tatcggcaga gcacttttaa accaggataa ctatgacgag gctatgaagt 1321 acttcaagct tgcttacaat gccgaagact atgacagagc gttcgaggct gaacgtcagg 1381 acctcttgag agataacttt acacttatcg ttattgttct cgttcttttg gtaattgctt 1441 ggtttgttgt taagcagctt cagaagcgcg gcattatccc taacaatctc attaaaagag 1501 gcattaagtg ggttgctgac aaaattgttg atttggttaa aaaaattatt agcaatatta 1561 ataagaaggg aggaagcaaa taatgattta tgatatgacg cctttacagt ggctttccca 1621 cgttattttc caccccttcg agggatatga agacatgaga tggaagaaag ccggttcgtt 1681 gaagatctca tttgttattg tgttcttcct cttcctggct cagatgatct cggcaagata 1741 cggtggcttc gcatttaaca tgagagctta ctccgatatc ttcaacgtag ttccgatttt 1801 ggtacagagc gttgcttact atgcaacatg ggtagtagca aactggtcgt tatgtaccct 1861 tttggacggc gaaggaaaca tgcgcagaat tgcaatttac acagcatatg cacttgttcc 1921 tttcatcgtt tgcagcttca tttcaaccgg tatctcttac ttcttaacac ttgacgaatc 1981 gatctggacg acaaccatca gcacgctcgg tttggcatgg agcggtgtta tgttggtatt 2041 cggcatgaag gcttgccacc agtattcatt cactaagaca attataagca tgattttaac 2101 agtagtaggt atgctcctca ttctctgctt gctcgttttg gtcatgtcac tcttccagca 2161 ggtatggctc tttattctta ccatctatac agagatcttg tatagagtaa gaagctaagc 2221 gagcagaaag tgagtataag atgatgaata gatttctcag attgatcgct tgcctgcttg 2281 tcatgg // LOCUS sequence227 2275 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence227 VERSION sequence227 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2275 /mol_type="genomic DNA" /organism="" /note="sequence227" CDS complement(1137..1856) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MKKILLFLLIVTTLIFSACADSNADKEVTDNIDSKVIDDTEVVDV QDDITSQDATLVCNKFIGPIIEIEEKDGKTYFVLYERESGEYFNFVVSQGELFDNSQLV DDFIYEDSVIVYSFSSQTTDNGDLYLAHIVIVEEPTRTFYAIVADVNPDTGRLILKGCD FNEVNSRGYYIVDVDEASIVRPYYMNLTAGDFKVGDLVMVRGRVSTLEVSPQSFDRFEE IELLVQGYDPDFVYDDF" /locus_tag="LOCUS_7140" /note="MGA_978" CDS complement(1990..2274) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MFVGANSDKSYYKWSEEEFNVQAEKYAQLFEMFQDFADQGIIDMV VFWGTDDENSWLNSTPKLRRNAALIFDRPETNYAIKPAFWSIARTSFNH" /locus_tag="LOCUS_7150" /note="MGA_979" ORIGIN 1 caggaacgat ctggtcgtcg ttaccggaat atatgtcaag cttgcccttt gtcaggtgcg 61 caagctttgc aatttgtgag agatttccgc ttgcttcctt aatgccgaca atatttggat 121 gctccgccaa aactgccgca gtttcgggca ggatattgca acctgttctc gaaggaacat 181 tatataagat tatcggcttg gttgaggcat ccgcaatagc actgaagctc gcaattaagc 241 ccttctgagt agccttgtta tagtaaggag atacaaccaa catcgcatct gcaccggcct 301 cacatgcaaa ttttgtcagc tcaattgcat atgctgtgtc gttcgagcct gttcctgcaa 361 taacaggcac tctgccgtta accttgtcaa cagtaaactt aataatgtcc ttgtgctcct 421 tgtcggtaag ggtcgagcct tcacctgtag ttccggcaac aacaattgcg ctgataccgc 481 tctcgatctg ccattcaaca agtctttcat agctctcata gtcgatctca ccgttcttga 541 aaggggtgat gatcgcggtt gccgcacctg taaatacagt atttttcata atgccatgcc 601 tccgaatata taatttacaa atcgctgaaa atcaaaaaag cagcgctttt aaatgaactt 661 taaaagccac tgccgatgcc tggtagtttt aacgaaaatt ccgataaaac aaagggcaga 721 tagctctccg catttttgcg acagcgaagc gttcttggtc cgttccgcca gatcattcca 781 tcgccgaggg aatgtcttcg gcagctcttc ctttcggcgc cgtcccggca gacgttcaaa 841 tgcgcttact gataagatac tgcacctcta tctcaatgtc taatttatac cataatataa 901 ttgtgctgtc aaccggttga aaaataaatg taggattgaa caaaaaagcg agtcaagatg 961 ggtcattata gggcagaatt gcgcctgcgg cgcaattgcg aggagccaat ttcctcgcat 1021 acgactcgga aataagttcc tcgccattcg cgggtcccct ccatcaatcc cttcgggctt 1081 gacggcctgc gccccgccac aaaatacccc gcccttttta ggacggggtt atctgcttaa 1141 aaatcatcat acacaaaatc tgggtcatag ccctgaacca gaagctcgat ttcctcaaag 1201 cggtcaaacg actgtggaga aacctcaagc gtggacactc tgcctctgac cattaccagg 1261 tcgccgacct tgaaatcgcc tgcagtcaga ttcatatagt agggacggac gattgaagcc 1321 tcatcgacat caactatgta atacccgcga gaattaacct cattaaagtc acagccttta 1381 agaatgagcc tgcctgtgtc aggattaaca tctgcgacga ttgcataaaa ggttcttgtt 1441 ggttcttcaa ctattacgat atgcgcaaga tataaatcgc cgttatcggt tgtttgcgag 1501 gaaaaagaat aaacgatgac gctgtcctca tatatgaagt catcaactag ctgagaatta 1561 tcgaatagct ctccttgaga aaccacaaaa ttgaagtatt ctccgctttc acgttcatac 1621 aaaacgaaat atgtcttgcc gtctttttcc tcgatctcaa ttatgggacc tatgaattta 1681 ttgcatacca atgttgcatc ctgcgaagta atatcatctt gaacatcaac aacttcggta 1741 tcgtcaatca ctttactgtc gatattgtcg gtcacttctt tgtcggcatt gctatccgca 1801 cacgccgaaa agatgagcgt tgttacgatt aaaagaaata aaagaatttt cttcatatat 1861 ttgtcctcct atagtcatta taattcatta tacgaaaaca tgtggttatt gtcaatggag 1921 aagaatatat taatggttta tccacaaaaa atcccgccct ttaaaaggac gggatcttgc 1981 actatgtaat cagtggttaa agcttgttct tgcaatgctc cagaaagcag gcttgatcgc 2041 atagttggtt tcgggtctgt cgaaaatcaa agcagcgttt cttctgagct tgggtgtcga 2101 gttgagccag gagttttcgt cgtcagtgcc ccagaatact accatatcga tgataccctg 2161 gtcagcaaag tcctggaaca tctcaaagag ctgagcatac ttttcagcct gaacattaaa 2221 ttcctcttcg ctccacttgt agtaggactt gtcagagttt gcaccgacga acatg // LOCUS sequence228 2264 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence228 VERSION sequence228 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2264 /mol_type="genomic DNA" /organism="" /note="sequence228" CDS complement(597..1307) /product="pseudouridine synthase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_012048228.1" /transl_table=11 /codon_start=1 /translation="MEMIRLDKFISSQVPSLSRKDVKELVKKGRVTLDGKPVKAADVKF DAETACVAVDGKAVGYKKHLYIMLNKPSGVVCATRDGLSATVLELLPPELRRDGLFPAG RLDKDTEGFVLITSDGDLAHKMLAPKSHVDKEYFVRLESPLRNDAKDIIASGMTLSDGT KCMPAELEVVSSYECKIILHQGMFHQVKRMFESLDNKVIYLKRIRIGGVRLDESLKIGE VRELDENEKDRLLI" /locus_tag="LOCUS_7160" /note="WP_012048228.1 pseudouridine synthase (Clostridium botulinum) [pid:46.1%, q_cov:96.6%, s_cov:97.1%, Eval:3.3e-53]" /note="MGA_981" CDS complement(1334..1786) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MFVKTVKIKSLLKILLILMAIAGVLLLAVTFVNRLTDRNKIILED IPAQIAFLESLGWETSGEPVDIREVIIPEEWNSVFEEYNDLQKQQGFDLDKYRGKQATI YTYQILNYDGAENVVANLMVFDGRLIAGDVCSAELGGFMQGLCKVN" /locus_tag="LOCUS_7170" /note="MGA_982" ORIGIN 1 ctacacgctg acgctgaccg ccggagagag ccttcggctt tctgtcgaga aggtgagaga 61 tgtcaaggat tcttgcagct tcttcaacct ttcttgcgat ctgatcctta ggagtctttc 121 tgagcttgag gccgaatgcc atgttctcaa aaacagtcat atgaggatac aaagcgtagt 181 tctggaatac cattgcgata tctctgtccg taggagcaat atcgttaacg attctgttgc 241 cgatgtaaag ttcgccgtca gtgatctctt caagacctgc gatcatacgc aaggttgtgg 301 acttaccgca accagaaggt ccaacgaaga taatgaattc cttgtcctta acttcaaggc 361 agaagtcaga aacagcaatt acaccgccgg gatatttctt ataaatgtgc ttgagtgata 421 agctagccat ttgtaggcct cccttttctt gccaaaatta tactaatcta cattagttac 481 aaaatatatt atacctgtga ggttgaaaat actcaagtga ttttttcaac aaactttccc 541 gcaagtgttt atctaaactg acggaaaagc catttaaatt gcacatttat cacttattat 601 ataagcagcc tgtccttctc gttttcgtca agctctctga cctcgccgat tttgagcgat 661 tcatccagcc gaactccgcc gatgcggatt cgttttaaat atatgacttt attatcaagt 721 gattcaaaca tccgcttgac ctgatggaac attccctgat gcaaaatgat tttacactcg 781 taagacgaaa cgacctcaag ctctgccggc atacattttg tgccgtccga aagagtcatg 841 cccgaggcaa ttatatcctt tgcatcgttt cgcaaagggc tttcaagcct tacgaaatac 901 tccttgtcca catgggattt tggcgcaagc attttgtgcg ccaaatcgcc gtcggaagtg 961 attaaaacaa atccctcagt gtccttgtca agtctgcctg ccgggaaaag cccgtcgcgg 1021 cgcaactcgg gcggcaaaag ctccaaaacg gtagcggaaa gaccgtcacg ggtggcgcag 1081 accacccccg acggtttgtt gagcataatg tataaatgct ttttatatcc gacagctttg 1141 ccatccaccg caacgcaggc agtttcagcg tcgaatttga catccgccgc cttaacaggc 1201 ttgccgtcaa gggtcactct gcccttcttc accagctctt taacatcctt gcgggaaaga 1261 gatggcactt gggaggatat gaacttgtcg agtcttatca tttccatttt ttcaatgtcc 1321 ttgtttataa gtcttagtta accttgcaaa ggccctgcat aaatccgccc agctcagcag 1381 agcaaacatc gcccgcaatc agcctgccgt caaaaaccat aaggtttgca acaacatttt 1441 cggcgccgtc ataattcaga atctgatatg tataaatagt cgcctgcttg ccgcggtatt 1501 tatccagatc aaagccctgc tgtttttgca gatcgttata ttcttcaaat accgaattcc 1561 actcctcggg aattatcacc tcgcggatat ccacaggctc gcccgaagtt tcccagccga 1621 ggctttcaag aaaagcgatc tgtgcgggaa tatcctcaag gataatcttg tttcggtcgg 1681 tcaggcggtt gacaaaagtt acagccaaca gcaaaacgcc ggcgatcgcc atgagtatga 1741 gcaaaatttt caaaagcgac tttattttaa cggtcttaac aaacatattt cttccccttt 1801 tcctttggtc ttggtgaagt atatgcttgt gcgaagggaa aaagtacagg gtgcagagca 1861 aacgaagcga ggcgtcggtc ggtctgcgcc gagtgaagcg aggctgtgac cgagcggtgc 1921 caagcggccg tcgaaaagag caattcaggt tacttttgtg tcggccgctt aaaattcggc 1981 ttttgcgaca atgtcgcaaa cttgcttgcg caagatcgcc gaattcccaa gttttgcatt 2041 agcctaacgc gcgacaagaa tccgctttgc ggattcttgt taaaattttg tgagcgtagc 2101 gaacaacatt tttgtcccca tccattgctc actatcgttc gcaatggcct cctccccgcc 2161 tcaatgcgcg aactgactgt tatacagctc gttatagaac ccgccctttg ccatcagctc 2221 ggtatgggtt ccctgttcaa taatgttgcc gtccttcatc acca // LOCUS sequence229 2244 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence229 VERSION sequence229 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2244 /mol_type="genomic DNA" /organism="" /note="sequence229" CDS 447..1796 /product="multifunctional CCA addition/repair protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011038505.1" /transl_table=11 /codon_start=1 /translation="MNCFEKDLSMAKAIAEKVAEFGGRVYFVGGYVRDRLMNIENKDID IEVHGVSPDVLESILDGLGKRMTMGQSFGIYGLKGYGLDVAMPRKEHAIGRGHRDFQVS VDPYIGTFKAAMRRDFTINALMQDVLSGEIIDHFSGLEDIKNGVIRHVSDESFAEDPLR VLRAAQFSARFNFEVAHETVLLCEAIDLGTLSKERVLGEMFKALSKADKPSHFFRALEK MNQLSHWFPELEALIGIKQDTIHHPEGDAYTHTLMVLDEAAKYRDKAGNLNGFMLSALC HDFGKSVSTEIIDGRIHSYMHEIKGLALIKTFLKRLTNESSLIQYVLNMCEHHMKPNIL AHDRSAVKSTNRMFDSVSHPRDLIYLSVCDRLGKNENDGYSEFLFERLEVYDQMMARPF VSGKDLIDSGLTPDETFSEILAYAHKLRLAGVDKPAALKQTLSYANKIKK" /locus_tag="LOCUS_7180" /EC_number="2.7.7.72; 3.1.3.-; 3.1.4.-" /note="WP_011038505.1 multifunctional CCA addition/repair protein (Xanthomonas campestris) [pid:32.4%, q_cov:92.7%, s_cov:99.8%, Eval:1.3e-40]" /note="MGA_984" ORIGIN 1 gagggcacag ggatggtctt gtcggaaacg atgtcggcaa aattgtcctc aaggtcaata 61 atgctctcgt aatatttaaa gccccaatcg ccgtttaaaa gctccattct ttgggattca 121 tagcggcagg caaagggatc ctgacctttt gcaaagggca taaaataggc gtggtcatta 181 agtgtgccga tgtgaatgct tttgggatct tcgtgataga tcatcttgct cttttgggag 241 tttggtgctg aaattgttga tatgttcatt aagttgtgcc tccaatctgt aagcggtcta 301 taatgtgatt atatccttta tatggaaggg gtgtcaatat ccaaaagtac tcaaatgttt 361 aacttttttg attatttgaa acgctcagtt tctgcttgaa gggttgtggt gtttgtgata 421 taatgaaaac aagcgaggtg aaacacatga actgttttga aaaagatctg agtatggcta 481 aagctattgc cgaaaaggtc gccgaatttg gcggaagggt atattttgtc ggcggatatg 541 ttcgtgacag actgatgaat attgaaaaca aggacataga cattgaggtt cacggtgttt 601 cgcccgatgt tcttgaaagc attcttgacg gattgggcaa acgtatgact atgggtcaga 661 gctttggaat ttatggactc aaaggctatg gccttgacgt tgctatgccg agaaaagaac 721 acgcgatcgg tcggggacac cgagattttc aagtgtctgt cgatccttat atcggcactt 781 ttaaggcggc gatgcgacgc gattttacaa taaatgcttt gatgcaggat gtgttgagcg 841 gcgagataat tgatcatttt tcggggcttg aggacattaa aaacggtgtg attcgtcacg 901 tcagtgatga gtccttcgcc gaagatcctt tgcgtgttct ccgcgcggcg cagttttccg 961 caaggtttaa ctttgaggtg gctcacgaaa cggttttgct ttgcgaagct attgatcttg 1021 gcacgctttc gaaagaaagg gtattaggcg aaatgttcaa agctctgagc aaagcggata 1081 agccttcgca ttttttccgc gccctcgaaa aaatgaatca gctttctcac tggtttcccg 1141 agcttgaagc tctaatcgga attaagcaag atacgatcca tcatccggag ggggatgcat 1201 atacccacac gctgatggtt ttggatgaag cggcaaaata ccgtgataaa gcgggaaatc 1261 tcaacggatt tatgctttcg gctctctgcc acgattttgg aaaatcagta tcaaccgaga 1321 ttatcgacgg tagaatacat tcatatatgc atgagatcaa aggtcttgcg ttaatcaaga 1381 catttctaaa acgtttgaca aacgaatctt ctctgataca atacgtttta aatatgtgcg 1441 agcatcatat gaagcctaat attctggcac acgatcgctc ggctgtcaag tctaccaaca 1501 ggatgtttga ttcagtcagc cacccgagag atcttatata tctttcagtc tgtgatcgtt 1561 tgggaaagaa tgaaaatgac ggatacagcg aatttctgtt tgagcggctt gaggtgtatg 1621 atcagatgat ggctcggccg tttgtttcgg gcaaagacct tattgattcg gggctgactc 1681 cggatgaaac cttttcggag atcttggcat atgctcataa gctccgtctt gcaggtgtag 1741 ataagcctgc cgcattgaag caaacacttt cgtatgcaaa taagataaaa aaataagcca 1801 tggttttaaa ccacggctta ttttgtttta cacatcttac ttcttcaaaa gctcaacgat 1861 ctgcttgaga agatcctcgg tggtggggtt tgcttctctt tcaaggcgag ccttttcttc 1921 ttcagccttc tttgcagctt cctcggctgc tgccttttct gcgaagtaag catcaactgc 1981 ggtcttgtcg ttaagcttga tgccctttgc cttgagcgca gccttgtctt ccttggagag 2041 cttgccgttc aaaagctttg tattttcatt cttgagggtg ttcataaact taacgatgca 2101 gaacaaaaca agagcggtca aaaggaagct gatgattgca ttgatgaatg tgccccagtc 2161 gatgtaaata gactgagtca aatcaaccgc gccgtcaacc tcaacgggca aaagcattgt 2221 cataatgccg ctgagcgaat ttgc // LOCUS sequence230 2235 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence230 VERSION sequence230 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2235 /mol_type="genomic DNA" /organism="" /note="sequence230" CDS 587..1750 /product="molecular chaperone DnaJ" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_142730484.1" /transl_table=11 /codon_start=1 /translation="MADKRDYYEVLGVSKTATDEELKKAFRKLAKQYHPDLHPDDKGAE MKFKEINEAYEVLSDKEKRARYDQFGFAGVDPNYGAGQGGADYGGYTSYGGGFNDFGDI FESFFGGGFGGASSRSNANAPRRGQDIRVSATISFMEACKGTKANIRFSHFEKCPDCGG SGAKAGTSATTCPDCNGTGTVRINQRTPLGMFQTTKTCERCGGKGKVIKDVCPGCSGQG RVKKTLTREIEIPAGIDDGQTLKVSGAGDCGFNGGASGDLNVRIVVKPDDIFEREGYDI YTEIPISYMQATLGDEITVPTIDGKVKYKVPEGTQTGTTFRLKGKGIKRLYRTERGDHY VTVKVEIPKNLTKKQAELLRTFDDSLEEKNTATTKSFFEKMKDFLNS" /locus_tag="LOCUS_7190" /gene="dnaJ" /EC_number="1.8.4.-" /note="WP_142730484.1 molecular chaperone DnaJ (Paraclostridium bifermentans) [pid:52.2%, q_cov:98.4%, s_cov:98.4%, Eval:8.1e-110]" /note="MGA_987" ORIGIN 1 aaggaagata tcgacaaggc tgttaaggaa gctgagcagt ttgccgctga ggacaagaag 61 agaagagaag atgttgatgc aagaaaccac gctgaccaga tggtatttag ctgcaagaag 121 tcccttgaag aattcggcga caaggtagag gcttccgaca aggcagattg cgaagcaaaa 181 attgcagcac ttgaagaagc actcaaggga accgatatgg aagcgatcaa ggcaaaggaa 241 aaggaacttg aatcctccat ccaggcaatc gcaaccaagg tatatcaggc tgcagccgca 301 gctcagcagc aggcacaggg tgctgacaac aacacaggct ctgcacccaa ggatgacaat 361 gtcatcgacg ctgagttcac cgacgccaac taaatccgta atttgaaaca atgcgcgtgc 421 gctcagcgcc cgcaagccgc gccccacata gggggcgcgg ctcccgccca aaaccgcccg 481 caggcggttt tgggcttgcg tgataataaa gcccaaagcg ctttattatc acgggcgggc 541 gctcggcgtc atacggcaaa ctatataatt tctaaggaaa aacattatgg ctgacaaaag 601 agattattat gaagtcctcg gtgtgagcaa gactgccacc gacgaggagc ttaaaaaagc 661 cttccgcaag cttgcaaagc aatatcaccc cgaccttcac cccgacgaca agggcgccga 721 gatgaagttc aaggaaataa acgaggcata tgaggtgctt tccgataagg aaaagcgcgc 781 tagatatgac cagttcggct ttgcgggtgt tgaccctaac tacggagcag gtcagggcgg 841 agcagattat ggcggatata caagctatgg cggaggattt aacgacttcg gcgatatttt 901 cgagagcttc ttcggcggtg gcttcggagg agcatcgtcg cgctcaaatg ccaatgcccc 961 cagaagggga caggatatcc gcgtgagcgc aaccatcagc tttatggaag cttgcaaggg 1021 cacaaaggca aatatccgct tctcccattt tgagaagtgc cctgattgcg gcggctcggg 1081 cgcaaaggca ggcacatctg ccacaacttg tcccgactgt aacggcactg gtactgtaag 1141 aatcaaccaa agaacccctt tgggtatgtt ccagaccacc aagacctgcg aacgttgcgg 1201 cggcaagggc aaggtcatca aggatgtctg ccccggatgt tcgggacagg gacgagttaa 1261 aaagaccctc accagagaga tcgaaattcc tgcaggtatc gacgacggcc agaccctcaa 1321 ggtttcgggc gcaggcgatt gtggcttcaa tggcggcgct tcgggcgatt tgaacgtgcg 1381 aattgttgtc aagcccgatg atatctttga gcgcgaggga tacgatatct ataccgaaat 1441 tccgatctcc tatatgcagg cgaccttggg agatgagata accgttccca caatcgatgg 1501 caaggttaaa tataaagttc ccgagggcac tcaaacaggc accaccttcc gccttaaagg 1561 aaagggaatc aagcggcttt accgcaccga acgcggtgac cattatgtaa ccgtcaaggt 1621 tgaaattccc aagaatttaa caaagaagca ggctgaactg ttaaggacgt ttgatgattc 1681 ccttgaggag aaaaacaccg caaccaccaa gagcttcttt gaaaagatga aagatttttt 1741 aaatagctaa aaataagacc catcgcccag gcggtgggtt tttgatattt aaaagctcgt 1801 ctgacattaa aaatttatcg taaaacgata aaaaactatt gacaaacgtt aaaatatatg 1861 ctatcctcta attgtcagca aaacccatac aaaaattgac acaacaggag gcaaacatat 1921 gaaaggttta aacaaagcag cagtaataat cacaaaggtg atcgagattg tccattgggt 1981 cgcaactggc ttggttgcgg cggcgggaat ctgtgcggcg gttgcaccca agtatcttgg 2041 tatgtttatg gatgttgaat ccctcatcgc agacccggag atgagcacat acggatttga 2101 agtgagcctt gcaaacatcg acggccagct gaatatgctt gcctttgtgc tctattccat 2161 cggtgcaact gcaattatgg tgataatggc gcttatcttc cgcaacctgc acgtcatctt 2221 cgaaaatgcc ggaaa // LOCUS sequence231 2228 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence231 VERSION sequence231 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2228 /mol_type="genomic DNA" /organism="" /note="sequence231" misc_feature <1..559 /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_011986795.1:flavodoxin-dependent (E)-4-hydroxy-3-methylbut-2-enyl-diphosphate synthase" /note="WP_011986795.1 flavodoxin-dependent (E)-4-hydroxy-3-methylbut-2-enyl-diphosphate synthase (Clostridium botulinum) [pid:59.2%, q_cov:98.9%, s_cov:52.7%, Eval:2.4e-57, partial hit]" /note="MGA_989" /locus_tag="LOCUS_7200" ORIGIN 1 aaggtttgac tttggcgata ttgttctgtc gctaaaatcg agtgatgtta acaaaatgat 61 ttccgcttac cgccttgttg ctgataagac cgattatccc ttgcatttgg gtgttaccga 121 agcaggaaca tataagatgg gacttattaa gtccagcatt ggaatcggat cacttttgtg 181 tgacggtatc ggcgaaacaa ttcgcgtttc gcttaccgat gatccgacaa aggaagttgc 241 cgcaggcttt gatattttga aagcgatcgg caaaggcagg ggagtaaggc ttgtttcctg 301 tcccacctgc ggaagaacga agattgattt gatttcctta gctcataagg tcgaggaagc 361 aactgcaaat attgataagg acattaccgt tgctgttatg ggctgtgttg tcaacggccc 421 gggagaagct aaagaggctg atatcggtct tgcgggcggc gacggctgtg ttgtaatttt 481 taaaaaggat aaaataatcg gcaagttttc cgagagcgat gcgcttggtg cgcttcttgc 541 cgaaattgaa aaactctgac ggaggaaaca atggcatatg aaagagtcgc tgattttttc 601 agcgcatatg acaatttaat acccccatcc atggcggacg gcgtgatcct tagaattgca 661 ttttctaagg ataattccgt tatggctgtt gaaataaagt tctcacaggt gatttcaggc 721 gatgatttaa agctttttgc ttcaaatctc aagccttgtc tgggattaac aggaatatac 781 ataagcccga aatatgacag ttcgcttttt ggcatcaatg caatgcctgc ggttattgac 841 gagcttaaaa ggcgaattcc gataaacggt tttttggata atgcagactt cgccattaac 901 ggtaatgagc tttgcataac tctaaaaaac ggcggtgaag ctttgcttaa aaaggcagga 961 attgaagaag tgctgccgaa aatcatcaat acgcagttcg gagtgttggt ttcaattaag 1021 tttgacggta accttagtgt caatgctgaa gagcacaata agcttcagca ggaagttctt 1081 aaaaagatca ctcctgttca catcgaaaag aaatctgcac ccgcggagcc gggcgaaaag 1141 ccgacctatt atgtgcagtt cgatggcgca cccattgaaa acgaagctac ccttataatg 1201 ggtaaggaaa ttgtcgatac gccgctgaca cccttgggcg atgtcgctca ggattcgggt 1261 aaggtagctg tctggggcga gatctttgat attgaaacaa agatcacacg tgacgagaaa 1321 aagatgataa tgacggtgtt tatcaccgac cttacaggat ctatcacgct caaactcatt 1381 gaaactgtca agaaggcaga agagcttctt gctgacctta aaaaagatgc ttcaattctt 1441 gcacgaggcg atgttaacta tgacaccttc gataaggaga taaacatccg tcctcgcgat 1501 atttcgctgg tcaaaaagct taaaaagacc gacgatgaac ctgttaagcg agttgagctt 1561 cattgccaca ctaatatgtc gattatggac gcaatgacgc cttctgatga aatcgtcaag 1621 cgtgccgcat catggggaat gaaagccatt gcaataaccg atcatggtgt atgccaaggc 1681 ttcccggatg ctatgtatac ctgcgataag cttcgcaagg acggcaaaga cttcaagatc 1741 atctacggcg ttgaagctta tcagattaac gacgaggtca gcataacgtt tggcgaggat 1801 aacaggcttt tgactgatga attcattgtc ttcgacgttg aaacaacagg cctttcggca 1861 gttaccgaaa agctgatcga aatatgcgca gtaagagtca aaaatcttga aattgttgat 1921 acctttgaca cttttgttga ccctgagcgt ccgattccgt caaaaataat cgaccttacg 1981 ggtatatccg atatgacagt taagggtgcg ccgaaagaag ctgaagcaat caagcaattc 2041 cttgaattct gcggcgacac cccttgcttt gttgcgcata acgcttcgtt tgatatgtct 2101 ttcatccgtt ctgcttgcga ccgcttggga atcaagtttg aaagaccgta tcttgatacc 2161 gttgcattct caagaagtat gctcccgggc atatcgaaat atactctcga ttcggttgcc 2221 aaaaatct // LOCUS sequence232 2227 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence232 VERSION sequence232 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2227 /mol_type="genomic DNA" /organism="" /note="sequence232" CDS 342..533 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MKKVIYILLGVLSLAGFIASAAMFVMAIRFSEWGRFMFYLFLGIV CAELLIFAIVRLVKELRK" /locus_tag="LOCUS_7210" /note="MGA_992" CDS complement(642..1181) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MKKLSTIALAVGAVFVAAGFSLPVVFEHIEWLAEALILSDIDKEF IPFACWLFGGTTLFFGFVELIFDKQISKFCSLKSVSLALGISLLTALGLYCVLSFASCY FLTHPDNHPIRYPVSFIVGSVCFWVFLALFCMYIKLRQKEPSALGVLLDVLLGLGHLPA FGVMCIVADNIVSDWI" /locus_tag="LOCUS_7220" /note="MGA_993" CDS complement(1402..2055) /product="HAD family hydrolase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_002386325.1" /transl_table=11 /codon_start=1 /translation="MKKYILFDLDGTLTESAPGIMNSARYALNHFGIPDPGSVFLRKFV GPPLFESFTQMFGLDPEQATEAITVYREYYARQGIFENEVYAGIPEALEMLKKKGFVLA VATSKPEVYARQILEHFDLSKYFTVICGIPLEDEKMTKSQVVERTLRELGVSDKSQALM VGDRDYDVKGAHTNGIECVGVLFGYGDRPELEEAGAEYIAVTPAGMGEIIASLG" /locus_tag="LOCUS_7230" /note="WP_002386325.1 HAD family hydrolase (Bacteria) [pid:46.7%, q_cov:98.2%, s_cov:94.7%, Eval:4.5e-51]" /note="MGA_994" ORIGIN 1 gcagttgtcg ccgacggtgc cctgccgaga aagacattct caatgggcca cgcatatgac 61 aagagatact atcttgaagc taagaagata gtggaataac gctcaaacag acaaactgtg 121 gaaatattgc ggtttgcgtc agcaaatgcc gctcattgag cggtaagcaa tatttatatc 181 ggcgggcgca aaagtgaagg gcaaagcaaa cttcgaccgc cgattggcca cgcatatgat 241 aagagatact atcttgaagc taagaagata gtggattaac gctcaaacag acaaactttg 301 gaaatattgc ttgtaagtcg aggggatggc ggagtgacga tatgaaaaag gttatctata 361 ttttgctggg cgtgctgtcg ctggcgggat ttatcgcaag tgcagcgatg ttcgttatgg 421 cgattcgctt cagcgagtgg ggaagattta tgttttatct cttcctcggc attgtctgcg 481 cggagctgtt gatatttgca atcgttagat tggtaaaaga gcttaggaaa taaaaaaaga 541 aaggcacccc tatgtgggtg cctttttgta ttgtagcctt ccccttgagg ggaaggtgtc 601 agcaaagctg acggatgagg tggacatcgc ccgattgagc ctcaaatcca gtcgctgaca 661 atgttgtcgg caacaatgca catcacccca aaagcaggga gatgaccaag cccgagcagg 721 acatcgagca agactcccaa tgcggaaggc tctttttgcc ttagcttgat gtacatacag 781 aacagcgcca agaacaccca gaagcacacc gaccccacaa tgaagctgac gggatagcga 841 atgggatgat tgtcgggatg tgtgaggaaa tagcacgacg caaacgacag gacgcaataa 901 agcccgaggg cggtcagcaa agaaatgccc agtgcaagcg aaaccgattt taaactgcaa 961 aactttgaga tctgcttgtc aaatatcagc tcgacaaagc caaagaaaag ggtagttccg 1021 ccgaaaagcc agcaggcgaa agggataaat tccttatcga tgtcactcag tatcagtgcc 1081 tcggcgagcc actctatgtg ttcaaacaca acgggcaacg aaaagcccgc ggcgacaaac 1141 acggcaccga ccgcaagcgc aattgttgaa agtttcttca cgtcaagccc tcctttttct 1201 gcattatact acacatatgg agtcggggca agttacgata gagttacaaa acgggcgggc 1261 acataggccc gccctcgttt ctgatataga ctataggggc atcccccctg tgtgggtgcc 1321 ttattctgta aatattggcg gggcggaggc cgtcgtgtcc cgaagggacg tgacggaggg 1381 gacccgcatc ccgttgggcg atcatcctaa cgatgcaatg atctcgccca tgcctgcagg 1441 ggtgacggcg atgtattctg cacctgcctc ttcaagctcg gggcggtcgc catagccgaa 1501 caacacaccg acacactcaa tgccgtttgt gtgtgcgcct ttaacatcat aatctctgtc 1561 gccgaccata agcgcctggg atttatcgga aacgcccagc tcacgaagcg tcctttcaac 1621 cacctgcgat ttggtcatct tttcatcctc aaggggaatt ccgcagatga ccgtaaagta 1681 tttgctcaaa tcgaaatgct cgagtatctg tctggcataa acctccggct tcgatgttgc 1741 aaccgcaagg acaaagccct tctttttcag catttcaagc gcttcgggaa tgcccgcata 1801 aacctcgttt tcaaatattc cctgacgcgc ataatattcg cggtagaccg ttattgcttc 1861 agttgcctgc tcagggtcaa ggccaaacat ctgtgtgaag gattcaaaca gcggaggccc 1921 tacgaatttg cgcagaaata ccgagcccgg gtcgggaatg ccgaaatggt taagggcata 1981 tcttgccgag ttcattattc cgggtgccga ttcggtcagc gttccgtcaa ggtcaaacaa 2041 aatgtatttt ttcatatttt ctcctttgtt taacccttcg cttcataaca actttcgcct 2101 ctgcctacat ctgctgtcag cggaaaagcg aggcttactg cgtttttcat ctcgtccgag 2161 aggatctttg ccgcttggtc ggcacattcg gcacttgctt caacgatcaa ctcgtcatgc 2221 acctgca // LOCUS sequence233 2222 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence233 VERSION sequence233 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2222 /mol_type="genomic DNA" /organism="" /note="sequence233" misc_feature <1..618 /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_011393967.1:DNA repair protein RadA" /note="WP_011393967.1 DNA repair protein RadA (Moorella thermoacetica) [pid:50.5%, q_cov:97.6%, s_cov:40.9%, Eval:4.0e-54, partial hit]" /note="MGA_996" /locus_tag="LOCUS_7240" misc_feature complement(776..>2222) /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_005810223.1:AAA family ATPase" /note="WP_005810223.1 AAA family ATPase (Desulfitobacterium hafniense) [pid:41.9%, q_cov:94.4%, s_cov:59.0%, Eval:3.9e-99, partial hit]" /note="MGA_997" /locus_tag="LOCUS_7250" ORIGIN 1 agagcggtta aaaaccgctt cggctcgaca aatgagatcg gcgtttttga aatgatggat 61 tcgggacttg aacaggttga aaacccttcc gcgatgcttc tttcgggcag acccggcggt 121 gtttcgggat gctgtgttgc ttgcacgatg gaaggttcaa gaccgatttt agcggaagtt 181 caggcgctgg tcacaaaaag cggaatgcgg gcaccgagaa tagtttcaac ggggtttgat 241 tttaaccgcg tgtggatgat cttggcggtg cttgaaaagc gaatgggata ttacttcggc 301 aatttggatg tgtatgtcaa tatcatcggg ggattgagaa tcaccgagcc tgcggcggat 361 ctgcctgttg caatggcgct gtattcatcg ttgaccgata aggcgattag cgaggatgtc 421 attgcattcg gtgagatcgg cctcggcgga gaactcagag gcgtttcaca tcttcagcag 481 agaattgaag aagcggctcg tttgggcttt acaaaggcaa ttgtcccccg ccattcaatt 541 aaaaatatgc gtcccgttga gggcattgag gtcgtgggtg tatccaacct caagcaggct 601 ttcggggcga ttaagtaaaa gctatataaa tcccttcggg atttgcgaga tattttcaat 661 gcgaaatttg cctgtggcaa gcgatatgcc ctgcggggca caaggattta tatcatatcg 721 cagataatta aaagagagaa tactacggac tgaccgtatt attctctctt tttgtctatg 781 ctgttaaaac cttggtggtg tgaagggtaa tctcgtttga atcggcggtg acggttatgc 841 ccagagtcgg agagcttgcg attgcatcgc acaggggcga ctcaattttg tgggcgatta 901 tgcggtggat ttcacgggca ccgaagtttt taatatctgc aaggcggacg atgaggtcaa 961 gtacgctgtc gtcatattca aaggatgtgc caacttttat gcaacgatct ttcagctcat 1021 caagggcaag tcgggcaatt tcggcaacgg attcggcatt tatgcgatta aacacgcaaa 1081 tgctgtcgat tcggttcatc agctcatatg aaaattgctt ggaaagcaac tcgcgggcag 1141 aaggggcgtt attcgcgtta gcaaatccaa cagcggcgtg agcttcgggg acggcgtttg 1201 aggtcaggat aataattgcg cttttaaaag aaatttttct gcctgcggaa tccataagag 1261 aaccgttatc gagtatctgc aggagcaatt gggtgacgtc gtggtgggct ttttcaaatt 1321 catcgaacag caccacgcaa aagggcttgc gtcgcacctt ttcagtcagc tcgccgcctt 1381 tgccataacc gacgtaacaa ggtggcgagc cgatcagacg ggaaacggtg tggtgttcgg 1441 aaaactcgga catatcaagg cggacaagat ttgatctgtc gcctgtgaga tattcggtaa 1501 gcgactcggc aagggcggtt ttgccaacgc ccgaagggcc tgtgaacatt aaagaggcca 1561 agggttttga attctcccga aggcctgatg atgcacgttt gagtgaggcg ataagcgatt 1621 cgatcgcaaa ggactggccg atgatttttt ggctgagttt atgtttaagc gaggcgatgt 1681 tttcgggatt tagagcatca gtcgggatac tcgcctgtaa agcgattatg ctttccacga 1741 cagaagcagt gacccgaggg atgtcaaaat cctcgcaggc gtggcgggaa agttcttcaa 1801 aataggcttc ttttgagatt ttgcctgcga tatagtcgct gaaaacgttt gaaagctgtt 1861 cgcggacacg gttagaattt gtaaagcctg agagctttac acgcgagcag gcttcgtcga 1921 tgatatctat cgccttgtcg ggaagataac ggtcgccgat atatcggtcg gatagtgtaa 1981 ctgctgactt aatggcttcg tcagcgatgg caacgccgtg gtgtgattca tattttggct 2041 tgagatggct tagcattgtt acggcttcgt ccaccgtcgg ttcattgagg cggatgatgg 2101 aaaatcggcg agagagggct ttgtcttttt caatggtctg catatattca tcataggttg 2161 tggcgccgat gacacggagt tcgcctcgtg cgagcatcgg ttttaagata tttgcagcat 2221 ct // LOCUS sequence234 2220 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence234 VERSION sequence234 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2220 /mol_type="genomic DNA" /organism="" /note="sequence234" CDS 302..1516 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MKQKKNKKWMKFRHRVITVLARWILGPYTTMKLGIHPEKFKEQGD RQYLILMNHQTAFDQFFIGMSFSGPIYYIATEDIFSLGWISKLLSWAVGPIPIKKQTTD VHAVMNCIRIAREGGTIALAPEGNRTYSGKTEHMNPAIVRLAKKLALPIAIYKITGGYG VQPRWADDIRKGKMHAGVSRVIEPQEYKVMSDDELYELIAKELYVNEACVDGEYHHKNL AQYIERAMYVCPECGLSEFVSDKDTLACKNCGLSARYLPTKELEGIGKPFPFTFVGQWY EYQNRFVSKLDLAEYADKPMYSDKADLSQVIVYEHKELIKKDIGIGLYGDRIEFSGLDE DLTLMFDDISAVSVLGRNKLNIYYGDKVYQLKGNKRFNALKYVNIYYHYVNIKDGKPEE LFLGL" /locus_tag="LOCUS_7260" /note="MGA_998" ORIGIN 1 caaagagtaa aaagtctttt catcattgat cgttccttcc gtgtaaatga ttgatatttc 61 cgaatgtcgg aatatatcta taattatgat agcacacata tatacaataa gcaatgatta 121 ttagtgtaca ttttactgca ttttaatatg gcaatatgcc gatacatccg cttttgcttc 181 atactgcttt tcgcaactaa tgcggcatat tagatgtgcc caaggaaatt atcggttgac 241 taaggcagga atttgaggta tactttaact ataatgttgg tttttgttgg agttagaata 301 tatgaagcaa aagaaaaaca aaaaatggat gaaattccga catagggtta taaccgtgct 361 tgcaaggtgg atacttggac cgtataccac catgaagctc ggcattcacc ccgaaaaatt 421 caaagaacag ggcgatagac aatacctgat tttgatgaac caccagaccg cctttgatca 481 gttctttatt ggaatgtcct tcagcggacc gatctattac atcgcgacgg aagacatatt 541 ctcgttggga tggatttcaa agcttttaag ttgggcggtt ggtccgattc ctattaagaa 601 gcagaccacc gacgttcacg cggttatgaa ctgcattcgc attgcgcgcg agggcggaac 661 gattgctttg gcgcccgaag gcaaccgaac atatagcgga aagaccgaac atatgaaccc 721 cgcaattgtc aggcttgcga aaaagctggc acttcccatt gcgatttata agatcacagg 781 cggatacgga gttcagccga gatgggcaga tgacataaga aaaggcaaga tgcacgccgg 841 cgtttcgagg gtcattgagc cgcaggaata taaggtgatg agcgatgatg agctttatga 901 gcttatcgca aaggagcttt atgttaacga agcttgtgtg gatggcgagt atcatcacaa 961 aaacttggca caatatattg agcgcgcgat gtatgtttgt cccgagtgcg gactttcgga 1021 gtttgtgagc gataaagata cgcttgcctg caaaaactgc ggattaagcg cccgttatct 1081 tcccaccaag gagctggaag gcattggaaa gcctttcccc tttacattcg taggtcagtg 1141 gtatgaatat caaaaccgat ttgtttcaaa gcttgatttg gcagaatatg cggataagcc 1201 gatgtattcg gacaaagctg atctttcgca ggttatcgta tatgagcata aggagctaat 1261 aaagaaagat attggcattg gcctttacgg cgacaggatt gaattctcgg ggcttgatga 1321 ggatttgaca ctaatgtttg atgacatttc cgcggtgtcg gtcttgggca gaaacaagct 1381 caatatttac tatggcgata aggtctatca gcttaaaggc aacaagcgtt tcaacgcgct 1441 gaaatatgtg aatatatact atcactatgt gaacattaaa gacggaaagc ccgaggagct 1501 gttcttggga ctgtaaaaaa gtacatataa caaaaatacc gctcagtttt tggctgagcg 1561 gttttgtttt tttatcgttt actcttttta actatcatca agactatgag aacgacagct 1621 gtgagggaga ttattcccag aatgatgaga attggcatta cctgactgaa atcgtcggca 1681 ggaagatcat atatttcgga catttgggtg tcagcggttg tgtcatcctc gggagaggag 1741 gttaccgcag gggtatcagc aggttgattg tcagatgtgg aaacaggatc tgttccggaa 1801 gtggtggttt cggatgattg cgattcgctt gccgaggtgg tgacagacag ggcggtgtcg 1861 ccggtcttgt cagtcttttc ggtcttggta gtggtggatt cggttgtcgc ggtggtcact 1921 tcagagcctt tggcttcctt gatgacgtat ccgcagacgg tgcaaacgac tttttcgccg 1981 tctttgccgt caccgtcggg ggtgtggtcg tcaaggtcgg tgacatcggt gcaaccgtag 2041 cattcgcgcc aatgggtgtc ttcatcgtgg gaccaagatg agttgaagct gtgctcatgg 2101 gtctgctttt cgccacagac gatgcactcg ccgtcctcat agctgtgata tccataagca 2161 gaagcggtta ttgagagagc ttcaacggtg cccgcagcat cgaagaaggt ctttttgcag // LOCUS sequence235 2219 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence235 VERSION sequence235 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2219 /mol_type="genomic DNA" /organism="" /note="sequence235" ORIGIN 1 aaaaagtcga atcggagcgc aagcttgcat ctgccgagga aaatatcctt cgtttaaagg 61 atattatctc cgagcttgaa ggcagagttg aacctttgcg tatccaatcg gaaaaggcga 121 agaaatatct ggtgcttgcc gaaacaagaa aagctcttga aatttccgta tgggcaagaa 181 agctttctga actgagcgaa aaccttggtg agctcgagga caggcttttg attgccggcg 241 gtgaatatga gcacctcgaa aatgagatcg cctcgatgga ggatgagctt aacgagctta 301 ctcttaaacg ccagcaatgc tcggccgccg ctgaagaaca ccgcgaaaag atcttatctc 361 ttgaaaagca gaatgcagaa gcctctgccg acatcgcggt atataagaac aatatcatgc 421 actataacga ctcggttgcc gagatcgagc ttaaaaagcg agagctttct ttggcaggcg 481 aacagcttga aaagacaatt gccgaaaaga aagcacttat cagcgagatc gaatcaaaga 541 agtcgtctgt tgccgaaaat atcgccgata ttgagaagga gctttcacgt cttaacaccg 601 aagcggacga attttcaaag gagatctccg gctcatcgga cgaacttaac aagctctata 661 tacataaatc agagttgaaa tttgcaattg caaactccgc actcaccaag tcggatgccg 721 aaaagaccgt ttccgatgca actgcaacac ttgatgaagt caatgcgctt ttagccgatg 781 ccgaaaagga atcgaaggag atcacctcgg gaattttgga tattgaaagc agcatttcag 841 aacactcaaa ccgtttgagc ggactttcga tgctgtattc caagaaatcc gatcagctta 901 aaaagatgaa ctccgagtat accgatgctg acatcgagat cagaaatctc actcagcgcc 961 gtcagatgct tattgacctt gaaaacagta tggaaggctt cgccggaagc gtccgccaga 1021 tcgtcaaagc tggcaaatcg ggacagcttc gcggagttaa gggcacagtt gctcaaatca 1081 tctcagtatc ttcaaaatac agcgttgcaa ttgaaaccgc tttgggcgga gcattgcaga 1141 atatcgttgt cgataacgaa gaaaccgcca agcgcggaat ccgtctgctt aaagaaacgg 1201 gcgggggacg tgcaaccttc ttgcctctca catctgtcaa gggcaaccga ctcaacgaac 1261 ccaacctcga tatgcaggag ggctttatcg accttgcctg cgacctggtt gattataacg 1321 aagaataccg cggaattatc aattctctgt tgggaagaat agttgtcgcc gagaacattg 1381 accttgccac caacatcgcc aagaaatacg gctataaatt ccgtatcatc acccttgacg 1441 gtcaggtcat caatgcgggc ggctccttca cgggcggcag tgtttcccgc tctgcaggtg 1501 ttctttcaag aaagaacgag ataagcgagc ttgaatcgaa gctcgataag cttactgcag 1561 acaacgcatc tcttaaatca cgactttcaa cactctccgc cgaggttgaa aaactcggat 1621 atgacgttga aggcgaaaag gaaaccatcg cacagatgga aaacgacaag gtacgattcg 1681 atgccgagca tcgccgtttg cgtgccgcaa tcgaccagta tgaggagcgt atcgaagaga 1741 tcgagcgcgc aatgttggtt gccaaaaaac gcatcgccga agccgagctt accgccaaaa 1801 caagcgaagc cgagcttatc aagtgcgata aggacatttc aacccttgaa gccgctgtca 1861 gcgaagcgag atcaaaggga gatgaatcaa aatcccgccg tgaggagctt tccgaacagc 1921 tttccgaaaa gaggcttgtt ctggtcgaac tcgaaaagga tatcgaagcg gctcgtgatc 1981 atattgcaac cctcgagggc agtgttctcg actccaagtc ggatgcaatg aaatatgatg 2041 agcgaattgc agagctcaac gctctcatcg atgttgaaaa caccaatatc accgagcgcg 2101 aaaacaaggt cattgaagcg aaggcggctg tcgcccgact taacgatatg atcaaggacg 2161 agctcaagcg cggtatggac tatgagcagg agagcgcgaa cgttcgcatt tcccagcgc // LOCUS sequence236 2211 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence236 VERSION sequence236 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2211 /mol_type="genomic DNA" /organism="" /note="sequence236" ORIGIN 1 caagaggtcg tcgtggtcgc cgcgttcaat gatctcgccg ttttcgagca ccagaatcgc 61 gttcgcgttt ctgacggttg aaagtctgtg agcaatgaca aaggttgtgc ggtttttcat 121 cagtcgatcc atgccgtgct caatgtggcg ttcggttctg gtgtcgacag atgatgtcgc 181 ctcatcgaga atgagtatgg gcgctttcga aaccgccgca cgggcaatgt tcaaaagctg 241 acgctgaccc tgagagaggt ttgcgccgtc cgactcaagt accgtgtcat agccgttttc 301 aagtcgcata atgaacgagt gtgccgaagc ggtctttgct gcggcaataa cctcttcgtc 361 ggtggcatca agtctgccgt aacggatatt ctccattacc gttcctgtga acagatgggt 421 atcctgcaat accatcgcaa tgttttctct taaatgctcg cgcttatagt ccttaatgtt 481 cacgccgtca accaagatct cgccctcgtc aatgtcatag aatcggttga tgaggttggt 541 aattgtggtc ttgcccgcac ctgttgaacc gacaaatgcg atcttctggc ctggtcttgc 601 atacaggctg atgtttttca aaactgtctt atcggggaca tatccgaagg tgacattgtt 661 aagaactacc tcgcccttaa tttcacggtc agttgcatcc ttggtgtcgg gagtttcggg 721 atttgtgtcc ataacctcaa atacacgctc agcgcctgca agtgcggcaa agattgccga 781 ggtctgctgc gagatgttgt taatgggcat agagaactgc tttgaatagt tcgcgaaaac 841 tgtcagcgcg ccgggagtca gcttgcccaa aaccatcagc acaccgccga taccgacagt 901 cacgccatag gagatctgag aagtgttacc cataatcgga cccataatgc ttccccagaa 961 ctgagcctta aactgcttgt cgcgcatatc gttgtttaaa agctcaaatt cgctgatgca 1021 ggtgtcctcg tgattaaata ccttaacgac cttctggccc gtaacggttt cttcggtata 1081 tccgttaact gcgcccaaag ctgcctgctg tcccgaataa tatctcgagg aaagctttgc 1141 aatcatcgca ccgccctttg caaaaatggg caggaacaca actgtaatga gtgtcagcac 1201 ccagttggtt gtaatcataa atgtaaatgt acccaccaag gttacaacgc ccgaaataat 1261 cgaggtcaac gagttgttga tcatcatgtc aatattgtca atatcgtttg tgaagcggga 1321 cattacctcg cccgtgggat tctggtcaaa atatcttaca ggtaggcgct gaagcttagc 1381 aaaaagatca ttacggatct tttcaattgc acctgttgaa attcctaata tcaggcggga 1441 ctgcagatat gttgacacaa ttcccacacc gtaaatgcag gcgaatatta aaagaactgt 1501 gagaatatat gtcaaaagct cgcttttaat tgccacattg acagggcctg tgaatgtgga 1561 aagaattttg tcggcaaagc gctccatcgc actcatctca agctctttgc cggtgacaaa 1621 aactgtcagc ttgttaacaa taggtgccaa aagatatgag cctgcaagtg aagttaccgc 1681 gcttagaagc atacagaaca aaacgcccac gattctgaat ttatagggca taagatatgc 1741 cagcagacgt ttaatcgttc cctttgtatc cttaaccttc gcaccctttc caatcggacc 1801 gtgtccgggc cctcttccgt gtccgcctct tcctgcggga gccgctttat tatactgctt 1861 ctgaagctgt tcaagtgatc ttgccataaa gctttatgcc ccctttcttt ccgagtcgtt 1921 ctgagaatag taaatttcct gatatgcttc gtttgatgcc aaaagctcct catgtgtgcc 1981 aacggcgtca attctgccgt cgttcataac aacgatcata tccgcatcct taacggatgt 2041 aattctctgt gcaatgatga tcttggtgga atctgccagc tcatttctga atgcctcgcg 2101 gatctgtgct tcggtggctg tatcaaccgc gctggtggag tcatcaagaa tgagtacctt 2161 cggcttttta agcaaagcac gggcgatgca aagacgctgt ttctgtccgc c // LOCUS sequence237 2196 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence237 VERSION sequence237 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2196 /mol_type="genomic DNA" /organism="" /note="sequence237" CDS complement(892..2121) /product="aminopeptidase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003429165.1" /transl_table=11 /codon_start=1 /translation="MKKSTIRKYAKLIVRVGANVQKGQSVVISCNVDQAEFCALVVDEA YKAGAKYVTVNWSYDPITKLAYRHESVKTLSTVLKWQEDKFAWMAEELPCRIVLLSEDP DGLKGVNPAKMQKVGQKRYPIIKPYRDAMENRHQWTIAAVPGEAWAKKVFPGERKSVAI EKLWKAILETVYVTDDNDPIAEWAKVNADFDERCKVLNSYHFEKLHYTSSNGTDFTCWL MPKSKWNGGGETDLRGHFFNPNLPTIEVFTTPCKGKAEGKVVSTKPLSYQGQLIENFSI TFKDGKAVSCEAEKGQELLERMITMDEGAAMIGELALVPVDSPINNQNILYYETLFDEN ASCHIALGAGFRDCVEGFENLTKEDFDEMGVNESMIHVDFMIGAPDMSIVGYTADGKAV DIFKNGNFAI" /locus_tag="LOCUS_7270" /note="WP_003429165.1 aminopeptidase (Clostridioides difficile) [pid:43.1%, q_cov:98.5%, s_cov:98.3%, Eval:4.8e-92]" /note="MGA_1004" ORIGIN 1 ctcggtctgt gcaagctcat aaatatttcc aaggcctgcc tgaagctgtt caagcagatc 61 atttgcaagg ttgagtgcag cactcttgag ttcttcgtcg gttaaatcct catatccttc 121 aagaccgctg aagtggtcat agctgattaa tagatggtga actcttacat agttctcgct 181 gatattgctc ttgatctctt cgtcagtggg aacaagcaaa gcgccttcct tgttgtaaag 241 ctcttcatat acacggttgc ccataacctc ggtttcgatg attcttctca aaagatcttc 301 ggtaaggcct gcttcagtaa gtgcagcttc atattcctct tcggtttcga agtatgtctt 361 ttcctgtgcg aggtattctt caacagttgc ctggtcatcc tcgttgaggg ttatgtcata 421 ctggtctgca aggatctggc tccagttgct ctggagaaga taatactctg catatccctg 481 caatgtgggg aacattgcgg cgttttcttc ccagaaagca gcattgccct gtgagaagta 541 atagccatct accattgaat accaatatct gtaaatatcg agggggatat catagccgtt 601 gacagtcaag aaagtatccg aagcggaaag aagcttgttg ccctcggcat catagaagcc 661 gacttcggtt gcagctgcgt cagcagattt atcgccgtcg gtgttttcat ccttgccgca 721 agcggtgaat acacaaagcg acattacaag cgctaacata agcgccaaaa ttttcataag 781 gtttttcatt ttttcaaact ctcctattat aaaacatttt acaccattgt aatcccgtaa 841 tgtgacaaca aggtgacagc tttttaaaaa gccgaatctg cacgcaagga attatatggc 901 gaaattgccg ttcttgaaaa tatcaacagc cttgccgtct gcggtatatc caacgatgga 961 catatcggga gcgccgatca taaagtcaac gtggatcatc gactcgttta cgcccatttc 1021 atcgaaatct tccttggtga ggttttcaaa gccttcaacg caatctctga agcctgcgcc 1081 caaagcaatg tggcagcttg cgttctcatc gaagagggtt tcatagtaaa gaatgttctg 1141 gttgttgatg ggtgaatcaa caggaacaag ggcaagctcg ccgatcattg cggcgccttc 1201 gtccattgtg atcattcttt ccaaaagctc ctgacccttt tcagcctcgc aggatacagc 1261 cttgccatcc ttgaaggtga ttgagaagtt ttcaattaac tgaccctgat acgaaagcgg 1321 cttggtggat actaccttgc cttcagcctt gcccttgcag ggggtggtga aaacttcgat 1381 ggtgggaagg ttgggattga agaagtggcc acgaaggtcg gtctcaccgc cgccattcca 1441 cttggacttg ggcatcagcc agcatgtgaa atcggttcca ttggaagagg tgtaatggag 1501 cttctcgaag tgataggagt tgagaacctt gcatctttcg tcgaagtcgg catttacctt 1561 agcccactct gcgatgggat cattgtcgtc agtaacatat acggtttcaa ggatcgcctt 1621 ccagagcttt tcaattgcaa cgctcttgcg ctcgccgggg aatacctttt tagcccaagc 1681 ttcgccggga acagccgcaa ttgtccactg gtggcggttt tccattgcat ctctataggg 1741 cttgatgatg ggatatctct tctgtcccac cttctgcatc tttgcggggt taacgccctt 1801 gagtccgtcg gggtcttcag aaagcaaaac gattctgcag ggaagttctt ctgccatcca 1861 agcgaattta tcttcctgcc acttcaaaac ggttgagagg gtcttgacag attcgtggcg 1921 ataagcaagc tttgtgatgg gatcatagct ccagttgacg gtgacatact tggcacctgc 1981 cttgtatgct tcatcgacaa ccaaagcgca gaattcagcc tggtcaacat tgcaggagat 2041 gactaccgac tggcctttct gaacgttagc gccgactctt acgatgagct tggcgtattt 2101 tcttatagtt gattttttca taaatatacc tacaaaagtt ttgtaattat cataacttaa 2161 atattataga acagcgcaca aattatttca acacaa // LOCUS sequence238 2192 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence238 VERSION sequence238 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2192 /mol_type="genomic DNA" /organism="" /note="sequence238" misc_feature <1..1599 /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_011107211.1:glycoside hydrolase family 127 protein" /note="WP_011107211.1 glycoside hydrolase family 127 protein (Bacteroides thetaiotaomicron) [pid:25.9%, q_cov:57.7%, s_cov:35.7%, Eval:4.6e-16, partial hit]" /note="MGA_1005" /locus_tag="LOCUS_7280" misc_feature complement(1652..>2192) /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_005814522.1:DUF4956 domain-containing protein" /note="WP_005814522.1 DUF4956 domain-containing protein (Desulfitobacterium) [pid:37.7%, q_cov:86.0%, s_cov:66.4%, Eval:1.8e-27, partial hit]" /note="MGA_1006" /locus_tag="LOCUS_7290" ORIGIN 1 atcagctctg agcttaattg gaatgattcg ggcgttaaac tgacacaggt ttcaacactc 61 cccgacggcg atacttcacg attcaccgtt aacaccgcaa acggcgatgg agttaaattt 121 gccctcaatt tgagagtacc cgaatgggtt gcatatgaac ctgtggtaac cgtcaacggt 181 gaagctcagt caaatgtaat taacgactgt catatccgca ttgaacgagt ttggcggaac 241 ggcgacagcc ttgaaattaa gctcccgatg gctgttaagg catacggatt gcccgacgat 301 gacaccgttt tcggatttaa atacggccct gttgtactca gcgcagagtt gggacaggaa 361 gagatggata agcgcactgc ctgcggtgtc agcgtgacgc ttcccgcaag caagatcgtc 421 ggcggcgctc aagctttgcc caaggatggc aaacgcgcag ttttgggcac cgagaccctc 481 tcgatcgaga acaccaccgt tgcagactat attgcaaata tcggcgaaaa cctcgtccga 541 attgacgacg gcgacgacct tcgcttcaag cttttgggaa ccgatacaga ccttgtcttc 601 actccccatt atcgtcagca ctctcatcgc tacggaattt attggtactt tgtcggtaac 661 gatatttccg aagaggacgc aagcgcaaga attttggcgc aaaagaccga gggcagaaca 721 aaccaggtta aaattgacgt taccaaggcg ggctacggcc agtatgaatt cgatgctttg 781 caccagttgg gcgactgggg aagtgtatac tcgaagggta catcaaacga ccgagagctg 841 ggaggtatga cttcaagatg tgcgaaggaa aaccagacct tcagctatcg catggcgatg 901 gacaaaacaa agagcaactt tgttgttatg aagcttgcaa aaatcgataa cggcaaaacc 961 ttgaagatat ccgttttgga cgaagttatt tataacgaag ttttgaacta ctcaggtgat 1021 gaggatattt acgaggtttg ggtcaagatt cccgatgagt tggttgcaca ggcgactacg 1081 gtttctgttg tcgagggcga cggaagcgtt aaggaatatg atacccttcg aatcggattc 1141 tcgggtgccg agggcgaaat atccgcccga cttgttgaag agctttacat tgccaccgga 1201 tattcccaca acgcatatat tgacgagatt tcctgcgagg tttcggatat tacatttgat 1261 gaaaaggaaa atgcatttgt gctccttgct cccaaggcac taaccgcgga tagattgaac 1321 gtcaagcttg cggatgcata cggtttgctt tatgttgacg gcaagctggt caacgatgcc 1381 aatccgataa agatcggtat tgttgacggt gaggtgcata ttctcaaagt atatgccgag 1441 gaccacgaaa caagcgatga gtttaagctt atcatcaagc agggaaaagg cggaaagata 1501 ccccaaaaag caaagctccc tcttattatt gcgggagcag cggcaatcgg cggaatcatc 1561 gcggcaattg caattaagaa taagaaaaag agaaaataga taagcaaaaa agagcagacc 1621 cccaaaaagg tctgctcttg aatttttgtg cttatgcctt gggagaatag tcaaattctc 1681 tcagggtgag gataacgtca aggttgccgt ttcttgttct tatcttatca ataaattcgc 1741 ggcggttaac gctttcgggg agattgatga taaatctgag ttcatacaaa gagccgaagt 1801 cggttgaacg aacctccttg aggttatatt catcggcata ttcatccaaa atatcgtcga 1861 atgcgccttc aaagttgaga tcctcgggaa tggtgatctt taaaagcata tttgttgcct 1921 tggggattcc aaagcgagtg atgctcaaaa ccagcattac agcacacatt acaattgtgg 1981 tgataaccgc aacgccgtaa tatcccgagc cgcaggcaac gccgatcacg attgcaaaga 2041 acaaaggaac aatgtccttg gtgtccttgg gatagcttct gattcgaagc agcgcaacag 2101 caccgcccaa ggaaaccgca gttacaacgc tggtgttaat gatcattgtg acgccggtca 2161 taagagggca aagcaaaaca attgccatgg gg // LOCUS sequence239 2190 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence239 VERSION sequence239 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2190 /mol_type="genomic DNA" /organism="" /note="sequence239" tRNA complement(494..570) /product="tRNA-Pro" /inference="COORDINATES:profile:Aragorn:1.2.38" /locus_tag="LOCUS_t0130" /note="Aragorn_13" CDS complement(730..2178) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MKRFIALAFVLVMIFTLVGCGGEKREIVKLTLSTEDSEAILAAAG ITLPDVEEAKGANSTIIWFSWYDGFHNYDEAEIVNTGFWTFSEKYGGEIEWIETDYFER NDDLANLILAGTSPDFAPAGSSSTATFPMNCIKGMYQPVNDYIDYTTPLWSGMADAAEY FSLGDTVFAFVTDVTFRHIVPYNRRVIDEWGFDDPAELYANDEWTWEVFYDMCMDFSDP DEDRYALDGYSFNDALVQQATGTKIIGKDENGHFYSNIDDPMLEVANNLLYDLVKNGCT YHEGTNYWAGRNDHLAGAGLKEGLCLFYIATVDEFTGTVEEISAVWGDVTEGELMFVPL PRYENGDGNYYLTSIPTGYMLCTGASNPDGVALLASCERFKIIDPTVVSIDRKQLKETY LWTDEMLDMYDHCYELAQETVQMYYNGNLTDSLNSVYNSLRDGVARSNPPATWAQLKEQ YTDSLEYYLEEQNAIIDDYIASMG" /locus_tag="LOCUS_7300" /note="MGA_1007" ORIGIN 1 gaggcttata tttgtccgtc aaacgcttgt ccacactgct gacggcgatg ttatacagca 61 cacaacaaaa gctcgaaaag accgaattgt accacttcca gaggaggcaa tacaaattct 121 tgaacgaata aaagccagtg acagccaaag tggttttttg ttcacttcta aaaacggaaa 181 accaatcacc ttgcgcaact ataataggct ttacacgaag ttctttaatg aacggaaaaa 241 ggaacacccc gatttggttt acctctctcc gcataagctc cgacattcct atgctacata 301 tttgatttat tgcggggcag atgttgaaac tgtaaagaat ttactcggtc ataaggacat 361 cgctaccaca cagagatata ttcattcaag ccttgaacag atgagaacag cgacagaaaa 421 cctcagcttt aacatcggct aagagtatac aaaaagaaaa acagagcctc ttttgagact 481 ctgtttcata ttatggtctg agtgacggga cttgaaccca cggcctctac caccccaagg 541 tagcgctcta ccaagctgag ctacacccag attcacaaca ttaatattgt atcacatgtt 601 ttaagaaaat gcaagtgttt ttttgcaact tttttcaatt tttcaaaaaa tttttccacc 661 cgctccgcct ttgtgacaga gcgggtgaag tttaatctgc taacgtcgaa ttatcagcat 721 tttttgaatt tatcccatcg aagcaatgta atcatcaatg attgcattct gctcttcaag 781 gtaatattca agggaatcgg tatactgttc cttaagctgt gcccatgttg cagggggatt 841 ggatcttgca acaccgtcac ggagcgagtt gtagacgctg ttgaggctgt cggtcaagtt 901 gccgttatag tacatctgaa cggtttcctg tgcaagctca tagcagtggt catacatatc 961 gagcatttca tctgtccaga gatatgtttc cttgagctgc ttgcggtcga ttgaaacaac 1021 agtagggtca atgatcttaa atctctcgca ggatgccaaa agggcaacac cgtcagggtt 1081 tgaagcaccg gtgcaaagca tatatcctgt ggggatagat gtcagatagt aattgccgtc 1141 gccgttttca tatctgggca acggaacaaa cataagctcg ccttcggtaa cgtcgcccca 1201 aactgcagaa atttcttcaa cagtaccggt gaactcatca acagttgcaa tatagaataa 1261 gcaaagtcct tccttcaagc ctgcacctgc aaggtggtcg tttctgccag cccagtagtt 1321 ggtaccttca tgatatgtac agccgttctt taccaggtca tacaaaaggt tgtttgcaac 1381 ttcaagcatc ggatcgtcga tgtttgaata gaagtggccg ttttcatcct tgccgatgat 1441 cttggtgcct gttgcctgct gaacaagagc atcgttgaaa gagtatccgt ccaaagcata 1501 tctgtcttca tcggggtcag agaagtccat gcacatatca tagaacactt cccatgtcca 1561 ttcgtcgttt gcgtaaagct cagcgggatc atcaaagccc cattcgtcga ttactcgtct 1621 gttatagggt acgatgtgtc tgaaggttac gtcggtaacg aatgcgaaaa cggtatcgcc 1681 aagtgagaaa tactcagcag catctgccat gccggaccaa aggggagtag tatagtcgat 1741 ataatcattg acgggctgat acataccctt gatgcagttc atggggaagg ttgccgttga 1801 actggagcct gcaggagcaa agtctggtga tgtacctgca aggatcaagt tagcaaggtc 1861 gtcgtttctt tcaaagtagt cagtttcgat ccattcaatc tcaccgccat acttttcaga 1921 gaaggtccag aaacctgtgt taacaatttc cgcttcgtca tagttgtgga atccgtcata 1981 ccagctgaac cagatgattg tggagttggc acctttggct tcttcaacgt caggcagggt 2041 aatacctgca gccgccaaaa tagcctcgga gtcttcggtt gaaagcgtca gcttaacgat 2101 ttcacgcttt tcgccgccac agccaacgag cgtaaagatc ataacaagca cgaacgcaag 2161 tgcaataaat cttttcatag tatcctccaa // LOCUS sequence240 2190 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence240 VERSION sequence240 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2190 /mol_type="genomic DNA" /organism="" /note="sequence240" CDS complement(57..386) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MKKLFILLVNFYRRFISPLKPPCCRYYPTCSAYALEAFKKHGAIK GLILAIWRLLRCNPWSGGGVDYVPDKFHLYTLKSEHKRKSTQTKEKTEFEINCPKDRAF DTEED" /locus_tag="LOCUS_7310" /note="WP_003701741.1 membrane protein insertion efficiency factor YidD (Ligilactobacillus salivarius) [pid:56.0%, q_cov:68.8%, s_cov:86.2%, Eval:4.4e-22, partial hit]" /note="MGA_1008" CDS complement(383..718) /product="ribonuclease P protein component" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003429302.1" /transl_table=11 /codon_start=1 /translation="MLYTQVLKDPKVFTKLYRKGRFCACKAVVAYFMPNRLPFTRFAVS ASKKIGNAVERNRAKRILRELYRQNEMKMPIGYDIVFVAREDIKDKKTPELEYFIPRLT KEMSREK" /locus_tag="LOCUS_7320" /gene="rnpA" /EC_number="3.1.26.5" /note="WP_003429302.1 ribonuclease P protein component (Clostridioides) [pid:39.8%, q_cov:91.9%, s_cov:90.4%, Eval:3.2e-15]" /note="MGA_1009" CDS complement(787..930) /product="50S ribosomal protein L34" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003568442.1" /transl_table=11 /codon_start=1 /translation="MAQIKRTYQPKKIHRKKEHGFFKRMATKNGRKVLARRRAMGRAKL TY" /locus_tag="LOCUS_7330" /gene="rpmH" /note="WP_003568442.1 50S ribosomal protein L34 (Lacticaseibacillus) [pid:73.8%, q_cov:89.4%, s_cov:91.3%, Eval:2.1e-11]" /note="MGA_1010" ORIGIN 1 accagccagc aaagccacat tagcttaccg aagggccacg cgataatttg ccacatttaa 61 tcttcctccg tatcgaatgc ccgatccttc gggcagttga tttcaaattc tgttttttct 121 tttgtttggg tgctctttct tttatgctcc gactttaggg tgtataggtg gaatttgtcc 181 ggaacatagt caactccgcc gccgctccag gggttgcagc gcaaaagccg ccagattgca 241 agaatcagac ctttaattgc gccgtgcttt ttaaatgcct caagggcata tgccgagcag 301 gtgggataat atctgcagca gggaggtttt aagggagaaa taaatctccg atagaaattt 361 acaagcaaga tgaacagttt tttcactttt ccctgctcat ttcttttgtg agccgcggaa 421 tgaaatattc cagctctggg gtctttttgt ccttaatatc ctctcgggcg acaaaaacaa 481 tgtcatatcc gatcggcatt ttcatttcgt tttgccgata aagctcccga aggattcttt 541 ttgcacggtt acgctcgacc gcattgccga tctttttcga tgcactgacg gcaaatcggg 601 taaaaggcag tctgttgggc ataaaatatg ccacaacagc cttgcaggcg caaaagcgcc 661 ccttgcgata taactttgta aaaactttgg ggtcttttaa aacctgcgta taaagcaaga 721 caatcacctt tcaaagaaat ctcttactaa aaataaagac cacaactcgc tgtggtcttt 781 gaggcattag taagtgagct tagctcttcc cattgcacgt ctgcgagcca aaaccttacg 841 gccgttcttg gttgccattc tcttgaagaa gccgtgctcc ttctttctgt ggatcttctt 901 aggctgatat gttctcttga tctgtgccat gtttatcttt cctccttgtc cataaaatcg 961 gtatgggcaa aatttgcacc ttgaacccga atcaattaaa aacagggttc ttcggtagat 1021 acccttgcaa tttagtatta tataataatt gcaaactaaa agtcaatagg cttttaaaag 1081 atttaattaa aaaaccctct taaatcgttt attccggcat acagctttgt ggaaatgacc 1141 aaaatatagt atactattta taatatattt tccttgaaaa attccacact ttgtagtata 1201 attatattaa caatgcaaag atgggaaaat atctgtcttt tgccgcgaaa accgaatttt 1261 taaatgaggg aaaaattgaa aatcaagaaa ggattttgaa aatatatgaa ctctttcaac 1321 gaactttttg agagtgtaaa acgcgcttgt caagccgatc ccaaggtcag cgacatcgga 1381 tatcagagat ggatcgcaaa gatcgaagca attaaacttg aaggcggaaa agcatatttg 1441 caggctgaaa acgattttca gcgtcgaact gttgaagact actatatgga cgttttgaaa 1501 cgcgcctttg aacaggtttt aggcttccct gttgaagttg agcttttact taaagaggac 1561 aacaaaggcg acggttacca tgagatcgag cgcagaatgg ctgaccttat gaacagccac 1621 cgcagaagcg attatgacct gacctttgaa aacttcatca agggaaaatc aaacgagctt 1681 gcatatgctt attgcattgc agtttcgggt aaaaacaacc ttaacaaaaa tgtttcaatg 1741 tcggtgttta acccgctgtt catctatggc gactcgggtc tcggaaaaac ccaccttttg 1801 cgcgctattg aaaacgaagt aagacgcaat catcccgaga tgaatgtgat ctacaccaca 1861 ggtgagcagt tcaccaacga gatcatccag gctgttgccg aaaaggacac catttccttc 1921 cacgaaaaat accgcaactg cgatttcctt ttggtggacg atattcagtt tattgcaggc 1981 aaggaaatga cccaggaaga attcttccac accttcaact ccctttatga aaaaggcaag 2041 cagattgtct taacatcgga tatttccccc aaccgcatca acaagctgga ggacagaatt 2101 aaaacccgct ttactttggg tgtacaagct gacgttcagg cgcccgacta tgaaaccaga 2161 atggcaagcg tcaagcgcaa ggcagagcgt // LOCUS sequence241 2167 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence241 VERSION sequence241 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2167 /mol_type="genomic DNA" /organism="" /note="sequence241" CDS complement(947..1303) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MFTAILSRDAEWASKMGERILNQSIPLGRYVALKLFESPQKLLRH LKTHGCGTVIMSIDHMDDLDYARDISETGARLILLTDSNDIAIKAYSVCPDYCALKHPD AEDFERISSIIFCA" /locus_tag="LOCUS_7340" /note="MGA_1013" ORIGIN 1 tcggacatga gcacaacgat aggcattttg tcaacgcctg cctggaagga tccgccatca 61 acggtcacat cgttgacact tgaaagaatg tcgcctgcca tgtccatacc gtactggatg 121 taggtaccgc cggagatgct ctgggtcttg acgcttactg cgttgccgtt gccgccaaga 181 aggttttcgc ctgttgaaat tgatgcgctg taagaatatg ttacctggtt gttgccgccg 241 ggtctgccgg gacggtttcc gccgccctgc tgggtcttgg tccagttgaa ggtgataaaa 301 tcgtcgcctt cgttttcaac tgagtatctg tccaagggca ggaaaacagt tccgctggtg 361 gaatagagca cgatgccgac acggttgtgt ctgttgtttg ccaaaagggt cttaattgca 421 tcgttagccg cttcgatcat tgttgcggcg cggctgttgt ttgctgcatc gtcagacgag 481 atgttgttaa acatcgagcc tgaaatatcc aaaacgaaga ttgtgtcggt gggggtataa 541 gcatagcctg ttattgactt tgtggatgcc aaagcggaca gcgcaacgat gaagttgttt 601 tcatcgctca aagtcagctt tgcagcatca gtcgcattca agcttgcagt cagttcgctc 661 aaatcggttt catcaaatac cgatttatcg acccaaatgc cgcctgcgtt ctcggttccc 721 aaattgtcac caaagaactc tttccaaccg ttaattgtcg ataagtctga tacagttgaa 781 attgcctcgg gaaccgccgc gtgaaggaag ttgaatcccg gaactgcaga caaagccatt 841 gccaaagcag ttgctacagc agtcagtctt ttaatcaaac cgtttcctct catatttgtt 901 tgcctcctaa tatgtaaaag ataaagatgt tttcaagttt tcaactttat gcgcagaaga 961 ttattgatga tattcgctca aagtcttcag cgtcgggatg tttcagcgcg cagtagtcgg 1021 gacagaccga atatgcttta attgcaatgt cgtttgagtc ggtcagaaga atcagccgcg 1081 cacccgtttc gcttatgtcc ctggcgtaat ccaagtcgtc catatggtct atgctcatta 1141 ttactgttcc gcatccgtgg gttttaagat gtcggagcag tttttgtgga gactcgaaca 1201 gtttcaaagc aacatatcgc ccaagcggta tggattggtt gagtattcgc tcgcccattt 1261 tgcttgccca ttcagcgtcg cgtgataaga tcgccgtgaa cataatctca ccctttcggt 1321 aaaaaacttt aacatggttt ccatattttt catgttaaat atatcacaaa tttttctttg 1381 aaacgaaaac attgcttaaa acgcaatttt tttgcgcgaa atgcaaaaaa ctcgttttta 1441 atcttgaatt cccaaaacta tgggagtata atttatacta tccggtatac cattttaaat 1501 tatatattat atttgacata ttaacttcta atttagggag atgttttaaa atgagagtcg 1561 cgatatgcga tgatttggcc gaggaaagaa aaatcattaa aaactatcta agacgccttg 1621 ataccgaaga gcacctggag cttgagatat atgagtttga caggggcgaa gccttgcttg 1681 actatatgaa aaagggcaaa aacctgcctg attttctctt cttggatata tatatgggtt 1741 cctgcgacgg aatatcggta atgagagagc tgagaaattc cggatatgag ggaagcgttg 1801 tattttgcac cacatctgtt gaacacgccg ttgagtcata taagctcaaa gcggacggat 1861 atctggtgaa gccatataat tatgaggact tccttgaagc catctggcgt tgccgcagac 1921 attttgaaaa gagcaaaaag gtgctgaaat ttgtttcgga aagacttgac tacgctattc 1981 cctatcagga tgttttatat attgaaaccg aggcgcgcac ctgtgctgtt cacaccaaaa 2041 aggatacctt taatacatat aaaaaaatcg gcgaattcga gactgagctc tcaggcgaga 2101 actccttcat taaaatcggc agaagctact tggtgaatat gaacgctgtt aaaaagcttg 2161 ataacga // LOCUS sequence242 2167 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence242 VERSION sequence242 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2167 /mol_type="genomic DNA" /organism="" /note="sequence242" CDS complement(83..616) /product="nitroreductase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_005902348.1" /transl_table=11 /codon_start=1 /translation="MIKNEALEVLTTRRSVKGYLDKPVSKEQLEAILAAGINAPTGRNL QAPKIVAVTDPETVKYLSKLNAAVMGASGDPFYGAPCVFVVLADKNIRTAIYDGCCVMA NLLNAAHAVGLGACWIHRAKEVFDSPEGKELLKKWGIEGDYEGIGNCILGYPSGNFPAP KAHKADYVVYVGEN" /locus_tag="LOCUS_7350" /note="WP_005902348.1 nitroreductase (Fusobacterium nucleatum) [pid:44.5%, q_cov:96.6%, s_cov:98.9%, Eval:7.7e-39]" /note="MGA_1016" misc_feature complement(1013..>2167) /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_011861612.1:NFACT RNA binding domain-containing protein" /note="WP_011861612.1 NFACT RNA binding domain-containing protein (Clostridioides difficile) [pid:34.4%, q_cov:99.7%, s_cov:65.1%, Eval:2.6e-60, partial hit]" /note="internal stop codon at [1013:1015](-)" /note="MGA_1017" /locus_tag="LOCUS_7360" ORIGIN 1 agcgcgcaga caagcggtgt aatattatat atcgctatcg ccgcaacgag ataccacagc 61 gttttttcaa atcgctcgcc catcagtttt cacctacgta tacaacatag tcggccttat 121 gcgccttggg tgcggggaag ttgcccgagg gataacccaa aatgcagttg ccgatgccct 181 cataatcgcc ttcgataccc cattttttca aaagttcctt gccctcgggt gaatcgaaaa 241 cctctttggc acggtggatc cagcaagcac ccaagccaac cgcgtgagcg gcgttcaaaa 301 gatttgccat tacgcaacag ccgtcatata tcgcagttct tatgttttta tcagccaaaa 361 cgacaaaaac gcagggtgcg ccatagaatg ggtcacccga tgctcccata acggcggcgt 421 taagcttgga gaggtatttc accgtttcgg ggtcggtgac agcgacgatc ttcggggcct 481 gcagatttct gcccgtggga gcattgattc ctgcggcaag gatcgcttca agctgttcct 541 ttgaaacagg cttgtcaaga tatcccttga cagagcgtct tgttgtcaat acttccaaag 601 cttcgttttt aatcataatt tatttctcct ttctcaacgc ttcgaccgtt tcggcatcag 661 gtgtgacata tagggttttg ttatttgtaa atattaccat gcccggtttt gcgccggcgg 721 gctttttaac gaactttgca aaggtataat cgaccggaac cagcgaggaa tttcgggcag 781 atgagttata tgccgcaatt aatgccgctt cgtcgatcgt ttcctcgggc ggagtggtac 841 cctcacattt tataataacg tgggaacccg taaaatcgtg ggtgtgaagc caaatgtccg 901 acttctcggc aattttaaga gttaaggtat cattctggcg gttgttgcgt ccaaccagaa 961 ttgtatagcc atcgctcgat gtatattcaa tgggcgggag cgccttcggt ggctattgtt 1021 tgtttttcgg ctgtttaaga tagccgctct gccaaagctc gaggcggatt tccgagaggt 1081 cgctctctgt tgatgcgcgc gagagcgaat cgaacaccga gtcgatatat ttaatttctt 1141 cctcacccga tgatatcagc tcgcggagct ttttgtcggc agtgtccgcc ttgcgatatt 1201 cggtgtaata cttctgagca ttttgggcag gtgtaagcct cgggtcgagc ttgattttaa 1261 tttcggggca ggcttcatca tagaaattct ccaaaattgc ctcacggtcg cccttttgga 1321 ttcgatatag gttcgccatt atgaggtcgc ccataaggcg aagctcatcg cggttctgac 1381 agtccaaaag ctcttgcttt tgcgacgcca cacggcgctt gatgcgttcg gtaaggctca 1441 ctatcatttt aaagagatcg tctgcacgct ggcggttctg attgatcaca tcccgctcaa 1501 aatagaagtt atcgagcaat tcgcagggcg attcaaactc gcgggtggac ataagatttc 1561 catattgaga aatggcggtg aagcaaaagt cggtcatctt gccgcttttg tccttcaaaa 1621 gaacgtattt gttttcgccc tcaagaatct gccgtgcggt gtttttaaga tagaacgcca 1681 agcggtcccg ctcgtcggca ttgagttcgg aaactgttct gtcctcaccg cgggcgcagt 1741 aatgcacagc ctcgcgggca aaaacaggcg aaattccctc aagggtcttt aaaatcgcct 1801 tagacaattc ctgcgcaggg tttttctcaa gatttaagaa aaattcatcc acatccaaat 1861 tcaaaaggct caaacgctca tctctcggcg gaagagtata gttcattccg ggcaaaactc 1921 tgcgcacact tgacatatcg tcgctgacgc gcttgattgc atcaataatt ctttggtcct 1981 tgccgattaa gatgatgttt gagcatctgc ccataatctc gcaggcgaga gttaaggtga 2041 cgcggtcgcc aagctcgtcg gtagcttcaa aatcgaaata taaaatacgc tcaaagccat 2101 cctgacgtat tgaaaccagc ttgcccgatg acagatgctt acgcataagc atacagaaca 2161 tcggcgg // LOCUS sequence243 2146 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence243 VERSION sequence243 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2146 /mol_type="genomic DNA" /organism="" /note="sequence243" CDS 837..1538 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MKKLTISIVAILMAMALTVSVFAVDMKYIDPSTPCYTYTVNGDIT ELTATVTILDFVYDEASWKDGAIQDGAGWNDWCGQFIVVTAPDGTVHYHDWGGASVTWG ADFDGDGVAETEGNNWGSTTWLAEVAAGQTVDFVVPVYGVGTVVEFFVNSWDIYLGVQY TLEVSGDTEAPVVEETPAVEEESAVEETPAVEDTPAVEEPKEEEPADTGLALAVVPAVL AMAVAVISKRK" /locus_tag="LOCUS_7370" /note="MGA_1019" ORIGIN 1 atagaggtca ctatttcctt aaccccggcg aagttggaat gagctattca aacaaccata 61 ctcacttgca taaattcaaa ggtgaatatt acataatctc tcactcccta atattaaagg 121 acagtatgaa aattgcaggc ggattcagaa gcttgatggc agacaacatt gaagttaacg 181 aaaagaaact cgagatcgag cttatcggta catcgactga aggcgcaaag cagattgagc 241 ctcttaaccc ctattacgca cattgcggaa cagaagccag catctctgca gatatcggat 301 atgttgattc ggacggagaa cttaacaatg tcagcgctgt cagcaagacc gcaggctctt 361 ggttatatat taaaggcgcg aaatttaaag acacagccaa gtttatggca tcggttaagg 421 gcaagggcag aattgaaatt cgcattgatt ctaaggacgg tgatgttgca gcggcaattg 481 agtttgattg cgatgagctg acaacggttt ataccaacaa tgttaatgtc cccaacggag 541 aacatggatt ctatattgta ttctccgacg agaacatcgt attggatgct tgggaatttg 601 cgaagtaaaa acagcaatct tcataatatt ttcgtatatc acctctttat acccctcggg 661 aattctcgag gggtataacc ctttgtccgg aaaatgcaca caagcttagt aaattgtgca 721 catttcaaga ttttgaaacc tttcgatttt tggtataatt aactcgtgac tattcagcaa 781 ttcaaaatgt ttgcttgctg aataatcgca aaaatactta tttggaggat atttaaatga 841 aaaagctcac aatttcaatt gtagcaattt tgatggcaat ggcattgact gtttctgttt 901 tcgctgtcga tatgaagtat atcgacccct caactccctg ttacacctac accgtaaacg 961 gtgacatcac cgagcttaca gcaaccgtca ccattttgga cttcgtttat gacgaagcaa 1021 gctggaaaga cggcgctatt caggacggtg cgggatggaa cgactggtgc ggccagttta 1081 tcgttgttac tgctcccgac ggaaccgttc attatcatga ctggggcgga gcttccgtaa 1141 cctggggtgc cgactttgac ggcgacggcg ttgctgaaac cgaaggaaac aactggggaa 1201 gcacaacttg gctcgctgaa gttgctgcag gtcagaccgt tgactttgtc gttcccgtat 1261 atggcgtagg cacagttgtt gaattcttcg ttaatagctg ggatatatac cttggcgttc 1321 agtatactct tgaagtttcc ggcgacaccg aggctcctgt tgttgaagaa actcctgcag 1381 ttgaagaaga gtccgccgtt gaagagactc ccgctgtaga ggatacccct gctgttgaag 1441 agcccaagga agaagaaccc gctgataccg gtcttgcttt ggcagttgtt cccgctgtat 1501 tggctatggc agttgctgta atcagcaaga gaaaataata aatagttttt tcttcattag 1561 aataacttcc ataaagtacc cctcggaaat tcccgagggg tgcttttttt gctgataaca 1621 tgacataaaa aagttcccca gcggttttgc ttggggagct tttatgttag tgctttgaaa 1681 gtgcgttgcg atattgggtg ggtgtctggt taattcgcga tttgaactga cgcataaagt 1741 gaagatcgca tttatatccg cagagctgtg caatttgatt tacgggcaga tctgtggtgg 1801 aaagaaggta tttcgcgtgc tcaattcggc tttgaattac atcatccatc gcactgacac 1861 cgaaggtctt tttatataga tgctggaaat atgatttgct catagccaac tcgtgggaaa 1921 gccaatcaat atcccaatcg ttatatggct tgttatatat ttttgagcgt ataattgcca 1981 gcttgtcata atgggaactg acctttttgt aatcatccga atgaacagcc tcgctgagtt 2041 tgaggaagaa tagcttcaaa tatagatcac aagagtaggt cctgaatgtg ttggaggagt 2101 aatgctcgta tgacatactt ttaatcagca ttgacagacc gttgat // LOCUS sequence244 2137 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence244 VERSION sequence244 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2137 /mol_type="genomic DNA" /organism="" /note="sequence244" ORIGIN 1 agcttgtcgg cggtggtata gtcggttgaa acggtttcgg ggttgttgtt gatgataatt 61 gcctcgtaac cggagttctt gatggttgca acagcgtgaa cggtggagta atcaaactca 121 acgccctgtc cgatacgaat ggggcctgca cccaaaacaa cgatcttttt cttgtcggtc 181 aatctggatg cattatctcc gctgtaggat gagtagaaat aagggatata tgcgcctgtg 241 tggcaggtgt caaccattct gaatacaggg aagattccgt tttccttgcg gatattatat 301 acatccatct cggtattctt ccacatacgg gcgatatact tgtcgctgaa gcccatcttc 361 tttgcggcga tgagggtttc aacgtccaag gggttcttct ttaaggtttc ttccatgtcg 421 ataatatttc ttatcgcttc aaggaagtaa ggtgtgatct ttgtaatatc gtggatcttc 481 tcaacgctta cgccgtgata taaaagctcg gcgattgcaa aaatattgtc agagcggaat 541 tccttgatat aatcaagcaa ttcttcaacg ctcatattgt caaacttggg gtgataaatg 601 tggtttgcac cgatttcaag tgaacggatg cccttaagca gagcttcttc aaggtttgca 661 ccgattccca ttacctcgcc ggttgccttc atctgtgtgc ccaaggtgtt gggagcagag 721 gtaaacttat caaaggggaa tctggggagc tttgcaatta catagtcaag cctgggctca 781 aatgccgcgt tggtgtttgc aatcttgatc tcctcaaggc tcataccgac tgcaatcttc 841 gcggtaactc gcgcaatggg gtaaccggaa gccttggatg caagcgcgga agaacgggaa 901 actctggggt ttacctcaat gagataatac tcgctggtgt gagggttaag tgcaaactga 961 acgttgcatc cgccttcaat cttcagctcc ttaatgagct tgattgcgga gtcgttgagc 1021 atcttttcgt cctctttgct cagcgtcata atcggagcaa caacgagcga gtcacctgta 1081 tggacaccga cagggtcgat attttccatt ccgcagatgg tgattgcgtg gtcaagcgag 1141 tcgcgcatta cctcaaactc aatttccgta tatcccttaa cgctcttttc aatcaatacc 1201 tggtgaacag gggagagctt gaaagcgttg ttgccaatgt cgataagctc ggcttcgttg 1261 tttgcaaaac cgccgcctgt tccgcccaag gtgaatgcag ggcgcaaaac aacggggtaa 1321 ccgattcttt cggcggctgc cttagcctct tcaatgctgt atgtgatttc ggagggaatg 1381 gtgggctcac cgatagattg gcaaagctct ttgaaaagct ctctgtcctc agcgcgctcg 1441 atactctcgc tggaggtgcc caaaagctca actccgcatt cgcgcaaaac gcccttcttt 1501 tcaagctgca tagcaaggtt taagcctgtc tgtccgccga taccgggcaa aattgcatcg 1561 ggacgctcat agcgcaggat ctttgcaaca tattcaagtg tcaaaggctc catatatacc 1621 ttatcggcaa taacggtgtc ggtcataatt gttgcggggt ttgagttgca caaaacaacc 1681 tcatagccct cttctttaag ggcaaggcaa gcctgtgtgc ctgcatagtc aaactcagcg 1741 gcctgtccga ttacgatagg gccagagccg atgatgagaa ttttcttcaa gtctgttctt 1801 tttgccataa aagcatcctc cttatatatc aatgctcaaa ttaaatcaaa ggttgttata 1861 tacaatttcg ccgttgtgaa ctgtcaaaag gcatttgccc gacagcgcca ttccctcaaa 1921 gggtgtcgcc ttgccgaggg ataggaactc gctcgggtca accttaaagc cctgctctaa 1981 atcccaaagg gtgaagtcgt tattaaaggg gattccgaat ctcactcgcg gattgattgc 2041 cataagctta accatatctt caagggttat tattcccttc ttaaccaggt gcgtatacat 2101 taccgcgacg gctgtttcaa gtcccacaac gccgaat // LOCUS sequence245 2136 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence245 VERSION sequence245 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2136 /mol_type="genomic DNA" /organism="" /note="sequence245" ORIGIN 1 ggcgcaccgc actatatcgc gttggttgta tatatgcccg aggaaacagg caacgaagcc 61 aaccacgatt cggattacga tgcacctgta atcaccctgg cgtaagcctt gaggcaacac 121 agatgtcaag cgagagcgac tccttcggca agacatatga cgagagcgca tcatttgcag 181 aaaagcctct cagcgtgtcg gtttcaatgc cgattgcaaa gaaggttgca actgaaacag 241 atgctagcac aggtgaaact gtaaccaaga tcgctgaaga agtaattatc gagagcgaaa 301 gcaacggcat tattgcgaaa attcctgcag acgttgttgt tgcagacggt gcaactgagc 361 tgaagctcac agttaaggaa atggatgaaa caagctcaca ggcaaacatt agccttgaag 421 acggcgaggt taagaattcg ctcgaaattg acatcgacgg cgttgctgat aacaacacca 481 cacccattca tatcaccctt gagggactaa tggacagggg gctcaacacc accagcgttt 541 cgatgtatca cgttgaaaac ggccagaccg ttgcaatgac cttggttaac tcccccgcag 601 atttggatac tcacaacgag ttctattatg atcccgcaac gggcaacgtt actgtttgcg 661 ttgcgacatt ctctgagtat gtcgctgtta caaatgactt taacctttgg aaaggcggat 721 ttgactactc ttggtataac accaccgata aagaattcac attgaatacc gccgatcagc 781 ttgcaggctt cggcagtatc gttgatggca ccgcagaagg aatcgccgca gactcctttg 841 agggcaagac agttaagctt ggcggtgaca ttgacctcag cggtggcgtt tccctcaacc 901 ccatcggttg cggatatgtt tccggtgtcg gcaactccaa cggtgtaacc ggcagagcct 961 ttatgggtac atttgacggc cagggccaca ccatctatgg tctttaccag aacggttggg 1021 atttgggatt gtcatattgc aacctgggcg gcggtttgtt cgcttctgtt gcggatgcaa 1081 ctatcaagaa cctgactatc agcggcgcaa acgttgttat ggaatgcgtt gaaatgggct 1141 ttgttgcagg tcttgcacag ggcaactgca ccttcgataa cattgacatt tataactcca 1201 agatcgccaa ctatcagcgc gcaacaggcg caatagtcgg tgaggtgagt gcatataacg 1261 gcggcggtac ttgcacattt aaagacatca acatcggttc ggacgttgtt gtcggctccc 1321 tttggggcga cttcgactgc cctgtcggcg gtgtaatcgg cgcaagatgg gatgatgcaa 1381 atgtgaccag cgttgtaatg gacactgtca acgttgcttg cagacttgat gtttataacg 1441 acgttacatc gagctatcag tggtatgctt accgcagagc gggtatgctg atcggcaata 1501 ccgatatggc tgacggtcac accgcaaccg caaacttctt gacttgcgaa gacgttgttg 1561 tatactatgg cgactgggtg aactatcact actgcgagtt taacaaccac aactcaagct 1621 ggcccttcgt tagagttgag gcgggcgaaa actgctcggc attttctaac cccagatggg 1681 gcgtgccgaa tgatataaac ggcgtcaagg taactcctga gcatcacaaa gtgcaggatt 1741 ataccattca ccaagaaggc gatgattgct acgttttgct tcccttcaac cagctttacg 1801 gcggcggaca gggtgtttac ggacagactg cacacgcagg tgtgacagca agcaattatg 1861 cttacacaat ccagtacatc aacgacaata aggttttggc tgaaactttt gttgagtcaa 1921 atgctactga ttttacattg acggatgacc ccaattatgg cgccgctaag aaggcagcag 1981 aagattgggt tataggccaa ggctacaacg ttgagtttgg cggatgggaa aatgcaggtt 2041 ccaccaaggt taccgcggtt cctgcaggca atacggaaag catcaagctg ttcccctatt 2101 tcaacagccc tcatactgca agattcgttg accaga // LOCUS sequence246 2132 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence246 VERSION sequence246 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2132 /mol_type="genomic DNA" /organism="" /note="sequence246" CDS complement(1720..2055) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MTEIGLVPNLIGCCECVTYSAQNMQFDLKYGKLYCENCCGARDLR NFEVLDPTLLHAVRHIALTDMERLFSFKLSDEYMPLLANITERYVRIQLDKRFQTLDFY KILTNGN" /locus_tag="LOCUS_7380" /note="MGA_1026" ORIGIN 1 ctcttgcttc gcgtttggca aggtccactt ccctatcctt tttctcaatc agctcgtttt 61 tctctttaac aagtcgatct ctgagttctt cagtttcgcg gcgatatttt tctgcaagtt 121 ttgtgtgttc ctcaagctgc tgtctcgtcg cttcaaggtt atcaattacc ttttcaaagc 181 ggcgagattc accagaaagc atattttccg catttttaat aatatcatcg ggtaatccta 241 aacgcgatga tatagcaaat gcgttggatt taccgggcga gccgataatc agtcgatatg 301 tgggctggag cgtcttaaca tcgaactcgc aggaggcatt ttcaacgccg tcttgttcta 361 atgcatagag tttcagctct tgatagtgag ttgttgtaac caactttgcc ccaaggctct 421 gaatcttttc gattattgcc acagccaatg ctgcaccttc aacagggtcc gttcccgaac 481 caagctcgtc aatcaaaaca agcgatttgt aatcaacggt gtcaagaatc tcaataactt 541 tgttcatatg agatgagaag gttgaaagac tctgctcaat tgattgctga tcgccgatat 601 cgactaaaat cttatcaaaa actgtaattt tactgccatc tgataccgga atcataagtc 661 cgcacatagt cataagggtc agcaagccga cagtcttcaa aattactgtc ttaccgcccg 721 tattagggcc tgtaatgata agagaatcgt atgcgttacc taatgcgaaa tcaatgggaa 781 cgaccttgtt gcggtcgatg agcgggtgtc ttgctttttt gagaattatc tcgccgtcat 841 cggaaatttc gggaatagtt cccgccattt ttgctcccaa attggctttt gcaaaatata 901 ggtcgagttt gacagctgcc tcaaagtcgg aaataagctg atcggaaaac atggctactt 961 ctgcggataa ttccttgatt atgcgctcaa tctcgtcctg ttctttgcat ttgagcactc 1021 ttatctcgtt gtttgcttca acaaccgcca tcggttcaat gaagaatgtc tggccggatg 1081 ctgatgtatc atgaacaaga cccgcaacgt tgtttttatg ctctgatttt acaggcaaaa 1141 catatctacc gtcgcggatg gttacaaggc tttcctggag ataggtctgt gtatcggaag 1201 atttgatcat tttatcgaga gtttctctga tcttggcgcc ctgcaaaatg atttttcttc 1261 ttattgatgc aagctccggg ctggcggagt cggctaactc ttcttcattc aaaacagcgt 1321 tgttgatttt atcatacaac cgtctgtttt caaaaagaca ttcaaacaga taatcaagct 1381 taaattcttc ctcaaactgt cttctccagg atatgagcat ttctgtttgt gaaagcattc 1441 ttgcggtatc catcagctca cgcaatgtta aagatgcccc gttttgagct cgctttgcaa 1501 tcgttgcggc gtctgcgaag ttgattgacc ccggtgtgcc gaatcgcaca gtctggttgt 1561 atgcatcaaa ggtttttaat gcttcggttt taacattctc aagatcagtt gacgggacga 1621 tttcgccggc aattttacgg gaaaaatcgt tatggcactc ccccactaac atctcaagaa 1681 ttttatgtaa ttcaagtgta atatagtgat cattcataat tagttaccat tagttagaat 1741 tttgtaaaaa tcaagtgttt ggaagcgctt gtcaagctga attctgacat agcgctcggt 1801 tatgtttgcc aaaagcggca tatattcatc cgaaagctta aagctgaaca gacgttccat 1861 atcggtcaac gcaatatgtc ttacagcgtg caaaagtgtg ggatctaaaa cctcaaagtt 1921 tcttaaatct cttgcgccac agcaattttc gcagtataac tttccgtact taaggtcaaa 1981 ttgcatattc tgtgctgaat aggttacaca ttcacagcaa ccgataaggt ttggcaccaa 2041 gccgatctcg gtcataaggc gcatttcaaa tatgcatttt aaaatctcat tgcttttctt 2101 accttccgaa aggaagtgta aacagttcaa aa // LOCUS sequence247 2128 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence247 VERSION sequence247 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2128 /mol_type="genomic DNA" /organism="" /note="sequence247" CDS 216..425 /product="DUF3006 domain-containing protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_010963615.1" /transl_table=11 /codon_start=1 /translation="MLIIDRFEDGFAVCENGDKLDRISISLIDPDAREGDVINIGEDGL YHLDREETDKRKANILKLLNNLWE" /locus_tag="LOCUS_7390" /note="WP_010963615.1 DUF3006 domain-containing protein (Clostridium) [pid:44.8%, q_cov:95.7%, s_cov:90.5%, Eval:6.2e-08]" /note="MGA_1028" CDS 433..1308 /product="MurR/RpiR family transcriptional regulator" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003358959.1" /transl_table=11 /codon_start=1 /translation="MNGDLFAYLNEWMPKISKGHKKIAQYILAHYDKAAFMTAAKLGET VGISESTVVRFASELGFDGYPGLQKVLQEAMRNKLTAVQRIEVSSLDQLGDGEVFKRVL LHDIEHIRHTLEETAMDQFNSAVDHIVKSKHVYVMGVRSSSALASFMAYYFKLMLPEVT LVQTGSRSELYEQILRIGEGDVMIGISFPRYSKQTVHAITYAHNNGAKSIAITDSLESP IAANADNVLVARSDMVSFVDSLVAPLSLINARSVAVSIKNKEMVSSNFSMLEKIWEEYD VYEKNGETSR" /locus_tag="LOCUS_7400" /note="WP_003358959.1 MurR/RpiR family transcriptional regulator (Clostridium) [pid:55.7%, q_cov:96.2%, s_cov:94.6%, Eval:1.1e-83]" /note="MGA_1029" ORIGIN 1 agctcaactt cttcgaccta tgaatttctc aatgctgtta cacctgattt ctgtgttatt 61 gagtgtggtg acaacagctt caaccatcca aattcacagg tagtaatgcg cttgttggag 121 tataccgaga acatttacag aacggatatt cagggaacgg ttgtgttcgt taccgatggc 181 accgaccttg aattcacata tgaggattta aactgatgct gataattgac aggtttgaag 241 acggctttgc ggtgtgtgaa aacggcgata agcttgatag gatctctatt tcgcttattg 301 accccgacgc ccgcgaaggc gatgtaatta atatcggtga ggacggttta tatcatcttg 361 accgcgaaga aactgacaaa agaaaagcaa atatcctgaa attactaaac aatttgtggg 421 agtgacatta aagtgaacgg tgacctgttt gcatatttaa acgaatggat gcccaaaatt 481 tctaaagggc ataaaaagat tgctcaatat atccttgctc attatgacaa agccgcattt 541 atgactgcgg caaagcttgg cgaaacggtt ggcataagcg aatctacagt ggtacgcttt 601 gcttccgagc ttggttttga cggctatccc ggcttgcaga aggttttgca ggaagcaatg 661 cgaaacaaac ttaccgctgt acagcgaatt gaagtttcat cgctcgacca gctcggtgac 721 ggcgaggttt tcaagcgcgt attgcttcac gatattgagc acatccgcca tacacttgaa 781 gaaactgcaa tggaccagtt caacagcgca gttgatcata ttgtcaaatc aaagcacgtt 841 tatgtgatgg gtgttcgaag ctcatctgct ttagcgtctt ttatggcgta ttactttaag 901 ctgatgcttc ccgaagtaac attggttcaa acaggcagtc gaagcgaatt gtatgaacag 961 atcttgcgca tcggagaagg agacgttatg attggaattt ccttccccag atattcaaag 1021 cagaccgttc acgcaattac atacgctcac aataacggcg caaagtcgat tgcaattacc 1081 gactctttgg aatctcccat tgctgcgaat gccgataatg ttctggttgc acgtagcgat 1141 atggtttcct ttgtcgactc tttggttgct cctttaagct taattaacgc gcgtagtgtt 1201 gctgtatcca tcaaaaacaa ggaaatggta tcctctaact tctcgatgct tgagaagatc 1261 tgggaagaat atgacgttta tgaaaagaac ggagaaacct cgagatgacg ggcgatgtaa 1321 ttattgtcgg cggcggtgct gcagggcttt ttgccgcttg tgagcttgca aagcactggc 1381 ttgatgttat tgttattgag ccgaactcaa agcttggccg aaagctccgc atcacaggca 1441 agggcagatg caatgtcacc aacaattgcg acattgatac aataattaaa aatattcctc 1501 gcaatcctcg gtttttatat agcgcattga atcagctttc acctgccgat gttatggaat 1561 ggtttgagtc ccgcagagta ccgcttaaaa ccgaaagggg agcgcgtgta tttcctgtaa 1621 gcgatgatgc aaacgacatt gccgaagcgc ttgtgcgaga atgcaagaag ctacatgtta 1681 agttcatcaa agataaagtg accgatatta tatatgaaga cagcgagatc aaaggcgttg 1741 agtgtgtaaa gggtatttac tttgcagata ctgtaattct tgccacgggt ggtttatctt 1801 atcccgcaac aggctcaaca ggcgacggtt acctctttgc cgaaaagctt ggccataccg 1861 tgaccgaact ttcgccatca cttgtgccga ttgtctgcga tgaaagcttt gtttgcgaac 1921 tgacaaagct ttcgcttaaa aatgtgactc tctcgcttta cgatgcgaag aaaaaatcac 1981 cgctgttttc cgaaattggt gagataagct ttatgcctta cggcgttgca gggccgctta 2041 gcttgtcggc ttcctgtttg atgtcgccga aattgcttga ggaaaggcga tataagcttg 2101 taattgacct taaaccggga cttactcc // LOCUS sequence248 2112 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence248 VERSION sequence248 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2112 /mol_type="genomic DNA" /organism="" /note="sequence248" ORIGIN 1 cataacctcg ggcttgtgaa tgattgttct tgcaaaggag ataagctggc gctgacctgc 61 ggagaagttg tttccgcgct cgcgaacctc ttcgtccaaa ccgttttcaa gcttatccaa 121 gatcttgtct gcatttacat atctgcaagc ttccatgatc tctttatcgc taaagctatc 181 ttctcgcaaa acaatatttg atcttatcgt tcccgagaag aggaaaacgt cctgaagcat 241 ctgtccgaag tgctttctaa gcgatgcaat ctttatattc ttaatgttaa ttccgtcaat 301 cagaatctcg ccctgctgaa tgtcatagtt tcggcagatg agcgacaaaa tggtggtctt 361 gcccgagcct gttgagccga caaatgcaac cgtctgaccg gcattcacct tgaaggatac 421 atctttaagc acccattcgc cctcgttgta tgcaaaccaa acgttcttga attcaatatc 481 tcctttgacc tcgtcaagct caattgcatc gggcgagtca acaatttccg gcttaatgtc 541 gaaaattgtg aatatctttt cgcttgatgc cattgccgac tggagccagt tgaacatttc 601 cgccaagttc tgaatggggt taaagaactt tgatatgtac aaatagaatg taacaacagt 661 tccacttgaa agggtctgac ccaaaaattc aacatctctt atatatccgc gtccgcccaa 721 ataaagcagg cacaaaacgc tggaaatata aagcatataa acgatcgggc ggaaaatgcc 781 gaaggtgaag atctgctcgc gcttggatct tccaagtctc aggtttttct cgtcaaactc 841 cgctttcttt tgttcctcac ggttaaagac ctgaatgatc ttcatacccg aaaggtgttc 901 cgaaaggaag gtattgatgt ccgttgtgcc gtccttaacc ttgcggaatg cttttcttga 961 gaactttctg aagatgatgg tgaaaagcag aatgaacgga acaaagcaga gcaccatcag 1021 cgtcagctga tagttaactg tcagcattgc aaccaaaaca cccacaatta caaagctgtt 1081 cttaacaagg ttaacaataa tgtttgtgaa catcattgaa attgcgttgg tgtcgttagt 1141 aactcttgtt accagcttgc cgacggggat gttgttaagc tgcgcatggg aaaggttttc 1201 aatgtgagtg aaaaggtcct gacggatatt tgaaaggatc ttctgacctg tcttttgcaa 1261 aacaactgcc tgaacatatg agcagataag ggaaacgata agtattcctg catagataag 1321 cacatatgaa taaagcaccg aaagctcaaa gtcgtcttta atcatctctt caaccttgcc 1381 gaccagggca ggggagataa catcatacgc aattgagaac atcattacca gcaaaacaat 1441 tccaaattgt aacttgaaag gctttgcata ttcgatcaga cgcttgatga tctccgagtc 1501 cttcatgttt cggtcaaagc cgattgcttc ctttttgtcc ttgatcatgg cataagccac 1561 aacaaaaata actgttaaaa cgccgacgat cgcgcccact gtcaaaagag gataaaattc 1621 atgcatatca gtgtgcctcc ttgtcggtat tcttttcaag gtcatcaagt ctttgcaact 1681 cgaccattgt tctatattcg ggacaattct cataaagctc attgtgcgcg ccgaccgcca 1741 cgaccttgcc gtcatcaata aagatgatct tgtccatgtt ttcaatcgtt gtaattctgt 1801 gggcgatgag tatggtcgtc ttgccctttc tcacatcgcg cagatttgaa agaattgcct 1861 tttcggtctt aacgtcaact gccgaaacgg agtcgtccaa aataagaatg gatgcgtcct 1921 tcataattgc acgtgcaatg gatatacgct gcttctgtcc gcccgaaacg gtcacgccgc 1981 gttcgcccaa aacggtttca tatccttctg caaactcgga aatattcgtg tgaacatccg 2041 acatctttgc tgcgttttca acgtcctcgt gagttccgcc gtcggtggca aatgcaatgt 2101 ttgcttcaat cg // LOCUS sequence249 2103 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence249 VERSION sequence249 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2103 /mol_type="genomic DNA" /organism="" /note="sequence249" CDS complement(339..1040) /product="tRNA (adenosine(37)-N6)-threonylcarbamoyltransferase complex dimerization subunit type 1 TsaB" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011860649.1" /transl_table=11 /codon_start=1 /translation="MTVLGIDTSGKTASCAILRDGVLLGETTLYTKLTHSQVTLPLVQK LIDDCGLTLDDIDLVAVSDGPGSYTGLRIGISAVKGICFAGKSCVGVSTLEALAYNCLC AKATVFSVLAARPGIVYFGGYRSDGETLENIIPDGVYNLDELKSISEEIEGDIIIVGDC VSDVKQKLFTDNANVRMASIPDRLQKASGVCLCALAHEDKWGTAQSLNARYLQITKAEK DLKEGNLKHDK" /locus_tag="LOCUS_7410" /gene="tsaB" /EC_number="2.3.1.234" /note="WP_011860649.1 tRNA (adenosine(37)-N6)-threonylcarbamoyltransferase complex dimerization subunit type 1 TsaB (Clostridioides difficile) [pid:31.7%, q_cov:97.0%, s_cov:96.2%, Eval:4.9e-25]" /note="MGA_1034" CDS complement(1021..1464) /product="tRNA (adenosine(37)-N6)-threonylcarbamoyltransferase complex ATPase subunit type 1 TsaE" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_000049642.1" /transl_table=11 /codon_start=1 /translation="MTISFITNSADETVSLGERIGALLEAGDIIAFRGGLGAGKTTITH GLAKGLGINAHVSSPTFALVNEYRGKVNLCHFDMYRIDGALDLESIGFYDYLDGENVLC IEWSENIESELPDGVITITIRRIDDETREITVDGDERFDSLGN" /locus_tag="LOCUS_7420" /gene="tsaE" /note="WP_000049642.1 tRNA (adenosine(37)-N6)-threonylcarbamoyltransferase complex ATPase subunit type 1 TsaE (Bacilli) [pid:44.3%, q_cov:89.1%, s_cov:82.2%, Eval:4.7e-26]" /note="MGA_1035" CDS complement(1477..1965) /product="cytidine/deoxycytidylate deaminase family protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_010966160.1" /transl_table=11 /codon_start=1 /translation="MERRDKANYYLDIADAVSERSTCLRKRYGAVIVNNDQIISTGYVG APRGRQNCSDLGFCIRNELNVPRGERYELCRSVHAEMNAIINASREQMIGATLYLCGRE MDTGEYVKNTSCCSMCKRVVINAGIERVVIRDDDNNYRTILTINWIMDDESVAGTLGY" /locus_tag="LOCUS_7430" /note="WP_010966160.1 cytidine/deoxycytidylate deaminase family protein (Clostridium) [pid:63.0%, q_cov:100.0%, s_cov:100.0%, Eval:2.7e-58]" /note="MGA_1036" ORIGIN 1 cgtccgccca agcaaagcgc gttggcatcg ttatgcagac gggtatactt agcggagaag 61 gtgtccgagc aagtgcaagc gcggatgcct ttgattttgt tcgcggcgat tgaaattccg 121 attcctgttc cgcagatgag tatcgccttg tcgcaggtgc cgtcaacaac cttgcggcag 181 acgcgctcag cggcatcggg atagtcgatc gcttcgcccg gacctacacc gtagtcgata 241 tattcaattc cctgctcctc aaggtgcttg attatttcca gcttgagggt ggtacctgca 301 tggtcgtttc cgattcctat cataataata tcctccaatt atttatcatg tttaaggttg 361 ccttctttaa ggtccttttc agcttttgta atttgcaaat agcgcgcgtt gagcgactgc 421 gcggttcccc atttatcctc atgagccaaa gcacaaagac aaacgcctga tgctttttgc 481 aggcggtcgg gtatagatgc catacgcacg tttgcattat ctgtaaagag cttttgcttt 541 acatcagata cacaatcgcc gacaatgatg atgtctccct ctatttcctc ggaaatggat 601 ttgagctcat cgaggttata tacaccgtcg ggaatgatgt tttcaagggt ttcgccatca 661 gaacggtatc cgccgaaata gacgattccg ggacgagccg caagaaccga aaagactgtt 721 gctttagcac agaggcagtt atatgccaac gcttcaagag ttgatacgcc aacacagctt 781 ttgcccgcaa agcaaattcc ctttacagcg gaaatgccga ttcgaagacc tgtatatgag 841 ccgggaccgt ccgatacagc cacaagatca atatcatcga gagttaagcc acagtcgtca 901 atcagctttt gcaccaaagg aagcgttacc tgtgagtggg tcagctttgt atataatgtt 961 gtttcaccga gaagaacgcc gtcgcgcagt atcgcgcagg aagcggtctt tcccgaggta 1021 tcaattccca agactgtcaa atcgttcatc tccgtcaact gttatttctc ttgtttcgtc 1081 gtcgatacgg cgaatggtta ttgttattac accgtcgggc agctccgact cgatgttttc 1141 gctccattcg atgcataaga cattttcgcc gtcaagataa tcatagaatc cgatggattc 1201 aaggtctaaa gctccgtcaa tgcgatacat atcgaaatgg cagaggttga ccttgccgcg 1261 atattcgttt acaagagcaa aggtgggcga gctgacatgg gcattaatgc ccaaaccctt 1321 tgcaagaccg tgggtgatgg tggtctttcc cgcacccaag ccgccgcgaa aggcgattat 1381 atcccccgcc tcaaggagcg caccgattct ttcaccgagc gaaacggttt cgtcggcgga 1441 atttgttata aatgaaatag tcacgtttat ccttctttaa tatcccaatg ttcctgcaac 1501 cgattcgtca tccattatcc agttgatggt gagaatcgtg cgatagttgt tatcgtcatc 1561 tcttatgaca acgcgctcga tgcccgcgtt aattacaacg cgcttgcaca ttgaacagca 1621 ggaggtgttt ttaacatatt cgccggtatc catttctctg ccgcaaaggt agagtgtggc 1681 gccgatcatc tgctcgcggg aagcgttgat gattgcgttc atttcagcgt ggacactgcg 1741 gcaaagctca tatctttcgc cacgtggaac gttgagctcg tttcttatgc agaatcccag 1801 gtcggaacaa ttctgtctgc ctctgggggc accgacatag cccgttgaaa tgatctggtc 1861 gttatttacg attactgcgc cgtagcgttt tcttaaacac gtgcttctct cggatactgc 1921 gtctgcgatg tcaaggtagt agttggcttt atctctgcgc tccatggtat gacctccgaa 1981 attaaaatct gttatatatg aattttagca caaaacttta agcattgcaa caatatattc 2041 ataaaaagaa agtagctccc gtcttgtagg acaggagccg agggggatat tatatgattt 2101 gaa // LOCUS sequence250 2099 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence250 VERSION sequence250 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2099 /mol_type="genomic DNA" /organism="" /note="sequence250" CDS complement(641..1456) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MKQIFNAKTVAEAKALAVSEFGVAEERIVFNILEEPKKGLFGMKG EAKVEAEYEMTKPEVAAQYIKHVMVAMGFECPEIAISDIEGGACLDISGEGAEGIIGRR GEVIDSLQYLASLVCNKSDKDYFRISTDCDGFRARRKVQLEELAKKMVSKAKRTGKTVA LEPMNPYERRIIHAAVSEIEGATSRSTGEEPYRKVLISSTEKRPYNRDGKSDGKRGGRG RNDRKGGRKPREEFKARSLDISSSFEKDYKKPKPEDEMIGSGLYSKIEF" /locus_tag="LOCUS_7440" /note="WP_011462331.1 protein jag (Desulfitobacterium) [pid:43.7%, q_cov:71.6%, s_cov:92.5%, Eval:4.8e-33, partial hit]" /note="MGA_1039" CDS complement(1618..2097) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MNTMLYVMPLFSFWIAFSFPAGLGIYWIFSSVLSLAQTVFLNLYM TPARVDKMLEKENKKKNRKPSIYQMALEQQKAQLAATNGGAMPEKTALDEVTEDMKLSR AERKELERLRINEARRAMEERYGKISEDEETKVAPEEENEILEAARRRMAEKYGD" /locus_tag="LOCUS_7450" /note="MGA_1040" ORIGIN 1 cctacccaaa gacagtgagg ataatactcg ggagtgataa aagttattgt tgcctttgcg 61 ctttcatttg ggtttacttt atcaacatca atatagtgat gaagacctgt tgttgtgtaa 121 tcatcggtaa cgcgatgacc ggggcggtat ccgttaaaca caggaccttt tcttgttccg 181 ttaaagcaaa ttattgcctc aacatcaggc tccctgtcaa tcaccgtctt tgattttcta 241 aagttaaaaa gagacattga tattctccct taattatttt gtaagattgt tgtataatct 301 gcagtacgtt tcggttgata ttcggcacac gagcctctgc tacaacagga gggtggtgag 361 ggaaagggcg tccagagggg acaaccgtag gagggaaccg caaggctttc acaaatctgt 421 gacctcctcg gcaaatcatt aatgcttgtc ggttccctcc taaaggtttc ccctttggtt 481 ggaaacttca aggcacaaat gaattgcgct tcgcgcatga atagcagatg cagatatctg 541 cgtgaataga tgcaacaagt tgcatcatga atagtcgaaa ccagtttcga cattgcctta 601 cggcaaaaag cggcaaccca gccggattgc cgccaaaaaa tcagaattcg atctttgagt 661 aaagtccgga accgatcatt tcatcttcag gcttcggctt cttataatcc ttctcaaagg 721 aagaagatat atcaaggctt cttgccttga attcctcacg gggcttgcgt ccgcccttgc 781 ggtcgtttct gcctcttccg ccgcgcttgc cgtcagactt gccgtcgcgg ttataggggc 841 gcttctcggt ggaggaaatg agcacctttc tataaggctc ttcgcctgtt gaacggcttg 901 ttgcgccttc aatttcagaa actgctgcgt gaataattct tctctcataa gggttcatag 961 gctccaaagc aacagttttt cctgttctct ttgcctttga aaccatcttc tttgcgagtt 1021 cttcaagctg aacctttctt cttgctctga aaccgtcgca atcggtggaa attctgaaat 1081 agtccttatc agacttgttg catacaagtg atgccaaata ctggagcgag tcaataacct 1141 cgccgcgtct gccaatgatg ccttctgcgc cttcgccgct gatatcaagg caagctccgc 1201 cttcaatatc gctgattgcg atctcggggc actcaaatcc cattgcaacc ataacatgct 1261 tgatgtactg agccgcaact tcgggcttgg tcatttcata ctctgcttcg acttttgcct 1321 cgcccttcat tccgaaaaga cccttcttgg gttcttcgag aatgttaaag acaattctct 1381 cttcggcaac gccgaattcg cttacagcca gagcctttgc ctctgcaact gtttttgcat 1441 taaaaatctg cttcacgtta attctccttt atcaaacagg gtgaaatttt gtactccata 1501 gcattctttg aaaatttttc gctcgtcggt tgcacgtttc ggtgcaacaa ggggctgttt 1561 tttaactata tatggagggc aaatttttcc ctgagtttat ttggttgctt attaaaatca 1621 gtcgccgtac ttttcagcca tgcgtctgcg agccgcctcg aggatctcat tttcctcttc 1681 gggagcgacc ttggtttctt cgtcttcgct tatcttgccg tatctttctt ccattgctct 1741 gcgagcttca ttgatgcgca agcgctcaag ctcttttctt tcagcgcgtg aaagcttcat 1801 atcttcggta acttcgtcca aagcggtctt ttcgggcata gctccgccgt tggttgcagc 1861 aagctgagcc ttctgctgtt caagtgccat ctgatagatc gagggcttgc gatttttctt 1921 cttgttttcc ttttcaagca tcttgtcaac tcttgcggga gtcatataaa gattgaggaa 1981 aacagtctgt gcaagcgaaa gaacgctgga gaagatccag tatataccaa gacctgcagg 2041 gaagctgaat gcgatccaga atgagaacaa aggcataaca taaagcattg tattcatgc // LOCUS sequence251 2097 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence251 VERSION sequence251 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2097 /mol_type="genomic DNA" /organism="" /note="sequence251" misc_feature complement(1367..>2097) /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_002681885.1:DMT family transporter" /note="WP_002681885.1 DMT family transporter (Treponema denticola) [pid:57.8%, q_cov:92.1%, s_cov:64.3%, Eval:1.1e-62, partial hit]" /note="MGA_1042" /locus_tag="LOCUS_7460" ORIGIN 1 atgtcagttc atcgaactga taaactctga cgtaatcaac gtatactgcc gcgggcaggt 61 cggatttatt tatctcccct gcccaggagc cgacttcaag agtcagcttc aaatatcccg 121 gctgattgca aactccaccg tcggaggatt cccacatcaa ctcgccgtcg atataccact 181 tgtagccctc gggagtccag cacatggcgt aggtgtggaa tccctcatag agttctttgc 241 gatattcggc aacgccgttt gatttgtggt gctcgccgta accgtcccaa tgcaaagcgt 301 ggttgatgcc ataggtcttg gcgttgaatg cctccataat gtcgatctcg gtgccgtcaa 361 caccatcgtt gccgacgctg ccaacatttc cgcacatcat ccaaaaagct gaccagaagc 421 cgggaacctt ttgaacatcc attgaacatt caaagtagcc atatgcctgc tcgaacaagc 481 ctttggtgcg aatcgcgcca gatttgcaga tgccctccga ttcatcgaag gaaacggaga 541 gaacaagctt gtcgtttgca acattagcct gcgaggggtc ccatttgccc ttgcggtcgg 601 agcgttccca cttgggacag tattcccagt tgtcaaagtt aagggtgttg ccggagaatt 661 catccaagaa ggtcagggtc attgttttgc cgttgataat ttccttttcg ccaacgctga 721 gcgctctttt gccggtcaca ggttcttcct ccttcggggg ttcataattt tcggttaaat 781 actttccgct gatgaaatac aagccatctt caaactcgat ttttgcccag ccgttgtccg 841 cccatgcgat tatatgcacc agctcgcctt cgtcaacatg gccaactcgc gaatactgcg 901 ggccggggcc tttgcgaaca tttagggctt gggtcacata aagcgattca tcagcaggtg 961 tttcgctcca agcaagagcg gtggcagctt cggtggttgt ggtgataacg gtggttgtgg 1021 cttcggtggt tgattccgtt gtagcttcgg ttacggcaga ttcagacgtg gtttcttcgg 1081 ttgtagtcgc ttcggtggtc gattcggtag ttgattcggt tgtcgcctcg gtttcggagt 1141 tgtcagtgct gtaataatcc acaggcggtt caacatagtc ctttgcgggg tcattgcacg 1201 cgcaaagaga caaagctaaa gcaagagcca aaatcaatgc ggtgagtttt ttcattattc 1261 attctcccta tgtcaattga ttgaaaaatc actttcaaat tttaatattc ttatgattat 1321 attataataa aacccgtcat ctgtcaagac gacgggtcgg gaacactcac tcccctgcaa 1381 gggtatctct gacgattata acggtggcaa ttatcattat cgccagcgcg acatagaagt 1441 taagcgcggg gcgctcgccc aaaagaagca tactgaatgc aacgcccaaa aacggtgcga 1501 cggcataata tgcgctggtt ttggcggcac cgatatgctt ttgcgcgagg atatagaaat 1561 tgatgctcag gccataggat acaaagccca gaagcattgc aaacacgata agcataaggc 1621 tcggcaatcg ctcaccaact gcaaatgcga caccgaggct tccgagtcct gagaagatgc 1681 ctttaatcat tgttatttga accgagcttt tgcttgaaag cttacgggtg cagttgtttt 1741 caatgcccca gcaaagacaa gctccgagaa cataaagcga gccgaggctg aatttgaagc 1801 tgccctgccc ttcaaacgac agaattgcgc ttgaaagaac taccaatgcg attgcaaatg 1861 aaagtcgctt tgaaacagct tctttgaaga taaacgcagt gatgagggtg gtggcgacaa 1921 tctcaaaatt gttcaaaagc gaaactgaag ccgagtgact gtttataatt ccgagcatca 1981 agagtatcgg cgcggcaatg tccaaaacga tcatcgcgac ggtatatggc aattctgctt 2041 tggtgagcgg gtctttgata atatttttgc ccgcagcctt gccgataagg caataag // LOCUS sequence252 2095 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence252 VERSION sequence252 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2095 /mol_type="genomic DNA" /organism="" /note="sequence252" CDS 855..1379 /product="hypoxanthine phosphoribosyltransferase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_000892185.1" /transl_table=11 /codon_start=1 /translation="MEFQHKVETMIAKEEIAVKVRELGEKITADYTGKEVMLIGVMKGS FVFLADLVRNIDLPVTIDFISAKSYGGTVSTGVVNVKMDTELELEGKDVLLVEDILDTG RTLSGLKVTLRSKGARDVKIAAFLDKPSRRVIDIKADYSCFTIEDRFVIGYGLDYNEMY RNLDFIGEVIL" /locus_tag="LOCUS_7470" /gene="hpt" /EC_number="2.4.2.8" /note="WP_000892185.1 hypoxanthine phosphoribosyltransferase (Streptococcus pneumoniae) [pid:48.8%, q_cov:93.7%, s_cov:91.1%, Eval:7.6e-44]" /note="MGA_1044" ORIGIN 1 cctgtgtaca cgcgacgaga tcgaagcata tttaactgct cagggtcaat catttgtcac 61 cgactcaacc aacctcgtgc ccgattgttc ccgaaatata ctccgtcttg aggtcatccc 121 caagcttatg gagatcaacc cgggactgta cagatcctac tccgcatttt tgcaaacggc 181 gggggagtcg aaagcttatt tagacgatca tatcgaaagt gaatttaata aaaatcttga 241 cggtaatgtt ctttatctgt caaatattcc cgagggcgct cttcgttcgg gcgctttgtc 301 gctatatttg aaaaatcaag aaataatgcc aacctatgat cgcatctcgc tgattttaaa 361 aaatcttgaa acatgcgagc gcatcaacat tcaaaaaggc gtttatgttg actacttttc 421 gggtagaata accataaccc gcgaatcgga atcaaatgat ccacagccga tctataccga 481 tttgcgcgaa aatttggttt tcggcacgaa aaaaatcaat atcacgaata tttcacatca 541 agacatatct tctcttaaca aatccgattt aaaatggtgt atggacttaa acaaagtcca 601 tggaaaagtc accgtcagaa gctatatcgg aaatgagaag ataaagcttt tgggtcggga 661 tatcacccag accgttaaaa agctttttgc atcctatgcc cccgcgggcg aaagaaaaaa 721 ccttgttgtc atcgcagacg atgagggcgc gatcttcgcc gaagggtttg gcatagccga 781 ccgtgttaaa tgcgacagcg aaacaaacgc tggcgtatgt atagatattt tatgacatca 841 aaggagactt ttttatggaa tttcagcata aagtcgaaac aatgatcgcc aaagaggaga 901 tcgctgtaaa ggtgcgtgag ctcggcgaaa agatcaccgc tgactacaca ggcaaagaag 961 taatgcttat cggcgtaatg aagggctcgt ttgtctttct tgccgacctt gtcagaaaca 1021 tcgacctgcc cgtaaccatt gattttatca gcgcaaagag ctatggcgga actgtatcca 1081 caggcgttgt aaacgtcaag atggataccg agcttgagct tgagggcaag gatgttttgc 1141 tggtagagga tattcttgat acaggcagaa ctttgagcgg actgaaggta actcttcgtt 1201 ccaaaggcgc acgcgatgtt aaaattgccg catttttgga caagccctcc cgccgtgtga 1261 tcgacatcaa ggctgattac agctgtttca ccattgagga cagatttgtt atcggttacg 1321 gccttgacta taatgaaatg tatcgcaatc tcgactttat cggtgaagta atcctttaaa 1381 gatacccaat agcaacgaaa cgaggtaaac ccattttgaa tcagaaacca ccaatccaaa 1441 aaccgaaggg aacgctggtg ctcttccttt taacggcagt aattatcatt gtaatgattt 1501 ttgccctaaa gggaattgta agttctgcta acgccccttc atattccgag atcatcggct 1561 attttgaaaa ccttcaggtc agcgagttca agtttaattt gggctccggc gagctggaat 1621 ataagctcga tggtgaagag gaattccgtc gatatgaagt cccgaacgtt tcagtattct 1681 ataatgagct gttcggcgaa ggaaatatat tcggcgaggg aagcaactac cgcgtcgcat 1741 atgacgaagc gcacgaaaca cccttaaagt ataacttcat tccagcttcc gactcctcat 1801 tctggctgaa cttaattccc acgctgatta tggtcggcgc gctaatcttc ctcattgttt 1861 caatgaccag agttatggga gcaatgggca aagcaaacaa tgtcggcaag gcgaatgtta 1921 aggtcgatgt tgacgcaaag aataaggtca cctttaagga cgttgcaggt gcagacgaag 1981 aaaaggccga gctgcaggaa atcgttgagc ttttgaaggc tcccaagaaa taccaggata 2041 tcggcgcaaa gattcccaag ggcgttttgc tcgttggccc tcccggtaca ggtaa // LOCUS sequence253 2089 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence253 VERSION sequence253 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2089 /mol_type="genomic DNA" /organism="" /note="sequence253" misc_feature <1..780 /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_011393762.1:sodium:solute symporter" /note="WP_011393762.1 sodium:solute symporter (Moorella thermoacetica) [pid:35.1%, q_cov:88.0%, s_cov:44.2%, Eval:8.4e-32, partial hit]" /note="MGA_1046" /locus_tag="LOCUS_7480" CDS 1028..1390 /product="putative DNA-binding protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003393779.1" /transl_table=11 /codon_start=1 /translation="MAKDLKFAALLDIYGGVLTDKQRDVLDLYYNEDLSLSEIAANDEI SRQGVRDSIKRGEETLLELDEKIGVVALLEQYNALLEHVKAKCDDIIADCKSYTTTKSV IEKLENIKSDIDNNRR" /locus_tag="LOCUS_7490" /note="WP_003393779.1 putative DNA-binding protein (Clostridium botulinum) [pid:36.4%, q_cov:98.3%, s_cov:99.1%, Eval:2.5e-12]" /note="MGA_1047" ORIGIN 1 ccacagatgg ttcagaagtt ctatgcaatc aagtcggaaa agagtgtata tacaggtacg 61 atcatttcaa ccttctttgc ggcagttgtt gccggcggat gctatttcct tggcggcttc 121 ggcagacttt tctccacccc tgaaattgtt gcacagaacg gttacgattc tatcgtcccc 181 gaaatgctct cgaatttggg cgatgttatg atcggtctgg tcattgtttt ggttctttcc 241 gcttcgatgt ccacactttc ttctcttgtt ctcacatcca gctcgagctt gacgcttgac 301 tttattgcac ctatgagcaa aaaaggaatg accgaaaaga aaaagctttt aattatgaga 361 attttccttg cggtattcat tattatttct gttattcttg caatcgtgca gtataagacg 421 caggcaacct tcatcgctca gatgatgggt ctgtcctggg gcgcattggc cggtgcattc 481 ttagctcctt tgctctacgg tttatattgg aagcgaacaa ccaaggcagc ttgctgggtc 541 tgcttcatta caggtcctgt aataatggtt ttgaacacct ttgttcccgc actcttcccc 601 acattcctca agagccccat caactgcggc gcattcacaa tgattttggg actcattatt 661 gttcccgtta tcagtttgtt gaccaagaag cctgatgaaa agatggttga tgacatcttt 721 tcttgctatg aagaaaaggt tttggtaaat gccagcgagt cgctgggcaa tgcagagtaa 781 aattgaatga ttgatagggg cacccacata ggggtgcccc tttttgagtt ataagaagaa 841 tttgaccatc cctcatcaga gggcgcctat atgcttgcca cttctcaatt tccgaaaatt 901 tcgtgaaaat tcgcgcaacc cccttgacaa attataaggg gtgtattata atgtttgctg 961 taaagttttt taactttaca ctaaaatcaa gattttgtgt cttaactgaa aggaaacggg 1021 tgatattgtg gctaaggatc tgaaatttgc agctctttta gatatttacg gcggtgttct 1081 gaccgacaaa caaagagatg ttctggacct ctattataat gaggacctct ccctttcgga 1141 aattgcggcc aacgatgaaa tttcccgtca gggcgtgcgc gattcgataa agcgcggcga 1201 ggagaccctt ttggagctgg acgaaaagat cggcgttgtt gcccttttgg agcagtataa 1261 tgccctttta gagcatgtca aagccaagtg cgacgatatt attgccgact gcaaatcata 1321 tacaacaacc aagagcgtaa ttgaaaagct cgaaaatata aaatcggata tcgacaacaa 1381 ccgtcgataa gcgaaaggaa aaagtagatg gcgtttgaag gattgagcga aaagcttggc 1441 gcggtattta aaaagctcaa atctcgcggc agactttcag aagcggatgt taaagcctca 1501 atgcgtgagg ttcgaatggc gcttttggaa gcggacgtca gcttcaaggt cgttaaggac 1561 tttgttgcca aggtcaccga gagatgtgtc ggcgctgatg ttttggaaag ccttacccct 1621 gctcagcagg ttattaaaat tgtaaatgaa gagctcatcg cgctgatggg cgaatcaaac 1681 tcaaagatca attttccaag caagcctccg tgtgtcatca tgatgtgcgg acttcagggt 1741 agcggtaaaa ccacccacgc cgcaaagctt gcgaaatatt tcaagggtat ggataagcgt 1801 ccccttttgg tcggatgtga catctaccgt cctgctgcta tcgaccagct caagatcgtc 1861 ggtgagcgcg caggtgtgcc cgtctttgaa atgggacaga tcgacccgag aaagatcgtt 1921 cgtgaagcgt taaagcacgc tcgcgactac ggcaacgaca ttgtcctttt ggataccgcc 1981 ggccgacttc acattgatga agagctgatg caggagctta aagacattaa ggatattgcc 2041 cagccccacg agataatcct cgttgtggac gcaatgaccg gtcaggacg // LOCUS sequence254 2084 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence254 VERSION sequence254 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2084 /mol_type="genomic DNA" /organism="" /note="sequence254" CDS complement(344..1573) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MKRLFVIALAVAMLLGLLCGCAANGGKMKQGLEYINNPSTYDEWL NNAKIESLTSLGNTNRLKDVIERAKNGEELTIAYIGGSITEGDHLDTCYAARSYRYFCE SFAKKGEEQITFVNAGISGTPSNLGALRFESEVLAYDPNIVFIEFAVNDGNDNETKDAF ECLIRACLDYETKPAVVLLFSRMEEGWTSQDWKKEIGAHYDVPMISYADGITYMFDNNV IQWSDFSHDYAHPHAEGNALVNEFISYFYDEVDRLPAQGEAEPAMPERMYAGFYQNAHL IQRVNDYKPTEKGSWRNSSSGFHYDKGWTKTYDDTNDPLVIEFTGKNAYVLYPTSGNQT FGTLVANIYFNGELVATKEFDEYVDGGWMCPSVGKLYRSPTVGEYRIEFSVPAGQERTD VQVLAVGYTD" /locus_tag="LOCUS_7500" /note="WP_011986990.1 SGNH/GDSL hydrolase family protein (Clostridium botulinum) [pid:31.3%, q_cov:42.5%, s_cov:52.7%, Eval:9.3e-19, partial hit]" /note="MGA_1050" ORIGIN 1 aaaaccgaaa agggcaactg ctgtcatacc cacactgacg gcagttgtca gacctgtacc 61 cagctttgaa atcaatctct cgctgacaag tgcggaaata atggtgcaaa aagatatgag 121 catcgccaaa acgcctgcat atgaaacagg aacgcccaag ccctcataca tactcggcca 181 cgccgagccc aaaagtccgt ccggcagacc aaggctgata aacgatatat aaattattgc 241 aatgagcaga tgtatcatat gaaatctcct ttaaaacata aaacagcggt ttcatattat 301 caaaacaaag ggaggctgtc aagcctccct ttgaaaaata ttcttagtct gtatatccaa 361 ctgccaaaac ctgaacgtcg gttctctcct gacctgcagg aacgctgaat tcaatgcgat 421 attcccctac agtaggtgaa cggtaaagct ttccgacgct gggacacatc cagccaccgt 481 ctacatattc gtcaaactcc ttggttgcaa ccaattcgcc gttgaagtaa atatttgcga 541 ccagagttcc gaatgtctgg ttgcccgatg tgggatacaa aacgtatgcg tttttgccgg 601 tgaactcaat taccaacggg tcgttggtgt catcataagt ctttgtccag cccttgtcat 661 aatggaatcc ggagcttgaa tttctccagg agcccttttc tgtcggctta tagtcattca 721 ctctctgaat caaatgtgca ttctgataga atcccgcata cattctttcg ggcattgcag 781 gctctgcctc gccctgtgca ggcaggcggt caacctcatc atagaaatat gagataaact 841 cattgaccaa tgcattgcct tcagcgtggg gatgagcgta atcgtgtgaa aaatcgctcc 901 actgaatgac attgttgtca aacatatatg tgatgccgtc agcataggag atcatcggaa 961 catcataatg tgcaccgatc tcctttttcc aatcctggct ggtccagccc tcttccattc 1021 ttgagaagag caaaactacc gcaggcttcg tttcataatc aaggcatgcc cttatcaagc 1081 actcaaaagc gtccttggtt tcgttatcgt ttccgtcatt gacggcaaac tcaataaata 1141 cgatgttcgg atcatatgcc aaaacttccg attcaaatct gagtgcgccc aaatttgaag 1201 gtgtgccgct gatgcctgcg ttgacaaagg tgatctgttc ctcgcccttt ttggcgaagc 1261 tttcgcagaa atatctgtaa gatcttgcgg catagcaggt gtcaaggtgg tcgccctctg 1321 tgatggagcc gccgatgtat gcaatggtca gttcttcacc attctttgct ctttcaatta 1381 catccttgag tcggtttgtg tttcccaagc tggtcagcga ttcaattttt gcattgttga 1441 gccactcatc ataggttgaa gggttattga tgtattcaag tccttgtttc atttttcctc 1501 cgttagctgc acatccgcac aaaagcccca aaagcattgc aacggcaagc gcgatcacaa 1561 ataatctctt cataataatg ttcctcacta agtaaaaaac ggctatcctt tcggacagcc 1621 gtttgtttta tattcggtta cagcccgttt tatcagttga caattacctt ttcggtttcc 1681 ttatcaaaga tgtggattct gttagcatcc aaagcgcact tgataatgtc ctgaggtctt 1741 gcggtagagc ggttggaaac tcttgcagta aggttgatac cttcgcaagt gaggtagagg 1801 taggtttcag cacccatcat ttcggttacg ttaacggttg cttcgatgat accggtctta 1861 gcggtagaga tgtacatctc ttcatcatgg atgcactcgg gacgaacacc gacgataact 1921 tccttgttga ggtaaggagc caaaacttct tcatgggcct tagattcggg aagttcaata 1981 tagaactttc ttcctctggt ttccttggtg tcttcagaac cgaactcaac gttatacttg 2041 ccatcgatct tcaaaagctt agcatcgatg aagttcatct gagg // LOCUS sequence255 2081 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence255 VERSION sequence255 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2081 /mol_type="genomic DNA" /organism="" /note="sequence255" misc_feature complement(351..>2081) /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_002288533.1:asparagine synthase (glutamine-hydrolyzing)" /note="WP_002288533.1 asparagine synthase (glutamine-hydrolyzing) (Enterococcus) [pid:53.5%, q_cov:99.8%, s_cov:92.6%, Eval:5.7e-177]" /note="MGA_1053" /locus_tag="LOCUS_7510" ORIGIN 1 gcaagatgtg cagttgctaa cccacctgtt atgattatgg acgaagcaac ttcaagtatt 61 gatactcaca cagaaaaact tgttcaagaa ggtatggatg ctttaatgaa aggtagaaca 121 gtttttgtaa ttgctcaccg tctttcaacc ctttcaaacg ccgatgcact tattgttttg 181 gataagggca gattggctga aatgggtaca cacgacgagc ttatgcgcaa caagagcgta 241 tactataatc ttgtaatggc tcagcgccag actactaaga tgaaaaaggt tgataaagcc 301 gcaatggcat aaagaaaaac cccacggaaa ttccgtggga ttttttgatg ttatccaaag 361 tatacgtcat accaaacaag gaaggtatat acagtccata tctttctgga gtagtcatac 421 ttttcagcct tgtggtcatc caataaagca acgagcttgt cggtgttaaa gaacttctta 481 gcattgttgc tttcaaatgc ggctcttacc ttattgtagt attcgtcctc tctcagccaa 541 acacgaatcg ggacagggaa gcccagcttc ttcttgttgg cagtaagggg aggacaggcg 601 ctgagagcgg cttttctcat tgcaaacttt gtgttttcct tggtgatacg gtagcgcttg 661 ggaattcttt ctgccaacgc cataacgtgc ttatcaagga agggaacacg aagttccagc 721 gagtttgcca tactcatttt gtctgccttg agaagaatat ctccggtcat ccaaaggttg 781 aggtcaagat actgcatctt tgtaacattg tccttgtctt taaccttgtc ataaaacggc 841 ttggtaattt ccatcgccat aggcgcatca gtcttaattg ataaaagctc cttgcgctcc 901 ttttcggaga agatatatgc attgccgatg aagcgttctt caaggtcctt gcttcggcgg 961 ataaggaagt taagtccgcg ttttgcaggc agcttcgatg caacagcacc gactgctttt 1021 cttatgggct tgggaatggc attataaaat gccatatcgt ccggttcttt atagatattg 1081 tatccgccga aaatctcatc agcaccttcg ccgcttaata caaccttaac tctttcactt 1141 gcaagcttgc atacaaagta tagagcaact gcggctgggt cagccaaagg ctcatccata 1201 tgatactgaa tgagagggaa gttgccccaa tactcttcgg gggtgatgac ctttgaaatg 1261 ttttccttgc cgatatactt ggagaattcc ttggcataac caatctcatt gtatttttca 1321 tcctcgccaa agcctacagt aaaggtttta tccacatttg caaccgcggc aacatagctg 1381 gagtcaacac cgcttgaaag gaagcttccg acctcaacgt cagcgatctt gtgtgcttca 1441 acagagtttt tgaatgtttc gctgattttt tcaacccact catccagatt aggcttttcg 1501 tcagcattaa agttaatgtc ccaatatctt tgagttgtca gcttgccgtc cttatatgta 1561 aaataatgtg caggcaaaag cttgaaaacg cccttgaaga atgtttcggc acagggggaa 1621 tattggaatg tgaggtagtt ttcaagtgct gtttcgttca gctctttctt gaaatcgggg 1681 tgatgcaaaa agctctttat ttccgaacca tacataaacg tgccgttcaa atttgcataa 1741 tacatcggct tgataccgaa gaaatctcgt gctccgaaaa gctccttctt gtttttgtcc 1801 cagatgacaa atgcaaacat acctctgagt ttatttaaaa ggttcttgcc ccactgctca 1861 tagccgtgca aaagaacttc cgagtcaacg tgggtttcaa aggtgtgccc tgcgctgata 1921 agttcttcac gaagctcctg atagttatat atctcgccat tgaaggttaa aacaaggctt 1981 ttgtcctcat tgaacaaagg ctggtgtccc atcgaaaggt caattatcga caagcgtctg 2041 aatcccatcg cgatgtcatc atcaagatat aagccttcag a // LOCUS sequence256 2077 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence256 VERSION sequence256 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2077 /mol_type="genomic DNA" /organism="" /note="sequence256" misc_feature <1..654 /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_000476500.1:serine O-acetyltransferase" /note="WP_000476500.1 serine O-acetyltransferase (Bacillales) [pid:55.7%, q_cov:93.5%, s_cov:91.9%, Eval:4.4e-62]" /note="MGA_1054" /locus_tag="LOCUS_7520" ORIGIN 1 aagaacatta acaacatcaa gcacaggata aatgaggacg tcgcatccgt tcgcgaacgc 61 gaccctgccg caagaagcac cgccgaaatt cttttgacat attcgggatt gcacgctgtt 121 ttgcttcacc gcgtggcgca taagctgcac caaaacaagt attatgtcac agcgcgaatc 181 atttcacagc tgggcaaatt cttcacaggc attgaaattc acccgggtgc caccatcggc 241 aaaggacttt tcattgacca cggcacaggc gttgtaatcg gcgagaccgc agaaattggc 301 gacaactgta ttttatatca gggcgtgacc cttggcggta ccggcaaggg caaaggcaag 361 cgccacccga cgcttggcaa caacgttatg gtcggatgcg gagcaaaggt tttgggaccg 421 ttcaaaatcg gtgacaatgt taaaattgcc gcgaactctg ttgttttgca cgaaattccc 481 gaaaactgca cagcggtcgg cgcacctgca cgagttgtca gacgggacgg cgttaaggtg 541 acacaagacc ttgaccacgt tcacattccc gaccctgttg cgcaggaact ttgccgccag 601 caggttagaa ttgaccagct tgagcgggag cttaacgcgc ttaaaaacaa gtaaacaaat 661 cagccgaaag gaattttaaa atatgaagct atataattca gcaaccagaa acaaagaaga 721 ttttgtcacc catacccccg gcaaggttga gatgtatacc tgcggaccta ccgtttatca 781 ctatgcccac atcggcaacc tgcgctcata cattatggaa gacgtgctgg aaaaatatct 841 gcgatatgac ggatatgctg tcaacagagt tatgaacatc accgatgtgg gacacttgac 901 ctccgacggc gacgagggcg acgacaagat gcttaaaggc gctaagcgtg agcacaagac 961 cgttatggag attgcaaagt tttataccga tgcattcttt gcggatgccg caaagctcaa 1021 cattaaaaca cccgacaagg tcgttcccgc aacaagctat gtgggcgagt tcatcaaggt 1081 catcaagggc ttgattgaaa agggatatgc atatgaagca ggcgggaaca tttattttga 1141 cacctccaag cttaataaat attacatttt caacgacttc accgaggaag atttggacgt 1201 cggtgttcgc gagggcgttg aagcggacaa caacaagaaa aacaaggcag acttcgtttt 1261 gtggttcaca aagtctaagt ttgacgacca ggagctgaag tggaactctc cttggggctt 1321 gggttacccc ggctggcata ttgaatgctc ctgcatttca atgaaaaaca actgtgagta 1381 tcttgacctt cactgcggcg gaattgacaa cgcattcccc caccacacca acgagatcgc 1441 gcagagcgag gcatacctcg gccacgagtg gtgcaaaaac tggttccacg ttcaccatct 1501 taacaccgaa ggcggaaaga tgagtaaatc caagggcgaa tttttaaccg tttcgctcct 1561 cgaatccaaa ggatatgacc ccattgttta ccgcttcttc tgcttgcagt cccactatcg 1621 caaatcgctg gtgttctcat atgataacct tgacaatgcg aaggttgcat atgataagct 1681 gattgcaaaa attgcatccc ttatgcccgc aacaggcgag gttgataaag aagcatttga 1741 tgccctcaag aaaaacttca ccgatgctat ggataacgac cttaatacat cgctgggcgt 1801 tactgctttg tatgatgttt tgaaggctga tgtcaacacc gcaacaaagc tcgcacttat 1861 tgcagatttc gacaaggtac tctctgtcaa tctgattgaa aacgcggcca agcaggcaaa 1921 gcccgccgag gaagagcttc ccgaagaaat tttggcattg gcagaacagc gcaaagcggc 1981 aagaaaagaa aagaacttcg ctcttgcgga cgaactgaga gataagatta ttgcccttgg 2041 ctataccgtt gaggaaacaa ggcagggcac tgttatt // LOCUS sequence257 2076 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence257 VERSION sequence257 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2076 /mol_type="genomic DNA" /organism="" /note="sequence257" CDS 302..1735 /product="Asp-tRNA(Asn)/Glu-tRNA(Gln) amidotransferase subunit GatB" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_012048223.1" /transl_table=11 /codon_start=1 /translation="MIRGYEVVVGLEVHAELNTKTKIYCGCKNSFGLEVNTQVCPICMG MPGTLPTLNEKVVEYAIKMGHALNCGINRICKQDRKNYFYPDLPKSYQISQADIPLCHD GYLDVIIGEDVKRIGIERIHIEEDAGKLLHSDKFDGSLVDFNRCGVPLIEIVSKPDMRG SNEAKAYLETIRSILRYIDISDCKMQEGSIRCDVNVSVHKPGEPFGTRCEMKNVNSFSA AVRGIDYEANRQIDIIEAGGVVTQETRRWDDVKGESVSMRSKEDAQDYRYFPEPDLLTI VVPEEKVTYLKDTLPELPNAKIMRYVNDYGIAFNDAAMIVDVPEKAKFFDECTALNCKS PKLLSNWILGEISKFMNEGTQIEDTKLTAEKLVAIVNYISDGKISTAAGKTVFDVILNE DKAVDAVIEEKGLSQVSDVSALEAIADEVLAANEKSVTDYNNGKTNALGYLVGQCMKAS KGKANPGIMKEIILKKITK" /locus_tag="LOCUS_7530" /gene="gatB" /note="WP_012048223.1 Asp-tRNA(Asn)/Glu-tRNA(Gln) amidotransferase subunit GatB (Clostridium botulinum) [pid:50.4%, q_cov:99.2%, s_cov:99.4%, Eval:9.9e-140]" /note="MGA_1057" ORIGIN 1 gttgatgtta ttattactcc tactgctcct gcagaagcat tcaagatcgg tgaaaaaacc 61 agcgatcctt tggaaatgta tgcttccgac atctgcaccg ttaccgttaa cattgctgga 121 cttcctgctg taagcgttcc ttgtggatac tctgaatcgg gacttccgta cggtatgcag 181 atcatcggca agaagttcga tgagcagaca attctgaatg tggcatttac tcaccagaag 241 ctctttggcg gcttcaagaa gcccgagctt taatcacctt gaggagagga cactaactga 301 tatgataaga ggatatgaag ttgtagtcgg tctggaagtc catgccgagc tcaacactaa 361 gacaaaaata tattgcggct gtaaaaactc cttcggtctt gaggttaata cccaggtttg 421 tcccatttgc atgggtatgc ccggcacatt gccaaccctc aacgaaaagg tagttgaata 481 tgccattaag atgggtcatg cccttaactg cggcatcaac cgcatctgca agcaggacag 541 aaagaattat ttctatcccg accttcccaa gtcctaccag atctcacagg cagatattcc 601 gctttgccac gacggctatt tggatgtaat catcggtgaa gatgtcaagc gcatcggcat 661 tgagagaatc catattgaag aggacgcagg caagcttttg cactctgaca agtttgacgg 721 ctcgcttgtt gacttcaacc gttgcggtgt tccgctgatt gaaattgttt ccaagcccga 781 tatgcgcggt tccaacgaag ctaaggcata tcttgaaaca attcgctcaa ttcttcgcta 841 tatcgacatc tccgactgta agatgcagga gggctccatc agatgcgacg ttaacgtatc 901 tgtacacaag cccggagagc ccttcggcac aagatgcgaa atgaagaatg ttaacagctt 961 ctccgccgca gtaagaggca ttgattacga agctaaccgc cagatcgaca ttattgaagc 1021 aggcggtgtt gtaacccagg aaacaagacg ttgggacgat gtgaagggcg aaagcgtttc 1081 gatgcgttct aaagaagatg ctcaggatta cagatatttc cccgagcccg atcttttgac 1141 aattgttgtt cccgaagaaa aggttactta tcttaaagac acattgcctg agcttcccaa 1201 cgcgaaaatt atgcgctacg ttaacgacta tggcattgcc ttcaacgacg ctgcaatgat 1261 cgttgatgtt cccgaaaagg caaagttctt tgatgaatgc accgctctta actgcaaatc 1321 tcccaagctt ctttcaaact ggatcttagg cgagatttca aagtttatga acgaaggcac 1381 acagatcgag gacaccaagc tgaccgctga aaaacttgtt gcaatcgtta actatatcag 1441 tgacggcaag atttccactg cggcaggcaa gactgtattt gacgttatac tcaacgaaga 1501 caaggctgtt gatgctgtta ttgaagagaa gggactctcc caggtctccg atgtttcagc 1561 acttgaagct atcgctgacg aagttttggc ggcaaacgaa aagtctgtta ccgactataa 1621 taacggcaag accaatgctt tgggttacct tgtcggacaa tgcatgaagg cttccaaggg 1681 caaggcaaac cccggaataa tgaaggaaat cattcttaaa aagattacca agtaaatatt 1741 catcaagcgc tcgatacatt cgggcgcttt tcttttttcg ataaagcaat cagaatcatc 1801 gcaagcatac aaacaagtgg aacaatactt tttgactgcg aaaagctgac ttttacaaaa 1861 gcctcaagtg catatcgttt aatcaataga tcgattatat aagcataaaa atacgtaagc 1921 gataatcgag ccaaaagtat cgcgaagaac ggcttcattg aaaatctgtt tccgattatt 1981 gcgcaaagct gcattattac gcatattccg ccgaaggata aatacacgct agccgcttta 2041 aaactgatgg ttttatactc tgatatgttt gttata // LOCUS sequence258 2067 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence258 VERSION sequence258 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2067 /mol_type="genomic DNA" /organism="" /note="sequence258" CDS complement(66..1475) /product="aminopeptidase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011391671.1" /transl_table=11 /codon_start=1 /translation="MSEKEKSAGKALQEKLFTQKKNGVLKLSNEEIVAVDNFCEGYKKY LDNGKTEREAVSAAIALAEEKGFVPFDTKKKYSAGDKVYYNNRGKSIILCVFGTDDLEN GVKIAAAHVDAPRLDLKQHPVYETTELCLLKTHYYGGIRKYQWVTIPLALHGVIFTADG TCVNVNIGEDENDPVFCITDLLPHLAQEQSKRSLADGIRGEELNVLIGSRPFKDDEVSE KVKLNVLSILNEKYGIVEDDFLSAELEVVPAFKAKDVGLDRGLVGAYGQDDRVCAYTAL EAILDVDCPKTTCITILTDKEEIGSMGNTGLQSAYLKHFIYHIAEMAGTNAPTVLAKSE CLSADVCAAVDPTFPEVCEPKNAAYITYGVGMCKYTGSRGKSGSSDASAEFVSRVRQIF DSNGVIWQTSELGRVDLGGGGTVAAYIANLDVDVVDVGVPVLCMHAPYELTSKLDVYMA YKGFASFFMAD" /locus_tag="LOCUS_7540" /EC_number="3.4.11.-" /note="WP_011391671.1 aminopeptidase (Moorella thermoacetica) [pid:48.8%, q_cov:99.1%, s_cov:99.4%, Eval:3.3e-132]" /note="MGA_1058" CDS complement(1492..2052) /product="lytic transglycosylase domain-containing protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_005816766.1" /transl_table=11 /codon_start=1 /translation="MLKRILASFALVVFVVTLLGVLFVYMPYVAKRDTYHRYYSDEVER YSQEFGIDDDFVYAVIKVESNFDPSAISDVGAIGLMQIIEDSFDWVAGKLGEREIMRFE DMYTPEYSIKYGCFMLSYLYNKYKSYELTAAAYHSGMTTVDNWLSEGVVDATNPDVDSF IGDNTRHYVKKIMRAFEKYSNLE" /locus_tag="LOCUS_7550" /note="WP_005816766.1 lytic transglycosylase domain-containing protein (Desulfitobacterium) [pid:30.4%, q_cov:91.9%, s_cov:85.4%, Eval:1.8e-20]" /note="MGA_1059" ORIGIN 1 catagtgcta agaacaaaaa aagagccaac aaaatgtcag ctcttttaat atattgattt 61 aatgtttagt cagccatgaa gaaggatgca aagcccttat atgccatata aacgtcaagc 121 tttgaggtca attcataagg agcatgcatg cacaaaacgg gaacgccgac atcgacaaca 181 tctacatcga gatttgcaat atatgcagca acagttccgc cgccaccaag gtcaactctg 241 ccaagctcgg aggtctgcca aattacgccg ttcgagtcga aaatctgtct tacacgggat 301 acaaactctg cgcttgcatc agaactaccg ctcttgccgc gtgaacctgt atatttgcac 361 ataccaacac cgtaggtgat gtatgcagca ttcttgggtt cacaaacttc ggggaaagtg 421 ggatccacag cagcacaaac gtctgcagac aagcattcgg atttagccaa aactgtagga 481 gcattggtgc ctgccatttc agcgatatga tagataaagt gcttgagata tgcgctctgc 541 aagccggtat tgcccatgct accgatctct tccttgtcag tgagaatggt gatgcaggtg 601 gtcttggggc aatcaacgtc gagaatagcc tctaacgctg tgtaagcaca aactctgtca 661 tcctgaccgt atgcaccaac caagcctctg tcaagaccta cgtctttagc cttgaatgca 721 ggaacaactt caagctctgc tgaaaggaaa tcgtcctcaa caatgccata tttctcattg 781 agaatagaca aaacattaag ctttaccttt tcggaaacct cgtcatcctt gaaaggacgt 841 gagccaatga gaacgttaag ttcttcgcct cggataccgt cagcaagact tctcttggac 901 tgttcctgag caaggtgagg caaaagatca gtgatgcaga atacgggatc gttttcatct 961 tcgccgatat tgacgtttac gcaggtgccg tcagcggtga aaataacgcc gtgaagagcc 1021 aaaggaatgg ttacccactg atactttctg ataccaccat agtaatgagt tttcaaaagg 1081 caaagctcgg tggtttcata tacagggtgc tgtttgaggt caagtctggg agcatcaacg 1141 tgcgcagcag cgatcttaac accgttttcg aggtcatcag tgccgaatac gcaaagaatg 1201 atcgactttc cgcgattgtt gtaataaact ttgtcccccg ctgaatactt tttcttggtg 1261 tcaaagggta caaagccctt ttcttcggca agagcgatgg cagcacttac tgcttctctt 1321 tcagtcttgc cgttatcgag atacttcttg tatccttcgc agaagttatc aacagcaacg 1381 atctcttcat tgctcagctt gagcactccg tttttcttct gggtgaagag cttttcctgc 1441 aaagccttac cagcagattt ttctttttct gacatttaaa tcgtcctttc tttattctaa 1501 atttgagtat ttttcaaaag cccgcattat ctttttaaca taatggcggg tattatctcc 1561 gataaagctg tcaacatcgg ggttggtggc atcaacaacg ccctcgctta accagttgtc 1621 aaccgttgtc attcccgagt gataagccgc agcagtcagt tcatagcttt tatatttgtt 1681 atatagatat gagagcataa aacaaccgta cttaatgctg tattcagggg tgtacatatc 1741 ctcaaagcgc attatttcac gctcaccgag ctttcctgca acccagtcga acgagtcctc 1801 aatgatctgc ataagtccaa ttgcaccgac atccgaaatt gcagacgggt caaagttgga 1861 ttcaactttg atgacagcat atacgaaatc atcatcaatt ccgaactctt ggctgtaacg 1921 ctcaacttca tcggaataat aacggtgata tgtatctctc tttgcgacgt acggcatata 1981 gacaaacaga acacccaata aagtgacaac gaaaacaacg agcgcaaatg aagcaagaat 2041 tcttttaagc atcaaaacgc tccttta // LOCUS sequence259 2062 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence259 VERSION sequence259 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2062 /mol_type="genomic DNA" /organism="" /note="sequence259" misc_feature <1..589 /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_011986645.1:FAD-binding protein" /note="WP_011986645.1 FAD-binding protein (Clostridium botulinum) [pid:50.0%, q_cov:99.5%, s_cov:54.3%, Eval:1.5e-52, partial hit]" /note="MGA_1060" /locus_tag="LOCUS_7560" CDS 610..1629 /product="phenylalanine--tRNA ligase subunit alpha" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003436795.1" /transl_table=11 /codon_start=1 /translation="MKQLLEKIELAAKAELEKIQDSAELENLRIKYLGKKGELTAVLKQ MATLSAEERPVIGQLANKIRGDIEEAISARGAELKKAMAEKKLKEEKIDVTLPGKLQTV GKLHPLNAVMKEIEEIFIGMGFDIAEGPEVEYDYYNFEALNIPKDHPARDTQDTFYITD NILLRTQTSSVQIHVMENRKPPIRIISPGRVYRSDAVDATHSPIFHQIEGLVVDKGITM ANLVGTLDMLMKRLYGDDCKIRLRPHHFPFTEPSAEVDVLCFNCGGKGCSMCKNEGYVE LLGAGMVHPKVLENCGIDPNEYSGFAFGLGLERVVMRKYGINDMRMLYENDLRFLGQF" /locus_tag="LOCUS_7570" /gene="pheS" /EC_number="6.1.1.20" /note="WP_003436795.1 phenylalanine--tRNA ligase subunit alpha (Clostridioides difficile) [pid:61.7%, q_cov:97.1%, s_cov:97.1%, Eval:2.0e-122]" /note="MGA_1061" ORIGIN 1 cggtgcaaat tctttggtgc gtcgctcgct cttccccgat cacaagatcc gtcaatacat 61 cgccattcaa aattggtata atgaccgatc acaaaaaccg ttttattcct gcatcttcga 121 taagaaaacc accgactgtt gctcctggag catctcgaaa gacggctcaa tgctctatgg 181 cggagccttc ccgatccttg acggaaaatc ccgcttcaaa actcagctcg agcgtgcaaa 241 ggcctgcggc ttcgagtttg gtgatcattt ctataccgaa gcttgcttag ttaaccgtcc 301 caagcgtgtc ggcgagattt ttgaaggcga aaacggtgta tttcttgtcg gtgaggccgg 361 cggattcatc agtccaagct ctcttgaagg tatcagttgg gcgatgcgaa caggggaacg 421 tctggcaaaa agcttcaatt cccccaaccc cgaaaaagcc taccgcaagg cggttcgccc 481 gctaaaattc aagctttggc tgaaaatgat gaagtgcccc tttatgtatg acccgctgtt 541 gcgcaatatc gtaatggcgt caaaaataaa atcaattaac gttaaataaa tgaaaggata 601 tgacaaaaaa tgaagcagtt actcgaaaag atcgagcttg ccgcaaaggc cgagcttgag 661 aaaattcagg attccgccga gcttgaaaat ttgcgaatca agtatctcgg caaaaagggc 721 gagctcaccg ctgtgctcaa gcagatggca accctcagcg ctgaagaacg ccccgtgatc 781 ggtcagcttg caaacaaaat tcgcggcgat attgaagaag cgatctctgc ccgcggtgcc 841 gagcttaaaa aggctatggc tgaaaagaag ctcaaggaag aaaaaatcga cgtcaccctt 901 cccggcaagc tccagactgt cggcaagctc caccccttga atgcagttat gaaggagatc 961 gaggagatct tcatcggtat gggattcgac atcgctgaag gtcccgaggt tgagtatgac 1021 tactataact tcgaagctct caacattccc aaggatcacc ccgcacgtga cactcaggat 1081 acattctaca tcaccgacaa tattctcttg cgtacccaga cttccagcgt tcagatccac 1141 gttatggaaa accgcaagcc ccccatccgc atcatctccc ccggcagagt ataccgctcc 1201 gacgctgttg acgccaccca ctctcccatc ttccaccaga tcgaaggctt ggttgttgac 1261 aagggcatca ccatggcaaa ccttgttggc actcttgata tgcttatgaa gcgtctttac 1321 ggcgacgatt gcaagattcg tcttcgtccc caccacttcc ccttcaccga gccttctgca 1381 gaagttgacg ttttgtgctt caactgcggc ggcaagggct gttcaatgtg caaaaacgaa 1441 ggctatgttg agcttttggg cgcaggaatg gttcacccca aggttttgga aaactgcgga 1501 atcgacccca acgaatattc cggctttgca ttcggtctcg gtcttgaaag agttgtaatg 1561 cgtaagtacg gcatcaacga tatgcgtatg ctctatgaaa acgacctgcg cttcctcggc 1621 cagttctaag ggaaaggagt aacttattat ggatttatca atgaaatggc ttcgcgacta 1681 tgttaaggtt gacgagccga taaagaaatt ctgctatgat atgaccatga ccggttcaaa 1741 ggtcgagggt tatgaaattg aagccgaatg tatcaccaac tgtgtcgtcg gcaaaatttt 1801 gaagattgaa aagcatcccg atgccgacaa gctcgttgtt tgccgggtca atgtcggtga 1861 tcgcgacatt cagatcgtta ccgccgcaac caactgcttc gaaggtgctt tggttcccgt 1921 tgcgctcgat ggctccaccc ttgcaggcgg catcaagatc aaaaagggca agctccgcgg 1981 agttgtatct gagggtatgt tctgctctgt tgccgagctt ggcgtaactg ttcacgactt 2041 cccttatgcc attgaggacg gc // LOCUS sequence260 2059 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence260 VERSION sequence260 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2059 /mol_type="genomic DNA" /organism="" /note="sequence260" CDS complement(17..817) /product="pyrroline-5-carboxylate reductase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_009898446.1" /transl_table=11 /codon_start=1 /translation="MTKKIAVIGGGNMGGAIVYGMLGAGYKTVTVADRNEAILEKVRAW GANATDDNLEAVKDADIIILAVKPNIASAVADEIKEKISQNAIIVSICAGKTVASLKEM FEHEKVVRVMPNTPVTVGEGMCAVCESDDVSAEEFDYINTIFASFGKALVLPESLIDTV IGVSGSGPAYAFMFIDGMVKSGVANGLDYETAKIMAAQTVLGAAKMVLESDLTPDQLKV NVCSPGGTTIEAVKSFEEDDLYGIIDKAMAACIAKSKKMSEVKN" /locus_tag="LOCUS_7580" /gene="proC" /EC_number="1.5.1.2" /note="WP_009898446.1 pyrroline-5-carboxylate reductase (Clostridioides difficile) [pid:47.0%, q_cov:98.1%, s_cov:99.6%, Eval:5.3e-61]" /note="MGA_1063" ORIGIN 1 atttgaaaac gtggtgtcaa tttttaactt cgctcatttt cttcgacttt gcaatgcaag 61 ctgccatcgc cttgtcgatg atgccgtaaa ggtcatcttc ttcaaacgat ttcactgctt 121 caatagtggt accgccgggg gagcagacgt tgaccttgag ttggtcgggt gttaaatcgc 181 tttcaagcac cattttagcc gcacccaaaa ccgtctgtgc agccataatt tttgcggttt 241 cataatccag cccgtttgca acgcccgatt taaccattcc gtcgatgaac ataaatgcat 301 acgcagggcc ggagccggaa actccgatga ccgtatctat aaggctttcg ggaagcacca 361 gcgctttgcc gaatgatgca aaaattgtat tgatataatc aaattcttcc gcgctgacat 421 catcgctttc gcacactgcg cacattccct cgccgacagt gacgggtgtg ttgggcatga 481 cccttacgac cttttcgtgt tcaaacattt ccttgagcga tgcgactgtc ttgcccgcac 541 agatcgacac gattattgca ttttgtgata ttttttcctt gatctcatcc gcaaccgcgc 601 ttgcgatatt cggcttcacc gcaagtatga ttatatctgc atccttaacc gcttcaaggt 661 tgtcatctgt tgcatttgcg ccccatgcac gcaccttttc aagtatcgct tcgttccgat 721 ccgcgacggt gacggtttta tatcccgcgc cgagcatacc gtatacgata gccccgccca 781 tatttccgcc gccgattacg gcaatttttt tggtcatata tatcaatacc tttcgtcaaa 841 aaatatcctt atacttcatc agtttagcac ataaaaacca ctgtgtaaag cgccaattat 901 ttttttctgt ttttttaagt gaatatttaa aaaagaattg attttcttac ctgaatttag 961 taaaataatt ttgaatggat cttccattta ttattaaccc gaaaggatta aaacatatgg 1021 aactttatat ggataagacc aaatcatttg aagaaagagc caaagatctt gtttcaaaga 1081 tgacactgat ggaaaagtgc gaacagctca aatacggcgc acctgcaatc gagcgtttgg 1141 gcgtacccgc ctataactgg tggaatgagg gacttcacgg tgttgcccgc gcaggcgttg 1201 caacaatgtt cccacaggct atcggacttg ccgcatcctt tgacaccgag cttttgcggg 1261 aagttgcaaa tgtgatctct gttgaagcaa gagcaaaata taatgagtat tccgcacacg 1321 gtgatcgcga tatttacaag ggcttgaccc tttggagccc caatatcaac atcttccgtg 1381 atccccgttg gggacgtggc cacgaaacct atggtgagga cccctacttg acttctcgcc 1441 tcggttgtgc atttgtcaac ggcttgcagg gcagcggtga ttatcttaga accgccgctt 1501 gcgctaagca ctttgctgtt cactcgggcc ccgagggatt aagacatgag ttcaacgcaa 1561 ttgcagatgc aaaggacctt gaagaaacat atcttcccgc attcgaagcg ctcgtaaagg 1621 aagccaaggt tgaatctgtt atgggtgcat ataaccgcac caacggtgag ccttgctgtg 1681 gttcggaata tctttacggc aagctcaaag aatggggatt cgacggctac tttgtttccg 1741 actgctgggc aattgccgac ttccacaccc gtcaccacgt taccgctacc gccacagaat 1801 ctgttgcact cgccctcaag aacggctgcg atgtcaactg cggcagtaca tatattcacc 1861 tttataaggc atatgaagaa ggcctcgtaa ccgaggaaga gatcacgtgc gcttgtgagc 1921 acttgttcag aacaagattc cgtctcggta tgttcgacga aactgatttc gacagcctca 1981 gctatatgga tgttgagacc cgcgagcacc tcgatatcag ccgcaaggcc gctgaatccg 2041 cttgcgtact tcttaaaaa // LOCUS sequence261 2054 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence261 VERSION sequence261 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2054 /mol_type="genomic DNA" /organism="" /note="sequence261" ORIGIN 1 atatgagctt ttggatgaat accttgaata taagtatttc atgcctgaaa ttaaaaaggt 61 tcattcaatt aaggataaca accgcggttt catatttgtt gaccttgaaa caaatgccgg 121 aagaaagacc atttgcatcc gcgactggta ttcaaacttc cgacttctga ccgatactta 181 tttatatgca cacgatgtcg acggaaacaa atacttctgt cctgatgtca ccaagctcga 241 caagaagagt cttgccgcac ttgaattgtt catctaacag tttccttttt tggaaagggg 301 tgaaagccaa tgaatttaaa aatttctgct ccggcgggta tagacataaa cgattttctg 361 ttttctttgc cctttaacct taacggcgaa agggaacttg caaacggaca tctttgcgta 421 acccgcgaac agatattcgt atatgtagat aacgagctca gcgcatcata tatgatcgac 481 gacttcgagg aatacgcctg cgaacagctt gttggctgtt caatgatggt cggccgtatt 541 gaagatgtcg ataaaatgcg tatatgctcc tttacacagg acaacttcat cgcatttgct 601 gaggtctgca agctgatcaa ccattactta accaccggag attttatcga taacagcgac 661 atcgatgagc ctaagtgcca taagtgcggt cttcctctgg atggctatgc cgagtgtcct 721 tattgctcat cgaagattca gatattctcg aagcttttta agcgtctgtt gccatataaa 781 aagcagtttg cgcttgcgat catgtgtacg attcttggtg aggtaacagc aattatctct 841 ccttatatca accgaatttt ggttgacgat tatgtaattc ctcaaaattc atcaaattgg 901 agcggcttcg gaattctttg cctttcaatg gtcgttattc tattgataaa tacggcactt 961 gaatggttga atatgaagtg cagttactat gtatcgctca acctgagcca ggatttgcga 1021 aaggatgtat tcaacaagac acttcatctt tcgatgtctt ctatatccaa gaagaccgcc 1081 ggcgagctca ttaaccgtgt atccaacgac gccaataaga ttcaaagctt cttgaccgat 1141 aacggtaagc acgcaatcgt tcgaattctt acacttgtaa ttacatcggt gattatgttt 1201 gtaatgaact ggcgcttggc attaatggca attgtgccga tcccgttggt tgttttgctg 1261 gtaaaaaagc tttacggcat cattcactca cacttcagcc gcgtatggag atataacaac 1321 ttctattccc gtcttttgca cgataccttg aacggcatcc gcgttgttaa gacctgcgga 1381 actgaagacg ctgaaattga gaagtataga gttgcttcaa agcgttgggc gggtgctgct 1441 tccgatgctg aagtaacatg gaacctcatt tggccgatta caaacttcct gcttacatcg 1501 ggacattacc ttgttctgta ctttggctca atgatgatcc tttcaaggat tccttcattc 1561 ggaacaatgt ctttgggcga attgattcag ttcaccactt atgtttcaat gctctataat 1621 ccgcttcgct ggcttatgca gcttcccaga tcctttgccg acttctctgt atctgccaca 1681 aaggtatttg aaattttgga agagcagaca gatgtcagag ataccgaaaa ctgcgttgac 1741 cttgatatca atggcgatat cgaattcgat cacgtatact ttggatataa ggtatataat 1801 cctgtactta aagacatcac ctgtaaaatt gatcagggca agatgatcgg tattgtcgga 1861 cactccggtg tcggtaaatc aacaatgata aaccttattt tgcgtctgta tgatgcaaca 1921 caaggttctg tgaagatcga cggagttgac attaagaata tatcccagga aagcttgcgc 1981 tctcaggttg gtgttgtatt gcaggaaact tacctctttg agggaagtat tcttgacaat 2041 attgcatatg caaa // LOCUS sequence262 2052 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence262 VERSION sequence262 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2052 /mol_type="genomic DNA" /organism="" /note="sequence262" CDS 321..974 /product="HD domain-containing protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011393194.1" /transl_table=11 /codon_start=1 /translation="MTYNEIRNNHEIIAYINKGNQNLDVMGYTDHSRAHCVLVLERAAK LLKAFDYSEHDIELVKIAGFMHDIGNAINRKHHAEYGALLANELLRDTEMPIEDRVTIV SAIGNHDESTGGAKDPISAALIIADKSDVRRNRVRHADLNFDIHDRVNYAVIESRLEID KENGIICLDLDIDESICSMYDYYEIFLGRMVMCRRAAEFFKCKFILKANGRKVL" /locus_tag="LOCUS_7590" /note="WP_011393194.1 HD domain-containing protein (Moorella thermoacetica) [pid:47.2%, q_cov:100.0%, s_cov:98.6%, Eval:3.1e-52]" /note="MGA_1068" CDS 1000..1833 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MFYDSCPGVIRSLDAIENALKTEGNHFIDRLDGDKLIACAVINKN IVVMLCVHPDYRKRGIGSALFNECEDYARSLGCDHIQLFGFDDYITPGAPIYEGNWEFF VKRGYEHTWGDGECVDMMMELKDFHHTENKLGDTINGITYRRAVIADRDRVQECLMDAA DYFAPYYMDDALYDPENCEFPLIALDGDLVVGALLVGAEIEGDDLGTVGCTATRHSHRG RGVATNMVKLGTRWLKEQGLKNGYLGFTYTDIIPMYGNSGYSVSMKYFMGKKNLK" /locus_tag="LOCUS_7600" /note="MGA_1069" ORIGIN 1 ccggaccgtc ggttgtcggt tttgttgccg atgctgtcgg cggcaacctt aaacccggct 61 tggctgcggc aatggttttc ccaatcgtta ttttcgtcgg aatttccctt ttaaaatcaa 121 agaaggcgga ttaacaccgc tcctctgtga atagccttcc ccgtgagggg aaggtgtcag 181 cggatgctga cggatgaggt ggacgcgaac tgccgaattc tcaatcttcg tgtaaccaca 241 cgtgcgggtc ccctccattt gtcacctttg gcgacaaatg gcctccgccc cgctttaacc 301 aatctccaag gaggtctacc atgacttaca acgaaatcag aaacaaccac gaaataattg 361 catacatcaa caaaggcaac caaaacctcg atgtcatggg ctataccgac cattcgagag 421 cccattgcgt gcttgttttg gagcgtgccg caaagctttt aaaggcattt gattacagcg 481 aacacgatat cgagcttgtg aaaattgcag gctttatgca cgatatcggc aatgcaatca 541 accgtaagca ccacgctgaa tacggcgccc tcttggcaaa tgaactcctg cgtgatactg 601 aaatgcccat tgaggataga gtcacgatcg tttccgcaat cggaaaccac gatgaatcaa 661 caggcggtgc caaggacccc atttccgccg ctctaattat tgccgacaag tcggatgtta 721 gacgcaaccg cgttcgccac gccgacctca acttcgatat ccacgaccgc gttaattacg 781 ccgttatcga atcccgcctg gaaatcgaca aggaaaacgg catcatctgc cttgacctcg 841 atatcgacga gagcatctgc tcaatgtatg actactatga gatcttcctc ggcagaatgg 901 taatgtgccg cagagctgcc gagttcttca aatgcaaatt catattgaaa gccaacggca 961 gaaaggtgct ttaagattat gattgataaa atcatctagt tgttctatga ttcctgtccc 1021 ggcgtcatac gaagtcttga tgcaattgaa aacgccctaa agacggaggg caaccatttc 1081 atcgatcgct tagatggcga caagctcatt gcctgtgctg tgataaacaa aaacatcgtc 1141 gtgatgcttt gcgttcatcc cgactatcgc aagcggggaa tcggctcagc acttttcaac 1201 gagtgtgagg actatgcccg ttcgcttgga tgcgaccaca ttcagctctt tggttttgat 1261 gattacatca cccccggcgc accgatttat gaaggcaact gggaattctt tgtcaagcgc 1321 ggatatgaac acacctgggg cgacggcgaa tgtgttgata tgatgatgga actcaaggac 1381 ttccatcata cagagaataa gcttggagat acaattaacg gcatcaccta ccgcagagct 1441 gttattgctg accgcgaccg tgttcaggag tgccttatgg atgctgctga ctatttcgcg 1501 ccatattata tggatgacgc cctttacgac cccgaaaact gcgaatttcc gctcatcgcc 1561 ctcgatggtg acttggttgt cggagcgctt ttggtgggag ctgaaatcga aggcgatgac 1621 ctcggcacag ttggttgcac cgccacccgc cacagtcacc gtggcagggg agttgccacc 1681 aatatggtta agctcggcac tcgctggctt aaagagcaag gtctcaaaaa cggctacctc 1741 ggtttcactt ataccgacat tatcccgatg tatggtaata gcggttacag tgtaagtatg 1801 aaatacttta tgggcaagaa aaacttgaaa taatacatat aggacggtaa taaaaaatgc 1861 ttaaaagaac ctgcaagcaa tgcggaaaag agtttattct gactgaccag gaaattagat 1921 ttttcaaatc aaaaaacttg aatttgccca aacgctgcaa agactgccgc gccgctaaca 1981 agcaggcaaa ggttgaaact gcacctgtag ctgaaatcaa aaagcccgca accgcgccca 2041 agggcaaaag ta // LOCUS sequence263 2049 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence263 VERSION sequence263 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2049 /mol_type="genomic DNA" /organism="" /note="sequence263" CDS complement(742..1824) /product="aspartate-semialdehyde dehydrogenase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_010963351.1" /transl_table=11 /codon_start=1 /translation="MKQYKVGIICATGMLGQRFAVLLENHPWFKVTTLAASPRSAGKKY KDAVKKWLIEEKPMPESMADIVVMDATADIEKIAAQVDFVFCAVDMKKDEIKALEEAYA KLECPVVSNNSANRFTDDVPMVVPEINPEHIEVIEAQRKRLGTKRGFIAVKSNCSIQSY VPALHPLRKYGIKNVLACTYQAISGAGKTFETWPEMVDNLIPFIGGEEEKSEKEPLKVW GTLEDGKIKVATEPNITTQCLRVPVSDGHTAAVFVSFENKPSKEEILAAWKDFAGVPQE LELPSAPKQFLNYFEEDNRPQAKLDRNLENGMAVSIGRLREDSQYDYKFVCLSHNTLRG AAGGGVLMAELLAAKGYFDR" /locus_tag="LOCUS_7610" /gene="asd" /EC_number="1.2.1.11" /note="WP_010963351.1 aspartate-semialdehyde dehydrogenase (Clostridium) [pid:62.0%, q_cov:99.2%, s_cov:98.9%, Eval:1.4e-129]" /note="MGA_1072" ORIGIN 1 attacgccct tgccgcccaa cgacataata ggaacgatct gatcgtcatt tcccgaataa 61 accgccaagt catcgccgca catatccaaa acctttgcaa ccagcgaaag atttccgctt 121 gcttcctttg tcgcaacgat ctgcgggtgc ttactcagct ccctatatgt ttccgccgcg 181 atagaaaatc ccgtgcgtga ggggacgtta tatacaattg cgggcaggct gacatcctca 241 agcagcttct catagtgctt gatcagcccg tgctgagaag ttttgttgta ataaggtgtc 301 accaacagca aaccgtcggc gcctgcttct tcggcggcct ttgttgtacc tttgccataa 361 agcgtgtcgt tcgagcctgt ggagcatata atcggcacgc gcttgttgac ccgcttaaca 421 gcaaattcca tcagcttgcg gtgctcatct cccgaaagag tggcattttc gcctgtggtg 481 gcaacagcaa caattgcgtc ggtgcccttt gcgatctgcc agtcgataag ctcgccgtat 541 ttttcaaagt ttatacttcc gtcctcgtga aacggcgtta ctaaagcaac agccgcaccg 601 ctgaaaataa gttttttcat tcaaaataca ccctttcgca ttatttttta atatccaact 661 atataatagc aaaaaatcta aaaaaactca atgacttttg gggtacgatt tggttacgat 721 tcggaaacaa ttattcaact tttatctgtc aaaatagccc tttgctgcca aaagctcagc 781 cattaaaaca ccgccgcctg cggcacctct aagggtgttg tggctgaggc atacaaactt 841 atagtcatac tggctgtctt ctctgagtct gccgatagat acagccatac cgttttcaag 901 gttgcggtca agcttagcct gaggacggtt atcctcttca aagtagttaa ggaattgctt 961 gggagcagag ggaagctcaa gctcctgagg aacacctgca aagtccttcc aagccgccaa 1021 aatttcttcc ttcgagggct tattttcaaa gcttacgaat acagctgcgg tgtgaccgtc 1081 tgaaacggga acgcgcaggc actgtgttgt gatgttaggc tcggttgcaa ccttgatctt 1141 gccgtcctca agagtgcccc aaactttgag gggttccttt tcagacttct cttcttcgcc 1201 gccgatgaag ggaatgaggt tatcaaccat ttcgggccag gtttcaaaag tcttgcctgc 1261 gccggaaatt gcctgatatg tacaagccaa aacgttctta atgccgtatt tgcgcaacgg 1321 atgcaaagcg ggaacatagc tttgaatcga gcagttggac ttaaccgcaa taaatccgcg 1381 ctttgtgcca aggcgctttc tttgcgcctc aataacctcg atatgctcgg ggttgatttc 1441 gggaactacc atgggaacgt cgtcggtaaa tctgtttgcg gagttgtttg aaacaacggg 1501 gcactcaagc ttggcatatg cttcttcgag cgccttaatt tcatcctttt tcatatcaac 1561 cgcgcagaat acgaagtcaa cctgtgcagc aatcttttca atgtcagctg ttgcgtccat 1621 tacaacaata tcagccatag actcgggcat aggcttttct tcgataagcc atttctttac 1681 tgcgtcctta tatttctttc ctgcggaacg gggggaagct gctaaagttg taaccttgaa 1741 ccaggggtgg ttttcaagga gaactgcaaa acgctgtcct aacatacctg ttgcacagat 1801 aatacctact ttgtactgtt tcatttttaa tttccagcct ttctcttgtt taaatgttat 1861 aaaaaaaacc gactttacgc cggtcatcaa acaaaaatag ttttatttga cgatagctct 1921 ccatcttatg atgacaattg tacgcctgtt tgacggacaa ccagaattcc gtgcttcagc 1981 acacgcaacc ttcggcaata tcccctttca taatgacaac aggctgaact gttagcgtca 2041 ttactactg // LOCUS sequence264 2045 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence264 VERSION sequence264 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2045 /mol_type="genomic DNA" /organism="" /note="sequence264" CDS complement(76..729) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MTDVAVGDNGIINILDYTTGRVFQYDKECNLLFIFGCDQEAQRGG FDNPNAVECHGEYIYVLDGRNNDITVYEETLFGEYVHEAVRMFNEGLYEDSLDLWNEVV KRDGNYNMAYTAIGRALLNQDKYEEAMKYFKVAFEDIDYYRAFEADRQDMLRDNFTLIV VLLVALVVVVIVISQLQKKGKIPKNLIKLGLGWVGKKLLVLWEKLIKLIKGGKK" /locus_tag="LOCUS_7620" /note="MGA_1075" CDS complement(754..1737) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MTSMNIKKMLCVLVAVILSVTTLATAVFAEDPYTAYNYNAWSVAI PSQNGYIVCDTITGTEIGLDQLSDPNSPLFISETEPNKLSDAKDFFLSPNNEFFIVDTG NNRIIHTDFNFKLIGCYKTFTGSKLTEEVTDEVTGETTTQPVLGLKSPYGIFVDEDDIM YISDRDNQRVIKCGLDCEIITEYTRPDTQLYDSVSFYCTKVLVDAAKNVYVICPAVNKG AIMFSPSGAFVGYYGANRVEVTAEVIRNKLWRKFASEEQRASLVISTPVEYANFDIDHE GFIYTVTEVADVSTDAVKKLNPAGYNILEATTNAANMTFGDQQSIT" /locus_tag="LOCUS_7630" /note="WP_012583939.1 YIP1 family protein (Dictyoglomus turgidum) [pid:30.6%, q_cov:91.7%, s_cov:38.3%, Eval:1.2e-28, partial hit]" /note="internal stop codon at [754:756](-)" /note="MGA_1076" ORIGIN 1 tgagatcctc atatccctca aaggggtgga agatgacatg cttgagccat tgcacgggcg 61 tcatatcata aatcattact tcttacctcc tttaataagt tttatgagct tttcccaaag 121 aacgagaagc tttttgccga cccagccaag accgagctta attagattct tgggaatctt 181 gcccttcttc tggagctgag aaataactat aactacaacg acgagtgcga cgagcaaaac 241 aacgatgagt gtgaagttat ctctgagcat atcctgacgg tcagcttcaa atgctctgta 301 atagtcgatg tcttcaaaag caaccttgaa gtacttcatt gcttcctcat atttatcctg 361 gttgaggagt gcgcgtccga tagcggtata agccatgtta tagttaccgt cacgcttaac 421 tacttcgttc caaaggtcga gggagtcttc atataagcct tcgttgaaca ttctaactgc 481 ttcgtgaaca tattcgccga agagggtctc ctcatatacg gtgatgtcgt tgttacgtcc 541 gtccaaaaca tagatgtatt cgccgtggca ttcaacagcg ttggggttat cgaaaccgcc 601 gcgctgagct tcctggtcac atccgaagat gaagagcagg ttgcattcct tgtcatactg 661 gaatacacgt ccggtggtgt agtcaagaat gttgatgatt ccgttgtcgc cgacagcaac 721 gtcggtcaaa cgagttgcat atgtggtgac ggactatgta atggactgct ggtcaccgaa 781 tgtcatgttt gcggcattgg tggtagcttc caaaatgtta tagccggcag ggttgagctt 841 tttaacggcg tcggtcgaaa cgtcagcaac ttcggttacg gtatagataa agccttcgtg 901 gtcgatatcg aagtttgcat attcaacagg agttgaaatt acgagggacg ctctctgctc 961 ttcagaagca aactttctcc aaagcttgtt tctgataact tcagcagtta cttcaacacg 1021 gtttgcgccg tagtatccga cgaatgcgcc ggagggcgag aacatgatcg cacccttgtt 1081 aactgcaggg cagataacgt atacgttttt ggcggcgtca accaaaacct ttgtacaata 1141 gaaggataca gagtcataaa gctgagtatc gggtcttgta tattcggtga tgatctcaca 1201 gtcaaggccg cacttgatta ctctctggtt atctctgtcg gagatgtaca taatgtcatc 1261 ttcatcaaca aagatgccgt agggcgactt gaggccgaga acaggctgtg ttgtggtctc 1321 acctgtaact tcgtcggtaa cctcttcagt cagctttgaa ccggtaaagg tcttgtaaca 1381 accgataagt ttgaagttaa agtctgtgtg gataattctg ttgtttcctg tatcaacaat 1441 gaagaattca ttgttggggg aaaggaagaa gtctttagca tccgaaagct tattaggctc 1501 tgtttcgctt atgaacagag ggctattagg atcggaaagc tgatcaagtc cgatctcggt 1561 accggtaatc gtatcgcaaa cgatgtaacc gttctgagag ggaattgcaa cgctccaagc 1621 gttgtagtta tatgctgtgt acggatcttc tgcgaacact gcagttgcca atgtggtaac 1681 cgacagaatt acagcgacca gcacacaaag catcttttta atattcatac tcgtcaccgc 1741 ttttcacctt tcatttaata attgaattaa catgggttta gtccttcata cctgagttag 1801 ccatggtttc cataacgtta ctctgagcaa tgaggaatat gacaagcgga ggaatcatga 1861 gtacaaccgc ggatgcatag atgataccct gacgggcaat accggatgca gcgatctgtg 1921 acatgatggt gggaagagtc ttgaggtctt cctgatatac gagcgcgccg ccctgtacgt 1981 tccatgcagc ctggaatacg aagatgataa gggttgcgat agcaggcttc tggttgggaa 2041 ttaca // LOCUS sequence265 2034 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence265 VERSION sequence265 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2034 /mol_type="genomic DNA" /organism="" /note="sequence265" CDS 212..1540 /product="MATE family efflux transporter" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_009902958.1" /transl_table=11 /codon_start=1 /translation="MEIKLSDRFSYKKLLRFTLPSIVMMIFSSIYGVVDGFFVSNFVGK TPFAAVNFIYPFIMVLGAFGFMFGTGGSALIAKTMGQGNKEKANSLFSLFVYISTATGV VIGALGFIFVGPVAKALGAEGELLENCIIYGRIILAAMPAFMLQFEFQSFFITAEKPQL GLVSTVASGVTNMVLDALFIALFHWGLVGAALATAMSQVVGGVIPLIYFSCRNTSLLRL GKTEFDVKALLKACTNGSSELMGNISMSLVSMLYNAQLMTYAGENGVAAYGVLMYVNMI FLSLFIGYSVGTAPIIGYHFGAQNHAELKSLLKKSLVIIGISSVAMLAMGEILAKPLSL IFVSYDPTLLDMTLRGFAIYSFSFLFAGIAIFGSSFFTALNDGLTSAIISFLRTLVFQI AAVIILPIIWELDGIWASIVVAELMAALMTVLFIIGKRNKYHY" /locus_tag="LOCUS_7640" /note="WP_009902958.1 MATE family efflux transporter (Clostridioides difficile) [pid:60.2%, q_cov:99.5%, s_cov:99.8%, Eval:3.6e-157]" /note="MGA_1078" ORIGIN 1 ataacagaaa atctatcgta tttcaatata tcttttgcac tctttttaaa caaaaatgtg 61 aaaattacac aaatttcgta aaattctgca aatccatctt taaggtttac aaactacttg 121 catttatttt attttcgtat ataataatag ttgaacggcg gctgttaaaa tcaaacgccc 181 atctttatat acttttgaaa gcgagatgcg tatggaaatt aagctttccg accgtttttc 241 atataaaaag ctgttaaggt tcaccttgcc gtcaattgta atgatgatct tttcatccat 301 ttacggcgtt gtggatggct tttttgtttc aaactttgtc ggcaaaacgc ccttcgcggc 361 agtcaacttc atatatccct ttataatggt cttgggtgcc ttcggcttta tgttcggcac 421 gggcggaagt gccttaattg caaagaccat gggccagggc aacaaagaaa aagcaaacag 481 cctgttttct ttgtttgtat atatttcaac tgcgaccggt gttgttatcg gcgctttggg 541 tttcatcttc gtcggacctg ttgcgaaagc gcttggcgcc gaaggggagc ttctggaaaa 601 ctgcatcatt tatggcagaa taattttggc ggcaatgccc gcatttatgc ttcagtttga 661 attccaaagc ttctttataa ccgcagaaaa gccccagctc ggcctcgtgt cgaccgtcgc 721 atccggcgtg acgaatatgg ttttggatgc cttgtttatc gccctattcc attgggggct 781 ggttggcgcg gcccttgcga cagcaatgag tcaagttgtt ggcggagtca ttccgctaat 841 atatttctcg tgcaggaaca caagtcttct tcgcttgggc aaaaccgagt ttgacgtcaa 901 agccctactt aaagcctgca ccaacggttc cagcgaactt atgggcaaca tttcaatgtc 961 actggtaagt atgctttata acgcacagct tatgacatat gcaggtgaga atggcgttgc 1021 ggcatacgga gttttgatgt atgtcaatat gatcttcctt tcgctcttca tcggctattc 1081 tgtcggcacg gcacccataa tcggctatca cttcggtgcg cagaatcacg cagagctgaa 1141 aagtcttttg aaaaagagcc tcgtcataat cggaatcagc tcggttgcga tgcttgcaat 1201 gggcgaaatt ctggcaaaac ccctttcgct catatttgtc agctatgatc ccacgctttt 1261 ggatatgacg cttcggggat ttgcgatata ttcgttttca ttcctctttg cgggaattgc 1321 aattttcggt tcgtcattct tcaccgcgct taacgacggt ttgacatcgg caataatctc 1381 gtttttaaga acacttgtct tccagatcgc cgcggtaata attctgccga taatttggga 1441 gcttgacgga atatgggcat caatcgtggt tgccgagctt atggcggcgc tgatgacggt 1501 gctgttcata atcggaaaga gaaataaata tcactactga ggacgtgaga aaatgagcaa 1561 aattaaagct gtgcttttgg atattgacaa caccattctc gattttcacg agggtgcgcg 1621 ttctgcgatg ctttcagcgg caaatgaatg gggaatcatc tttcccgaga actattttga 1681 aacattcctc acgatcaaca atgccctttg gcatcgaatt gagcagggtg acttgacccg 1741 cgaggagctt ttcaaaatcc gctggccgtc gatatttgaa gcacttggta ttgatgcaaa 1801 cggtatcgaa tttgagaaag acttccgagc aaacttaatg tatgcggccg agcctgtcac 1861 aggcgctaag gatatgctcg attatctgta tggaaaatac cctatctatg ccgcgacaaa 1921 ttcgctatat gctcagcagg tgaccagact tcagaaggcc ggctttattg aatatttcag 1981 cggaatgttc gtgtctgaga agatcggcgc gcaaaagcca tcgcaggtgt ttta // LOCUS sequence266 2032 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence266 VERSION sequence266 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2032 /mol_type="genomic DNA" /organism="" /note="sequence266" ORIGIN 1 atggacacta tcgaaaatac ctacgttttc aagtggttct atgatatcga cctcaccaga 61 ttcggctgat tttaagttaa tataagcaaa tacattttgt cagatattct gacccgcatt 121 tttaggagaa attattatga tgttatgttc aaggtgcaaa aagcgccctg ctgctgtatt 181 tatcacaacg atgaacggca acgaaaagaa aaacgaaggc ttgtgctttg cctgcgcaaa 241 ggagcttggc attacgcagg ttgacgatta tttgaagcag atgggcattt ccgaggaaga 301 gctggaagcg atgagcgaac agcttatgag tgagcttgac ggcgattcat ttgagatggg 361 cggaaacgaa acgatgccta atttcttgac aaatctgttg ggcaaattcg gaggaaacaa 421 cgcttctcag ccttccaata atgctgatgc tcccaagtcg gataaaaaat ccgacaaaaa 481 agcaaacaag gaaaaggaac tgaagtttct gacaacatat tgcaccaact taaccgagcg 541 tgccgcacag ggtaagcttg ataatatcat cggccgtgac cgagaaatcg gcagagcggt 601 tcagattctt tcacgcagac agaaaaacaa cccgtgcttt atcggcgaac ctggcgtcgg 661 aaaaaccgct attgccgaag gtatcgctca aaagatcgtt gcaggggatg taccctttaa 721 tcttaagaac aaacagctat atcttttgga cttaactgcg cttgttgcag gtacacagtt 781 ccgcggtcag tttgaaagcc gaattaaagg tcttatcgaa gaggtcaagc gagagggaaa 841 tgtcattctt ttcattgacg aagtgcataa ccttgtcggt accggcgatt cagaaggcac 901 aatgaatgcc gcaaatatcc tgaagcctgc gctttcaaga ggcgagcttc tggtcatcgg 961 cgccaccacc tttaaggaat accgcaagta tattgaaaag gattccgccc ttgagcgccg 1021 attccagccg ataactgtca ccgagcctac ggtcgatgac actgttgaag tattgttcgg 1081 cattagaaag tattatgaag gatatcatca cgttaaaatt tccgatgcag cgctcagaat 1141 gtgcgctgtt ctgtcggaaa gatatattaa tgaccgtttc ctgcccgaca aggcaatcga 1201 ccttttggac gaaagctgtg cttgtgctgc gatcagaagc cccgaaattg caaaggcatc 1261 tgctttgaga tcaaagcttg aagaccagtg cataggtctt tccgaacttg aatctgcaga 1321 agaacccgat tatgagagca ttgcaaaact aaaggctgaa atctccaaaa ctgaggcaga 1381 gctggcatct gctgaggcgg aagctgataa ggtctgtgta tccgaagagg atctttctaa 1441 ggttattgag ctttggacgg gcattcctgc aaataagatc gttgagtcgg aatacgaaaa 1501 gatccgttcg cttcacgcgg cactttcaaa aagaattatc ggtcagcctg aagcggttga 1561 gcttgtctgc aatgcagtta agcgctcgcg tgttcagctt tcatctcgcc gcagacccgc 1621 atccttcata tttgtaggtc caacaggtgt cggcaagact gaacttgcaa aaactttggc 1681 agcagagctg tttgatgcaa cagagccgct catcaaaatt gatatgtcag aatatatgga 1741 aaagcatacg gtttcacgtc ttatcggctc gcctcccggc tatattggat atgacgaagc 1801 ggggcagttg actgaaaagg tccgccgaaa gccatattct gttgttctgt ttgacgaaat 1861 tgagaaagcg cacaaggatg ttatgaacat tctcttgcag attcttgacg agggcagggt 1921 aaatgatgcg cagggcagaa gcgtatcatt tgaaaacaca gttattatta tgacctctaa 1981 tgcgggttca acagaccaat cgggcggaat tggatttgat aagtcagtcg ca // LOCUS sequence267 2005 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence267 VERSION sequence267 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2005 /mol_type="genomic DNA" /organism="" /note="sequence267" CDS 149..532 /product="desulfoferrodoxin family protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_004453642.1" /transl_table=11 /codon_start=1 /translation="MCENSRFYICEHCGNIVGMIHSSGVNPVCCGQKMTKLEAGTVEAS REKHIPVVSVDGNTVKVVVGSVAHPMTEEHSITWVYLQTDRGGQRKCLNAGEAPEVTFA LADEKPVAVYAYCNLHGLWKADI" /locus_tag="LOCUS_7650" /note="WP_004453642.1 desulfoferrodoxin family protein (Clostridioides difficile) [pid:57.8%, q_cov:100.0%, s_cov:100.0%, Eval:2.2e-40]" /note="MGA_1081" CDS 567..725 /product="rubredoxin" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003688501.1" /transl_table=11 /codon_start=1 /translation="MKYVCNVCGWVYDEELGAPDMGIAPGTKWEDLPDDFECALCGVDK DNFSPEE" /locus_tag="LOCUS_7660" /note="WP_003688501.1 rubredoxin (Neisseria) [pid:63.8%, q_cov:90.4%, s_cov:83.9%, Eval:7.0e-15]" /note="MGA_1082" CDS 791..1543 /product="ZIP family metal transporter" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011144264.1" /transl_table=11 /codon_start=1 /translation="MKLVLLTALGVGGATVIGALLGFVFKKLSHKFSDIVLSFAAGVML AAAVLGLVLPSLEYGRKYGLIVTVAGIFAGALCLNLIDKLVPHLHKMVGPDIESHENSS LDKVLLFVTAIAIHNLPEGIAAGVGFGSGDVSQALIIAGGIALQNIPEGMVIIGPMLAA GVKPRTTFWLAMITGLVEVVGTLIGYFAVSISSAILPFALAFAGGTMLYVISDEMIPET HAHGSERGATYSLLAGFCVMLITDVLLG" /locus_tag="LOCUS_7670" /note="WP_011144264.1 ZIP family metal transporter (Gloeobacter violaceus) [pid:40.2%, q_cov:97.2%, s_cov:95.8%, Eval:7.8e-48]" /note="MGA_1083" ORIGIN 1 aatgcttgaa aagagcgtaa acctgacata tacagaagca acagtcaaaa ttctctcggc 61 acttaatgcc gaaaacgaag ctcagctcga ggctttggca gacgagctgt gcaaataaca 121 aatatttaaa tttttggagg taattattat gtgtgaaaac tcaagattct acatttgtga 181 gcattgcggg aatattgtgg gaatgatcca ttcgagcggc gttaaccctg tttgctgcgg 241 tcagaagatg actaagcttg aagcaggcac cgttgaggcg agccgtgaga agcatattcc 301 cgttgtatcg gtggatggaa acaccgttaa ggtcgttgtc ggttcagttg ctcaccccat 361 gaccgaagaa cacagtatca cctgggtata tctgcagacc gacagaggcg gacagagaaa 421 gtgtctgaat gcaggggaag ctcccgaagt gacctttgct ttggcagacg aaaagcctgt 481 ggctgtatat gcttactgca atcttcacgg attgtggaag gctgatatat aaacaaaaat 541 caacaaaata ttaggaggaa ataattatga aatatgtatg caatgtatgc ggatgggttt 601 atgacgaaga attgggtgct cccgatatgg gcatcgctcc cggcacaaag tgggaagatc 661 ttcccgatga ttttgaatgc gctctttgcg gcgtagataa agataacttc agccctgaag 721 aataatttgc tttttcgctc ccgtgctgag ttttcggcgc gggagcattt ctttaaagga 781 gcattagttt atgaaacttg tattgctaac agctttgggt gtcggcggag caacggtgat 841 cggcgcactt ttaggctttg ttttcaaaaa actatcccat aagttttccg atattgttct 901 gtcctttgct gcgggagtaa tgcttgcggc ggcggtattg gggctggtat tgccctcgct 961 tgaatatggc aggaaatatg gacttatcgt tacggtcgcg ggtatatttg caggcgccct 1021 ctgcttaaat ttaatagaca agctggtgcc ccatttgcac aagatggtgg gacctgacat 1081 cgaatcgcac gagaattcat cccttgataa agttctgttg tttgtgacgg ctattgccat 1141 acataacctg cccgagggca ttgccgcagg tgtcggcttc ggttcgggag atgtttcaca 1201 ggcgctgata attgcaggcg gcatcgccct gcagaatatc cccgagggaa tggtaataat 1261 cggtccgatg ctggcggcag gtgtgaaacc gaggacaacc ttttggcttg caatgattac 1321 agggctggtc gaggtggtcg gaacgcttat cggctatttt gcagtcagca tatcaagcgc 1381 aattctgcca tttgctttgg catttgcggg aggcacgatg ctatatgtca tcagcgacga 1441 gatgattccc gagacccatg ctcacggaag cgagcgcgga gcaacatatt cgttgctggc 1501 gggcttttgc gtaatgctca taaccgatgt tttgcttgga taaccgaccc ccttgggccg 1561 gttttttcat cttgagtcat agggacaaat atggtataat tgttttaata ttaatggatc 1621 aggaggcaca ctgatgtatt gtttgcagaa tcgctggaaa tttgaaggca aaaaacttgt 1681 atattacggt ctgagaagcg ggaaaaatat gcttaaaaac gaaattcttc tttcgcgcag 1741 gcaggcggat attattgcat ctttgccttg cgagcttggc gacgaggaaa agttggcttt 1801 gaaaaagctt ttggatgtct gcgtggttga aaaagaccgg cttcgcccga tccctcagtc 1861 tatagatgaa gcgagatttt gcaataattg ctgtgccaat gattttatca tccccgggtt 1921 ggagtttgac agtgacggac tttgccctat gtgtcaaacc gctgacgatg tccgcgactt 1981 gaaaagtgtg gtgcctttgg ttgat // LOCUS sequence268 2001 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence268 VERSION sequence268 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2001 /mol_type="genomic DNA" /organism="" /note="sequence268" CDS complement(880..1356) /product="sigma-70 family RNA polymerase sigma factor" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011459411.1" /transl_table=11 /codon_start=1 /translation="MNNQEYERLVKLHIDSVYRVALNGCQNPHDAEDIVQSTFMKLLER KDSFNDDDHARRWLIRVCVNECKNLWRSPWRSRTTSLEDIFQEPIFSSPEKSELYYAVN ELPAKYRTLVYLYYFEGYTVKEIAAIMSISETAVQTRLYRARAHLKDRLKEAWQ" /locus_tag="LOCUS_7680" /note="WP_011459411.1 sigma-70 family RNA polymerase sigma factor (Desulfitobacterium hafniense) [pid:41.3%, q_cov:87.3%, s_cov:78.6%, Eval:3.7e-25]" /note="MGA_1086" ORIGIN 1 agaacatatt gtcgatcgac tcggcgattg ccttgatttc ttcgacagtg agtgtattct 61 cctcgacata ggagtagtca ccttcttgat caaacagtga tgcccaagaa atcatcatta 121 ccttatattt ttctccgaca aacagatatt gtctatacaa acagcggtct tccttgagca 181 tatcgtaata gtagatgtca actctgccgt catccgtctg ttcgtgatat agttcaccat 241 cgtgggcgat cacaagatca gattcgttat aaagctcctg cagataaatc catataccct 301 ttgtccagaa atcttgatca attccctctt ttctgaattt tcctccgcga tagttataat 361 ctgcatttga gctcaatgtt gctccaggtt cttgctcgcg ttcttccaaa gtaattccct 421 ctatgctata aagttcaaag tcctcgggaa cggcaatctt ttctgggtcg atgatgttcg 481 gaatatcaaa gagaaaatct tcaaccggat atggagtgag ataatgctta tactcttcct 541 taacctcatg gccgacgata attccgttgc cgtcatcgcc tgcaagaact ccgtctgtgc 601 cgtcgatgtg tccgtaaatc gggtcataga aagtatcatg gaccgcgttg ccgaacataa 661 cgtccctact gaaatcgacc ttatatgtcg caacagtgac aagtgtcgcc gccaaaacca 721 atgtgagtgc cgccgcaatt attacaacct ttttaacaac tttgggtctt gccttatttt 781 cattattcgc tgtcatattt aacacctttc cgactaaagc agacggcgcc ttaatttcgc 841 tgaaagtatc cttgaaatac tccctgtttc gttcatcatt cattgccatg cctcctttaa 901 tctgtctttt aaatgcgctc ttgcgcggta aagtcttgtt tgaacagcgg tttcggagat 961 ggacataatc gccgcaatct ccttaacggt gtaaccctca aagtagtaca gataaacaag 1021 cgtgcggtac tttgccggaa gctcgttcac tgcataatac agctcgctct tctcggggga 1081 tgagaatatc ggttcttgaa aaatatcttc aagcgaggtc gtgcgactgc gccagggcga 1141 gcgccaaaga tttttgcatt cattgacaca gaccctaatc agccagcgcc ttgcgtggtc 1201 atcatcgtta aagctgtcct tgcgctccaa tagcttcata aacgtgcttt gcacgatatc 1261 ctcggcatcg tgagggtttt ggcaaccgtt aagtgcaacc ctataaacgc tgtcgatatg 1321 gagcttgacc aagcgttcat attcttgatt gttcaaactg tcttcaccac tttcgaaagg 1381 cctttcacca tatgaacgga tttaaaggcg ggaatatcac aaggggaaaa ttattttttt 1441 gaggggagcg gagcgccgtc tgcgagcgcg ttacgcagga acagtgccgc aggtggcgcg 1501 gagcggtggg gcaagcatcc gacctgcaaa tcctctccca ttgggagagg tggcacgcgc 1561 agcgtgaagg agagggcaac aaacaaggcg cgaggcaaag ccccacgccc gagtgtatat 1621 tatttttcca aagtgccgtt tgaaagcgcc ttgagatatg cgttgatgaa accgtcaagc 1681 tcgccgtcca taactgcgcc gacatttccg ttttcatggc ctgttctgtg gtccttgaca 1741 agggtatagg gcatgaaaac atatgaacgg atctggctac cccatgcgat ctccttttgt 1801 acgcccttga tatcctcaat tttggaaaga tgctcacgct ctttaatttc aacgagcttt 1861 gcaatcagca tcttcattgc atagtccttg ttctgaacct ggctgcgctg ggtctggcaa 1921 gcggttacga tgcctgtagg gatatgagtg atacgaacag cagaggatgt tttgttaata 1981 tgctgtccgc ctgcgcccga t // LOCUS sequence269 1997 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence269 VERSION sequence269 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1997 /mol_type="genomic DNA" /organism="" /note="sequence269" CDS complement(185..1939) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MSVTQTIINNMLKNGILEDYSYETFRTPEYSSSGFASPDDIILND EQQAAYDGIFKLICEGKPAGALLHGVTGSGKTAVFIKLIDSVIKSGKGAMLLVPEISLT PQLVGKFKTMFGDTVAVIHSSLSLGQRLDEFKRIKRGDAKIVIGTRSAVFAPLKNISLI IMDEEGESSYKSEASPRYHARDVAIHRAGIHNSVLLMASATPSLESYYFAKSGRYSLFE LKKRFNNSSLPQVVVADMATEAEFGNSGFFCSDLIRSVGEAVKDGKQAILLLNRRGYNT TITCHSCHEPVKCPNCSIPLTYHKANGKLMCHYCGYSAMFNSTCPDCGSKLVKASGLGT QLLEEELEHAFPNARILRLDADTTYSRYAYEQKFKAFENGEYDIMVGTQMIAKGLDFPN VTVVGVISLDNSLFAGDYRSYERTFSLLTQVVGRGGRGEHKAVAYIQTFVPDHHIITLA SDQDYVGFFEQEVALRKELIYPPFCDICAVYFTSPIELDALRASSAFLDMMKQRLGNVK DKFPLRVLGPARSRQGRINNRYKYVLTLKCRNSKVFRSFISELLIAASKDKRFSNVRVY ADINGDIN" /locus_tag="LOCUS_7690" /note="WP_003232079.1 primosomal protein N' (Bacillus) [pid:41.5%, q_cov:98.1%, s_cov:70.4%, Eval:1.7e-131, partial hit]" /note="MGA_1089" ORIGIN 1 aattccaacc tggggcgcgg caagaccgac gccgtcatca tcgtacattg tatccttcat 61 atcgtcaagc aactgccaaa gtcttaagtt aaacctatcg acaggcttac aaaccttcaa 121 aagaatgggg tcgccatcct tgacaatttt tctaatagcc ataagtattt acttcctttc 181 aaaatcagtt gatatcgccg ttaatgtcag cataaactct aacatttgaa aatcttttat 241 ctttggatgc tgctattagt agctctgaaa taaagcttct gaacactttt gagttgcggc 301 atttaagcgt taaaacatat ttatatcggt tatttatccg tccctgtctc gaccttgcag 361 ggccgagaac acggagcggg aatttatctt taacgttacc aagtctttgc ttcatcatat 421 ccaaaaaagc gctggaagcg cgaagtgcat caagctcaat tggcgaggtg aaatacacag 481 cgcaaatatc gcaaaaaggc ggatatatca gctcttttct cagagcaact tcctgttcaa 541 agaaacctac gtagtcctga tcggatgcca gagtgattat atgatgatcg ggaacaaagg 601 tttgaatata tgcaacagct ttgtgctctc ctctgccgcc tcttccaacc acctgtgtta 661 gcagagagaa tgtgcgctca tagcttctat aatcacctgc aaagagcgag ttatcaaggc 721 tgatgactcc cacaactgtt acattgggaa aatcaagacc ctttgcaatc atctgggtgc 781 cgaccataat gtcatattcg ccgttttcaa aggctttaaa tttttgctca taagcatacc 841 gagaatatgt ggtatcagca tccaaacgca aaattcttgc gtttggaaaa gcgtgctcaa 901 gctcttcttc gagaagctgt gtacccaagc cggaagcttt aacaagttta cttccgcaat 961 cgggacaagt ggagttgaac atcgcagagt atccgcaata gtggcacatc agcttgccgt 1021 tggctttgtg atatgtcaaa ggaattgaac agttgggaca cttcacaggc tcgtggcaac 1081 tgtggcaggt gatggtcgtg ttgtatccgc ggcgatttaa aagcaaaatt gcctgtttgc 1141 cgtccttaac tgcttcaccg acacttctta ttaaatcaga acagaagaag cccgagttcc 1201 cgaattccgc ttcggttgcc atatctgcaa caacaacttg cggaagcgaa gaattgttga 1261 accttttttt gagttcaaaa aggctgtatc tgccggactt ggcaaagtag tatgattcaa 1321 gagagggcgt tgcggaagcc atcaaaagaa ccgaattgtg gatacccgct ctatgaatcg 1381 caacatcgcg agcgtgataa cgtggcgagg cttcgctttt atatgaggac tccccttctt 1441 cgtccataat aatcagagaa atatttttga gcggtgcaaa aactgcgctt cgggtaccga 1501 ttacgatttt ggcatcgccg cgcttgatgc gcttgaattc atctaaacgc tgacctaacg 1561 ataaactcga gtgaatcacc gcgacggtat cgccaaacat tgttttgaac ttaccaacaa 1621 gctgtggagt cagcgaaatt tcaggcacaa gaagcattgc acctttgccg gatttgataa 1681 ctgagtcaat cagctttata aatacagctg ttttgccact tcctgtaact ccgtgaagca 1741 gcgcacctgc aggcttgcct tcgcagatca gtttaaaaat gccgtcatat gccgcttgct 1801 gttcgtcgtt gagtataata tcatcaggag aagcgaaacc gcttgacgaa tactcaggtg 1861 tgcggaatgt ttcgtaggaa tagtcctcca aaatcccgtt tttgagcata ttgttaatga 1921 tcgtctgggt gacgctcaaa atatagcaag tttccttgat agatgcactt tcgttttcct 1981 aaagaaactc gataaca // LOCUS sequence270 1996 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence270 VERSION sequence270 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1996 /mol_type="genomic DNA" /organism="" /note="sequence270" misc_feature complement(561..>1996) /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_012584062.1:endo-1,4-beta-xylanase" /note="WP_012584062.1 endo-1,4-beta-xylanase (Dictyoglomus turgidum) [pid:38.7%, q_cov:71.7%, s_cov:31.1%, Eval:2.7e-60, partial hit]" /note="MGA_1091" /locus_tag="LOCUS_7700" ORIGIN 1 tgcttcgaga gcagcttcat aaacgcctgc acaaggaaca acgtaatcgt cataaccggt 61 agccttgatg gttacgtcag agatctcata cttgatggtg gtcttgtcac cgataactgc 121 ctgagtctgg ccaatggtac cgtcaagaat ctggatacca tactggtaag aaccgccgtc 181 agcagtggta atagtcttcc aagcttcgcc ggtgtaaaca acagtcttgg tttcgccgag 241 accgatctga ttctcaacac ctgtagcgtc cttcaaaggg gtccaaacag cgtagttagg 301 ggtatcctgt gcccaaacct ggggctggat gtgaatgtag gatgtatcaa cagcacagac 361 ggaaactgtc ataacagcaa cgagcgcaac tgccaatacg attgacataa ttctcttcat 421 aatgttttcc tcctaaaaaa tagtggtatt aaaccattta aagtttagca catgaaaata 481 ttaaagtcaa tatataacaa aacaaactgt catatacaca agaatatagc tagttttttg 541 tgcaaattaa catattttag ttattcaagc accaaagaca ggacttccca gtatgtcgat 601 ttgaaaccat tattgcgatc aattaagaat gggtgattta cacggcctgc agggctgttg 661 ttaagccaag agtgatcatc gttgatgccc cagaatacaa ctgtgtcaat aatgccttct 721 tcggataatt ccatgaaaag cttgaatgct tcaacgtagg ttttgttata ctgcttcata 781 aagctgtcat tcagatcaac tttaagggaa ttatcattcc aaacgaaaca gctcatatcc 841 atttcggtta tctcaatagt gaaaccgggg ttatactttc tcagttcggc taacttttca 901 agatttcttc ttaatgtgtt tatgtcggtg ttatatgcaa tatgcatctg cagaccgaca 961 ccgtcaacct gaatgccgtc ctgaagcatt gatttaacga ggttatatac tccgtttacc 1021 tttgcagagc tccattcaag gttataatcg ttgataatca gctttgcatt tgggtcagcc 1081 tttgaagcgc aaatgaacgc ctgctcgatg tagtcatact tatcgccgtc gccgtcgtaa 1141 tcccctacta tctgcagcca cttggagtca cgcagagttc cgtcatcgtt aaacacttca 1201 tttacaacat cccaagtgtc gattttaccg gcatagcggg aaacgatcgt ggtaacatgt 1261 tcatcaattc gatccataag ctgttttgcg gttgcctttg ttccgcttgt gcccgattta 1321 tagaagaacc aatcgggaca ttggctatgc catacaagag tgtgtccgcg aagagcaaca 1381 ccgtattttt cgccaaactc aacaaactta tcaacgtttg agaagttata tttattctcg 1441 ctggggtgca tagcatcagg cttggattca ttctcaagag tgaaaatgtt gaactgtttc 1501 atcatcgaaa caaaatcatt actgttcttg ttgttgaaat accaagtgtt gacagcagca 1561 cctaccttga agtggtcagt aaacgcttca tagagtgaag gggcgttatc atcatatgta 1621 tgcttggctt tttgcatagt gttgagctca gactttttgt attcatagtc agagccatac 1681 atttcagcag caaggccttc ggcaacaccg tcgttattcc aatcctgaga agtatatgca 1741 ggaatatact cgccgactgt aatggtgacg atatattcaa agtcgattac acctgcatca 1801 gcgctgaagg catagggatt taaaattaca gcatggacgc tgtcatcaag atcgcaggaa 1861 agcaatgctg ttcctttttc gaaatctgcg gtggtttctg cgccgttgtc accgcgtgaa 1921 ttccaatgga gctcacattt aggcgatgca ctgttccaac atttatcggt gttagatgca 1981 gtaattttga tctcaa // LOCUS sequence271 1966 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence271 VERSION sequence271 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1966 /mol_type="genomic DNA" /organism="" /note="sequence271" CDS complement(338..1642) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MTNLQLFELISDIDSSYIIAAARPVRRYNMSKWTKIGGVAACLCL IIAGIFAVSSSFSDRIPLPIDPEQTTASTDILNGEVTLGDDTVNSLPVLSIDENSLFGG GMGFEGLMYRDISEVQNGNPWNEETQLETLPVYKNLGYSYHGVQNYLESDEMVARVKET AKLLGIEITDWDFGIVFSQIGENEFLDETTYAEGANADIKIRAFANGDVFINYEKAREL PDSINFTRESTTHEDGLIALEYLSGEYAEFMNYTETECTTINGDYNIYGEQQKRDYIIY EGSGDYAEDIVNYNLNYTEFVPEFGGEQGELDTGNLGDVRRYDHLVCAEKVGDYPLISA DEAEELLFSGIYLTSVPHDIVETDIVAKVELVYTKGVTSQYFMPVYKFYIPLSGRENGH NFDRSNGLITFGIYYVPAISGEYIADMPTSAGRFN" /locus_tag="LOCUS_7710" /note="MGA_1092" ORIGIN 1 ccccgaagcg atggcgtcaa gtcaaaaaaa taaaccccgc cccacacaat gggacgaagt 61 cactcgcggt accacccaaa ttcgccgaaa acagtttcag cctcataagc cttaacgcgg 121 caaacgtcac ggttttccgt gaagctcagg ggtagcaccc gacaagatca tttcatgctt 181 acaccaaccg catgatctct ataaatgcct tttgttcggt cattcccgtc aacgcttgtt 241 aataaaatta ttataatctc ggatatctga tttgtcaagg gtttgagtgc gaatataaat 301 gcaaaaaggc agggtttcct gccttgtctg cattatgcta attgaatctt cctgcactgg 361 tgggcatatc ggcgatatac tcgcccgata tcgccggaac gtaatagatt ccgaaggtta 421 taagcccgtt gctccggtcg aagttgtgac cgttttccct gcctgaaagc gggatataga 481 acttatatac aggcatgaaa tattgcgatg tgacgccctt tgtgtaaaca agctcaacct 541 ttgccacgat gtctgtttca acaatgtcgt ggggcacaga tgtcaaatat ataccgctga 601 acagaagctc ttctgcttcg tctgctgata taagcggata gtcgccgacc ttttcagcac 661 atacgagatg gtcatatctt ctgacatctc cgagatttcc cgtgtcaagt tcgccttgct 721 caccgccgaa ttcgggaaca aactcggtat agttcaggtt atagttgaca atatcttctg 781 cataatctcc cgaaccttca tatatgatgt aatcccgctt ttgctgttcg ccgtatatgt 841 tataatctcc gttaatggta gtgcactcgg tttcagtgta attcataaac tcggcgtatt 901 ccccactcag atattcaagc gcaataagcc catcctcatg ggtggtgctt tcgcgggtga 961 agttgatgct atctggcagt tcgcgtgctt tttcatagtt aatgaacacg tcgccgttag 1021 caaaggcacg aattttgatg tcggcgtttg cgccttctgc ataagttgtt tcatcaagga 1081 attcattctc tccgatctgc gagaatacta ttccgaagtc ccaatcggtt atttcaatgc 1141 ctaaaagctt agcggtctct ttgactcttg ctaccatttc atcgctctca agataatttt 1201 gcacgccgtg gtagctgtag ccgaggtttt tataaacggg tagagtctca agctgagttt 1261 cctcattcca agggttgccg ttttgaacct cacttatgtc gcgatacata agcccctcaa 1321 agcccattcc accgccgaat aggctgttct catctattga gagaacaggc aaactgttga 1381 cagtgtcatc gccaagggtc acttcgccgt tcagaatgtc cgttgaagcg gttgtctgct 1441 ccggatcaat cggcaaagga atcctgtcgg aaaagcttga tgataccgca aatattcctg 1501 cgattatcaa gcataagcaa gccgccaccc ctcctatttt tgtccatttg gacatattat 1561 atctgcggac aggtcttgct gctgcgatga tatagctcga gtcgatatcg gatataagtt 1621 caaatagctg taaatttgtc atacggtgaa gcccctttcc tcgagatatt ttttgagttt 1681 ggcacgggtg cgcataagaa tcgacgaaac gtttccctgc gacatcccta tatcctcggc 1741 gatgtccata acgctgtcgg cataccaata cctgcggatg aagatgttac gcttttgctc 1801 gctgagttca ctcaaaaagc tgtttatggc gcgcacaagt tcctgtttat ccagctctcc 1861 ctccacgttt tcgtttcccg aaacgatctc gctcagctca tccaaaaccg catcggctga 1921 gttgccgccc cgtttttcac ggtgaagatg cttatagcga ttgagc // LOCUS sequence272 1965 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence272 VERSION sequence272 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1965 /mol_type="genomic DNA" /organism="" /note="sequence272" CDS 360..1157 /product="dihydroorotate dehydrogenase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_010905897.1" /transl_table=11 /codon_start=1 /translation="MGTFSFKGTTKDPRFGNPTPRIAECTNGMINAVGLQNPGVEKVIS EELPKLAKCFNKKVMANVSGFSVEDYAYTCACLDKCEQVGWLEVNVSCPNVHGGGMSFG TSPEAAAEVVKAVKAVTTKPVIIKLSPNVTDIVAIAKACEEAGADGISLINTLLGMRIN LRTRKPIIANKMGGFSGPAIFPVAVRMVYQVAHAVNIPVIGMGGVSCAEDVIEMMLAGA TAVEIGAQNLVDPFVCKKIIEELPSVMDKYGIENLSDIIGGVK" /locus_tag="LOCUS_7720" /EC_number="1.3.1.14" /note="WP_010905897.1 dihydroorotate dehydrogenase (Lactococcus) [pid:55.3%, q_cov:100.0%, s_cov:85.5%, Eval:2.4e-82]" /note="MGA_1095" CDS 1160..1858 /product="orotidine-5'-phosphate decarboxylase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_000083510.1" /transl_table=11 /codon_start=1 /translation="MGKDVIIACDFSSAEQVFAFLDKFTGRKPFVKIGMELFYAEGPSI VREIKARGHKIFLDLKLHDIPNTVKKSMNVLSRLDVDLCNLHAAGTVNMMKAAIEGLTR PDGTRPLLIAVTQLTSTDQESMENDLLIHEPIDKVVMHYAHNAKLAGLDGVVCSPLEAE KVHEVCGKEFLTVTPGVRFADGDIGDQKRVMTPAPAKLIGSDYIVVGRPITAAPDPVAA YERCCREFIG" /locus_tag="LOCUS_7730" /gene="pyrF" /EC_number="4.1.1.23" /note="WP_000083510.1 orotidine-5'-phosphate decarboxylase (Bacillus) [pid:54.5%, q_cov:100.0%, s_cov:98.7%, Eval:7.3e-66]" /note="MGA_1096" ORIGIN 1 aagcgttgga acaaagggct ttgtgacaga cgttatgaag gaccttgaat atacacactt 61 ctatacctgc ggacccgaac cgatgctgaa agcggtatat aaatcttcta acacatcggg 121 acagctcagc tttgaagaga gaatgggctg tggcttcggc gcttgcatgg gttgctcctg 181 caagaccttg acaggcaaca agagaatctg caaggaaggc cccgtaatgc ggaaggagga 241 gatcatatgg gaagactgag tgtagacctt ttgggaatca accttgataa ccccattatc 301 ccgcgagcgg aacctttgga tacggatatg aattcgcaaa cctttatgac attaacattt 361 tgggaacgtt ttcctttaag ggtaccacaa aagaccccag attcggaaat ccaacccctc 421 gaattgccga atgtacaaac ggaatgataa atgccgtagg tttgcagaac cccggcgttg 481 aaaaggtcat ctccgaagaa ctgcctaagc tcgcaaagtg ctttaataaa aaagtcatgg 541 caaacgtcag cggattttcc gttgaggatt atgcatatac ctgcgcttgt cttgataagt 601 gcgagcaggt tggatggcta gaagtcaatg tgagctgtcc gaatgttcac ggcggcggaa 661 tgagcttcgg cacaagtccc gaagcggcgg ccgaggtcgt taaagcagtt aaggcggtta 721 ccaccaagcc tgtaattatt aagctcagcc cgaatgtcac cgacattgtg gcgattgcaa 781 aggcatgcga agaagcaggc gccgacggca taagcttgat caataccctt ttgggtatgc 841 gaatcaacct tcgcacccgc aagccgataa ttgcaaacaa aatgggcgga ttttccggcc 901 ctgcgatctt ccctgttgcc gttagaatgg tatatcaggt ggcgcacgca gttaacattc 961 ccgtaatcgg aatgggcggc gtaagctgtg cggaagacgt tattgaaatg atgcttgcag 1021 gcgcaactgc cgttgagatc ggtgcacaga atctggttga tccctttgta tgcaagaaga 1081 taattgagga attgccctcc gttatggata aatatggaat tgaaaattta agcgacatta 1141 ttggaggagt taaataatta tgggtaaaga cgtaatcatc gcctgcgatt tttcaagtgc 1201 tgagcaggta ttcgcatttt tggacaagtt cacaggcaga aagcctttcg ttaagatcgg 1261 tatggagctt ttctatgcag aaggcccctc tatcgtcaga gaaattaagg caagaggaca 1321 caagatcttt ttggacctca agcttcatga cattcccaac accgttaaga agtcgatgaa 1381 tgttctttcg cgcttggacg ttgacctttg caacttacac gcagcgggca cagttaatat 1441 gatgaaggcg gcaattgaag gcctgaccag acccgacggc acaagacccc ttttgattgc 1501 agttacacag ctcacctcca ccgatcagga gagcatggaa aatgacctgc tcattcacga 1561 gcctatcgac aaggttgtaa tgcattatgc acacaacgca aagcttgcag gacttgacgg 1621 cgttgtttgc tcaccccttg aggctgaaaa ggtacacgag gtttgcggca aagaattcct 1681 caccgttact cccggtgtga gatttgctga cggcgacatc ggcgaccaga agagagttat 1741 gactcccgca ccggctaagc tcattggctc cgactatatc gttgtcggca gacccattac 1801 cgcagctccc gaccccgtag cagcctacga gagatgctgc cgcgagttca tcggctgata 1861 attgtaaaca aatattcact ttattcaaaa acaacagcgc cgtaacttga cacggcaacc 1921 atgaaagaga ggattactaa aatggctgac atacagaagc ttata // LOCUS sequence273 1959 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence273 VERSION sequence273 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1959 /mol_type="genomic DNA" /organism="" /note="sequence273" misc_feature <1..821 /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_010964978.1:replication-associated recombination protein A" /note="WP_010964978.1 replication-associated recombination protein A (Clostridium) [pid:45.4%, q_cov:98.9%, s_cov:67.0%, Eval:1.6e-65, partial hit]" /note="MGA_1097" /locus_tag="LOCUS_7740" CDS 835..1617 /product="TIGR00282 family metallophosphoesterase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011392597.1" /transl_table=11 /codon_start=1 /translation="MSNQFKILALGDVVGPFAVKYISEKLWAFRRENNINMVVCNAENA ASGNGLDPFGADKLISAGCDVLTGGNHIFRKREIRPYLESSEVLVRPANYPIGTPGNGY TIVDIDGFKVLVINVMGTIYLEALACPFSTVDRILEREAGRYDLAILDIHAEATSEKIA LGRYFDGRINVVFGTHTHVATADTAVLPKGTGYVTDLGMSGPNDGVLGVRADIIIEKLR MKLPVKFELAEGDIEVNGVIFTLDTVSGKTLDVERVKF" /locus_tag="LOCUS_7750" /note="WP_011392597.1 TIGR00282 family metallophosphoesterase (Moorella thermoacetica) [pid:45.9%, q_cov:97.7%, s_cov:97.7%, Eval:1.3e-61]" /note="MGA_1098" ORIGIN 1 acgccataat ctcccgttct gcggtttttg aatttcgtcc tgtttcaaga gaagaaatta 61 tccgcgctct ttcgcgtact ctcgatatgc tcaactcgga agaaaacgct tcggtgaaat 121 gctccgagga agccttcgat gctcttgccg gctccggtgc cggtgatgtc cgtcggagta 181 tggggctgct tgaaaatgca ttttatctcg cggtttcggg agataacgag ataacggctg 241 accttatacg cggcttcact cccacggtgc tgggaagctt tgaccgggct ggcgatgtac 301 actatgatct tttgtcgtgc cttcaaaagt ccataagagg aagcgacccg gatgctgctg 361 cgttttatct tgcaaagctt cttgagggcg gtgatatgga gtctgcctgc agacggcttc 421 aggtgatcgc aagcgaggat attgggcttg catatccgat ggctgctgta atcactcgct 481 cctgtgtgga aagtgccagg gaattgggac ttccggaagc ccggatcccg ctcgtcaacg 541 cggcgataat gcttgcaacc gctccgaaat ccaacagtgc atatgaagca cttgcaaagg 601 caaatgccga catttcggcg ggccgcggtc aggaggtccc aaagcatctg cgcagtccga 661 attttgtggg atacaagtat cctcattcgt acccggatca ctgggtggca cagcaatatc 721 ttcctgatga gcttgaaggc cgacgttatt atgagtacgg agaaaacaag acagaacagg 781 cggcaaagca atattgggat aagatcaaga attcaaaata gtgggaggcg cgaagtgagc 841 aatcaattca aaatccttgc gctcggcgat gttgtcgggc cgtttgcggt gaaatatata 901 agtgagaagc tttgggcttt ccgccgtgaa aacaatataa atatggtggt ctgcaatgca 961 gaaaatgctg cctccggaaa cggtcttgat cccttcggcg cagataagct tatttcggca 1021 ggctgcgatg tgctgaccgg aggaaaccat attttcagaa agcgtgaaat acgtccttat 1081 cttgaatcca gcgaggtact tgtccgacct gccaactatc cgataggcac acccggcaac 1141 ggatatacca tagtggatat tgatggattc aaggtgcttg ttataaacgt gatgggaacg 1201 atatatcttg aggcactcgc ctgccctttt tcaacagttg accgtatact tgagcgtgaa 1261 gcgggacggt atgatcttgc gattcttgat attcatgccg aggccacaag cgaaaaaatc 1321 gcccttggac gttattttga cggaaggata aatgtggttt tcggaactca cactcacgtt 1381 gccactgccg atactgcggt gttgccaaag ggaaccggat atgttaccga tctcggaatg 1441 tccggtccaa atgacggagt tctcggtgtc cgcgccgaca tcattattga aaagctccgc 1501 atgaagcttc cggtgaagtt cgagctggca gaaggtgaca tcgaggtgaa cggcgtgata 1561 tttactttgg atacggtgag cggcaagacg cttgacgttg aacgagtgaa gttttgatgg 1621 tgtatagact gtctgttatt tgactttaca tgaatgtaga accaacagaa aaatccgccc 1681 gcatcagaat gatgcgggtg gatttttgtt atagagggtt cttttaaatc acttcttgtt 1741 cttcttatcc ttcgccgact tggcaactat gccggaaagg gcgatcagag caattacgtt 1801 ggggagaacc ataaggtagt tgaagaagtc tgtcagttcc caaacaaggt cattcgatgc 1861 caatgttccg aggaatatga aagcaaccgc gattacagaa taaactaaaa tcgcaacctt 1921 gttattttta aagagcgact gaacgttgat tttgccgaa // LOCUS sequence274 1956 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence274 VERSION sequence274 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1956 /mol_type="genomic DNA" /organism="" /note="sequence274" misc_feature complement(1010..>1956) /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_010890803.1:RICIN domain-containing protein" /note="WP_010890803.1 RICIN domain-containing protein (Clostridium) [pid:27.3%, q_cov:76.4%, s_cov:39.9%, Eval:4.9e-11, partial hit]" /note="MGA_1101" /locus_tag="LOCUS_7760" ORIGIN 1 tgtcggggtc gagcggatcg gttgaagtca tatagcacat ggtgcacttt tcagagatag 61 gtgcctgcaa agaactgtcg gtcattgttc tgtcgaacca gttggagcaa taggttaaaa 121 cgtatgtacc gttaatatag tttaactcat ttgcctcgaa gtggtagggt gcatcaattg 181 atatgatgtc acttgcaaag gatatcatat cgtcgccgag ttttgcaaag cggcagttac 241 ctgtgtaaag tcccgattcg ctgccttcgg tgggatcacc gccgccgaaa gcgatccagc 301 caactccgtt atcatcaatt acaacaccgg ggtcgaagca ccaatacaca cggttttccc 361 taaggtcagg atggtttcca tcaacaaggg gtttgcccaa gggatctgtc caaggacccg 421 ttggagaggt tgcggtcaat acgccgacgc cggctgcact gtttgcaaag tagagataaa 481 agtgagttag tccgtcagct tcttctcttg caacgataga cggtgcccag gaatatcctg 541 tccatgtggc gatatcgcca acaggaatta cctgttcaaa ctgccagttt accatatcgg 601 cagacgagta gcagacaagt gagtcaattg agccgtagtc attatcccct actccgccgt 661 tttcgtcata ttcagcggtg tcattggtgc catatacata cactctgccg ttatattcaa 721 cagatgtggg gtcggcaaag aagatatttg atgagatcgg atttgcctcg cctgcttttt 781 tatatgcggt ggtgacggtg tttccgacag acaagcccaa atcggtagat tttgttaagt 841 cttgggaaat tgtgaaatca aactcatttg catcatctga accgtcgccg aaaagaacgt 901 gatacaaaag atagatagcg tcgtttttgt taatttcgct gtcgccgtca aaatcgcagt 961 tctggttcaa gggatacttg tcagcggtga acagtacagc atagagaagt tatatcgcat 1021 cgttcttatc aacaacgccg tcggcattaa catcgccggc taaaacactt ccgtcaccat 1081 caggcaaagg atatgaagca gtaccgccgt gcgagggagt atctataccg ttgtcaattt 1141 caaggacgat ggtggtaagg cttcctgcgg gaattgataa gccgtcggca aattcgccga 1201 tatctttcat atattcccct gttgatttaa gggattgata tacgcttgaa ccgatgattt 1261 cgccttcgtt aagaacgatg tttaaggtgt cagcattttc ggtgttgttt gcggcaacca 1321 ccacaagagt cttgccgtcc ggagatttaa atgcgcccac agaggatttt aacccttcgc 1381 ttacatcaac tctttgatat ccgttcttga tgaacttgga aaaatgagtc attatgtagt 1441 gggcgggacg tcttgtaatg gtggcttcat gtacccacca tgattcccaa gtccagtcgg 1501 tgatttcaag caagcagttt ccgtcatcag ccggccaaac accgttccaa tataagtatg 1561 cgttaagatt ttcgtttacc agctcatcca gaattacctt tccaaggtag aaatagtcgt 1621 tgcaatacca ttcggtctgc caaagacggt aatcggagaa gttatcatat agcttctgga 1681 agtttcgctc ggttaaagtt gtgccataaa ggtggtggcc gacaatttca aggctttcgg 1741 ggcagttttc aattacgggg tcaagataac ccttgaggaa atatgtatcg gcagccattg 1801 tttcagcgcc aagcaacaaa ggcgcattat cgccgaaggc ttctttaaat gcttcatata 1861 cggcgatgtg ggctttccaa tatgcacaat ggtcgtcgtt ttcttccatt ccgaagaaga 1921 atcctgcagt gtcgcgggcg ttgccctgct cgtcaa // LOCUS sequence275 1955 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence275 VERSION sequence275 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1955 /mol_type="genomic DNA" /organism="" /note="sequence275" CDS 618..1469 /product="rod shape-determining protein MreC" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_001135485.1" /transl_table=11 /codon_start=1 /translation="MKEFFSSKKFIVIICIAALMIGIMIYAAVSSSTLVSSALGTVFSP LQKFSQSISQSVTGAMDMLFNAKEYYEENRRLKEEIAELTGQMVDYIETKEENEHFREM LGLAETNPGIEFSEPCEVIGRTANDVFGSFFIDKGEMDGIEYYDPVVTSGGLVGFVTRV EYTYALVTPILSNEISLGVYCVQTGETGVIEGVYDYALEGSVRMVYIPLDCEMQTGDIL VTSGYSGLVPKGLVVGTAGELKAASNGLSKTCPVSMNVDIDSLKTVYVITDFDGKGSAY EE" /locus_tag="LOCUS_7770" /gene="mreC" /note="WP_001135485.1 rod shape-determining protein MreC (Bacillus cereus) [pid:28.2%, q_cov:95.4%, s_cov:96.1%, Eval:1.4e-19]" /note="MGA_1103" ORIGIN 1 aaaacatcat gatcgactcg gttgagatca gagatgcttt gagcgagcct ttgtcccaca 61 ttattgaagc aatcaaggtc acccttgaaa gaactcctcc ggagctttcc gctgacatca 121 tcgacgcagg catcaccctt gcgggcggcg gtgcacagtt aagaggactt gaccgcctca 181 tctttgaaga aacaggcatt cctgtacata ttgcagagaa tcctttggat tgcgttgttg 241 acggaacagg caagctcctt gaaaatattg aagagcttca cgatgttctt gacttcttcg 301 actattgatt ttttgacccc tgccgccgaa ggcaacaaaa cttgcagcta aaaggcgacc 361 gttttggttg ccttttgtgt ttttatatcc gcctgtcctc ttgaatagag gcgggcctgt 421 gtgcccgccc gtcaaggcgc cgttctcgtg tgggcgacca cgcagggtcg ccccttccaa 481 tgaaaaatga atggcgaata attaaggtgt acgcctaacg gcggacggct ccgccaaatc 541 acctcatccg tcggcatacg ccgacacctt cccctcaagg ggaaggctac gcccatcaga 601 aaggagttgg caatcgcttg aaagagttct tctcatcgaa aaagttcata gtaataatct 661 gcattgccgc ccttatgatc ggtattatga tctatgccgc ggtttcgtca tcgacgctgg 721 tttcctcagc gctgggaact gttttttcac ccttgcaaaa gttttctcag tcgatctctc 781 aaagcgttac cggcgcgatg gatatgcttt tcaacgccaa ggaatattat gaggaaaacc 841 gcaggctcaa agaggaaatc gccgagctta caggacagat ggtcgattac attgaaacca 901 aagaggaaaa cgagcatttc cgcgagatgc ttgggcttgc agaaactaac cccggcattg 961 aattttccga gccttgcgaa gtcatcggcc gaacagccaa cgatgttttc ggctcattct 1021 tcattgacaa gggcgagatg gacggaattg aatattatga ccctgttgtg acctcgggcg 1081 gacttgtcgg atttgtcaca agagttgaat atacatatgc acttgtgacc cccattctct 1141 caaacgagat atcgctgggc gtatattgcg ttcagacggg cgaaacaggc gtaattgagg 1201 gcgtatatga ctatgccctt gaaggttctg tccgtatggt atacatcccc ctcgactgcg 1261 aaatgcagac gggtgacatt ttggtgacct cgggctattc ggggcttgtg ccaaagggtc 1321 ttgttgtcgg aacggcgggt gagcttaaag cggcatcaaa cggactttca aaaacctgtc 1381 ccgtttcaat gaatgtggat atcgactcgc tcaaaacggt atatgtcatc accgattttg 1441 acggaaaggg ctctgcttat gaagaataaa cgtgcccgca gaaagcccct gccttatggg 1501 cttaaaacga ctttaaaatg gctttcatat ctcgctttgg gtctcgggct gtttcttttt 1561 tcaacttcgg gaagcccgtc ggggtctaaa gccgttttgc ttttgccctt tgctttggcg 1621 gttgcggtat atgaggacga aattccctct gccgccgcag gcgcattttt cggacttttg 1681 gtcgatattt cccttgataa gcttttggga tttaccgcgc tttatctttg catcatctgc 1741 ggagtggtct cggcgctgtt tcgtcagttt ttaagaaaaa atatctttaa ctacctccta 1801 tgcatagtca tcgcaggggg gatatatcta tatttggact attacttctt ctatgccatc 1861 tggcaggaag agggatataa gctggcattt gaaaaaatgc ttttgccctc tgcaatcaag 1921 acacttttga tttcaccgct tatctttgcg gcgga // LOCUS sequence276 1954 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence276 VERSION sequence276 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1954 /mol_type="genomic DNA" /organism="" /note="sequence276" CDS complement(835..1572) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MLTDQLNILKDTVDDFFDGTYDSFESLNMNEHLNETLCFVGVSEY KLGRALPNAVSIGVSPLYTTFTVTALGKRNMSASELVSYVDGSVIPAVRLSILNIRAIN RKSCVYSKEHGRYSLSFEVETFCEQTSSFTTSLNVFFNGTYYGFFSDWSISQGYKTYKL GTIYAGSVSGISRKEPNELTVSGELIASEGKEAYSSVAQFLGTVVTVSVDGILFPNLLL KEVKYEKNGESAKLIARLCEVSG" /locus_tag="LOCUS_7780" /note="MGA_1106" ORIGIN 1 cacccacata tcccagatca cttatgacaa gctgatccaa aagatcggcg ccgggatatc 61 ccaagacggt aaagaagtca taggtaacac cgcgttttga aaagtcgatc cgctttttaa 121 gaccaagttc cgggtccatt atccagtcgc ggtcaaaagg gatctccttt ttgcggataa 181 tgtttcttga aacggcgaag ctatcaatgg tgttaaatgc gtttgcttcg cctgttatct 241 ccgactcgct gattgcagat atgagatttg aataatcgtt tcctgttccc tttgaaagca 301 atgatgttga tgctatactt acgattcccg catcatatgg gcggctgatc cttacggtat 361 tggaaccgcg gatatatgga tataagccgt aagcacgaat ggaatagcaa acgactgcat 421 cccaaatgct tgttccgtca taatagttga catatctcac ctcgggggtg ttcgcttcat 481 agctgatgtt tggacaaata attgccgaat ttgccagcga atcgagggtg acatcaggaa 541 caaggcctgc tgtcggctga tttcttgaaa gcgcatcggt atagcccttt gagcgaagtt 601 ttaaaatctg tttgccgtcc ttgtttataa actgtgcaag agctggatat ccgtaatgga 661 taccctttcc gccaagggtc aaactcacag atattatctc cgacggagta atgctcgtag 721 cataccactg gccttcaagc aaggtatatg gagtgtagcg ttccttttca aagcgcatac 781 ttatgcaatc atcaagcaca tatgtgcccg aggttgatgt tacaataagc gacattatcc 841 gctcacctca cataaccttg caatgagctt ggcagattcg ccgttctttt catatttgac 901 ttcctttaaa agcagattcg ggaagagtat tccgtcgaca gaaacggtca caactgtgcc 961 caaaaactgc gccacagaag aatatgcttc cttgccttca gaagcaatca gttcaccgct 1021 gacagtaagc tcgtttggct ctttccttga aattccgctg acagagccgg cgtaaatcgt 1081 tccaagctta tatgttttat atccttggga aatcgaccag tcgctgaaaa agccataata 1141 agtaccgtta aagaaaacgt ttaaagatgt ggtgaaggac gaagtctgct cgcagaaggt 1201 ttcaacctcg aagctcaggg aatatcttcc gtgctcctta gaataaacac aagacttgcg 1261 attgatggct cttatattga gaattgaaag acgaacagca ggaattacag agccgtctac 1321 atagctcacc agttcgcttg cagacatatt tcttttgccg agagcggtta cggtgaatgt 1381 tgtataaagc ggtgagacgc cgatgcttac tgcattcggc aaagctctgc caagcttata 1441 ttccgaaacc ccaacaaagc acaaggtttc gttaaggtgc tcgttcatat tcagcgattc 1501 aaaggaatcg taggtgccgt caaaaaagtc atcaaccgtg tctttaagga tgttaagctg 1561 atctgtaagc acacttatcc gaccgtcctt tcaaagacga agccgttgtc gcacataaga 1621 tcacggggga cagcagcaaa ggcgttatac atcagcgttt gcgcctgcga aacgttttcg 1681 tcatcactta cctttgtgaa taccgagccc gactgggttg aaagagttct tgaggttgcc 1741 gcacaaagca cggtataatc gaaaaagacc tttgcggcgc aagcgtttgt taaaagcaat 1801 gattcttcct cggtttttgc ttctcttaaa agaagccgct ccacatatga cttcgcagag 1861 agaacaagac ccaaatatct gggcgtttct tcgtcggtca gaccgctgag aagcttgaac 1921 tgatcaagta ttgaattttg attgagtgta aaca // LOCUS sequence277 1951 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence277 VERSION sequence277 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1951 /mol_type="genomic DNA" /organism="" /note="sequence277" CDS complement(1357..1869) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MKKRSSDPMPFKLAVFMLAIGILLGSIFTFGMQYWNENIPREECR VVKTQFLSYDEIWHAKPTVSLVKIAIDCTDGNRYFIDGVSINEGLRDQLSSLSKNDDIT LLIHPDSNTIVEFSNGKTVLLNFDETIGKLEGESTGFLFLGLFMYLCALVGLYYTVYHM IRRKAKR" /locus_tag="LOCUS_7790" /note="MGA_1109" ORIGIN 1 gcggcagaga tcttctgata cttgaggttc aggccgaact caacgtctgc catatagccg 61 tctgcgcgga atgcggagag gagcttggtc ttgacgccgt cgcccacgct ctccaggtgg 121 tcaacgatga gagcctcgtc ctgaatgtag taggtgaagt tgtcgaggga tgcaagggcg 181 aaggcctttg caatgttgta gttgagaact gtgtcggcgt tcttgttgtc ggtcttggac 241 ataaccgtct caaactgagt cttgacggcc tcgcgctgag ccaggtagtt gtcgaagatg 301 ccgtcggtct cggcgttgac tgttctgccc tttacgtagt agttgtaaag tgcggcgtag 361 gcaccggtgc cgtcctcgca catataaacg tggaagtcct cggtggtgag acccgcattg 421 gcggcgagag cagcgccctt gagagcggtg ccgtcctgaa cgtagatgtt gaagaagacg 481 ttgtcgccct tgagctcctt gatctttgcg accatggtct cgaactcggt gttggtgaag 541 cctgtgctct ggttgttcgc ggcgtcaaag cccgcgttgt ggaaatgctc gagcttgtcg 601 ataccgctgt aggtcttgcc gcgctcgatg atggcgtagg tctcgtagcc gttctcaatg 661 cattcgagtg ccgaaagaac gggagggatg gtggcaagtg cgaagatgat gttataaacc 721 gtgtcgccct ctgcgggagt tgtgggagtg ggatcgggtg cgccgcttcc ctcgggctcg 781 ggggtggtgg tgtctgtggg atcggtggtg ttattgctgt cggtttcgct tccgccgcag 841 gcaaccataa agagcattac gaatgcaagt gccagcgcca gaattcttgt gaacgctttc 901 attttgaagc ctcctgtatt tttttcggtg gcgttgtata acgtcggact cattataaca 961 caaaagtcga agcttgtcaa tacaatcgcc ctcgtatatt aaagacggat ttttttgcat 1021 ttcgttacac cttttgggga gatttttgaa aaaattcaat aaatttcggg agatcggcaa 1081 aaaatccgcc gcaaggcgtg tatatcatca attccgaagg aattgcatat catcaacacg 1141 aagtgttgta tatcatcaat tccgaaggaa ttgtatatca tcaatgcgaa gcattgcata 1201 tcatcaagcc gcaggtaaga tgcacgctgg cgcgtgatga gatacagccc caaaggggct 1261 gatgatatgc caagcctgcg gcttggataa aaaaattcga caagctgaag cttgccgaat 1321 ttttgggttc gtcttgacag aaaagatgcc gcagcattat cgctttgctt ttcttcggat 1381 catatgatat accgtataat aaagtccgac taaagcgcaa agatacataa aaagccccaa 1441 gaaaagaaat ccggtggatt ccccctcaag cttgccgatc gtttcatcaa aattcaataa 1501 aacggttttg ccgtttgaaa attcgacaat agtgttgctg tcagggtgaa tcaaaagcgt 1561 aatatcatca ttttttgaca gcgatgatag ctgatcacga agtccttcat tgatggacac 1621 accatcgata aaatatctgt ttccgtctgt gcaatcgatc gcaattttta caaggcttac 1681 ggttggcttg gcgtgccata tttcatcata cgaaagaaac tgcgttttaa ccactctgca 1741 ctcttctcgc ggtatatttt cattccaata ttgcatgcca aaagtaaata tgcttccaag 1801 caggatgcca attgcaagca taaacacagc aagcttaaac ggcattggat ctgatgatcg 1861 ctttttcata tcgccaccgc ctttctaaga ttattatagc atactttgga gcaggttgca 1921 agaggttgag aactattcgc gtcccaatca c // LOCUS sequence278 1940 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence278 VERSION sequence278 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1940 /mol_type="genomic DNA" /organism="" /note="sequence278" CDS complement(543..716) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MKKISIGRLISLIGILVLSIGLICNAFEIVSITAFRIIVLIGIIA EVVALIIILKKS" /locus_tag="LOCUS_7800" /note="MGA_1111" ORIGIN 1 atatctctca cagcgctata ccgctccctt gcccgaagtt aaggcaattt taaatgatat 61 cggaacggaa gaactcggcc atatggagat gatctgtgcg atagtttatc agcttacccg 121 aaatctcact cccgcccaga tcaaggcgtc gggcttcgac acctactttg tcgaccacac 181 aaccggtcta tatcccattg cggcatcggg cacacccttc tcggcggaga tcttccagtc 241 cacaggcgat gccattgccg acctgacgga agaccttgcg gcagagcaga aagccagaaa 301 gacctatgat aacatccttc gtctggtcga tgaccccgat gtgcgcgatg taatcaagtt 361 cctgcgcgag cgcgaaattg tccacttcca gcgcttcggc gaagctcttc gcaaagtcac 421 cgacaccctc gactcaaaga acttctacgc cttcaatccc agctttgata aataagcaaa 481 aaagcagatg agttaattct catctgcttt ttatgttacg tattaggatt tgtatattag 541 aattaacttt tctttaaaat gataataagc gcaaccactt ctgcaattat tccgataagg 601 acaataatac gaaatgcagt aatagataca atttcaaaag cattgcaaat cagcccaatg 661 gacaaaacca atattccgat aagagaaata agacgaccga tactgatctt tttcattttc 721 acacctcaac agcaaagaca aatttattag ttgtcattat accacacctc gcagaagaat 781 gaaagtacat attcaaaaaa tgtacaactg ttaattcggc attttcactc ctttcgcatt 841 ccgtttaata ttttcatatc tgcattgaca atatgggcac gtatttggta atataaactt 901 aacaaaaggg cgttgcgccc tgcgcgaaat gaggaacgat tatgacagaa ttagagttaa 961 aacagcttct ttcggatatg tcactcaccg agaagatcga ccagcttgtt cagcttcacg 1021 gcggattcta cggcgatgtt aagctcatca ccggccccgg ccacgatttt aaaatgcgcc 1081 ccgaccagca ttggcaggtc ggctcaattt taggtgagat cggctgggag catttaagag 1141 aacttcaaga cggttttatg gctcatcagc cccataaaat ccccgcaatt tttatggctg 1201 acgttattca cggacttcgc accgttttcc ctgcacccat cggacagggc gcgggatttg 1261 accccgattt gacacgcgaa atggccgctg ccgccgcaaa ggaggcatca agcgagggct 1321 tgcacgtaac attttctccg atggttgacc ttagccgcga tgcccgctgg ggcagatgta 1381 tggaaggcac aggcgaggac ccgtggctga atgcgcgctt tgccgaagcc gccgtcaagg 1441 gctatcaggg tgacggaatc ggcaacgaag gcaacatcgg tgcttgcgtc aagcactttg 1501 ccgcatacgg tgctgccacc gcaggcagag attattcggg cgttgagctt tcaaccagaa 1561 ctttaatgga tgactatctg ccctcatacg aagcggctgt taaagcgggt gttgcccttg 1621 taatgaccgc gtttaacacc attgacagaa tcccttgctc aacaaacaag tggcttatgc 1681 gtaaagtttt gcgcgaaaag atgggctttg aaggtgtctt aatttccgac tacggagcaa 1741 tcggcgaaac tgttgcccac acatcatctc ttaacaaggc tgatgccacc aagaaggcga 1801 tccgcgcagg tgtggatatt gatatgatga ccgactgcta tttcggaaat cttgaaaagc 1861 ttgtcgaaag cggtgaggtt gctgaatcgc tcatcgatga agccgtaatg cgaatcttaa 1921 agcttaaaaa cgacctcggc // LOCUS sequence279 1935 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence279 VERSION sequence279 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1935 /mol_type="genomic DNA" /organism="" /note="sequence279" CDS complement(6..266) /product="YdbC family protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011986552.1" /transl_table=11 /codon_start=1 /translation="MAELKYEIKEHLGVLSENAKGWTKELNLVSWNDYAPKYDIREWSP DHTRMGKGVTLSAEEFENLKHLINGEPVDLGGDDVDEDEIL" /locus_tag="LOCUS_7810" /note="WP_011986552.1 YdbC family protein (Clostridium botulinum) [pid:60.9%, q_cov:80.2%, s_cov:94.5%, Eval:9.1e-23]" /note="MGA_1113" CDS complement(285..1745) /product="oligosaccharide flippase family protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_000091276.1" /transl_table=11 /codon_start=1 /translation="MSDSRSSYKKLFSNTLIFALGSFGSKLLVLILVPLYTACLSPDQY VTVDLISQTANILIPIITLSAADAALLFALETKDEAQHAKIYSSLLSVVLCGFAFLAVL YPIYSKFAYLDGYALLLLIYVCTASLKQLNSTFVRALEKVKLFAFDGILTTLAMLLLNI LFLIVFKWSTVGYLLAIILSDLLSSVFLFFAAKLWRFISFKKPDFALLKDMLRYSAPLI PTTLLWLVTSISDRFIITYFHGEYLNGINSIAYKIPTILTTIFTMFSQAWNMSAITENE SSERASFYTNVFSLNQSFMYVLSAGILLLNRPITHIWVDAAYYEAYRYSPLLTMATIFT CFNVFLGSAYIACKKTKRSFYTSLAAGIINIVLNFVLIPNYGIYGAAIATFVAYFAVFF YRLYDARSLIHFDFSMAKVLINTAMLASMAVLNQIEGPWTYGVLTGVFLIILIINFKEL WKCVMFIIQKKLLNKLPIVQKISDKINK" /locus_tag="LOCUS_7820" /note="WP_000091276.1 oligosaccharide flippase family protein (Streptococcus pneumoniae) [pid:27.3%, q_cov:92.8%, s_cov:96.6%, Eval:8.2e-57]" /note="MGA_1114" ORIGIN 1 ttcaattaaa gaatctcatc ctcatcgacg tcatcgccgc cgaggtcaac gggctcgccg 61 ttgatgaggt gcttgaggtt ttcaaattcc tctgcgctca gggtgacacc cttacccatt 121 cttgtgtgat cgggactcca ttcacggatg tcatacttgg gagcgtagtc gttccagctc 181 acaagattaa gctcctttgt ccagcctttt gcattctccg aaagaacgcc caaatgttcc 241 ttaatttcat acttgagttc tgccattgct ttctttcctt tctgttactt gttgatttta 301 tctgaaattt tctgaacgat aggtaattta ttcaaaagct tcttctggat gataaacatt 361 acacacttcc aaagctcttt gaaattgatt atgagaatta tgaggaatac tcccgtcaaa 421 acgccgtatg tccaagggcc ttcgatctga ttgagcacag ccattgatgc aagcatggcg 481 gtattgatca aaaccttcgc cattgaaaag tcgaagtgaa tgaggcttcg ggcatcgtac 541 aggcgataga agaatacagc aaaatatgcc acaaatgttg caattgcggc gccgtaaatg 601 ccgtagttgg gaatcagaac aaagttcaaa acgatgttta ttatgcctgc tgcaagggaa 661 gtatagaagc ttcgcttggt tttcttgcag gcgatatatg cagagcccaa gaaaacattg 721 aagcaggtga aaattgtcgc catggtgaga aggggggagt atctatatgc ttcataatat 781 gccgcatcca cccatatatg ggttatggga cggttgagca ggaggattcc tgcagagagc 841 acatacataa acgactggtt gagggagaaa acatttgtat aaaagcttgc tctctcgctc 901 gattcgtttt cggttatcgc cgacatattc caggcttggg agaacattgt gaatatggtc 961 gtcaaaattg tcggaatctt atatgcgatc gagttgatgc cgtttaaata ttctccgtga 1021 aaataggtga tgatgaatcg gtcggaaatg cttgtcacaa gccacaaaag agttgtggga 1081 ataagcggtg ccgaatagcg gagcatatct ttgagcaacg cgaagtctgg ctttttaaag 1141 ctgataaatc gccaaagctt cgccgcaaag aacaaaaaca cacttgagag caggtcggaa 1201 aggattattg caagaagata tcccacggtg ctccacttga acacgatcag gaacaaaatg 1261 ttcaaaagga gcattgcaag ggtcgtaagt attccgtcga atgcaaaaag cttgaccttt 1321 tcaagggcac ggacaaatgt ggaattgagc tgtttaaggg aagctgtgca tacatatatt 1381 aatagtagca gagcatagcc gtcgagataa gcaaactttg aatatatggg atacaaaacc 1441 gctaaaaagg caaatccgca aagaacaaca ctcaaaagcg aggagtatat ttttgcgtgc 1501 tgtgcttcat cttttgtttc aagtgcaaag agcagggcgg catccgcagc agagagtgtg 1561 attattggta ttaggatgtt tgccgtctgg gagatcaggt cgaccgtgac gtattggtcg 1621 ggcgaaaggc aagcggtata taacggtacg agtattaaaa ccaacagctt tgagccgaag 1681 gagccaagag caaatataag cgtattcgaa aagagctttt tatagctcga gcgtgaatcg 1741 ctcaccgaat catcctcctt attataagat agtatataca tcactaccat tataataagg 1801 atatgtgtaa aaatcaagca gttttatgag attgtaaaaa cactcgacat acttgacaat 1861 gtatgctata ataggtacat acgaaaaaga gttgacccgt gattttgtga aaggacggta 1921 atgaaatatg aagaa // LOCUS sequence280 1933 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence280 VERSION sequence280 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1933 /mol_type="genomic DNA" /organism="" /note="sequence280" CDS complement(143..1009) /product="YitT family protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003435320.1" /transl_table=11 /codon_start=1 /translation="MDKQNLKSLLWKYLTITVGSVIYAAAVSFFLDPNGIVPGGFTGIA MIIGHYVPIKTGTMTLILNIPVIALGIWKFGLKFLASTVYSVALSSVMIDLFALIGPLT SDLLLSALAGGFLMAIGLELVLKEGATTGGTDIIVKLLRTKIKHLSAGSLFTITDGLVV LISAIVFKNIEVALYAVICIVVYSKVIDLILYGRDEAKMLLIVSDKYEIITKRLLVELD AGATFLDGTGAYSGEGKRVVLCVIRKHLAPRALKIVKIEDPLAFTIITTANEVFGEGYK MHDEGHI" /locus_tag="LOCUS_7830" /note="WP_003435320.1 YitT family protein (Clostridioides) [pid:35.2%, q_cov:96.9%, s_cov:98.3%, Eval:1.1e-46]" /note="MGA_1115" ORIGIN 1 acggagggat tgtaagagat gaaaggctgc ccgcaagcaa tcccttaatc agcttcactg 61 gattgagatt atgtcaaatt tactgttgaa taaacaaaaa tgccccccac tcagcaaagt 121 ggggagttgt ttttatatgt tactatatat gcccctcgtc gtgcatctta tatccctcgc 181 cgaaaacttc gtttgcggtg gtgatgatgg tgaatgccag cgggtcttca atcttgacga 241 tcttcagcgc tctgggtgcc aaatgctttc ttattacgca gagcacaacg cgcttgccct 301 cgcccgaata agcacctgtg ccatcgagga aggtagcacc cgcatcaagc tcaacaagca 361 gccgtttggt gatgatctca tatttatccg atacaattaa aagcattttt gcttcatctc 421 tgccgtagag gataaggtcg ataactttgg aatatacaac aatacagatg acagcataaa 481 gcgcgacttc aatgttctta aagacaattg cggagatgag aacaacgagt ccgtcggtga 541 tggtgaagag cgaacctgcc gaaaggtgct tgatctttgt gcgcaaaagc ttgacgataa 601 tgtccgttcc gcctgttgtt gcgccttctt taagcaccaa ctcaagtccg atcgccatta 661 aaaatccgcc tgcaagcgca gaaagaagca gatcagaggt caggggaccg ataagcgcaa 721 aaaggtcgat cataaccgat gacagcgcaa cggaatagac cgttgatgcc aaaaatttca 781 gcccgaattt ccaaattccc aaagcgatta cagggatatt aaggatgagt gtcatcgtac 841 cggttttaat cggcacatag tgaccgatga tcattgcgat acctgtgaat ccgcccggca 901 caatgccgtt ggggtccaaa aagaagctga cggcggcggc atatatcact gagccgacgg 961 tgatggtgag atatttccac aataagcttt ttaaattttg cttatccatg agagggtctc 1021 ctttcatatt tatattaaaa tattcattat ttacaataga aaagcttcat ctttgtagct 1081 ttgcccattg aaaagcgcgt cgtaatatag tataatttct ttacatatta ccgttcttgt 1141 ttcaagatgg gagggcctat gaaaaataag agaatcatat caaaatatat agttgcgata 1201 attgttgcgg ctatgcttgc attatcgctt tgctcttgca gcaacaactc gaatgatcac 1261 atcgatcctc cgcagagtga ggctcctgag gtgacgacaa ccgaaaatgc cgtcgaggag 1321 gttaccacca ccgaagtgac tacaactgaa gccaccactg aggcaacaac agaagcgact 1381 accaccgaag ccacaactga ggcgaccaca actgagtcta ccacaactga ggctaccaca 1441 acggaagcta cgaccaccga agtgactacg acgaccgagg caactaccac tgttacaact 1501 acagtggcaa caaccaccga ggcgaccacc gttacaactc cggcacccga gccggaatac 1561 ggagacccga gcgagatcgt tatcaacgag atctgctctt caaacaagga tagccttgag 1621 gacttcgaag gcgaatcgaa ggactggatc gatctttata atcccacaat ctttgatatt 1681 gacattaagg gaatgggtat ttccgacgat gcgacccagc cttacaagtg ggtattcccc 1741 aagaccgtta ttgaggcggg ggactatctt gtggtctttg catccgataa ggatattacc 1801 acaggaaaag agcttcacac caatttcaag ctttcgggcg gcaacgaaac attatatctt 1861 acatttaacg acaagaccat cgactcggtt cccgttgttg aaaccgcaaa cgatatgtct 1921 tatgccagat atc // LOCUS sequence281 1930 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence281 VERSION sequence281 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1930 /mol_type="genomic DNA" /organism="" /note="sequence281" misc_feature <1..626 /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_003019988.1:30S ribosomal protein S1" /note="WP_003019988.1 30S ribosomal protein S1 (Francisella tularensis) [pid:30.7%, q_cov:77.3%, s_cov:32.0%, Eval:2.5e-11, partial hit]" /note="MGA_1117" /locus_tag="LOCUS_7840" CDS complement(667..1149) /product="NUDIX domain-containing protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_004574859.1" /transl_table=11 /codon_start=1 /translation="MNKDLCIPCDDGILNIRAGAIITKDGKLLMVGNDRDDYLYSVGGR IKFGETAEEAVVREVFEETGVRMEIDRLGFVHENYFYGDAPSNLGKLIYEISFFFYMKV PSDFAPISESFTEDNSKEHLKWVSLDEDIKMYPEFFKTELKNPIDTVKHFVTDERK" /locus_tag="LOCUS_7850" /note="WP_004574859.1 NUDIX domain-containing protein (Gardnerella) [pid:40.8%, q_cov:93.8%, s_cov:93.8%, Eval:4.5e-26]" /note="MGA_1118" misc_feature complement(1159..>1930) /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_010964978.1:replication-associated recombination protein A" /note="WP_010964978.1 replication-associated recombination protein A (Clostridium) [pid:58.3%, q_cov:88.7%, s_cov:54.2%, Eval:4.6e-75, partial hit]" /note="MGA_1119" /locus_tag="LOCUS_7860" ORIGIN 1 aaaacggtga aacgatagcg ttgctttctc gtaagcaggt gcaggaagct tgtaaacgcg 61 aatatctttc acaacttgaa aacggcgaag taatagactg caaagtgact catcttgaac 121 aattcggttg ctttgttgat gttggttgcg gaatagcttc gatgattcct attgatgcaa 181 tttccgtgtc acggatttct catccttgtg accgatttga gcttggcgag gatattaagg 241 cgattgtaaa aggttttgac ggtgagcggt tatatttgag ccataaggaa cttttgggca 301 cttgggaaga gaatgccgag atgtttcgag ccggtgaaac cgttaacgga attgttagaa 361 gtatcgaatc atacggcata tttgttgagc ttgcaccaaa tcttgcgggg cttgctgaac 421 caaaaccaga tgtatttgtc gggcagactg cgagtgtata tatcaaatca atcaaccccg 481 gcaagatgaa aattaagctg atcattgtcg atacattcga tgccgaccca atcaaggata 541 acagatactt catcaccgca ggcgtgatca aacgctggag atactctccc gagggatgtc 601 agaagcatat tgaaagcgtg ttctaaaaga aaagcgtcat cattataaga tggcgctttt 661 ctgtatttat ttacgttcgt cggtgacaaa atgctttacg gtatcaatag gatttttcag 721 ttcagttttg aaaaattcgg gatacatctt gatatcctcg tcgagggaaa cccatttcaa 781 atgctccttg ctgttgtctt ctgtgaagct ctcgcttatc ggagcaaagt cgctcggcac 841 tttcatatag aagaaaaatg aaatttcgta tatcaatttg ccgagattgg aaggcgcatc 901 accgtagaag tagttttcat gaacaaagcc aagacggtcg atttccatcc taacgcctgt 961 ttcttcaaat acttcacgca caacggcttc ttctgctgtt tcaccaaatt tgattcttcc 1021 accgacagaa tagagatagt cgtctctatc attgccaacc ataagtagct ttccgtcttt 1081 cgtaatgatt gcgccagcac ggatgtttaa gataccgtca tcgcatggta tacacaaatc 1141 tttattcata ttaccctctt atttcttctt tatctgctcc caatactgct tggcggcttg 1201 ttcggtctta ttgtttccgt attcataata gactttttcc ttaagagtat cgggcaaata 1261 ctgctgttcg atccaagaat ttgggtatgc gtgtgggtat ttatatccca ttgccttacc 1321 gagtttattt gcacctccgt agtggccgtc ctgcaggtgt gcaggtatat cccctgcatt 1381 tccggcacgg atatcatcaa gggcggaatc aattgcacag ataccgctgt ttgatttggg 1441 tgcggttgca agcaagatta cggcatcagc caaaggaatt ctcgcctcgg gcagtccaag 1501 ttgcattgca ctgtcgacac acgatttgac aatgggcaaa gcctgaggat aagcaaggcc 1561 gatatcttca gctgcaataa ccaaaagtct gcgcgaaagg ctgatgatgt cccctgcctc 1621 cataagtctt gcggcatagt gaatcgcggc attttcatca gagcctcgaa ttgatttttg 1681 taaagcagac agaatgttat aatgctcatc gccgtcgcgg tcatagcgca tattactgcg 1741 ctgtgtgagc agcttgacat tatcaagctt gacactcaac acaccgtcag agctgtcagc 1801 agataatacg cacagctcaa ctgtgttgat cgattttctc acatctccgc cgcaaccgtg 1861 ggcaatatgg tcggttacac cattttcaag cttgagcttt aggcctaaat catcagcaca 1921 tatctggaat // LOCUS sequence282 1914 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence282 VERSION sequence282 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1914 /mol_type="genomic DNA" /organism="" /note="sequence282" CDS complement(434..1912) /product="AMP-binding protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_010941764.1" /transl_table=11 /codon_start=1 /translation="MRPGSKVSVWMTNLPQWYIAFWAATKIGAILVTVNTAYKIHEAEY LFRQSDTHTLVMIDSCKDSNYKEIIEELCPELKNLKPGEPLYSKALPFLRNVITVGFEM DGALTWEQMLDRSDMVPREEVRRRAAAVKPDDVANMQYTSGTTGFPKGVMLTHSNIINN GKTIGDRMDLSTADRMMIQVPMFHCFGMVLSMTSMMTHGGTLCPVPYFSPKSSLSCINN EHITCFNGVPTMFIAMFAHEDFATTDFSYMRTGIMAGANCPPDLMRRAAAEMNMREIIS VYGQTESSPGSTMGEVNEDLDHRVETVGSAFPGIECKIVDPETGEDLPDNTNGEFVARG FHIMKGYYKMPRATAQAIDKDGWLHSGDICCRTSDGYYKVTGRLKDMIIRGGENLYPRE IEEFYLTHPKIRDIQVVAVPDVRYGEEACAWIILKEGETATVEDMIAYGVANMARHKVP RYFIFTESFPMNAAGKILKYKMREESVEVLGLKK" /locus_tag="LOCUS_7870" /note="WP_010941764.1 AMP-binding protein (Geobacter sulfurreducens) [pid:50.8%, q_cov:99.8%, s_cov:88.9%, Eval:1.2e-140]" /note="MGA_1121" ORIGIN 1 gatcggcaga ccatatttta cgcaaagctc gtaaatgcgc aagcatctgg gatcatcaat 61 ataaaatccc tgaatttcgg ggtggagctt gacgccttta agaccaagtt ctttaaggtg 121 gacgatatct gcctcgagat cgtcgctttc gggatgcatt gttccaaggc ctgtgaagat 181 ttccggctca gattcaacgg tgtttgcgat aaattcgttt atcgagcgca cctgcttggg 241 ggtggtggca acgctgaata tgatcgagtg aataactccg accttttcgc cctcctgctt 301 gcaggtggaa atggtgccgt cataagccat ttcaatgtta tagaagttgc ctgttgcctg 361 cgacgcttta acggcgatct tgtcgggata gacatggcaa tggcagttta ttttggggta 421 cattttcctc accttacttt ttcagcccga gaacctcaac cgattcctcg cgcattttat 481 atttgagtat ctttcctgcg gcattcatcg ggaagctttc ggtaaagatg aagtatctgg 541 ggaccttgtg gcgagccata tttgcaacgc cataagcgat catatcctca acagttgcgg 601 tttcgccctc tttaaggatt atccaggcgc aagcctcttc gccatatcgc acatcgggaa 661 cggcaacgac ctgaatgtct ctgatcttcg gatgggtcaa atagaattcc tcgatctctc 721 ggggatagag gttttcgccg ccacggatga tcatatcctt gagtcggcct gtaaccttat 781 aatatccgtc cgatgtgcga cagcagatgt cgcccgagtg gagccagccg tccttatcta 841 tcgcctgtgc ggtcgctctg ggcattttat agtagccctt cataatgtgg aatccgcggg 901 caacaaattc gccgttagta ttgtcgggca gatcctcacc cgtttcggga tcaacaattt 961 tgcactcaat gccgggaaat gctgagccga cagtttcaac gcggtggtca aggtcttcgt 1021 tgacctcgcc catggtgctt ccggggctgg attctgtctg gccgtatacg gaaatgatct 1081 cacgcatatt catctccgcc gctgctctgc gcattaagtc gggcgggcag tttgctcccg 1141 ccataatgcc cgttctcata tatgagaagt cggttgttgc aaagtcctcg tgtgcgaaca 1201 tcgcaataaa cattgtcggt acgccgttga agcaggtgat atgctcattg tttatacagc 1261 taaggcttga tttcggcgaa aaatatggca cagggcaaag cgttccgcca tgggtcatca 1321 ttgatgtcat tgaaaggacc attccgaagc aatggaacat cggcacctgg atcatcattc 1381 ggtcggctgt tgaaaggtcc attcgatcgc cgatggtctt gccgttgttg atgatgtttg 1441 aatgggtcag cattacgccc ttggggaagc ctgtggtgcc cgaggtatac tgcatatttg 1501 caacgtcgtc cggcttaact gccgcggcac ggcggcgaac ttcctcgcgg gggaccatat 1561 cggatctgtc cagcatctgt tcccaagtca gggcaccgtc catctcaaat ccaacggtaa 1621 tgacatttct gaggaatggc aacgccttgg aataaagagg ttcgccgggc tttaagtttt 1681 tcagctcggg gcaaagctct tcaattatct ccttatagtt tgagtccttg caggagtcga 1741 tcataacaag tgtgtgggta tccgactggc ggaagagata ttccgcctcg tggatcttat 1801 aggcagtgtt gacggtgaca aggatagcgc cgatcttggt ggccgcccag aaggcgatat 1861 accattgcgg caggttggtc atccaaaccg agaccttgga gccggggcgc acgc // LOCUS sequence283 1913 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence283 VERSION sequence283 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1913 /mol_type="genomic DNA" /organism="" /note="sequence283" CDS 583..1266 /product="RNA polymerase sporulation sigma factor SigK" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_012047887.1" /transl_table=11 /codon_start=1 /translation="MLSRILEILASGILWFALHVEEKNIFPKPLPPSQELELFKQYAKG DKSAKDKLILHNLRLVAHIVKKYSNQQDVQDELISIGTIGLIKAVTTFDCEKGNRFAAY GSRCIENEILMYFRSMKKTAKDVHFDEPIDVDKDGNQLTLMDIIAAEGDLCDEVDTRID LAKLKQCVISVLDEREREIISLRYGLYGSRPLTQREVAGLLEISRSYVSRIEKRAIEKL ADKMK" /locus_tag="LOCUS_7880" /gene="sigK" /note="WP_012047887.1 RNA polymerase sporulation sigma factor SigK (Clostridium botulinum) [pid:50.9%, q_cov:97.4%, s_cov:94.4%, Eval:1.4e-53]" /note="MGA_1123" CDS complement(1311..1763) /product="tryptophan-rich sensory protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003574643.1" /transl_table=11 /codon_start=1 /translation="MNKLKSIVVLLLPLAAGGLSAWLSGDKSMTYYHMPPLSPPEWLFP IVWTILYAVIGVASYLYMKDTDFKLGDTARFFYYGLFLNFVWPIIFFRFKMFTAAVIIL ILMIILSVAATKGFFDKNKTAGWMMVPYIAWLLFALYLNIGVAVLN" /locus_tag="LOCUS_7890" /note="WP_003574643.1 tryptophan-rich sensory protein (Lacticaseibacillus paracasei) [pid:41.3%, q_cov:89.3%, s_cov:86.2%, Eval:1.4e-23]" /note="MGA_1124" ORIGIN 1 tcctcatata tctcccgcgc agctctgccc tttgaaatgc gttcgtcaca taccgccggc 61 gggacatcca aaaagatgca tacatccggc tttaaaacat cggggcaatc catattcgcc 121 ctcatacacc actcaaggtc ggtgtccatt ccctgatatg caaagctgga ataataatat 181 ctgtcgcaaa ttacatttat gcccttttca agcagatttt tcatgccgta tacaggattg 241 gagcaatggg cgattctatc cgacaggaac agccctgcaa gctcggcggg tgtgcgcttt 301 gtaagtccgc aaagggtatc acgaacaagt ccgcctgttg cgtgctcggt aggctcagcg 361 gttaaagcat actggatgcc gtttgctttt aagtattcag caagcatgac aatctgggtg 421 cccttgcccg agccgtcaag accctctata acgataaatt taccttttgt catgtaaaac 481 aagtccttaa agaatatttg attatattat attccctcgg gcgaatttag tcaagcatat 541 ggcgaatagc atattttgaa aaaggttttg gagggtataa gtatgctttc gcggattttg 601 gagattttgg caagcggtat tttatggttt gccttgcacg ttgaagaaaa aaacattttt 661 ccaaagcccc ttccgccgtc gcaggagctg gagcttttca aacagtatgc caagggcgac 721 aaatcggcaa aagacaaact gattttgcac aatttgcgtt tggtggcgca tatcgttaaa 781 aaatattcca atcagcagga tgttcaggat gagctgatat caatcggcac catcgggctg 841 atcaaagcgg taacaacttt cgattgcgaa aagggcaacc gctttgcggc gtatggctca 901 aggtgcattg aaaatgagat acttatgtat tttcgctcga tgaaaaagac cgccaaggat 961 gtccactttg acgaaccgat tgacgttgac aaggacggca accaactgac gcttatggac 1021 attattgcgg cggaggggga tctttgcgac gaggtggata cgaggatcga ccttgcaaag 1081 ctgaagcagt gtgtaatatc ggtgctggat gagcgagaaa gagagatcat cagccttcgc 1141 tatgggctat atggctcacg gccgctaaca caacgtgagg ttgcaggact gcttgaaatc 1201 tcgcggagct atgtatcccg cattgaaaag cgggcgattg aaaaattggc ggataagatg 1261 aaataaaaaa gtaaatatcc ccgagcgaag ctcggggatg tttatactta ttagttcagc 1321 accgcaacgc cgatattgag atatagcgca aacaacagcc acgcaatgta tggcaccatc 1381 atccagcctg cggttttgtt tttatcaaag aatccctttg tagccgcaac cgagagaata 1441 atcatcagaa tcagaatgat gacagcggcg gtgaacattt tgaaacggaa gaaaattatc 1501 ggccaaacga agttcaaaaa cagcccataa tagaaaaatc tcgccgtatc accaagctta 1561 aagtcagtgt ctttcatata taggtaagat gccacaccta ttacagcgta aagtatcgtc 1621 cacacaatcg ggaaaagcca ttcgggcgga gaaagaggcg gcatatggta ataggtcatt 1681 gatttgtcac ccgaaagcca ggcggaaagc ccgcctgcgg caagaggcaa cagcaaaact 1741 acgattgatt tcagcttatt cataaaagtc actcccaaag cgtatttgca attattatat 1801 ggcgaagtgt ggacaaaaat acccgaagat ggtatacttg ataagaggag ttgatttttg 1861 tgaaaacgct tttacatata tgctgtgcgc cttgctcgat aatgtgcatt gaa // LOCUS sequence284 1891 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence284 VERSION sequence284 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1891 /mol_type="genomic DNA" /organism="" /note="sequence284" CDS complement(540..1445) /product="signal recognition particle-docking protein FtsY" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003393780.1" /transl_table=11 /codon_start=1 /translation="MGFFEKLKAGLAKTKAGLMGGLTGIFARSEIDDDFYDELEETLIL SDIGARTAEDIVTALRAKVKEEKIKEPEACKNALKDIISDMLGEDTPLDMSTKPSVILV IGVNGVGKTTTIGKLSYQLKNEGKKVLVAAADTFRAAAIDQLNVWTDRAGVDIIKHSEG SDPAAVVFDALDAAKARNVDVVIVDTAGRLHTKKNLMNELAKISKIVHSKAEGCALEVL IALDGTTGQNAVNQAREFNEVADITGIILTKLDSTAKGGIVIPIANELGVPVKLVTVGE KIDDIQPFIAKDFVNALFED" /locus_tag="LOCUS_7900" /gene="ftsY" /note="WP_003393780.1 signal recognition particle-docking protein FtsY (Clostridium botulinum) [pid:56.2%, q_cov:98.7%, s_cov:98.7%, Eval:7.5e-86]" /note="MGA_1126" ORIGIN 1 cggtggctga tggcgttctt ttcctcgggg tcaagctcgg cggtagattt atcccctacc 61 ataaagatgg ggtcataacc aaagccgtgc tcgccaatgc gctcatatcc gatcctgccc 121 tcgatggtgc ctttaaactg ggcggactcg ccctgctcgt tgatgtatgt gatgacggcg 181 acaaagcgag cggtgcgctt ttcatccggc acgcccttga gtttatccaa aacaaggtag 241 catcttccga tgtcgtcgac ctcatcgccg ccgtagcggg cggaatatac acccggctcg 301 ccgccgagat aatcgacctc aaggccggaa tcgtcggcaa caacggcaca gcctgcaatg 361 tcataaagcg cttttgcttt gatgtatgaa ttttcggcaa atgtggtgcc gttttcctcc 421 gcttcgagga cgataccctc ctcgcgctga gatttgacct caaatccgag gggttccaaa 481 atctccttga attcgcggag cttgtcttta ttgttggatg caagaatcag tttcatagtt 541 tagtcctcaa acaaagcatt gacaaagtcc ttggcgatga agggctgaat atcgtcgatc 601 ttttcaccca cggttacaag cttaacaggc acaccaagct cgtttgcaat gggaattacg 661 atgccaccct ttgctgttga atccagcttg gttaaaatga tgcctgtaat gtcggcaacc 721 tcgttgaact cgcgagcctg attgacagca ttctgtcctg tggtaccgtc gagtgcgata 781 agcacctcaa gtgcacagcc ttcagccttt gaatgaacga tctttgagat cttcgcaagc 841 tcattcataa ggttcttctt tgtgtgaagt ctgcctgcag tatcaacaat tacaacatcg 901 acatttcgtg ccttggcggc atcgagcgca tcgaacacaa ctgcggcggg gtcagagcct 961 tccgagtgct tgatgatatc aacacctgcg cggtcggtcc agacattgag ctggtcgatt 1021 gcggcggcac ggaaggtatc agccgcagcg acaagcacct ttttaccctc gtttttaagc 1081 tgatatgaaa gcttgccgat ggtagtggtc ttaccgacgc cgttgacgcc gatgaccaaa 1141 attacggacg gcttggtgga catatccaaa ggagtatcct cgccgagcat atccgagatt 1201 atatctttaa gtgcattctt gcaagcctcg ggttctttaa ttttttcttc tttgaccttg 1261 gctcgaagag ctgttacgat atcctctgcg gtgcgggcac cgatatcgga caaaattaag 1321 gtttcttcaa gttcatcata gaaatcgtca tctatctccg agcgagcgaa aatacctgta 1381 aggccgccca taaggcctgc tttggttttt gcaagacctg ctttaagttt ttcaaaaaag 1441 cccatacgat tttcctttca attagttgct ttcgtccata agcgcagctt cacgtacatc 1501 cattctcaaa agcttggaaa cgcccttttc ctgcattgta acgccataga gcacatctga 1561 ttcttccatg gtgcctcgac ggtgggtaat gcagataaac tgggtggtgt cggtgaagtt 1621 tcttaaatat tgagcataac gagtgacgtt gacatcgtca agagcggctt caatttcgtc 1681 taagatgcag aagggagaag gacgaagctt gagtattgca aaatagattg caattgcaac 1741 gaacgcctgc tcaccgcccg agagaagcga gaggtttttg attacctttc cgggaggtgc 1801 aacgttgatc tcaatgcccg attccaaaac attttcgggg tcggtgagtt taagctccgc 1861 cttgacgccg ccaaagagtt caacaaatat c // LOCUS sequence285 1885 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence285 VERSION sequence285 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1885 /mol_type="genomic DNA" /organism="" /note="sequence285" CDS 1050..1292 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MALARTDLDEVRHDLAQKSETLFMKEWNEHRHVHENYNSITGEGC DSGSSDKFYHWGALLCAIALADAGYIANFGKSMEE" /locus_tag="LOCUS_7910" /note="MGA_1129" ORIGIN 1 aggtacaaaa gcttatagag tctcgcaaag aagaatatca taaaaagacc tcccgctttg 61 gcaaacttca gcaaatgtat gaggcaatgg aatgctcttt gtcctgggac acgatatatg 121 atgcgaaaaa tgaccgcgtt gtctcccctg tcagccgact ttggagcatc aacagcggcg 181 gctacgtttt gttctgttgg gacaatttct tcgcaggatt tatggcgagc ctcggcaacc 241 gtgagctttc atacagcaat cttcgagaaa tacttaacga acagacaaaa gatggctttg 301 ttccgaatct cgcatatgca acaggccagg ttagcgccga ccgttcacag cctcccgttg 361 gaagtgcaat gcttttggaa acataccgaa ttctgaagga aaaatggctc atcgaggata 421 tgtatcccga ccttttaaag tggaaccgtt ggtttgcaaa aaacaggatg aacaaaagcg 481 gtgctttgtg ttggggaagt aaccctatac ctgttctata cggcaaccga tgggagaccg 541 acggagttca ttcgacatat ggagccgcgc ttgaaagcgg acttgataat tcaccgatgt 601 atgatgatat tccttttaat aagcatacca accgacttga gcttgaagac gttggtttga 661 caggacttta cattcttgat ttccgttcgc tgattgagct tgctaaaata atcggcaatg 721 aggaagtcgt ttcagaactt caagaaagaa tggacaaggc ttgcgcaggg cttgaaagcc 781 tttgggatga ggaaaatgga ttctattata ataaaagaac cgatacagga gaatttgagc 841 gcagaatttc acccactaat ttttatgcgc tgtttgctcc gaatgtttcg aaagaacgtc 901 agcgaagaat ggctgacgag cattattaca accctgatga attttacggc gaatggatgc 961 ttccctcaat agcgcgaaac gatccggctt agcttgatca aaactattgg cgaggacgag 1021 tttgggcgcc tcttaacttt ttagtatatt tggcattggc tcgcacagac ctcgatgaag 1081 tgcgccacga tctggctcaa aaatcagaaa ctctgtttat gaaggaatgg aacgagcacc 1141 gccacgttca cgaaaactat aacagcataa caggagaagg ctgtgattcg ggaagcagcg 1201 ataagttcta tcattggggc gctttgcttt gtgccatcgc ccttgccgac gcgggatata 1261 tcgcaaactt cggaaaatcc atggaagaat agtaaggaat atatgagggc tttttggtaa 1321 aaccgacttt aaagatagaa atgcctgcag cttcaaaata gcctttaaaa ccgcttgttg 1381 cttttggctt tgcataacaa ctgctctctg tggaaaatat cttttccgta tgtgaacgac 1441 aactattatc acaacggtga taacagtcgt ggccttacgg taacgatgga aaaagccaaa 1501 tgtcaaggat atcctcggca tttggctttt gctttgtttt gattaggatt cgcactaagc 1561 agataccccg cttttcaaga atgtcaagtt cttaattatc ctgcttccac atagtaaaat 1621 gcaccccaaa agcttttgac ttttagggtg catatttctt tttatttagc acctaaacaa 1681 ccgccgattg attaaggaac tgttattcct gagcaacaaa ctctgcgata tcagtattca 1741 actcatttac gtaataatct atctgctcgg catatttttc cttgagctga gcccatgtag 1801 aaggttcctg attcaatgtg aagtttacac aattggaaac cgcatctgca agcttgctgc 1861 cgataccttg ttcatagtcg ataac // LOCUS sequence286 1885 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence286 VERSION sequence286 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1885 /mol_type="genomic DNA" /organism="" /note="sequence286" ORIGIN 1 cagaaggtga tgatgtcgta tcctgtaaca agggtggagg tggggtagaa atatttaaga 61 tcttcggtgt tttcgggcca tcccaatgtg ctgaaaggcc acaaagccga gctgaaccat 121 gtgtcaaggg tgtcggggtc ctgacgcatt gccttgccgc acttggtaca aactgcatgg 181 tcgtcctttg tgacaatcat ttcgccgcaa tcgtcgcaat agaatgcggg aatgcggtgt 241 ccccaccaga gctgacggga gatgcaccag tcacggatgt cttccatcca gttgaagtag 301 ttcttgtcaa atctttcggg aacgaacttg atatcgcccg agcgaacagc ctcgatcgca 361 ggctttgcaa ggtcagccat tttaacaaac cactgaagcg atactctcgg ttcgatggtg 421 gtgccgcaac ggtagcaggt gccgacattg tgggaatgct cctcgatctt aacaaggaag 481 ccgccctctt cgaggtcctt aacgattgcc tttcttgcct caaatctgtc cataccggca 541 tacttgggat agtcctcggt tatcttggcg tcatcggtca taacgttgat gacgggcaga 601 ttgtggcgga gtccgacttc aaagtcgttg gggtcgtgag caggagtgat ctttacaacg 661 cctgttccaa attccatatc aacataagga tcggcaacaa cgggaatttc acggcctaca 721 agaggcaatg taacagtctt gccgataaat gcctgatagc gctcatcctt ggggttaact 781 gcaacggcag tatcgccaag aagggtttcg ggacgggttg ttgcaagctg caaccagccg 841 ctgccgtcag taagaggata acgcaggtgc cagaagtggc ctgcctggtc ttcatattca 901 acctcggcat tggaaatgga tgttaagcaa tgggggcacc agttgatgat gcgttcgcca 961 cggtagataa ggcctttttc ataatacttg atgaaaactt ccttaacagc cttcgagcaa 1021 ccctcatcga gggtaaatct ctcacgggtc caatcgcaag atgagccgag atttttaagc 1081 tgggagatga tccttcctcc gtactgctcc ttccaagccc aagcgcgctc taagaagccg 1141 tcacggccga ggtcatcctt ggtgatgcct tctttgcgca tagcttcaac gatcttagct 1201 tcggttgcaa tggatgcatg gtcggtgccg gggagccaaa gggtggcata tcccgacatt 1261 ctcttatagc ggatcaaaat atcctgcagg gtgttgtcaa gtgcgtgtcc catatggagc 1321 tgacctgtga tgttcggagg ggggatcacg atggtataag gcttcttttc ggggtctgct 1381 tcagccttga agcagtcgtt gtcgagccag tatttataaa ttctgtcttc gacttctctg 1441 ggctcataga gctttccgag ttcctttttc atataaacaa tcctttcgtg gttattgagg 1501 cgatgaaaaa aataaaaaat cgcctcaaag atttttcttt gagacgagct gtttacccgc 1561 ggtaccactc aaattgcgca ggttgccctg cacctctttg cgacacaaaa ggtcgccgac 1621 gtaacgtgtc gtaaaatacg gaggaggtct acggcattta taaaaaatgc ttcttctccc 1681 ctgctctgaa gctacaaata atcagggtca tcagcgactc gcaccttccg tcgcctctct 1741 gggatgatag tctgaaaatt cctcttcgtc atcgcattta acagatgtaa tcataataac 1801 accacagctt gaaaaagtca acacccaaag gtatttttgc gggatgtttg gagaggatag 1861 gggcagaatg tgcgggcggc agccc // LOCUS sequence287 1863 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence287 VERSION sequence287 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1863 /mol_type="genomic DNA" /organism="" /note="sequence287" ORIGIN 1 atcctgaaac atttgcgtca gccgttgtgc cggaaatcct gtagcaaaag ctcttatatc 61 cgcccgatac cttgccgtgg cttccggagc cgttttgcga ccagaaaacg aagtcgccct 121 tgttcgaatc aaagtcaatg agcatcattt ctcttatcag ctcgccgtct ttatattctt 181 ccaaaacaac gtcgtcgaaa tatgccgcac cctctgcacc gatctttgat gcccttaaag 241 cgatcgtgcc gacattatac ttatcgctgc gcttgacaag ggaggattca tacagcatcc 301 agccgtcctc aagctcagca gtcttcttcg atgatgcgca gtctacccac gagttgatta 361 cgtttgaaac gaccgcctcg tccgaaggat atcgtttaac gattcccaaa gttcccgccc 421 aatccatatc ctggtgagtg aaattgtgag gggagtagca atggaattca taagctgtgt 481 tattatcatt caaaaggaac tgaagctgtg atattgcaat gttccagtcg gaacttccgc 541 ttgctgattg aacggcgcaa acacgctcag cgaagatgat gtggttttca tcaacctctc 601 ttatcgcgtc ggtaattctt tgcatcagat ttttgcactg accaaccgat tcttcaactg 661 taccgatatc ggggactatg ggttcattca gaatgccata tccgatgaca gtttcttcat 721 ccgaatagcg ctttgcaatt tccgcccaca gagcgataag tcttgcctgg ctttcttcgt 781 ccgtccaaag tcctgtgccg ttgccctggg actgatatcc gccctgggga acgtgcatgt 841 tgagtataag tccgataccg ttctttttcg cccacttgat atttttatca agccactcaa 901 aaccttcttc cttatatata taaggatttg cgtcatcttc aaaaagctgg taattcaaat 961 aaaatctcac gctgttaaag cccattgaag caatatcttc atatgacgac tcatcgtgag 1021 aagtcaaaac cggctcggtt gggttcgacc aaacatcgtt tcccaaagca atgcctttaa 1081 gccaaacggg attacccgaa ccgtcaacaa ttttgccgtt ttcaacgtga ataaagccca 1141 tatcatcacc ctttgagccg catcccgcaa gcaaagccac tgaaagtaaa aatgcaataa 1201 tcagcgataa gattcttttg atcttcatat tatttcctct gaatcataat gcgaagaact 1261 ttgcaattct gctaagttct tcaatgttgt tagccatata gtatactgcc caaggaaaaa 1321 cctcgggcag tataagaaaa agcagtggtc gtttatccga gagttgcaac gtattcagca 1381 acgtcgttgt tgagttcagc gatgtagtat tcgatctgtt cgctatactt ttcggttacc 1441 tgagcccaag tggaagcatc agcatgtctg ccaaggttca tagtgtgctc aatagctgag 1501 tcataaagct tgttgcccaa accgtggctg aaggtaagaa cagtgtaggg accttcggaa 1561 agctccatgc agtggtcata catatcgagc atttcgtcat tccacttata cttttcaata 1621 agctgcttct tgtcgatgga aataacggtg gggtccatga ttttgaagcg ttcgcaagct 1681 gcaaacaaag caactgcttc gggattagca gcaccgttta caataaggaa gccgtggatt 1741 cttgtgccaa tataatagtt gccgtcgccg ttggggtcac gaggtacagg gcagaacatg 1801 atttcgcccg cttcaatatc gccccaaact gcatttactt cttcaacagg gttggtgata 1861 ccc // LOCUS sequence288 1858 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence288 VERSION sequence288 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1858 /mol_type="genomic DNA" /organism="" /note="sequence288" CDS complement(173..1030) /product="AraC family transcriptional regulator" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_010965896.1" /transl_table=11 /codon_start=1 /translation="MDGQCLYEPLADEVVCVHKRAKGYQTYSYHRHNGYEVYLFLEGNI LFYQGSNCYRLTPGDLLILPPSCMHRIISIDESIYDRIVLNIRHSAIERLSTGMTNLFA CFETTDTDNIMPINLNKEEIKRFTQLSEGLISSMKDHTFGSDVLANSYVSQLLLLVNQC HKVSPEPKFNIMPALVKDVMLYIEDNLAGDLRLSKISEEFYHNGTYISRMFKKHTGLTL KEYIIDQRIEVSRRILKNGGSVQEACYKSGFSDYSNFIRSFTAAMGVSPGKYKQENNKK TVKK" /locus_tag="LOCUS_7920" /note="WP_010965896.1 AraC family transcriptional regulator (Clostridium) [pid:32.2%, q_cov:87.7%, s_cov:87.7%, Eval:1.2e-37]" /note="MGA_1134" CDS 1279..1749 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MNTVKREKLFELCIRYLDCLDISRAAKLANIEGDPNIDGAKLIVG RSAKRILKKLCDPEFAETAALAGLMKLALGRCNDAVELLREELPQDISSLDLYNVSEIK KVKGGGVEIKFFNRLDALEKLIDLCETKSGANAAESFFSALSSGADRSDSDD" /locus_tag="LOCUS_7930" /note="MGA_1135" ORIGIN 1 ctcctcgcaa gtatgcttct actgctttct tcctgaattc attgctatat ttcttgttct 61 tgtgtgtcct tcttggcata aaattaaccc ccttaaagta gtcttgaaaa ctttttgttt 121 tttcaagtgt ctactctaag gggattatat catcagatga gcggcgtttt tattattttt 181 tcacagtttt tttgttgttt tcttgcttat attttcccgg agaaacgccc attgcagcgg 241 tgaaactgcg aatgaagttg gaataatcgg aaaagcccga tttatagcaa gcttcctgaa 301 cgcttccgcc gtttttgagt attcttcttg aaacctcaat tcgctggtca attatgtatt 361 ccttcaaggt cagtcctgta tgctttttaa acattcggct gatatatgtg ccgttgtggt 421 aaaattcctc ggaaattttt gacagcctta aatcaccggc caagttgtcc tcaatgtata 481 acataacgtc tttaaccaac gccggcataa tgttgaactt tggctcgggt gaaaccttgt 541 gacattgatt caccaaaagc aaaagctgag aaacatatga gtttgccaaa acatcggagc 601 cgaaagtgtg atccttcatt gagctgatca gcccttccga aagctgggta aatctcttga 661 tttcttcttt gttaaggttt atcggcatga tattgtcggt gtcagtcgtt tcaaagcagg 721 caaacagatt tgtcatcccc gttgaaagcc gttcgattgc agaatgcctt atattcaaaa 781 ctattcggtc ataaatgctt tcgtcaatgc ttataattct gtgcatgcat gacggcggca 841 atatcaaaag gtcgccgggt gtaagcctat agcaattact gccctgataa aacaggatat 901 ttccctcgag gaaaagatat acttcataac cgttgtggcg gtgatagcta tatgtctggt 961 atccctttgc gcgcttatgc acacatacaa cttcatcggc taacggttca tataaacact 1021 gtccgtccat acatatgcac ctccgatgtg ctcattatac atccgaaagt caaattttgc 1081 aatagttttt gcaaaaaata ttgtaaaata tctaaatttg atactttatc acattcccgc 1141 gttttttgca taaaaatggc aaacgagtcc aaaaaatgtc actccaagcc cattttcaaa 1201 aaaactttgc ccgcaggttg cacgtttcga tgcaacctgc gggctttttg taggccttag 1261 tgaaaggagt tgaaattatt gaacactgtc aaaagggaaa agctctttga gctatgcatc 1321 cgatatcttg actgcctcga catttcccgc gcggcaaaac ttgcaaatat tgagggcgac 1381 ccgaacattg atggggcaaa gcttatagtt ggccgttccg ccaaacggat cctgaaaaag 1441 ctctgtgacc ccgaatttgc cgaaactgcc gctcttgcgg ggcttatgaa gctggcgctt 1501 ggcagatgta atgacgcggt ggagctttta agggaggagc tcccgcagga catctcatcg 1561 ctggatcttt ataacgtttc ggaaattaaa aaggtcaagg gcgggggagt ggagatcaag 1621 tttttcaatc ggcttgacgc cttggaaaaa ctcatcgacc tctgcgaaac caagtcgggc 1681 gcaaatgccg cagaaagctt tttcagtgcc ttgagctcgg gcgcggacag gtcagattcg 1741 gatgattgat ttcaagaact tttcaaaaaa gcaaaggagg gtgctctcct ggtggcaaaa 1801 tccccaatat cgggactatg acgcgatcat atgcgacgga gcagtcagaa gcggcaag // LOCUS sequence289 1852 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence289 VERSION sequence289 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1852 /mol_type="genomic DNA" /organism="" /note="sequence289" CDS complement(40..1851) /product="stage V sporulation protein D" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_010965429.1" /transl_table=11 /codon_start=1 /translation="MTVMSQNKITSVGATPTAKRYYPQGDLASNVIGHLHYDGYGIYGL ESYYDDYLTGVDGKIITAIDAHGVEIQYKYKQSYDAQDGDSIYTNIDTTIQYYVEKALA NAVQTNSAANRGCAIVMNCNTGAILAMATEPDYDLNYPTAIYDENTAAILAGIEITGND ELYNSTRAAAWNLQWTNKAISSLYYPGSVFKVVTGSAALEEGAVNLASSFYCGGDITVA DRLLHCWTKTGGHGRQNFIEAMTNSCNPAFVEIGQALGAKAFTEYFEAYGLTEKTGIDL PAEASSIYYDYNRMGAVNLATSSFGQANKITPIQMITAFSAVVNGGDLVTPYVVNKIVD SDGNIVKEFTPTVKRQVISEDTSEIMRSTLETVVTTKAGSNAYIKGYDIGGKSGTSQKL DENPEGNTYVSSYCAFFPANDPEIIMLVMIDEPTNGLYYGSAVAAPVVSEVFSEILPYL GYFAEYDEAELESLDVNVPDVFGAEIGQAKATIESLGLTAEVIGNGETVIRQVPSSDGS MPKGCNVILYTEEGYEEEQVYVPDLTGYTLEEANKKLAKLGLNLKPLGGAAYKTGATCS GVVNYKEVYVPEGTIIETYFIVNDETG" /locus_tag="LOCUS_7940" /note="WP_010965429.1 stage V sporulation protein D (Clostridium) [pid:37.2%, q_cov:94.4%, s_cov:76.3%, Eval:1.1e-104]" /note="MGA_1136" ORIGIN 1 atcaaaaatc actcctttgc ttggcgtagg tgggatatat catcccgttt cgtcattgac 61 gatgaagtat gtttcgataa tggtgccctc gggaacataa acctctttat agttcacaac 121 gcccgagcag gttgcacctg ttttatatgc cgcaccgccg aggggtttaa ggttaagccc 181 aagcttggcg agctttttgt ttgcttcttc aagggtatag cccgtgaggt cgggaacata 241 tacctgttct tcttcatagc cctcttcggt atagaggatc acgttacagc ccttgggcat 301 cgagccgtcg gaggaaggca cctgacggat aacagtttcg ccgttgccga tgacctctgc 361 tgttaatccc aacgattcga tcgtcgcctt tgcctggcct atttccgcgc cgaatacatc 421 gggcacattg acatcgaggc tttcaagctc tgcttcatca tattccgcga agtagccaag 481 gtatggcaaa atttcggaga aaacttccga aacaacaggc gccgcaacgg cagagccgta 541 gtaaagtccg ttggtgggct cgtcaatcat aacgagcata attatctcgg ggtcatttgc 601 agggaagaat gcacaatagg acgaaacata agtgttaccc tcggggtttt cgtccagctt 661 ctggctggtg cccgatttac cgccgatgtc atagcctttg atatatgcat ttgaacctgc 721 tttagtggtt acaaccgttt caagggttga gcgcattatt tcactggtgt cctcggaaat 781 gacctgtcgc ttgacggtcg gggtaaactc cttgacgatg ttgccgtccg aatcgacgat 841 tttatttaca acataaggtg tcaccagatc gccgccgttg acaacagccg aaaatgctgt 901 gatcatctga atcggagtga tcttgtttgc ctggccgaag gaggatgttg caaggttaac 961 ggcgcccatt ctgttgtaat cataatagat actcgatgct tccgcgggaa ggtcgattcc 1021 tgttttttcg gttaagccgt aagcctcgaa atattcggtg aatgcctttg cgcccaatgc 1081 ctgaccgatt tcaacgaagg cagggttgca ggagttggtc atcgcttcaa tgaagttctg 1141 tctgccatga ccgcctgttt ttgtccagca gtgcaaaagt cggtcggcaa cggtgatatc 1201 gcctccgcaa tagaaactgc ttgcaaggtt aactgcgccc tcttcaagtg ctgcagagcc 1261 tgtcacgacc ttgaataccg agccggggta atatagcgag gaaattgcct tgttggtcca 1321 ctggagattc caagcagccg cacgggtcga gttatatagc tcatcatttc ccgtgatttc 1381 aatgccggca aggatcgccg cagtgttttc atcatatatg gcggtgggat agttaaggtc 1441 atagtcgggc tcggttgcca ttgccaaaat cgcgcccgtg ttgcagttca taacgatcgc 1501 acatccgcgg ttggcggcag agttggtctg tacggcattt gccagcgcct tttcaacata 1561 atactggatg gtggtgtcga tgtttgtata aatcgagtcg ccgtcctgtg catcgtagct 1621 ctgcttgtat ttatactgga tctcaacgcc gtgggcatca attgcggtga ttatcttgcc 1681 gtcaacacct gtgagatagt cgtcataata tgactcgagg ccatagatgc catagccgtc 1741 atagtgcaaa tgtccgatga catttgatgc aaggtcgccc tggggataat atcttttggc 1801 ggttggggtg gcgcccacag aggtgatctt attctggctc attacggtca ta // LOCUS sequence290 1850 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence290 VERSION sequence290 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1850 /mol_type="genomic DNA" /organism="" /note="sequence290" ORIGIN 1 gctaattttg taaataacag atgtagggtt gcacattgtc acaggcggac cacggacatt 61 gcaccgttac agtcaaacaa gctcggcttg atcagatcaa tgttcactta atactaagaa 121 ttaacgctat tttcaataaa tatcagcaaa tatattgtaa aaattgattt tattattgtt 181 taaaaaaggt taattgttgg aaaacccgac gaatttcaaa atcttccaaa aaattgtaga 241 aattaaagaa tcgttgtgtt atactgaacc taatgcgaac atctgcatta cgacataatt 301 gttcataaga aaggaaaacc gtatgaataa gtttattgtt gcgaacggcg gcaacgtctg 361 cccgatatta accgaaactt gtgctcacga aggcgttaag cgtatcgcca acgtccttgc 421 cgaggatatc tccctcgtta ccggcgtttt gcccgagcgt attgattcac tctcaaatgt 481 aaaatcttca tctgtaataa tctgtgcaac ccttggttac agtgaactga ttgacagcct 541 tgcaaatgaa aacaaactcg atctttgcgc aatcagcgga aagcgcgaag tatatatgat 601 tagtcatctt tcctcgccat ttgctgatta tcccaacatc accgatgctt tgataattgt 661 cggaagcgac aagcgcggaa cgatttacgg tatgttctca atctccgagg cctgcggtgt 721 ttctcctttg gtatattggg gtgatgtcgc acctaagcat aaggacgata tcgcgcttga 781 ttattccgat gctgttgttt caaaggagcc ttccgttaaa taccgcggat tctttatcaa 841 tgatgaatgg cctgcattcg gcggctggtc acgtgaccgt ttcggcggct tcaatacatc 901 cgcttatgaa tacgttttcc agctccttct tcgcttaaag ggcaactata tgtggcctgc 961 aatgtggtca agcgcattct ccgaagaggg ccccggaatt gccaacgccg agcttgcaaa 1021 tatctacggc gtaattatgg gtgcatccca ccacgagcct atgtgccgtg ccggtgttga 1081 atggcagaat atatataagc aatatggcga cgacaacacc tggagcttca tttccaaccg 1141 tgaagcaata accgagtttt ggcgcgacgg cttaaagcgt aataaggatt ttgaaaatat 1201 catcaccgtc ggtatgcgcg gcgaaaacga ctcgcttctt ttgggcgctg atgcaacact 1261 tgacgacaac atcaatgttt tacgcggaat aatcaatacc cagaacgagc tgatgaagga 1321 gatcgtaaat cctgatttaa acgaaattcc aagaatgctc gcaatgtata acgaggttga 1381 ggacttttat tacgctccca acggtttaaa gggctgggaa gctcttgacg gcgtgatttt 1441 gatgctctgc gacgataact ttgcaaatct ccgctatttg cccacagaag atgaccgtga 1501 ccacaagggc ggcttcggta tgtactatca ctatgactac cacggtgctt caatttcata 1561 tgaatggatc aactccaacc gcttaaccaa gacttgggaa caaatgacca tggcatatga 1621 ctacggcatt cgcgacctgt ggatcgtcaa tctcggcgac atcaagggcc ttgaatatcc 1681 catctgctgt ttcttggatc ttgcatacga ctttgatcgt tacggttcaa gtgctcttaa 1741 ctctgttgaa gattatgtca agagctggat agatcagcag tacggcgatt ggcttacatc 1801 tgaacagctt gatgatgtgt acaccctcat caacggatac accaagttca // LOCUS sequence291 1849 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence291 VERSION sequence291 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1849 /mol_type="genomic DNA" /organism="" /note="sequence291" CDS 134..595 /product="low molecular weight protein-tyrosine-phosphatase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003546643.1" /transl_table=11 /codon_start=1 /translation="MTKIMFVCHGNICRSPMAEFIFKKMLAERGLSELFYVSSCATSTE EIWNGIGNPVYPPARAELMRHGIDPAGKRAVRLKKSDYDEFDLLVGMDSANIRNMHRIL GGDPDGKIKKLMDYTSRGGDVADPWYSDRFDIAYRDIFEGCEALLNTLI" /locus_tag="LOCUS_7950" /note="WP_003546643.1 low molecular weight protein-tyrosine-phosphatase (Lactobacillus acidophilus) [pid:42.5%, q_cov:99.3%, s_cov:98.0%, Eval:5.5e-31]" /note="MGA_1138" CDS complement(635..1456) /product="sugar phosphate isomerase/epimerase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_013530826.1" /transl_table=11 /codon_start=1 /translation="MRIGLSSPLAHKSPEEWAKNLKALGCRAVNFPLNCNSDPALIRAY ADLAKENDLVIAEVGVWNNMLERDPEKRKANLNYNIRQLILADEIGAVCAVNVAGTPHG PRWDGGYRENFSLETFDMTVETVKYVIEQANPKNAFFSIESMPWMIPSSPKEYLELIEA VDHPRFAAHLDAINMITSPRRYFFNDEFLRECFSLLKGKICSCHLKDVRLKEQFTFQLE ECCIGTGNFDLETFARLCDDENPDMPVLIEHLNTDNEYLWALEHVKNRLSL" /locus_tag="LOCUS_7960" /note="WP_013530826.1 sugar phosphate isomerase/epimerase (Mesorhizobium) [pid:21.4%, q_cov:89.4%, s_cov:89.5%, Eval:1.8e-08]" /note="MGA_1139" ORIGIN 1 ctttttcaat cttttgcacc tccgtgggag atatagttat attttatatg atttgggcgg 61 ggattgcaat cccccttgcc aactatgcac acttatgcta aactatacac atcaaatcgt 121 atgaggatta gttatgacaa aaattatgtt cgtctgccac ggcaacatct gtcgcagtcc 181 gatggcggag tttatattta aaaaaatgct ggctgaaagg ggtcttagcg aactgtttta 241 cgtttcttcc tgtgccacca gcaccgagga gatttggaac ggtatcggca accctgttta 301 tccccctgca agggctgaac taatgcgcca cggaattgac cccgcaggaa agcgtgctgt 361 ccggcttaaa aagagcgact atgatgagtt tgacctcttg gtgggcatgg actcggcaaa 421 tatccgaaat atgcatagaa ttctcggcgg tgaccccgac ggaaagatta aaaagctgat 481 ggactatacc tctcgaggtg gtgatgtcgc cgatccgtgg tattccgacc gattcgacat 541 cgcctatcgt gatatttttg agggctgtga ggctcttttg aacacgctca tataaaaaac 601 aactcccatt gttttgcaat gggagtattt tggtttataa tgacagccta ttcttcacgt 661 gctccaatgc ccaaaggtac tcattatctg tgttcagatg ctcgatgagc acgggcatat 721 cggggttttc atcgtcgcaa aggcgggcaa atgtttcaag gtcaaagttt cccgtaccaa 781 tgcaacactc ttcgagctgg aaggtgaact gttcctttaa gcgcacatct ttaagatggc 841 aactgcaaat tttaccttta agcaggctga agcactcgcg caggaattca tcattaaaga 901 aatatctcct cggtgaggtt atcatattga tggcatccag atgcgccgca aatctggggt 961 ggtcaaccgc ttcgatcagc tccaaatatt ccttggggct tgaggggatc atccaaggca 1021 tcgactcaat gctgaaaaac gcatttttcg ggttagcttg ttcgattaca tactttaccg 1081 tttcaacggt catatcaaag gtctcgaggc taaaattctc gcggtatcct ccgtcccagc 1141 ggggaccgtg gggtgtgccc gcgacattga ccgcgcagac tgcaccgatc tcatccgcca 1201 aaatcagctg acggatatta tagttgaggt ttgccttgcg cttttcgggg tcgcgctcaa 1261 gcatattgtt ccaaacgcct acctcggcaa tgacaagatc attctccttt gccagatcag 1321 catatgccct gataagagcg gggtcgctgt tgcagtttaa tgggaaatta acagctctgc 1381 atcccaaagc cttcagattc tttgcccatt cctcggggct tttgtgagca aggggagatg 1441 ataaaccaat tcgcatatat attttcctcc tgattattat ttgctgaaaa tttaaagcac 1501 caaatcacat ttttcggcta tgttaaagcc ttcaaaatac ctgttttcca tggggatcca 1561 ttcattgaag aaacgctgat gcaaaaatgc aggccgcttc aaaatccgtt cgcgttgctc 1621 atcttcggtg atattgagca taactttcaa gtcataaact tcgccaaaat acgggtgtaa 1681 gctatatgta ccctcaacaa tgctcagctt ttttggaaca accgtcactt ctttgccaag 1741 cgtaaatgtt gagcagtcaa aggggcgata tgcaaacgat tttcccgatt tgagcggaat 1801 cagaacttct ttttcaaaac gctcataatc aacattcccg ccgatctgc // LOCUS sequence292 1847 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence292 VERSION sequence292 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1847 /mol_type="genomic DNA" /organism="" /note="sequence292" misc_feature <1..917 /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_081712308.1:glycogen/starch/alpha-glucan phosphorylase" /note="WP_081712308.1 glycogen/starch/alpha-glucan phosphorylase ([Clostridium] dakarense) [pid:49.4%, q_cov:99.0%, s_cov:37.6%, Eval:3.6e-80, partial hit]" /note="MGA_1141" /locus_tag="LOCUS_7970" CDS 1002..1256 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MAVVNIISGFLLIVACIAIIAVVLMTDTKSNGLNSAIGGGSSDTF FGRNAKNTKEARLDKATKICVGVFFVITLLVNIVSAIVA" /locus_tag="LOCUS_7980" /note="MGA_1142" ORIGIN 1 agaagctgga agcatataag gacaatgcag aagtgctcac caagctcggc gagatcaagc 61 tcaagaacaa gactgcattt gctaaatatg taaagagcca gagcggaatc attttagatc 121 ccaacacctt ctttgatgtt caggtcaagc gtctgcacga atataagcgt cagcacctca 181 acctcttgaa catcatgtcc gaatataact atctccttga aaatcccaat gctgacttcg 241 tgcccaagac ctatatcttc gctgcgaagg ccgcacccgg atattacctt gcaaagcaga 301 tcatcaagct catctggtcc ttgggcgagg agattagaag aaatcccaag ataagcgaaa 361 agctgggcgt tgtcttcctc gagaactata atgtttctct ttccgaacgt cttatgcctg 421 ccgctgaaat ctccgaacag atctctcttg cgggtaccga agcatccggt acaggcaata 481 tgaagctgat gctcaacggt gctgtaacct tgggcacctg cgacggcgca aatatcgaaa 541 tcggcaatgc ctgtggcaag gataacatca tcaccttcgg tatgtccgca gaagaagcag 601 acagagctaa gtacggttat aaccccgagc ttatctacaa ttccaacgag ataatcaagg 661 cggctatcga ccgcattgaa aagggcgtaa acggcagtat gttcgacgat gttgttaagt 721 ccctcaagta tgaagatcct tatatggttc ttgctgactt cgattcatat caggcagcac 781 aggcaagagc atccaagctc tatagcgata acctcaagtg gcagtcaatg tcgcttatga 841 acatagctaa cgcaggtgta ttctctgcag acagagcagt tgaggactat gcaagagata 901 tttggaagct gaaataaaat ttctttccaa agctattgca ttttacaaac ggatgtgtta 961 taatccaaag gaatgttaat tatttattgg aggatttata aatggcagtt gtaaatatta 1021 tcagcggatt tcttcttatt gttgcttgca tcgcaatcat cgcagttgtt ctcatgaccg 1081 acaccaagag caacggtctt aactctgcaa tcggcggcgg ctcttccgat actttcttcg 1141 gcagaaatgc aaagaacacc aaggaagctc gtcttgacaa ggctaccaag atctgcgttg 1201 gcgtattctt cgtcatcaca cttcttgtca acatcgtttc cgcaatcgtt gcttaacttc 1261 aagcaaaaat gccgcctgac cgtttaagtc gggcggctgt tttcattttt tcttagtttt 1321 tctgaaagga tggatatata aatgaaaaag accttattca cgagaattct tgtaatctta 1381 ttggttatct gtttggtttt gggcattgtc gtttcggctg catatccgtt attggtgtga 1441 tgcgttatgg ttaaactcgg taacgattgg gacaatatca tcggcggcga atttgaaaag 1501 gaatattacc ttcagctccg cgagttttta aagggggagt atgcaaacgg caccgtatac 1561 cccaatatgt atgatatttt caatgccctc aagctgactc catattcttc tgtcaaagct 1621 gtcatcctcg gacaggaccc ataccacgag ccgggacaag cccacggcct tgcattttcc 1681 gttaaagagg ggacacccct gccaccttcg cttcgcaata tctataaaga gcttgaaaca 1741 gacgtgggcg caaagcccgt ttcctgcggt gagcttatcg gatgggcaaa acagggtgtt 1801 ttgcttttga atactgttct aacagtaaga cagggcaacg ccaactc // LOCUS sequence293 1843 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence293 VERSION sequence293 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1843 /mol_type="genomic DNA" /organism="" /note="sequence293" CDS 388..1299 /product="stage III sporulation protein AA" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003438117.1" /transl_table=11 /codon_start=1 /translation="MTSGIINSLNLLQNGIKQAVSEIEYINYIDEIRLRCEKPLSVVIG AKNYFVERGGKLCNTVNENCFTVSKGDIEYAFKSAFSYSIHSYSKELAGGYITTEGGNR VGICGTAVIAGESRDRVDSVKYISSINIRISREVFGYAQDLYNQCLANNPVGILIIGPP SSGKTTLLRDLTRLAGNRYKVSLVDELNEISYTYRSEPQKDVGVFTDVFVGYPKHIGIS TAVKVMSPQIIACDEIGSLEDAKALEYALHSGVSLITAVHSSSFDEAKNKAGIAALLRE KAFAVTAILDPISRNYRVIKID" /locus_tag="LOCUS_7990" /gene="spoIIIAA" /note="WP_003438117.1 stage III sporulation protein AA (Clostridioides difficile) [pid:38.2%, q_cov:93.1%, s_cov:90.1%, Eval:8.7e-50]" /note="MGA_1145" ORIGIN 1 agaaggcttc aattgcaaac atgataactg ccgcatcgat tacgagaata acgatggtat 61 ccaggaaaca ggtgacgaga gctgtgatga caaccgtcat tagaggatgt tcctggatgt 121 aattttggat catctcaata atgccgtatt cattgaggac actgaaaatg gcagtgggat 181 cgttagcggc tgtttcagcc aaagtaggaa tcagtgctgc caaagcagcg atgatattca 241 taaaattcat attgtgcata ttcttcggtg tagttggcgg aataaaaggt gttaatacac 301 gcaaaacaaa agtgcgatga atgcatacaa aagctgagaa tcacatagat atttactaac 361 acggacaaga ttggggataa acataaaatg acctctggga ttataaattc tctgaacctt 421 ttgcaaaacg gaatcaagca agcggtcagt gaaatcgagt atatcaatta tattgatgag 481 atacgtctgc gatgtgaaaa acccttgagt gttgtaattg gcgcaaagaa ctacttcgtt 541 gagcgaggag gtaagctatg taatactgta aatgaaaact gctttacagt atccaaaggt 601 gatatcgaat atgctttcaa atcggcattt tcatattcaa ttcacagcta ttcaaaagaa 661 cttgcaggcg gttatatcac taccgaaggc ggcaacaggg ttggaatctg cggaaccgct 721 gtcattgcgg gtgaatctcg agacagagtt gacagcgtaa agtatatctc atcgatcaat 781 atccgaatat cccgcgaagt tttcggttat gcgcaagatc tatataatca atgtcttgcg 841 aataatcctg tcgggatact cattatcggc ccgccttcaa gcggtaaaac aacgttatta 901 cgcgatttga cgaggcttgc aggaaacaga tataaggtct cactggttga tgaactgaat 961 gagatctcat atacataccg ctccgaaccg caaaaggatg taggcgtgtt cacagatgtt 1021 tttgtgggtt atccaaagca tatcggaatt tcaactgctg ttaaagtgat gtctccgcaa 1081 atcatcgctt gtgatgagat cggttctctt gaggacgcaa aagcacttga atatgctctg 1141 cattccggag tgagcctgat tacagctgtt cactcatcaa gcttcgatga agcaaagaac 1201 aaggcgggaa ttgcagctct gcttcgtgaa aaggcatttg ccgttacagc gattttagat 1261 cctatttcaa gaaactacag ggtgataaag attgattaag ctgaccgctt gtgtgctgat 1321 atgtatgttt tcgtttctga tttcatatga actgcttatt cgtgaagaaa acaaagcaag 1381 aagcgctgac agcttgagag aagcggtaga taaaattatt gttatgcttc actttggaga 1441 atatgatgta ttccagatat gcgaatctat atttgaagat gcggacgaat tttcgccgtt 1501 aaacggagat tttcgggaac aatggattga ctattgtcgg aatcatttaa ttgattctga 1561 tttgaaagat tttctgctct ttgaaaaagt cggggaagta ttgggaagta ccgatgcgaa 1621 atcgcagatt gatcggctta catatatcaa agacgagctt attaggtcat atgaaaaaag 1681 acggacagat gttgaaaaga agcgtaggat atattttagt cttgggtgct ttgcagggct 1741 gatggtctgc attattttga tttgaggtaa cacataaatg gatgtcgatt tgatatttaa 1801 aattgcagga atgggcataa ttgttgccgt tctcagccag cta // LOCUS sequence294 1831 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence294 VERSION sequence294 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1831 /mol_type="genomic DNA" /organism="" /note="sequence294" misc_feature <1..1094 /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_054937112.1:mannitol dehydrogenase family protein" /note="WP_054937112.1 mannitol dehydrogenase family protein (Moorella) [pid:64.5%, q_cov:45.7%, s_cov:30.9%, Eval:3.3e-57, partial hit]" /note="internal stop codon at [1092:1094](+)" /note="MGA_1147" /locus_tag="LOCUS_8000" CDS 1125..1535 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MPDAPQRIATDTSQKVGIRFGETIKSYAALGRTDELVAIPLAIAG WARYLLGIDDNGSVMAVSSDPLLGELQPKLEGIVVGKPETYNGQLKDILANANIFGSDL CALGMDTLIEKIFVEELAGAGAVRATLEKYLG" /locus_tag="LOCUS_8010" /note="WP_054937112.1 mannitol dehydrogenase family protein (Moorella) [pid:54.3%, q_cov:100.0%, s_cov:25.7%, Eval:2.6e-33, partial hit]" /note="internal stop codon at [1092:1094](+)" /note="MGA_1148" ORIGIN 1 aggtcgcgga gcatctctct gatgcgatca aattcaaaac gatttcaaag gtaagagatg 61 agggcgtaga ctgggacgaa tttgaaaagt ttcacgagta tctcgacaag acttaccctc 121 tcgtcgccaa gaatactaca aaagagataa tcgacaaagc aagccttctc tacctctgga 181 agggtaaaaa tcccgacctt gaacctatgg ctatgctcgc tcatcaggac gtcgtgcctg 241 tttccgaagg tactgaaaag gactggaaat atgatgcttt cagcggtcat attgacggcg 301 aatacgtctg gggcagaggt gcacttgata tgaaaaacca cctcatctgc gtaatggaag 361 ccgtagaaac gcttatggtt gaaggttttc agcctgacag agacgtttac ctctgcttcg 421 gtcataacga ggaaacagtt tcgactgttt attcaggcgc aggaactatc gtaaagactc 481 tcaaagagag aggtgtacgc cttgacagcg tacttgacga gggtagtgca ctcatcaagc 541 tgaaagttcc cagaatcatc gatacacacc ttgctgcagt cggtacggct gaaaagggtt 601 atgttgacaa tggcttcatt gagtatcttt ccgatgaaag ctacattacc ttcccctggt 661 cgatgatcga caagatcact ccccgtcccc acgacagcgt tatggctatg cttgaggaaa 721 agggccttga ggatatggct cccattgtta caagcaagaa cacatatatt gcggcattcg 781 ttaacgcaga aagacctcag tatcttgttg ttgaggacaa gttccccaac tcccgtccct 841 gccttgaaaa tgcaggcgta tatctgaccg acagagatac agttaacaag actgagagaa 901 tgaaggttac aacatgtctt aatcccttgc atacagcttt ggctgtatac ggatgcttgc 961 tgggatacaa cctcatctgc gaagagatga aggatgaaga gcttgttaag cttgttaagc 1021 gtttgggcta tgttgagggc ttgcctgttg ttacagaccc cgaaattgta agaccaaagg 1081 aatttatcga ttaagttgta aatgaaagac ttcctaaccc cttcatgccc gacgctcctc 1141 agagaatcgc taccgacaca tcccagaagg ttggaattag attcggtgaa accattaaga 1201 gctatgccgc actcggtaga accgacgagt tggttgcaat tcctcttgca attgcaggct 1261 gggcaagata cctattggga attgatgaca acggcagcgt tatggctgtt tcaagcgacc 1321 cgttgctcgg cgagcttcag cccaagcttg aaggaattgt tgttggcaag cccgaaactt 1381 acaacggaca gctcaaggac attttggcaa atgcaaacat cttcggctcc gatctttgtg 1441 ctttgggaat ggacaccctc attgagaaga tctttgttga agagcttgca ggcgcaggcg 1501 ctgtaagagc gactttggaa aaatatcttg gataatacgc ccatgtgagg cgaagccgat 1561 ccccgatgcg cgaagcgcat cggggatttt tgcgccgcag gcgcaaaacg gtacgttttc 1621 gcaagaaaac ggacgcggct tcgccgtagt tgggcgatgc gcaaaaggag ccgtcgcgga 1681 gcctgcgcac cgtgaggcgt tggggcgaag cggtggcggt cggtatgaga taattgcacc 1741 aaatcttaga aaaatatgcg ctttttcgta ttgccattag aagcacattt tgttataatt 1801 aatgtgtata tttgagcatt ggtggtgata g // LOCUS sequence295 1828 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence295 VERSION sequence295 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1828 /mol_type="genomic DNA" /organism="" /note="sequence295" ORIGIN 1 aactgtgata ttaccgcttt cgagtgcttg ctttaccata tccggagtat agtcggggtc 61 aaaaccgcct tcttcccatc cgtcccaatc gctgtcctgc aaagtttcct cgaatgtttt 121 tatatcggaa acatctctga tccaagtgct aaatgcatta tttgcaggat tgtttttcaa 181 aatgatgtcg agttgctttg atttgagctc ttcttggctt aaggaagaaa ttcccctgtt 241 gactttttcg ggcaacggtg atatactatg tttaaaagaa gcagatgagt tgccgtctga 301 aagcccttta tggcttggca atgagtctgc ttcttttagc gtcatatcat acacataatt 361 atcgttgcca gtatctttga cattgacaag cacatcaaaa tatcttccgt cacttttaac 421 agttttcaca tagagtaatc ccaagatttt gcgttttcgt ttttttgtaa tggtgagagt 481 gtcgccctct atggtgcagg cagtcgggag cggaggggcg tctgcgggcg cgttccgaag 541 gaattgtgcc gcaggtgccc cggagcgccg gatgacccga aaacaggagc ggctcctcca 601 ccgcttgctc gctgccgctc acgcaaccga cgtcgtcgcc gcctttgtca ccaaaacctg 661 cacattttat aaaaatatta aatcaatatt tgcacattac ccccttgcca aacaggtcac 721 aaaatggtaa tattatcttg accgcgttcc aagcaaattt gcggatcatt ctctatggta 781 taggaggacg aaatatgcag tatggtcatt ttgatctgaa aaacaaagaa tacgtaatta 841 ccaagcccaa cacccccgca ccttggtgca actatctggg ctcgcccgaa tacggcgcaa 901 tcgtttccaa caatgcagca ggctatagct tcgttaagag cggtgcaaac ggcagaatcg 961 caagataccg tttcaactca acaatggctc ttcccggaag atatatctat ctgcgcgata 1021 atgacaccgc tgattactgg tctgcatcat ggcagcccgt tggcaagccc ctcgatcagt 1081 ataagtccga atgccgtcac ggcacagctt actctgttct gacaagtgag tatgcagaca 1141 tcaagtcgga ggttacatat tatgtaccta tgggtgcaac atacgaagta tggcgtgcaa 1201 aggtaaccaa caccggcgat aaggaaagaa acctctccgc tttcggtttc attgaattca 1261 ccaacgaaaa taactatgag caggatcagg ttaaccttca gtataccctg ttcatcacaa 1321 gaacctcatt cgagggcaac aaggtgctcc agcacattaa cgaaaactcc ggcaaggatg 1381 caacaggctc taaccaccgc gaaagattct tcggtcttgc aggcgaaaag gctgtcggcg 1441 cttgcggcga ccttaacgct ttcatcggcg attacagaac ttacgctaac cccatcatgg 1501 ttgaagatgg caagttaaac ggtgctatga actataactc caacgcttgc ggtgctttgc 1561 agtcggatat taccctcggc gcaggcgaaa ccaaggagct tatctacgtt ctcggccaga 1621 aggataacga gcaggccaac aagatcttgg ctctttatga agaagaaggc agagttgacc 1681 gcgaagttga tgaactcaag gcttattggc acgcaaagct tgaaaacttc tcaattgaaa 1741 ctcccagcga agagttcaac aatatgatca acgtttggaa cgcatatcag tgcttcatca 1801 ccttcacctg gagccgtgca gcttccct // LOCUS sequence296 1827 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence296 VERSION sequence296 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1827 /mol_type="genomic DNA" /organism="" /note="sequence296" CDS complement(270..1340) /product="branched-chain amino acid aminotransferase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003244231.1" /transl_table=11 /codon_start=1 /translation="MLSIKYDLKTERKEKPDWDNLGFGKYFTDHMFIMDYDKGMGWHDA RIVPYQNLSLDPACMVFHYAQEMFEGLKAYRTPDGDIQLFRPDKNIERMNNTNTRLCIP HLDPDDVLDAIKAIVSVEKDWVPTADGTSLYIRPFIIATDVHIGVHPSHSYKFIIILSP VGSYYPEGIKPVKIFVEREYVRAVKGGTGYAKVGGNYACSLIGQEKAEKLGYSQVLWLD GIEHKYIDEVGAMNVFFVLDGTVVTPTLDGGNILPGVTRASCIQLLEKLGYKVEERKLS LEEVIDAYKKGKLNEAFGTGTAAVVSPIGLLDTGDLKMTVNNGEIGEIAQKLYDTLTGI QWGKLPDDFGWTVKVD" /locus_tag="LOCUS_8020" /EC_number="2.6.1.42" /note="WP_003244231.1 branched-chain amino acid aminotransferase (Bacillus) [pid:61.2%, q_cov:99.2%, s_cov:97.0%, Eval:1.1e-126]" /note="MGA_1151" ORIGIN 1 atcttgttct ttttgaatat tatacaccat taaagccaat atgtcaatac accgaacaac 61 aatattttga caagtttttc gcattcaaat tgtcattatg cacaactatg cataatatga 121 atagtttata caattgcttt ggcgtataat tggcttaaaa tttccatgtt tcaacaacag 181 aacagctgaa taatattcac ataatttgca tagctcatac cgcactcaac cgcaggtaca 241 gtttatgtac ctgcggttga aatttttatt tagtcgacct taaccgtcca tccgaagtcg 301 tcaggaagct taccccattg aatacctgta agtgtatcgt agagcttctg tgcgatctcg 361 cctatctcac cgttgttaac ggtcatctta aggtcacctg tatcaagaag tcctatcgga 421 gatactacag ccgcagtacc tgtaccgaat gcctcgttaa gcttaccttt cttgtaagcg 481 tcaataacct cctcaagaga cagctttctc tcttcaacct tataacccag cttctcaagc 541 agctgtatgc aagaagctct ggtaacgccg ggaagaatgt tgcccccatc aagcgtagga 601 gtcactacag ttccatcaag tacgaagaaa acattcatag cgcctacttc gtcgatgtac 661 ttatgttcga tgccatccag ccagaggacc tgagaatatc caagcttttc agccttttcc 721 tgtccgatga gagagcaagc atagtttcca ccaaccttgg cataacccgt gccgcccttg 781 acagccctta catattctct ttctacgaat atcttgaccg gcttgattcc ttcgggataa 841 taagaaccaa cggggctgag aatgattata aatttatagc tgtgtgaggg atgaacgcca 901 atatgaacat cggttgcgat tataaaggga cggatgtaca gagatgtacc gtctgccgtg 961 ggtacccaat ccttctcaac ggaaacgatc gccttgattg catcaagaac atcatcggga 1021 tcaagatggg gtatgcaaag acgagtattg gtattattca tacgctcaat atttttgtcg 1081 ggtcggaaga gctgaatatc tccatcagga gttctatatg ccttaagacc ctcgaacatc 1141 tcctgcgcat agtggaacac catacatgca gggtcaagcg aaaggttctg atagggaacg 1201 atccttgcat catgccaacc cataccctta tcatagtcca taatgaacat atgatcggta 1261 aagtactttc caaatcccag attatcccaa tcgggctttt cctttctctc tgttttaaga 1321 tcatacttga tactaagcat tttaattatt cctttctaat acataaaaat tatatattgg 1381 aggcaataat tgttcccatt tcggagcaac caaccttctt aaatccgtct ttgtaaatat 1441 cgacggtgcg gtatccgtca tcaagtgcct tgttcactgc tctctctatt gcatctgctt 1501 cttctgccat atcaaaggaa taacgaagca tcatagcggc agacattatt gttccgatgg 1561 ggtttgctat atccataccg gcaatatcgg gagcagaacc atgtatcggc tcgtacatgc 1621 ccaatgtacc ggaggaaagg cttgcagagg gcatcatacc gatcgaaccc gtaagcatac 1681 ttgcctcgtc ggaaagaata tcaccaaaca tattttcggt aacgatgacg tcaaactgag 1741 caggattttt gataagctgc atagcggtgt tatctacaag aacatcggaa tactccacat 1801 cgctgtactc atcttcaagc ttgtgca // LOCUS sequence297 1824 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence297 VERSION sequence297 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1824 /mol_type="genomic DNA" /organism="" /note="sequence297" ORIGIN 1 gcgcaggggg ctgagtgaaa tgctgattgc cgtcaaggga tttaagcttt aaaacatctc 61 cctttgaaag cttgggcaaa attgcagttt cttccgattc ttccttgggt tcttcataga 121 gcacggtaaa accgtcaaac ttaacactga agccggacgc tttgaatata catccgttag 181 cttcgattga gcaagcagtg gtgtccaaaa cgcaatctgc catctggctt gcgatgaagc 241 gtgaccaaat gagcttatag agcttatact ggtcgtttgt cagcgaggac tttgcctttt 301 cgggagtcag atcgggcatt gtgggacgaa ttgcttcgtg ggcatcctgg atgtttgcat 361 cctttgattt atatgtcttg ggagttgcgg ggagatattc cgcaccgtag ttatttttaa 421 tgaaatcgtg ggcagcggct ctggcttcgt cggaaatgcg aagcgagtcg gttctcatat 481 atgtgatcag accgacagca cccaagcctt caacatctat accttcatat agctcctgag 541 caacgctcat ggttcttctt gactggaatc ccaaacgctg ggaggcatcc gagaggagag 601 ttgaggttga aaaaggtgcg gcggcggatt tgattcgcga accttttctt acagactgaa 661 cgacaaactg ttcgccgtca agacgagaaa gaactgcatc ggtctcgtcc ttggttttaa 721 gctcgatttt cttgccgtca acagttgcaa gctttgcaac aaagggcttc tttgcgctgt 781 cggcaaggaa cttcgcctca atcgaccaat attcaacagg gatgaaggac ttgatctcct 841 cttccctatc aacgatcatg cgaacagcta cagactgaac acgacctgca gaaagaccgc 901 ggcgaacctt cttccagagg aaaggagaaa gcttatatcc aacaatgcgg tcgagtattc 961 ttcttgtctg ctgggcgtta acaatgttca tatcgatgct tcggggtgcg gcaatacccg 1021 cttcgacacc cgacttggtt atctcattga aggtgacacg gtttttgtcg cttaaatcga 1081 aaccgagcat tgttgccaaa tgccaggaga ttgcttcgcc ttcgcggtca gggtcggttg 1141 caaagtaaac atgttttgcc tttttggaaa gcttcttaat gtcgtcaatg accttttcct 1201 tgcccttgat gtccacatag gtgggcttga aaccgttgtc aatatcaaca ccaagctttg 1261 acttgggtaa atctcttacg tgacccacac aagcgacgac tttatagtcg ctgccgaggg 1321 tgcgctgaat tgtgtgtatc tttgtagggg actctacaat gataagatct gccataattg 1381 tattgctcca ttcttgcgat gttatatcgc ttatattgaa aatctgttgc cgggaagtgc 1441 gcggatgatt ccgtcgatct ccatatcggt aagctccgat tcaaggtcgg gaatttcact 1501 tccgagggca tcaaatattg cgtccaaaag ttgtgcgccg ttgtcggcga ggtattcata 1561 gataagccgc tgtgccttcg gcagggcttc ggtatccata agcttgggtt tttcggcagg 1621 acgggaaact tcttcactct cggaataagc tttcttcggt gacggcttcg gtttgggtgt 1681 atcctgcttg gcaaaaagtc ccgagtcgga ccgacgacta aatatgcccg aattcggatt 1741 cagcttatga gcataggtgc tgaagtattc atttaaaatg tcacgtgctt caaaaacagg 1801 aatagccccg tcacgaatca gccc // LOCUS sequence298 1823 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence298 VERSION sequence298 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1823 /mol_type="genomic DNA" /organism="" /note="sequence298" misc_feature <1..647 /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_003426579.1:Holliday junction branch migration DNA helicase RuvB" /note="WP_003426579.1 Holliday junction branch migration DNA helicase RuvB (Clostridioides difficile) [pid:66.7%, q_cov:95.3%, s_cov:60.2%, Eval:3.1e-73, partial hit]" /note="MGA_1155" /locus_tag="LOCUS_8030" ORIGIN 1 aggttttgta tcctgcgctt gaagatttct gcatagatat tattatcggc aagggtcctg 61 cggcgcgctc gataagaatc gatctgccaa agtttaccct agtcggtgcc accacccgtg 121 caggtcagct cacttcgcct ttgcgcgacc gtttcggcgt tattcagcgt cttgagcttt 181 acaccaaaga agaacttgct gagattatta tgcgctctgc agttattttg ggcgtaagct 241 gcgataaaga aggtgcgctc gagcttgcct cccgttcaag aggcacacca cgaattgcca 301 accgattttt gaaacgcgtg cgtgactatg ccgatgttat ggcagacggc cacatcacca 361 aggaaatcgc aagtgttgcg ctcgaccgaa tggaagttga ccccttgggt cttgattcgc 421 tcgacaagcg tatgcttgaa atgataatca agggttataa cggcggacct gtcggtcttg 481 aaactcttgc ttccgcaatc ggtgaggagg ctgtaacttt agaggacgtc tgtgagccct 541 atttaatgca gctcggcttt attgcaagaa ctcccagagg ccgatgtgct accgaccttg 601 catataaaca tttaggattt ttaaaggacg gtcagaccac actttaaaat attcattgaa 661 aattaaccta aaactaacac aacatacata aaaggggata ttatttatca tgggaagact 721 tttcggaact gacggcgcca gaggcgttgc gatcagcgag attactgttg acaaagcgat 781 gctcattggc aaagccgcgg cgctgaccct ttcaaaaact gctaaccata aacctaaaat 841 tttaatcggc aaggacaccc gtatttccgg cgatattctg gaagccgcac tcattgcggg 901 tatctgctca gtcggtgccg atgttcatct tttgggcgtt attccgacgc ctgccgttgc 961 atacttaact gttaagtacg gcgcagatgc aggcgttgta atttcagctt cgcacaactc 1021 ttacgaattc aacggaatca aactcttttc atcgacaggc tataagcttc ctgacgaggt 1081 tgaaaacgag atcgagcgcc ttgttttgga tgctcaggat gagatcatca acgccgattg 1141 cgatactatc ggccatatct acaccgaaaa gaacgctgaa tgggactatg ttcgctattt 1201 gatcaagcag atagataccg atcttggcag aatgaagatc gctatcgact gcgccaacgg 1261 tgcggcatca tcaaccgctg aaaaattctt ccgtggaatc aacgcaaatg ttacattctt 1321 aaataacacc cccgatggct tcaacatcaa tcgcaactgt ggctcgaccg acctttcaat 1381 gctttcaaaa tatgttgttg aaaaccgctg tgttgctggc attgcctttg acggcgatgc 1441 cgacagatgc ttggttgttg acgaaaaggg cgaacttgtt gatggcgaca agcttattgc 1501 tttgcttgct cttgatatga aggaaaacga aaagcttgca tccaacacct gcgttgtcac 1561 ccagatgaca aacctcggat ttttccgctg ggcaaaggaa aacggaatcg ttgtttcaac 1621 ctcatcgaag atcggcgaca gatatgtttt ggagcgtatg ctcatcggtg gatataatct 1681 cggcggtgaa cagtcgggac acataatcct ttccgatatc gccacaacgg gtgacggtga 1741 gctttcgggc gcaaaaattc ttgagatact tgccaaatcg ggcaagaaga tgagcgacct 1801 tgcgaacatc ttcactccat atc // LOCUS sequence299 1807 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence299 VERSION sequence299 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1807 /mol_type="genomic DNA" /organism="" /note="sequence299" CDS complement(167..1021) /product="RNase adapter RapZ" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_010963833.1" /transl_table=11 /codon_start=1 /translation="MKIVIITGMSGAGKSSAINLFEDMGYYCMDNMPPELLASVADFIV KSDSVIDKICVAVDVRSGELYKKLEECTQDLKRSGIDVSILFVDCDDDCLLRRFKETRR KHPLDEEASGNLVSAIALERVATSRAREIADYYIDSSSTGVVAFKDKIKEMFFEKSDAI IIDAVSFGFKHGVPKDADLVFDVRCLPNPFYVPELKPKTGLDDEVYNYVMSFDDAKAFY DKIYDMVKFLIPLYAKEGKSRLVIAFGCTGGKHRSISFARRLSNELAGEGFTVRADHRH IDY" /locus_tag="LOCUS_8040" /gene="rapZ" /note="WP_010963833.1 RNase adapter RapZ (Clostridium) [pid:45.8%, q_cov:99.6%, s_cov:96.6%, Eval:3.3e-72]" /note="MGA_1158" misc_feature complement(1018..>1807) /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_001057087.1:UDP-N-acetylmuramate dehydrogenase" /note="WP_001057087.1 UDP-N-acetylmuramate dehydrogenase (Bacillus cereus group) [pid:53.8%, q_cov:90.8%, s_cov:77.7%, Eval:2.0e-65]" /note="MGA_1159" /locus_tag="LOCUS_8050" ORIGIN 1 accaaatcgt tttcggtttg aaagacgatc tcatcggctt ttaaggtatt tgcaaataaa 61 agcataccca aaaggcaggc atcgcacctg cggcggcctg taatgccatc gcatatttcc 121 gctttggttt tatatgaaaa tgtttgatta tatgcagttt tcatggtcag taatcaatat 181 gtcggtggtc ggctctgaca gtgaagccct ccccggcaag ttcgtttgaa aggcggcggg 241 caaagctgat cgagcggtgc tttccgcctg tgcagccaaa ggcaattaca agtcggctct 301 tgccctcctt agcatataga gggattaaga acttgaccat atcgtagatt ttgtcataaa 361 aagcctttgc atcgtcaaag ctcatgacgt agttatatac ctcgtcgtca agacctgtct 421 tgggcttgag ctcaggtaca tagaatgggt tcggaagaca tctgacatcg aataccaagt 481 cggcatcctt gggcacgccg tgcttgaagc cgaaggaaac cgcatcaatg atgattgcat 541 ccgacttttc aaagaacatc tccttgattt tgtccttgaa ggcgacaacg ccggttgaag 601 atgaatctat gtaataatcg gcaatttcgc gggcgcgaga ggttgcaacg cgttcaagcg 661 caatggcgct gacaaggttg cccgaagcct cttcgtccaa aggatgctta cgtcttgttt 721 ccttgaaacg gcgcaacaga caatcatcgt cgcagtcgac aaataaaatg ctgacatcaa 781 tgcccgaacg cttcaaatcc tgagtacact cctcaagctt tttataaagc tcacccgagc 841 ggacatccac agcgacacat atcttatcaa tgacagagtc agacttaaca ataaaatcgg 901 caacacttgc caaaagctca gggggcatat tgtccatgca gtaatagccc atatcttcaa 961 agagattgat ggcgctggat tttcccgcac cggacatacc tgtaatgatg actatcttca 1021 cttgtcgctc tcccccaatc tttcgggaat tgtcttgacc tcacactcaa ggtcgtatcc 1081 tgtgtgttcc tttacagctt ttttgacata tgcgatcaga tcaattatgt ccttagctgt 1141 ggcattgccc ttgttaatta caaagttagc gtgcttttcc gatacctgcg ctccgccgac 1201 agaatagcct ttaagaccgc tttgctcaat tacaaggccc gcatatgttc cctcagggcg 1261 cttaaaagtc gatcctgccg aaggatactc aagaggctgt tttgatttgc gcctcgacat 1321 aaggtcatcc atctttgcct tgatatcttc tttatttccg attgaaagtt caaaggatgc 1381 cgacagaatc acatattccg aatcggtgaa aacgcttcgg cgatagccca tatcgagcat 1441 atcgtttgta aaggttacaa gcttgccaca cgagtcaaga gctgtgactt cggtgataac 1501 atcctttatc tcgccgccgt atgcgcccgc attcatatat accgcgccgc ccacggttcc 1561 tgggattccc caagcaaact cgaggcctgt taaactgtta tcataggcgg tttggcagag 1621 tctggccaaa gatgctcccg cacctgcgac cagcttgttg ccatctgcag atacgccgcc 1681 catttcacag gagattatga atattactcc tctgaaaccg cggtcggtaa acaatacgtt 1741 tgaaccgttg ccgagaatat atgtgtcaag tccaaccgct ttacactcgg aatacatctt 1801 tgaaagt // LOCUS sequence300 1802 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence300 VERSION sequence300 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1802 /mol_type="genomic DNA" /organism="" /note="sequence300" CDS complement(96..1322) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MKFKRLLCGLLLVAMLLTALVGCADTDINKPEEDTRLNTDYENSN KTRVINITDLLADPDDEQSLVRMFVTSNQVELEGIIVSTSCWRQHQDQQGMDVLYKIID AYGEVLPNLQIHAEGYPSLEYIKSISVMGQTGYSMNGVGQGKDSEGSELIIAAVDEYDD RPVWINLWGGANTLAQALWKVQNTRSEAEVAKFVSKIRVYDVLGQDEAGAWIVTNFPDI LYIRANLVYGLNHSIQQQGEGYIKQIQNLGPLGSVYPTAVWSYEGDSPSFMYQLPTGMN DPEHIDWGSWGGTFCAEKEPFIRSMDAVLNERDYDPYLMYGDSENNAWDFVNLWGDAIQ NDFLARMIWSVTDAYSEVNHHPIAVLNEDATMDILNITVKAGENVKLSAKGSSDPDGDD LSIIGMFTV" /locus_tag="LOCUS_8060" /note="WP_236615821.1 DUF1593 domain-containing protein (Rhodopirellula europaea) [pid:51.8%, q_cov:87.3%, s_cov:34.3%, Eval:2.8e-108, partial hit]" /note="frameshifted, insertion/deletion at around 116" /note="MGA_1161" ORIGIN 1 atggatgcag ttacctttgg cgtcctcagg gatctcaaca tatgcattga tatcattatt 61 acctttgatc gttacatttc ccgaatagag tccgttcaca cggtgaacat accaataatc 121 gacagatcgt caccgtcggg gtcagatgac cctttcgcgc tcagcttaac attttcgccg 181 gccttaacgg ttatattgag gatatccata gttgcgtctt cgttaagcac cgcaatggga 241 tgatgattta cttcactgta agcatcggtt acagaccaga tcattcttgc caaaaagtcg 301 ttttgtatag cgtcgcccca gagatttacg aagtcccatg cattgttttc gctgtcgcca 361 tacatcagat aggggtcgta atctctttca tttaaaacag catccattga tctgatgaag 421 ggttcttttt cagcgcagaa agtgccgccc cagctgcccc aatcaatgtg ctcgggatcg 481 ttcatacctg tgggaagctg atacataaat gaaggggaat ctccctcata tgaccacact 541 gcagtgggat aaacagatcc caaaggtccg agattctgaa tctgtttaat gtagccttca 601 ccctgttgct gaatgctgtg attaagtcca tagacaaggt ttgcacggat atacaagata 661 tcagggaaat tggtaactat ccaggcgcca gcttcgtcct gaccgagaac atcgtatact 721 cttattttgc tgacaaactt agcaacctca gcttcgcttc gtgtgttttg aaccttccaa 781 agagcctgcg ccaaggtgtt tgcaccgccc cagaggttta tccagacggg tcggtcatca 841 tattcatcaa cagcggcgat gataagctcg cttccttccg aatccttgcc ctggccaacg 901 ccattcatgc tgtatcctgt ctgtcccata acggagatag acttgatata ttcaaggctc 961 ggatatcctt ctgcgtgaat ttgcaagttg ggcaaaacct cgccatatgc atcaataatt 1021 ttgtagagta catccattcc ctgctggtcc tgatgctgac gccaacagct tgttgagacg 1081 attatgcctt cgagttcgac ttgattcgag gtgacaaaca ttcgcacaag cgactgctcg 1141 tcatcgggat ctgcaagaag atcagttatg tttatgactc tggtcttgtt tgagttttca 1201 tagtccgtgt tcaaccgggt gtcctcctca ggtttattga tatcggtatc ggcgcagccg 1261 acaagcgcag ttaagagcat tgctaccaag agcaatccgc aaagcagtcg cttaaatttc 1321 atatctgcct ccaagtatat ctgtataatt atatcatata tttcaaagga cttaatttca 1381 accaaaaatt aagtgaagtt tgagagcttg agcacttaat ctgctcaagt ttattatata 1441 ttcggctcgc cttgcaatca ccgctgacat acccgtgatg aaaagcaaaa ccatttccct 1501 cttttttcaa gaatgtcgag taaggtgtcg cctccaccaa aataaaagga gtccccaagg 1561 ggggcttctt tgtttttgtg acggttttcg ttaaccgaac acgcaagttg cttccatgtg 1621 gttgggaaaa atattcatcc gttactcaca atcagtgtat taaaccggca ctgcaacttt 1681 taaagttttc cgaccaaagg gaggaacact tttgggttca gattcccgtc gcctccacca 1741 tacgtgggat acgaaaaaga tatataccgt taaaagcccg atttatcggg cttttttcat 1801 tg // LOCUS sequence301 1801 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence301 VERSION sequence301 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1801 /mol_type="genomic DNA" /organism="" /note="sequence301" misc_feature <1..528 /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_010963601.1:aspartate kinase" /note="WP_010963601.1 aspartate kinase (Clostridium) [pid:48.2%, q_cov:97.1%, s_cov:38.9%, Eval:1.9e-42, partial hit]" /note="MGA_1162" /locus_tag="LOCUS_8070" CDS complement(571..1191) /product="flavodoxin family protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011986495.1" /transl_table=11 /codon_start=1 /translation="MKVLLVNGSPRKEGCTYTALCEVAKSLNEEGIETEIFWVGNKPLS GCIACYSCFKTGKCALDDCVNEFNEKACEADGFIFGSPVHYAAAGGTLTAFMDRVFYSS RGLYRLKPAAAIVSARRAGTTAALDQLNKYFTISEMPIVSSQYWNMVHGGTPSDVLQDE EGMQTMRVLGKNMAYMLKCIEAANLAGISKPEKEPRKWTNFVR" /locus_tag="LOCUS_8080" /note="WP_011986495.1 flavodoxin family protein (Clostridium botulinum) [pid:68.9%, q_cov:100.0%, s_cov:100.0%, Eval:8.0e-79]" /note="MGA_1163" misc_feature complement(1210..>1801) /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_004081723.1:glycerol-3-phosphate 1-O-acyltransferase PlsY" /note="WP_004081723.1 glycerol-3-phosphate 1-O-acyltransferase PlsY (Thermotoga) [pid:32.6%, q_cov:94.9%, s_cov:94.4%, Eval:3.3e-23]" /note="MGA_1164" /locus_tag="LOCUS_8090" ORIGIN 1 aagcctgacg atgcgggaac aatgatcgtt gaaaccgcag acgtttcaag ctgtgcatac 61 accattacag gtattgcggg cacaaagggc tttgccaccg tgagcattga aaaggatatg 121 atgaatgcgg agctgggctt cggcagaaag gtgcttgaga tatttgaaaa gcacggcatc 181 agctttgaac acattccctc gggcatcgac accatgtcga tcgttgttcg caagagcgaa 241 tttgaaaagg ccgaacatag cattattgac ggcattaagc gcgcagttaa ccccgaccac 301 attgaaattg accgcgacgt tgcgcttgtt gcgatcgttg gccgaggaat gaagagccag 361 cgcggtactg cggcgagaat ttttgcgagt ctggcgcata acaacatcaa catcaagatg 421 atcgaccagg gctccagcga gcttaacatc atcgtcggtg tcagcgaaga ggacttcgag 481 gcttccattc aggcggttta cgatattttc attacacaga atctttgatg agaaataaaa 541 aatcccccgt tattcggggg attttatttt ttatctcaca aaatttgtcc acttgcgcgg 601 ctctttttca ggctttgaaa tgcctgccaa gttggcagct tcaatgcatt taagcatata 661 tgccatattc ttgcccaaaa cgcgcattgt ctgcattccc tcttcgtcct gcaaaacgtc 721 cgaaggggtt ccgccgtgaa ccatattcca atattgcgac gaaacgatgg gcatctcgct 781 gattgtaaaa tatttattga gctgatcgag agcggcagtg gtgcccgctc ttcttgcgct 841 gacgattgcg gcggcaggct ttaagcggta aagtccgcgg gaagaataga atactctgtc 901 cataaacgcg gtcagcgtac ctcctgcagc agcataatga acaggagagc caaaaatgaa 961 gccgtcagcc tcacaggctt tttcgttgaa ttcgttgaca cagtcatcaa gcgcacactt 1021 gcctgttttg aagcaggaat agcaagcaat acatccgctc agcggcttgt ttccgaccca 1081 gaagatctcc gtttcaattc cttcttcgtt cagcgacttt gcaacctcgc aaagcgcggt 1141 gtatgtacag ccctctttgc gggggcttcc gttgacaagc aataccttca tcgttaatca 1201 gttcctttct taagttttat ttttcgactt tccgattttt gaaagccgca tctccgtttt 1261 gtttatcatt cttttatagt tttcaatatg cttgatgatt atgaccattg atgcaaccaa 1321 aaggatcagc ggcagtatat agcttctttc ggtaaagccg tatacgatcg gcacaagggt 1381 gaccgttaag gtagtcgcaa caacgatata gtcggacagg agcattatta cgaggatgat 1441 cgcagttaaa atcagagcaa ctttccagtt gatgccgtat gccacaccga tatatgaggc 1501 aaagcctttt ccgcccttaa atttcaaata aaacgggaag atgtgtccca atacacagga 1561 aacgcccgca agcaccccaa tatagggcaa gtcggagaag aatatctgcg acaaaatgac 1621 gcacagcacg cctttgagaa tatcgtgaac gcccacggca attcccgcac gccagcccgc 1681 aagcaaaacg gtgttcgatg cgccgaggtt ttttgaaccg tctgcgcgaa aatcaacgcg 1741 cttgatccgg gatatataat aagacatatt cgaggaaccg atgagatatg atgaaacgat 1801 c // LOCUS sequence302 1798 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence302 VERSION sequence302 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1798 /mol_type="genomic DNA" /organism="" /note="sequence302" CDS 743..1600 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MIEKNENLIPEEDLEYERRLAEEAANQPTEEELEAEAVKARDEKR KTYEKDLNDRKIELMKLKQGVIEESDIVKEEQTQEYKLSFGEWISNVWYRNKWLIIFAA AMIFAFSYIVYDQVTTTKPDLTVLVLSPDYSLYYRTQELEMFLDDYCDDLNGDGEVYVQ VYNISTDYSDPNTVTANQAQVMSQLQSGENIILIADDKTDFAMHDFTGEYPDNERFNEL GMRLNCQLVRDALKWEAMNDNVYIGMREPTKLLATTEEDMQENFDEARAVFERIVKAVS ESEK" /locus_tag="LOCUS_8100" /note="MGA_1166" tRNA 1681..1756 /product="tRNA-Val" /inference="COORDINATES:profile:Aragorn:1.2.38" /locus_tag="LOCUS_t0140" /note="Aragorn_14" ORIGIN 1 cctatcgcgc ccgacgcgag ccttattgac atccgcgatg tggcacacgc tttgtcgctg 61 acctgccgcg gaaacggcca cgttaaaagc ttcttttccg tcggtcagca ttgcttaaac 121 tgcgcccgcg aagcggtctt gagaggctac ccaaagcgtt tggcgctcgc gtgcctcatt 181 cacgatgcat cggaggcata tatgtccgat gtaccccgcc ctttcaagca ggtcttgcct 241 gaatatcgcg aggcggagga gagcttgctt gcgctgatat ataaaaaatt cctaggaggc 301 cccctttccg gcgaggagga agcgctcatc aagcaaattg atgacgatat gttatatttc 361 gacctgttgg tgctcttgga tgagaagatg gatcgcgaag agccgaagct gaagatcaac 421 ctcagctatg actttgtgcc cttcgagcag gtcgagaggg agtacctcga gctgtttgag 481 gagttgaaga tgtaaaaagc ttccctatga cgagtggagg tggatttttg cgaagcaaaa 541 agacggaggg aaggatatgc gcctgagcga ggcgtctttt tgcctgcgcc gaagcgaagc 601 ggaggctgtg gcaaaatggt gccgagcgtg gttggatgtt cgcaccttgt ttccattttt 661 cactcccctt tcattctccc cgcttgctat ttgacacatt tgtggtataa tatactcaca 721 gtaacatttg ccgaggtgcg aaatgatcga gaaaaacgaa aatctgatcc ccgaagagga 781 tcttgaatat gagcgcagac ttgccgaaga agccgcaaat cagcccaccg aggaagagct 841 tgaagcggag gctgtcaagg cgcgtgacga aaagcgcaag acatatgaaa aagatctcaa 901 cgaccgcaaa attgagctta tgaagctcaa acaaggcgta attgaagaat cggacattgt 961 taaagaggag cagacacagg aatataagct cagctttggc gagtggatat caaacgtgtg 1021 gtatcgcaac aaatggctga taatcttcgc tgcggcgatg atatttgcgt tttcctatat 1081 cgtatacgat caggtgacca ccaccaagcc cgaccttaca gttttggttt tatcccccga 1141 ttacagctta tattaccgca cccaggagct ggaaatgttt ttggatgact attgcgacga 1201 cctcaacggc gacggcgagg tatatgtgca ggtatataat atctctaccg actattccga 1261 ccccaacact gtaacagcca accaggcgca ggtcatgagc cagcttcagt cgggcgaaaa 1321 cattattttg atcgctgatg acaagaccga ctttgcgatg cacgatttca caggtgaata 1381 tcccgacaac gagcgtttta atgagcttgg aatgaggcta aactgccagc ttgtgcgcga 1441 tgccctcaag tgggaagcga tgaacgataa tgtatatatc ggcatgcgtg agccgaccaa 1501 gcttttggcc accaccgaag aggatatgca ggaaaatttc gacgaagcga gagcggtttt 1561 cgagcgaatc gtcaaggctg tcagcgaaag tgaaaaataa ataaaaaatt tcaaaaaatg 1621 tattgacaaa tccgtttatg tcggttataa tatcaaagtc gcctatcgag gtggctttat 1681 gggagcatag ctcagctggg agagcacctg ccttacaagc agggggtcat aggttcgagc 1741 cctattgttc ccaccaattt ggcccggtag ttcagttggt tagaacgcta gcctgtca // LOCUS sequence303 1798 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence303 VERSION sequence303 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1798 /mol_type="genomic DNA" /organism="" /note="sequence303" ORIGIN 1 aatcagcaga attaaaatgt cctcctcatc ccctgttgct gtattgatat ataccaaaac 61 atccaaaccg tcgtcggttt tacatcttaa ttcccaacat agggtttcgt ctatattgtc 121 ggtgggaata agggcaagtc tgctcgatac aacgctgagg cttggcgaga gctttgattg 181 cgcttcggtt ttggatattg tgggttcatc caagtcgcgc tcgtaatggt ttaccaagaa 241 accgcgcccg tcaaaaccga ggatttcacc gttatccagc gcgacgctga ctttgataag 301 gtcggtatag cagactgtgt cctcctgctt atatgcaaaa ttcaccgtta aaacgttgtt 361 atagcactca taataagtct ttgtcattga cggtataccg agagtatcca aatatagctc 421 tgcgcgtctg atggcttctg taatgtcgat atcttcgttt gtaacatcgc gtgatttgag 481 catatagctt aaatatcccc cgagctttgt gacagatacg gtcacgccgt cagccttgaa 541 gcgatatgac ggcattttac cttcctcgga gctttcggca tcctcaagct gccaatcttc 601 aaggcctgtg gcctttgccg cttttttagc tgcttcctcg cgggaaaatc cgatggcatc 661 tgcggtcatc tttggctctt tttcaagaat gtggtcggaa tatgggccgt catagatgag 721 ctttggcata tctttaaagt tgtcctcaat gccgctgatg ccgtccatca caaatgagcc 781 gtcctctaaa tcagcaaaaa gctcgcttaa tcgctcccct cttgaatata ggctcgattc 841 cagttcatag agtttgtccc gaagattttt tgcgtattcg cagagtttgg aaagcgtcag 901 atagtcttca taatcaagct catccgctgc cgattttttc gcaagatatg cagcatagtt 961 gccgatttga gagaaaaact tttcggtgtt tgaaagctca acctgcgaaa gcggaaggtc 1021 caaaagggcg ttttttgcgt tggttgcttg ctcgcgcagc tcacccgaaa gctttgtcag 1081 catcgtatcg gatgcggagc atttggattt cgtcagggcg gaatatattt tgtcggtacc 1141 ttggcaaagt tcctctacag agcgaagata tgtggcctca atggcgtttg aagcaacaga 1201 gagcttactc atatatacga tatttgaagc cgccagaacg cccattatcg ccaaagaaaa 1261 gcacactatg cggatgagcg tgcggcgtga aaacctataa ttcatattgc tactcctttt 1321 ttctttttct gttatctttt cacgcattag ggaaaataat catcgtcaga gtaaccgaaa 1381 aaatcttcca tattatttga tattttgttg tcaaaatgtt tgcattttta tgtcaaatga 1441 tttataatat atatgtatgc tattcatagc gactaattta caatacggag gtcaaatcaa 1501 tgcttgtatc agcaaaagaa atgcttaaca aagcaagaca gggacactac gcagtaggac 1561 agtttaacat caataacttg gaatggacaa agtgcattct tcagaccgct caggagctta 1621 aggctcccgt cattctcggt gtttccgagg gcgcaggaaa gtatatgtgc ggttacacca 1681 ccatcgttgg catggttgaa ggaatgatta aggaacttgg cattactgtt cccgttgctt 1741 tgcacctcga ccacggaaca tttgaaggcg caaaggcttg catcaatgca ggtttcag // LOCUS sequence304 1797 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence304 VERSION sequence304 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1797 /mol_type="genomic DNA" /organism="" /note="sequence304" CDS complement(752..1228) /product="transcription elongation factor GreA" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_012048372.1" /transl_table=11 /codon_start=1 /translation="MAKATTMSRSGFIKLQEELEHLVTVRRKEVAEKLKEARSYGDLSE NTEYDEAKNEQGMLEAQIADLEAMIANAVIVDEDSLNKDEIGIGSIVTLYDYDMEEEWE IQIVGSNESDPDDNKLSDESPIGKACLKKHKGEVFEVEVPAGTLKFKVVDISMK" /locus_tag="LOCUS_8110" /gene="greA" /note="WP_012048372.1 transcription elongation factor GreA (Clostridium botulinum) [pid:51.6%, q_cov:98.1%, s_cov:96.9%, Eval:5.3e-40]" /note="MGA_1170" CDS complement(1444..1680) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MTATGLYSRLAKIGEAGTLVPITGFANGIASSAIEFKAEGWISGI GSKIFAIAGPVILYGTACSVAYGVVLFTMHKLG" /locus_tag="LOCUS_8120" /note="WP_003403642.1 stage V sporulation protein AC (Clostridium botulinum) [pid:53.2%, q_cov:98.7%, s_cov:51.0%, Eval:7.9e-19, partial hit]" /note="MGA_1171" ORIGIN 1 gcagcaccgc ctgcatttga aacaagcata ggtgtttcaa cctcgataaa accgagggtg 61 tcaagataac ggcggatggt tgagatgatc ttcgatcttg cgataaaggt cttcttaaca 121 tcggggttaa caataaggtc agtatatctc tggcgatagc gggtatctct gtccttaagg 181 ccgtgccact tttcgggcaa gggctgaagc gactttgaaa gaagggtgat atttgttgcg 241 tgaagggaga tctcgccctt tcttgttctg aaaacaaagc cttcaacgcc gacaatgtcg 301 ccgatatccc acttcttgaa gtccttgaac ttttcttcgc cgatgtcgtt catgcgaata 361 tatacctgca tacggtcgga ggtgtcgcga acgtcaatga agtttgcctt acccatgtcg 421 cgccagctca taattctgcc ggcaatgcgc catgtatgag ccttgatttc gtccaaacct 481 gcgttcttct tttcttcgtc atcccctgct tccgccaaga cctttgcttc ttcggcttca 541 tagaactcgc ggagcgcggt gtttgtggtg ttaaaatcga actttgtgat ctcaaaagga 601 ttcttgcctt cagccttgag cgcttcaagc ttttcatatc gaattctctt gagctcgttc 661 atttcttccc ttgagagacc ttcttcctct tcgggaatat ttgtcaaaat ttcttcggtc 721 atttttaaaa ctccaatttt aagtcaggtt attacttcat gctgatgtca acgaccttga 781 acttgagagt gcctgcggga acctcaacct caaagacttc gcccttgtgc tttttaaggc 841 aagccttgcc gatggggctt tcgtcggaga gcttgttgtc atcgggatcg gattcgttgg 901 aaccgacgat ctgaatttcc cattcctctt ccatatcgta gtcgtaaagt gtgacgatgg 961 agccgatgcc gatctcatcc ttgttgaggc tgtcctcatc aacaatgaca gcgtttgcaa 1021 tcattgcttc aaggtctgcg atctgagctt caagcatacc ctgctcgttt ttcgcttcat 1081 catattctgt attttcggaa aggtcgccgt atgaacgagc ctctttaagt ttttctgcaa 1141 cctctttacg tctaactgta actagatgtt caagttcttc ctgaagcttg atgaaaccgc 1201 ttcttgacat tgttgtagcc ttagccataa gtaaattcct ccgtcgaaaa tgtattttcg 1261 gtgcgatagt atatagttat cgcatattat cctcaagtat aattatagcg atgtttttgc 1321 tcgatgtcaa gatggaattt gtcggcgagg gtggctgaaa gatgagccac gctcagtgtg 1381 ttttctctcc ctccgtctcg ctatacggca accgggcgac cacatagggt cgcccctctc 1441 tttttatccc agcttatgca tcgtaaacag caccacgcca taggcaaccg agcaagcagt 1501 gccatagaga attacaggtc ctgcgatggc aaagatcttc gagccgatac cagatatcca 1561 gccctctgct ttgaattcga ttgcgctgga ggcaatgccg ttggcaaacc ccgttatcgg 1621 cacaagcgtg cccgcttcgc ctatcttcgc caggcgggaa tataagcccg ttgcggtcat 1681 aaccgctgaa attaacacca atgtcattga acaaaggctt gatgattcat ccttatcgaa 1741 ccccgtggct ttatatagct cgatcagccc ctgccccagc aggcaaattg acccacc // LOCUS sequence305 1788 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence305 VERSION sequence305 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1788 /mol_type="genomic DNA" /organism="" /note="sequence305" misc_feature <1..520 /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_010966138.1:ATP-dependent RecD-like DNA helicase" /note="WP_010966138.1 ATP-dependent RecD-like DNA helicase (Clostridium) [pid:47.9%, q_cov:94.8%, s_cov:22.5%, Eval:1.9e-34, partial hit]" /note="MGA_1173" /locus_tag="LOCUS_8130" CDS 498..1184 /product="ComF family protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003357235.1" /transl_table=11 /codon_start=1 /translation="MKLKLIYDYLIDFILPNRCSFCGKFTAWNEPVCKNCKDSILFSEH PIRQDENGVFILCVSACEYDGTARDGILNLKYHNGINTAKHLSPHLCELLKVNIDLNRI DVVTCVPMTRKRLADTGYNHADVIGKLVAELIKKPYDRKLLKRISNAPIQHELSADERR KAVKDTYFPANKKKSLNGKTVLLVDDIITTGSTLSECASVLKSMGADEVYCCTLAKSLY NESRKE" /locus_tag="LOCUS_8140" /note="WP_003357235.1 ComF family protein (Clostridium botulinum) [pid:31.2%, q_cov:95.6%, s_cov:95.6%, Eval:7.1e-21]" /note="MGA_1174" ORIGIN 1 ccgcgaaaaa tcagagataa aaccccttga ccaacccttc cgcaccggcg acaaggtaat 61 gcagaccaaa aacgactatg atgtggagtg gaaaaaggac gacgagcgtg gaacaggcat 121 cttcaacggc gatatcggag ttatcacaaa gctcaaccgc attttgggca ccatcgagat 181 tgacttcgag ggcagaatat gccaatataa tactatgatg ctggacaact tagagcttgc 241 ctatgccgca actgtacata aaagccaggg cagcgaattt gaagctgtga tcctgccgat 301 attgggcgga tttgacaagc tatattaccg caatcttttg tataccgccg tgacccgcgc 361 caaaaagctc attgtcattg tcggctcgtc caatcgcgtc aagtatatga tagataatga 421 ccgccgcacc aaccgctaca cctgtttgaa aaccatgctc cgtgaagatt cattcggcaa 481 ccacagcgag gtaaacgatg aagctgaaat tgatttatga ttatttgatc gactttattc 541 tgccgaaccg ttgcagcttc tgcggaaaat tcaccgcttg gaacgagcct gtctgcaaaa 601 actgcaaaga tagcatcctt ttctcggaac atcccataag acaggatgaa aacggcgtat 661 tcatactctg cgtcagtgcc tgcgaatatg acggcaccgc gcgcgacggc attttgaacc 721 taaaatacca caatggcatc aacacagcaa agcacctttc gccccatctc tgcgaattgc 781 ttaaagtcaa tatcgaccta aaccgaatag atgttgtaac ctgcgtcccg atgacccgca 841 agcgacttgc agacacgggc tataatcacg ccgatgtgat tggcaagctg gtcgctgagc 901 tgattaaaaa gccatatgac cgcaagcttt taaagcgcat ttccaacgcc ccgatccagc 961 acgaattatc agccgacgag cgacgcaaag ctgtgaagga tacatatttc cccgcaaata 1021 aaaagaaaag ccttaacggc aaaactgttt tgctggtgga tgacatcatc accaccggct 1081 cgacactttc cgagtgtgcc tcggtgttaa aatcaatggg tgctgacgaa gtatattgct 1141 gtacccttgc aaaatcttta tataacgaat caagaaagga gtgaaagtct tgtcaatctt 1201 agacctcgga atcgaccttg gcaccgccaa tataatcatc accacaaacg gccgcggctc 1261 gattttcaac gagccgacag tcattgcata taacaaacgc accgagcagg ttgtcgcctt 1321 cggtgaagag gcatataaga tgataggacg tgctcccgag catatcgcag ttatccgacc 1381 gcttaaagac ggtgtaatct ccaacaacga tatggcgcag gagcttatcc gcctttcaat 1441 tttaaaagtt atcggcaagc gcttgatcaa cccgcagata ataatgtgcg tgccctcagc 1501 gatcacaact gtcgagcgcc gtgcagttgt tgaaagcgct gtttccgcgg gcgcccgaac 1561 cgtttatctg atcgaagagc cggttgccgc cctcatcggt gcaggcgcag acattttaaa 1621 accatatggc cagatggttg tcgatatcgg cggcggaact gttgacgttg ccgtaacctc 1681 cttgggaggt gtagtcgttt caaaatccct taaaagggca gggaacacct tcaacgccgc 1741 aatcgagcga tatttctccg aaaccttcaa gcttttaatc ggcgagcg // LOCUS sequence306 1787 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence306 VERSION sequence306 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1787 /mol_type="genomic DNA" /organism="" /note="sequence306" misc_feature <1..561 /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_003358892.1:tyrosine recombinase XerC" /note="WP_003358892.1 tyrosine recombinase XerC (Clostridium botulinum) [pid:46.9%, q_cov:92.5%, s_cov:52.8%, Eval:6.1e-37, partial hit]" /note="MGA_1176" /locus_tag="LOCUS_8150" CDS complement(695..1657) /product="mannose-6-phosphate isomerase, class I" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_002287262.1" /transl_table=11 /codon_start=1 /translation="MNMYPLILKAPLKDYIWGGNRLKNEYGYETELDKVAEAWVLSSRN DGDSTVINGELSGKNLSEVLALWGDTAIGKNASKFEYFPLLIKLIDACDRLSVQVHPDD EYAMRVEGEFGKTEMWYVVDCDEGAKLIYGFTHEISKDEFKRRINDNTLEEVCNFVPVK KGDVFFIEAGTLHAIGKGILIAEVQQNSNTTYRVSDYGRLGADGKPRPLHVEKALDVTK TIAPTREYGNVGKICKADGTIIRELAKCELFSADLITLGGKIEIGNDDSFVSLVVLNGN ATLEWNGEKISVNKGASVFIPAGITVMISGSAEILKSWV" /locus_tag="LOCUS_8160" /gene="manA" /EC_number="5.3.1.8" /note="WP_002287262.1 mannose-6-phosphate isomerase, class I (Enterococcus) [pid:40.0%, q_cov:98.1%, s_cov:97.8%, Eval:3.5e-60]" /note="MGA_1177" ORIGIN 1 gacagcgcag attcaaataa tcctgaccgc gactactgta ttcttacgct attccttaac 61 tgcggtatgc gtttaagtga actggttggt cttaatattg aggattacag caaggctcag 121 cgcacgttac gtctgtttgg taaaggtcag aaagaacgta tcgtttatct caacgatgct 181 tgcatcaacg ccttagaaaa atatctttcc gttcgtcaca aagaagccgg aaaaccgatg 241 tttgtatcct tttatcgcaa tcaatataaa cgaatttcca accgtcgtgt acagcgaatt 301 gttgaagatc agctgcgacg tgcagggctt ggaaatctcg gtatatcaac gcataagctt 361 cgtcacacct gtgctacgct tatgtatgaa tacggcaatg ttgatcctat ggttttgcga 421 gatgttttgg gacacaagag tgttgctacc acgcagattt acactcacct atcggataag 481 gacaagcgaa gagccgccga gagatcccct ctcgcaaatg ttaaaaaatt aacaagcaaa 541 gatgactcct ctgataagta aaattttttc tgtgatacat aattgattaa aaataagacg 601 gatagctgag cgctgtccgt cttttctttg ttattcgcag ttttataatg ataaagtttg 661 atttattgtg agatttatga atagtactcc cctatcacac ccagcttttc aaaatctcag 721 cgctaccgct aatcattacc gtaattcccg caggaataaa cacgcttgcg cctttattaa 781 cgctgatttt ttcgccattc cattcaagag ttgcattacc gttaagaaca accagcgata 841 caaagctgtc atcgtttccg atttctatct tgccgccgag agttatcaga tccgcactaa 901 aaagctcaca ttttgcaagc tctctaatta tagtgccgtc agccttgcaa attttgccga 961 cgttgccata ttcacgtgtg ggagcaatgg ttttggtgac atccagagct ttctcaacgt 1021 gcaagggtct cggtttgcca tcagcaccaa ggcgtccata gtcggaaacg cgatatgttg 1081 tgtttgaatt ctgctgaacc tcagcaatca aaatgccctt gccaatagcg tgaagtgtgc 1141 ccgcctcaat aaagaacaca tcgccctttt taacgggcac aaagttgcag acttcttcaa 1201 gagtgttgtc attgattcgg cgtttgaatt catctttact gatttcatgt gtgaaaccgt 1261 aaatcagctt tgcgccttca tcgcaatcga ctacatacca catttcagtt ttgccgaatt 1321 cgccctcaac gcgcattgca tattcatcat caggatgaac ctggactgac aatcggtcac 1381 aagcatcaat cagctttatg agcaaaggga aatattcaaa cttagaggca ttttttccga 1441 ttgcagtatc accccaaaga gcgagaactt cggataagtt tttaccgctg agttcaccgt 1501 tgataactgt cgaatcgcca tcgttgcgag aagacaatac ccaagcttca gcaaccttat 1561 caagctcagt ttcatatcca tattcatttt tcagacgatt accgccccaa atataatcct 1621 tcagcggtgc ctttaaaatt aaaggataca tattcattta tttgacctct tttctaataa 1681 ccgagcctga ttcaaactgc atatctatcg gcaacgagaa cctcattgtt gccttgtttg 1741 ccgcaggaac gctttcgcca agttcgttat agataatatc ggcttta // LOCUS sequence307 1769 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence307 VERSION sequence307 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1769 /mol_type="genomic DNA" /organism="" /note="sequence307" misc_feature complement(551..>1769) /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_000441046.1:excinuclease ABC subunit B" /note="WP_000441046.1 excinuclease ABC subunit B (Bacillus) [pid:62.6%, q_cov:99.5%, s_cov:62.2%, Eval:1.3e-142, partial hit]" /note="MGA_1180" /locus_tag="LOCUS_8170" ORIGIN 1 acgcacacga acatagcccg acttttttgc ctgttcaagc tctttgacat attcgccctt 61 gcggcctctt acaattggtg caagaagctg aattttggta ccctcgggaa gctccaaaac 121 cttgtcgacg atctgatcga ccgactgacg ggaaatctcc ctaccgcata tgggacaatg 181 cggaataccg attcgggcat agagtaaacg caggtagtca tatatctcgg tgacagtacc 241 aacggtcgaa cgcgggttgt ttgaagtggt cttttggtcg atggaaatgg cgggagaaag 301 gccctcgatc gagtcaacat ccggcttgtc catctgtccc aaaaacattc tcgcatagga 361 cgaaaggctc tcgatatatc ggcgctgacc gtcggcaaaa atggtgtcaa acgcaagcga 421 cgatttacct gagccggaaa ggcctgtaaa tactatcatt ttatcgcgcg ggagagtcaa 481 atcgacattt ttaaggttat gctccctcgc gcctttaatt acaatttcgt tgttcataac 541 aaaccttctt ttacatattg cgcagttcgt ttatcttatc acgcaggtat gccgcctgct 601 cgaattcaag ctgacgtgca gcttccttca tctgtttggt catcttctca atgagttcag 661 ctttttcgcg ctttgtatat tgtttaagcg gcttttttgt ttccttcttg gagatttcaa 721 tgacgtcacg cacgccttta atgatcgttt tgggaacgat tccatggtcg gcgttatatt 781 tcatctgtat ctcacggcga cgctcagttt cggttatagc gcgttccatt gagcctgtaa 841 cactgtcggc atacattatg actttgccgt tggcgtttcg agcagctcga ccgacagtct 901 gaataagcga gctttcgctt ctaaggaagc cttccttatc ggcatctaaa atcgcaacaa 961 gagaaacctc gggaaggtcc aagccctcac gcaggaggtt aattcccacg agcacatcaa 1021 attcgcccaa gcgcaggtca cggattatct ccatacgttc catagtgtcg atggagtggt 1081 gcatatattt gaccttgatg ccaactcctt ggagataagc ggtcagatcc tcagccattt 1141 taactgtcaa ggtggtgacc agtacacgct cctttttggc ggcgcgctcg ttaatttcaa 1201 gaatcaagtc gtcaatctga ccctgagtgg gcttaacttc aatcagaggg tctaaaaggc 1261 ctgtaggacg gataatctgc tctactatgg cctctgactc ttgtttttca agatttccgg 1321 gagtagccga aacaaatatt gcctggtcga tgtgtccata aaattcatca aacgttaagg 1381 ggcggttatc aagcgccgaa ggcagacgga agccgtattc aacaagggtt tcctttctcg 1441 cacggtcacc tgcatacatt ccccttacct gcggaagagc aacgtgagat tcatccacaa 1501 ccagcagaaa atcatcaggc aaaaagtcta aaagtgtgaa aggtactgca ccaggttcgc 1561 gtctggcaag cacacgagaa tagttttcaa cacctgagca gaagccgacc tcttgtaaca 1621 tctccatatc gtatttcact cgctgttcaa tgcgctgagc ttcaataagc ttatcctgcg 1681 atttgaaata ttcaacctgc tgacgcattt cagcttcgat atcctcgata gcatcgtgga 1741 gcttatcctt gcttgtgata tagtgggat // LOCUS sequence308 1760 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence308 VERSION sequence308 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1760 /mol_type="genomic DNA" /organism="" /note="sequence308" ORIGIN 1 aaaagacaat gcacggcaca caggctttgg acgaggtttt gggagttatc cgcgagaaac 61 agcccgagcc gattgttgaa gatatcgtca ctacacagcc ggagacggaa gttaaagcgg 121 agcccacgcc caaggagacc cgcgagcctt ccaagattcg cggaattgcc gaggacggct 181 cgaacaccgg cattattgaa ggcttaatga agcttaaaaa agagcgcggc acacctaagc 241 ctgatgcgaa aattccccct gtcaaccgcg catctattga tgacattgat cttgaaattg 301 aaaagaaggt ccttcccaac acggaaatcg gaattgacga aaacgcaact gaagaggaac 361 gcttggcata cctcaacgcc aagcgccgcg aaagagttaa gcagtttgtt gttgaagcgg 421 aagaggaaga agctccttca aaggacgacg ttgccgattt taacaatttc tcgcaagcca 481 aggatatggc tttgagtatt gcaaacctca aaaagagcct tgttgttcgc ctttgcgtac 541 ttattatctg cgcggcggtg gcggtatata tcacacttgc aaacgatttc ggcatgcccc 601 ttatcagcct gctttcaaga gcggaaaact cgggcacggc gttccttttc accaacgttg 661 ttttgggact tgccgcctgc tttgtatcat ataccgtgtt gatcgttgga ttcaaaaagc 721 ttgtgaccct caagcccgac tcggacagcc ttgcaagcat tgcaatgata ttcagcttga 781 ttacaggcat cgtgatgctg accgactcgg aaatggttca gatgcaaaga gttcatgtat 841 atattcccgc ggcgatcatc ggacttttga tgaataccgt cggaaagctt ttgatagtca 901 cccgcacaga gcgcaacttc cgatatgttt cgggcggata ttcaaaatat gccgctatgc 961 atattgatga cgaagacatt gcaagcaagt tcaccaaggg cgctttaagc gacttcccca 1021 gcctttccac atcaagaaag acagaatttg tcagcgattt cattaagaac agctactcgg 1081 cagatatgac cgatgctttt tgtaagttct ttgtgcctgt tgttacattg ctttcgatca 1141 tcgtcggtgt tatcggcgcg tttgtatgcc ccgaaacggt tgtcaccgca caggataaga 1201 cattctatgc tttgtcctgc gcttcgggcg taatggcgat gtgctcggct gtgggcatga 1261 tgcttgtcac aaacattccc cttgcgaagg catcgaagaa gtatttgcag tcaagtgctg 1321 taatgctcgg ttattcggca gttgataaat ttgcggatac caactcggtt ctgattgatg 1381 ctattgatct gttccccgac ggtatggtgg atataatcaa ccttaaaccc accaagaaaa 1441 cgcccattga ggaaggcatt ttgtatgccg caagcctctg ctgtcagaca gaaagcattt 1501 tgcgccccgc attttacaag atgatcaagg gcaagacaga aatgctttac cccgttgaga 1561 gctatattta tgaagacagc ttgggtcttt ccggctggat tcagaacaag cgagttcttt 1621 tcggcaaccg tcagctgatg gagagccact cgattgaggg acttccctcc cttgaaaagg 1681 aagcacagta tgtcaagaag gatacaaatg tgttgtatct ttccatcggc ggaaatcttg 1741 cgatgctctt tgtaattcag // LOCUS sequence309 1759 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence309 VERSION sequence309 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1759 /mol_type="genomic DNA" /organism="" /note="sequence309" ORIGIN 1 atttttcctg cacacaggaa tatgtgattg ctcaaacaat aatcgtcggt gatatacctg 61 agggatacgc tgttttagga taagttaaga gaaaggttgt gtgaaaatga ataagttaga 121 tgcaaaaaaa cgaattgatg aactgactga gcttttaaat tatcacaacc gcaaatatta 181 tattgaggat gatcccgaaa ttgaggatta tgaatacgac gcgctgatgc gtgagttgcg 241 ctcgcttgaa gaggcgtacc ctgagttttt gtcgccggct tcaccctcgc aacgtgtagg 301 tggagcgccg atatcggact tcaaaaaagt cacccatact gtccaaatgg gaagtttgca 361 ggatgttttc tcatatgagc aggtaagaga attcgttgaa agaatctacc gcacagttga 421 caaccctaag tttactgtcg agccaaaaat tgatggccta agctgttcgc ttgaatacag 481 agatggtatt cttacagttg gttcaactag aggggacgga ttcatcggcg aggatgttac 541 cgcaaacata aaaacaatag gctctgttcc tctgaaactt cccgaagagc ttcctttgct 601 tgaagtcagg ggcgaggtat atatgcctaa gtcggtgttc tataaaatct ccgatgagat 661 ggagcttaca ggcgaaaaac cttttaagaa tcccagaaac gcggctgccg gttcgctcag 721 acaaaaggat tccaaaatcg ccgcaaaaag acgtttggat atattcgtat ttaacattca 781 gcaaattgaa ggcaagaccc tttcttcgca taaagaatcc cttgactatc tttcttccct 841 cggtttcaag gttatcccga aatataccct tgtttcaaca gcagatgaag tgattgagaa 901 aatcgaagca atcggcaatt cgagatttga tctgccttat gatatcgacg gcgtagtaat 961 caaggttgat gatatcgcta gccgagaaga aatcggatat acctcaaaag ttcccaagtg 1021 ggcagttgcg tataaattcc cgcctgagga aaaaaccacc aagcttttgg atattgaagt 1081 taacgtcggc agaacgggtg tcatcactcc tgttgcaata tttgagcctg taatgcttgc 1141 aggaacaagt gtgtcaagag ccacacttca caaccaagac ttcatcagag agcgaaatat 1201 tgctgttggc gacgaaatcg tcgtaagaaa agcaggggat atcatccccg aggttttaag 1261 tgtgtcaaaa tcctgcggtg ctgatagcca ttttatgctc cccgagcatt gtcctgtatg 1321 cggagcgagt gtcattaaag atggcgatga agcggcggtg agatgcccaa atatcgactg 1381 tcccgctcag attcaaagaa gcattgccta ctttgcatct aagcctgcga tgaatattga 1441 gggtttggga ccgcaaattg ttgaaacttt atatcaaaac gggctgataa attcaatttc 1501 agatatttac aagttgacac aaagtgatat aatgagtgtt gacggtttta aagagaagtc 1561 tgcaagcaat cttttgtctg ctattgagaa atcgaaatca aacggacttg aacgactgat 1621 ttgcggactt ggaatcagaa acatcggtct tgcatctgcc aagcttcttt gcgagagatt 1681 tggcgacatc gactcgctgt tgtccgccac atttgatgat atcgtatcta tcgacggctt 1741 tggcgatgtc acagcggcg // LOCUS sequence310 1759 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence310 VERSION sequence310 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1759 /mol_type="genomic DNA" /organism="" /note="sequence310" CDS complement(189..614) /product="Holliday junction resolvase RuvX" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_001221192.1" /transl_table=11 /codon_start=1 /translation="MKIFAVDYGDARTGLAHCDKFESIASPVGTVFEWNVNKCLAKVAD AIKADGAELIVVGLPVNMDGTQGERAQKCRDFADKLREMTGVETVMWDERVTTVQAIGI LNETNVRGKKRKEVIDTVAATLILESYMDYRKKKGLA" /locus_tag="LOCUS_8180" /gene="ruvX" /EC_number="3.1.21.10" /note="WP_001221192.1 Holliday junction resolvase RuvX (Bacillus cereus) [pid:37.8%, q_cov:94.3%, s_cov:98.5%, Eval:1.3e-19]" /note="MGA_1184" CDS complement(632..1114) /product="LURP-one-related family protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_012775190.1" /transl_table=11 /codon_start=1 /translation="MSKLLIKQRVFSWSDTYDVYDKDGNPKYYVEAEFLSIGHKLHIYR HDTGEEVAFIRQCLFRFLPTAEISVGYRVLGEIRKEFTFFIPKYTIDYNGWTIDGNFMG WDYSITNSSGSTVAQISKELFRWGDTYVLTVYDDSDEVDALVTVIAIDMMNCSHND" /locus_tag="LOCUS_8190" /note="WP_012775190.1 LURP-one-related family protein (Bacteria) [pid:36.2%, q_cov:95.0%, s_cov:93.8%, Eval:6.6e-17]" /note="MGA_1185" CDS complement(1133..1594) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MSKFVIKPKSIFSKKEYEIFDEAGKSLYYIKYKWKWKYIAYDSDV HDEVIYVHERRDLVNGYITSVYIRHKLLGEIEFGFGRGLSIGYKGWEVYGTPSNWNYMI TNVVENPVVTVSNNLGEIIVDVDESVDDLTALATVVALSLVGSMKSEIF" /locus_tag="LOCUS_8200" /note="MGA_1186" ORIGIN 1 ccccctcacc acgcgcgaca gcgcgggtaa ccaattttgc ggagcaaaat gggttggctg 61 ccgccgaaac agctccgtcc gcggatgcgc cgccgaatgg cggttgtatt cgcgggtgga 121 gcggggcgat gcgcaaactg aatagaacaa aacagacccg ccacggtttc gtgacgggtc 181 attttgtttt atgctaagcc ttttttcttg cggtagtcca tataagactc caaaatcagc 241 gttgcggcaa ctgtatcaat tacctctttg cgttttttgc cgcgcacgtt tgtctcattt 301 aaaattccga ttgcctgaac ggttgtgact cgttcatccc acataactgt ttcaactccg 361 gtcatttcgc gaagcttatc agcaaagtca cggcattttt gagcacgctc accctgtgtg 421 ccatccatat tgacaggaag acctacaaca atcagctcag cgccgtcagc tttgattgca 481 tcagcaacct ttgcaaggca tttgttgacg ttccattcaa agactgtgcc aacaggagat 541 gcgattgatt caaatttgtc gcaatgggca aggcctgttc tggcatcgcc atagtcaaca 601 gcaaaaattt tcacagcgta cccccctttt atcagtcgtt atgcgagcag ttcatcatat 661 caatggcgat aacggtcaca agggcatcaa cctcgtcaga gtcgtcatat actgtgagca 721 catatgtatc gccccaacgg aagagttcct tggagatctg cgcaactgtg cttcccgacg 781 aattcgtgat cgaatagtcc cagcccataa aattgccgtc gatggtccaa ccgttatagt 841 cgatagtata cttgggaata aagaaagtga attcttttct tatctcacca agcactctat 901 agccgacaga aatttccgca gttggcagga atctaaagag gcattgacga atgaaggcga 961 cttcttcgcc tgtatcgtgg cggtagatgt ggagcttatg gccgattgag agaaactccg 1021 cctcgacata atattttggg ttgccgtcct tatcgtatac atcataggtg tcgctccagg 1081 agaacaccct ctgtttgatt aaaagcttgc tcatttttta ctccgggttt aattaaaaga 1141 tctctgattt catactgccg acaagactga gcgctacaac cgtggcaagc gcagtcagat 1201 catcaacgga ttcatcaaca tcgacaatta tctcgcccaa attattgctc acggtcacta 1261 ccggattctc gacaacgttg gttatcatat aattccaatt ggacggggtg ccgtagacct 1321 cccagccctt atatccgata gagagccctc tgccaaagcc aaattcgatc tcaccgagaa 1381 gcttgtgacg gatatagacc gatgtgatat agccgttaac aaggtcacgc cgttcgtgaa 1441 catagatcac ttcgtcgtgg acatcgctgt cataagcgat atacttccat ttccacttat 1501 acttgatata ataaagtgac ttgccagcct cgtcgaatat ctcatactct tttttcgaga 1561 agatagactt cggcttgatt acaaacttgc tcatttcgca agacccaaga atgccgcgcc 1621 gatgatgcct gcgtcgttac ccagcgaagc aataacaatt tcagttttct ttgcaccgtt 1681 tctggtgtaa atttctttat caaccgcttc tttaagagga atcagcaaag catcgccttc 1741 attgcagaca ccgccgccg // LOCUS sequence311 1756 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence311 VERSION sequence311 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1756 /mol_type="genomic DNA" /organism="" /note="sequence311" ORIGIN 1 atcgctgttg cgagctcctc ggggatgccg agcatacggt agcaaagtcc cgagtacata 61 tcgatatttg cgcacatggt cttttccttg cctgtgacct ttaagaacac ctcgggcgtg 121 aggcgttcaa ccgagtcaag cagcttgaag tcggcttcat attcggtgcc ctttgccatc 181 ttcattgcct cgcgctttaa gattacgcat ctggggtcgg aaagggtata tacagcgtgg 241 cccatgccat agataagacc cgagcggtcg gaagcttcct ttttgagaat cttttcaagc 301 atttcggtga cctcggcatc gtcttcccag ttttcgatgt ttgccttgag gtagtcaagc 361 tgttccaaaa ccttgaagtt tgcaccgccg tgacggtggc ctttaagtgc acctactgca 421 gccgcatatg cagaataagg gtcggtaccc gatgaggtca gcactctgca agcgaatgtc 481 gagttgttac cgccgccgtg ctcagcgtgg agcataagca taagatccaa aagttttgcc 541 tcttcaaagg tatattttct gtccttacgc aagagggaaa gaattgtttc tgcggtcgat 601 tcctcgggcc tgggctgatg cagatacata ctcttgtcat aaaaatatct gcgcttgacc 661 tgatatgccg aggtgattat gaggggcatt tttgcaatga tcgaaattgc agttgaaagc 721 tcttcatcgg gagagggaga ttcagggtcg tcctcatagg aataaagtgc caaaattgaa 781 cgctcgatct tgttcataat gttctttgaa ggggctttca agatcatatc ctcaaagaaa 841 ccgctcggca gatcgcggtt ataggcaatg gtcttgttga aatggttcag ctcttccatt 901 gtgggaagct tgcccatcaa aagaagatat acgacctctt caaagccgaa gcggtcggat 961 ttcataacat cctcaaccaa ttcctcaacg ttgtatccgc ggaagaacag ctgaccctcg 1021 atgttttcct tttcgccttc attcatgata tatccgtgaa cgttgcaaat gttggtgatt 1081 cccgcaagaa cacctgtgcc gtctgcgtta cgaagtccgc gcttaacgtc aaacttcttg 1141 taatacttcg gatcgatggt gttgttcttc acgaaatttt cgcaaagcgc ctgcttaacg 1201 gcattgtcaa tgttgagttt cattcgtgca ctccttcttt aaatgataat ttctttgatt 1261 atagcacgca agatcgtggg tgtcaataaa tttgcaacat ctaattgata attatgcaaa 1321 aatgacataa tgcaagcata gccatcggat gattttgcaa gaagtttgca agaaagcttc 1381 aaaatgcctg caggtttgag ggcgaagccc tgcccgaaat cccctcaagg ggctttcggg 1441 cattcccccc aagtccgccg ccaagccgaa acggcggcgg acttgggggg aacaggcggc 1501 gcgggtgctt tggcgcccac cgcgccgccg gggcttcgcc cgtaggtatg caccacacaa 1561 aaaagctccc cgagaaaaac tcagggagcc aaattcgttt tattctatcc gtcaccgagc 1621 attcgatatg tataatattt atacatattc aagccgacgt cctcatattc ctcttcccga 1681 tcataccaac agttgaagcg gtcataataa ccccacgccg ccatcgaggc ggcagtttca 1741 cgcaagccat caatca // LOCUS sequence312 1753 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence312 VERSION sequence312 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1753 /mol_type="genomic DNA" /organism="" /note="sequence312" CDS complement(304..1704) /product="dipeptidase PepV" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_012048281.1" /transl_table=11 /codon_start=1 /translation="MNKEKVFEYIDAHKDEMVETLCQLISYPSYQQESQEGAPFGKPVR ECLDKALEICESFGFKIRNYDGYVGTAEYTEGEPILGILGHLDVVPEGTGWTYDPFKGT VADGKVFGRGSIDDKGPCVAVMYALKALKELNIPLKKGVRLILGTNEENGSGDLAYFEK VAEMPKWLFTPDGNYPLINIEKGMIRGRISATPEACSCKRKLVCFHCGKTINAVPELGY FEVAGVSESEIEKAISACKCEVGFTLEATDNGIKVNAKGKSAHASTPDLGYNALTAMLS LIKALGLDDNAGKLLAGLSEVFPYGETDGEHSGIKASDEVSGALTEVLSVLDYDDGKEI VGWIDIRFPVCENVESVKTKLEKSVSGAGFALMAGGAEPHYVDSNSTFVKELLSVYEDV TGNKGECIAIGGGTYVHHTEGGVAFGAEFPGEDNHMHGADEFMTIDSLLLNAKIFACAI ERVCNSDL" /locus_tag="LOCUS_8210" /gene="pepV" /EC_number="3.4.13.-" /note="WP_012048281.1 dipeptidase PepV (Clostridium botulinum) [pid:36.9%, q_cov:97.4%, s_cov:98.7%, Eval:1.2e-81]" /note="MGA_1190" ORIGIN 1 acatgaattt taatgcatag catcaaatga attgaaactc gcccttgcgg tcgaatttcg 61 ttcgcacacg cgccgtcgcc ggcacctgcc gcccgcgccc attcaggcgc acctcgccag 121 acgccggctg ttttctgcga acgctcaacc tcgggcgaag ccctgcccgt tttgcaaaac 181 gggcaagccg cgccttcggc gcggctccgc cccgcaggcg cggagcgccc ccgcggggcc 241 ggggcttcgg cctcaaagcg caaaaatccc cctatacgtc accgtatagg gggattatct 301 tttttaaaga tccgaattgc acactctttc aatcgcacaa gcaaaaatct ttgcgttcaa 361 aagcaagctg tcaatcgtca taaactcgtc tgcgccgtgc atatggttgt cctcgcctgg 421 gaattccgca ccgaatgcaa cgccgccctc ggtgtgatgc acataagttc cgccgccgat 481 cgcaatgcac tcgcctttat tgcccgtaac gtcctcataa acgctcaaaa gttccttgac 541 aaatgtgctg ttcgagtcaa catagtgcgg ttcggcgccg cccgccataa gcgcaaagcc 601 cgcgccgctg acgctctttt caagctttgt tttaacgctt tcaacattct cgcaaacagg 661 gaatctgatg tcgatccatc cgacgatctc tttgccgtcg tcataatcca aaacggaaag 721 aacctcggtg agcgcgcccg aaacctcgtc gcttgcctta attcccgaat gctcgccgtc 781 ggtctcgccg taggggaata cctcggacaa gcccgctaaa agcttgcctg cattgtcatc 841 aagaccgaga gccttgataa gcgaaagcat cgcagtcagc gcattgtatc ccaaatcggg 901 agtggaagcg tgggcgctct tgccctttgc gtttactttt atgccgttgt cggttgcttc 961 aagggtgaaa ccaacctcgc atttgcaagc gctgatcgct ttttcaatct cactttccga 1021 aacgcctgca acctcaaaat atcccagctc gggaacggca ttgatcgtct ttccgcagtg 1081 gaagcaaaca agctttcgct tgcaactgca agcttcgggt gtggcggaaa tgcgtccgcg 1141 aatcataccc ttttcaatgt tgatcaaggg atagtttccg tcgggagtaa agagccactt 1201 tggcatttcg gcaacctttt caaaatatgc cagatctccc gagccgtttt cctcattcgt 1261 gcccaaaatc aagcgcacgc cctttttgag ggggatattc agctccttga gggctttaag 1321 cgcatacatc accgcaacgc aagggccttt atcgtcgatc gagcctcttc cgaaaacctt 1381 gccgtcagca acggtaccct taaatgggtc atatgtccag cctgtgccct cgggaacaac 1441 atcaaggtgt cccaaaatgc ccaaaatcgg ttcgccttcg gtatattccg cagtgccgac 1501 gtatccgtca taattgcgga tcttaaagcc aaagctctcg caaatttcaa gagccttatc 1561 caaacattcc ctaacgggct tgccgaaagg agcgccttcc tgagactcct gctgatagct 1621 tggatatgaa atcagctgac aaagggtttc aaccatctca tccttgtggg catcaatata 1681 ttcaaaaact ttttccttat tcatcaatag gacctccact catatttttc tttttaagca 1741 ccatcaccga tat // LOCUS sequence313 1746 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence313 VERSION sequence313 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1746 /mol_type="genomic DNA" /organism="" /note="sequence313" CDS complement(202..1653) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MNCIYCSGKIPETEERCPYCGASVNPEQYADEKPKRRFPWEVVAV AALCVVIIVGVILVASALKLPEMEYSKYVCDYDEGIIYTNTFGHIGDAVCAIKFEYEID MERLSNQALGLQAEYDELIKQGEGFESFSCDYYTEGDTMYVTAIYDGLNLSSTLEEYIE RGILDIESPYVYYSMSEIEESIYDEGYILYDGDEPDLSNLDKAVYVWSDGKYTSVIVIY HRYDITYKREHYYTADAKTWSDSYKLEWLQTERDSVAKAKNLLFFDYEEIISDNKLYTK KTINDLYDVNNIIDSQYAEILSINGFSDDFHSYISVAKTENSLKALGYERNDDFDLDSL LPNEKKDAVDDDPPYFDEMSFEYTYPNGWKQVYTYEYYDDVAYTVRIKWSKSCKSWSNA DYEGTRKYFADVYEPVKDCDWLEVNETIEDNIYYIEVVFNDMHIPENLEEADKTSVISV GDSFRRISMVSWEPWHIGRGYKKVD" /locus_tag="LOCUS_8220" /note="MGA_1191" ORIGIN 1 ttcaggctga aaacaagcgc aaggcacgct atgccgatac atattacagt gagtaggatt 61 tttttgaatg tcagtttgcg tttcacggca cagccccctc tttctatata aaacaattat 121 acccaacaaa atattgcaat gcaactgcga tttttctatc acaaaaaatc ggcagaggaa 181 gctctctgcc gaccgttttt atcaatcaac ctttttatat ccgcggccta tatgccaagg 241 ctcccaggat accatcgaga ttcttctgaa gctgtcgccc acacttatga cgctggtttt 301 atccgcctct tccagatttt ccggaatgtg catatcgtta aagaccacct caatgtaata 361 gatgttgtcc tcaatggttt cgttcacctc aagccaatcg caatccttaa caggctcata 421 aacatcggca aagtatttgc gcgtgccctc ataatctgca ttcgaccaac ttttacagct 481 ctttgaccac ttgattcgca cggtgtaagc aacatcgtcg taatactcat atgtatagac 541 ctgcttccag ccgttgggat aagtatattc aaagctcatc tcgtcaaaat agggcgggtc 601 atcatcaact gcatccttct tttcatttgg caaaagcgag tcgaggtcga aatcatcatt 661 tctttcatat cccaatgctt tcagcgaatt ttcggttttg gcaacggaaa tgtaagagtg 721 gaaatcatcg ctaaagccat tgattgaaag aatctctgca tattggctgt cgatgatgtt 781 gttgacatca tagaggtcat ttatcgtttt ctttgtatac agcttgttat cgctgattat 841 ttcctcataa tcgaagaaga gcagattttt cgcctttgca acgctgtcgc gctctgtttg 901 gagccattca agcttatagc tgtcgctcca ggttttggca tcggcggtat aataatgctc 961 tcttttatat gtaatgtcat aacgatggta tatgacgatc acagaggtat atttgccgtc 1021 gctccagaca tataccgcct tgtcgagatt tgaaaggtca ggctcatcgc cgtcatacag 1081 gatgtagcct tcatcataaa tggattcctc aatctcggac attgagtaat aaacataagg 1141 agattcaata tcgagaatcc ctctttctat gtattcctca agggtggacg acaagttgag 1201 accatcatat atggcagtga catacattgt gtccccttcg gtgtaataat cacagctgaa 1261 gctttcaaag ccctcgcctt gttttatcag ctcgtcatat tccgcctgaa gcccgagggc 1321 ctgattgctc agccgctcca tatcgatctc gtactcaaat ttaattgcgc aaaccgcatc 1381 gccgatgtgg ccgaaagtat tggtatagat aatgccctcg tcataatcgc agacgtattt 1441 ggaatattcc atttcaggga gcttcaatgc gcttgcaacc aaaatcacac cgacaatgat 1501 tacaacgcaa agagcggcca ccgccaccac ttcccaagga aatcttcttt tgggcttttc 1561 atcggcatac tgctcggggt ttacgcttgc accgcaatat ggacatcttt cctctgtctc 1621 gggaattttt ccgctgcaat aaatgcaatt cataaatacg cctcctttat ttatgttgta 1681 aaaatcataa catacttaca tgcaaaaatc aacattttcc aggcccatgt acaaattttt 1741 aataaa // LOCUS sequence314 1746 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence314 VERSION sequence314 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1746 /mol_type="genomic DNA" /organism="" /note="sequence314" misc_feature complement(874..>1746) /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_013095330.1:Gfo/Idh/MocA family oxidoreductase" /note="WP_013095330.1 Gfo/Idh/MocA family oxidoreductase (Enterobacter) [pid:50.0%, q_cov:98.6%, s_cov:74.2%, Eval:1.6e-77, partial hit]" /note="MGA_1193" /locus_tag="LOCUS_8230" ORIGIN 1 catttggcat tggggaagct ggatttttca gtcgagcaga tctcacgctc gtcgcgaggc 61 aaacgccacc atttgagcac ttcgttttca aggactatct tgcccttggt gccgctgatt 121 tcaaggcggt tggtgccggg aagctcgcct gtcgaggtca taaatgcacc tgttgcgccg 181 tttgcatatc gggcaaagat ggtaacgtcg tcctcaacct cgatattgtg atactttgct 241 tcgtcgcaaa atgcggtgat ctgtatcggc attccgcata tccactgcca aaggtcaagg 301 ttgtggggtg cttggttcaa aagcactccc ccgccctcgc cattccatgt ggcgcgccac 361 gagcccgagt cataatacgc ttgggagcgg taccagttgg tgattatcca gacggtgcgt 421 ttaagctcgc ccaactctcc gtttttaacc atatcgcgag ccttgataaa caaggggttg 481 gtgcgctggt tgaacattat tgcgaaggtc ttgcccgact ttgcggcaac atcgttcaaa 541 tatcttgcct tggtgactct tatatcctcg ggtttttcaa ccaaaacgtg gagccctgcg 601 tttaagcagt cggcggcaat atcagcgtgc aaaggatggg gtacagaaac gatgaccgca 661 tcgcacaggc ccgaagcaat aagctcctta taatcggaaa agcttttaag ctcgggattg 721 tcttttgtga agtgatggca tctgtcggtg ttaatatcgc atattgcgcc gaggcacgca 781 cccttaattt tgcccgaaag aaggcagttt gtgtgggcag agccgatatt tccgacaccg 841 ataacgccga ttcttaaatc gttcatagct ttattatttg cttccgccat aggtgtcgct 901 tgtatcagaa acgactgcct tgacgttgtc ttttctcttt gaggttgcaa ctctcttcat 961 cagctcgtca tagtaaagct gttcgtcgaa gggaagctca atttccttgc ccaagaatgc 1021 ggaaaggtgc attgcatttg cgagcataag accgttgata ccctcttcac cgggagcgac 1081 aagcgattcg ccgcgcagaa ttgcgcctgc ccaagcattg agtacgccaa cgtgctgttc 1141 gttcttgcca tcggtctcaa tttcaacctt gtgggtcttg aggttaccga agggaacggt 1201 attggtcttg gagaattcct gctcggtcat ttcaaattca attacttcaa ggccggagta 1261 atcagcgatg attcttgcct tgtcaagctg aatatcaaaa cggttggtgc cgcgagcgtc 1321 acctgtggtg gtaacgaaaa cgcctgttgc gccgtttgca tattcaacat atgtagtaac 1381 atcgtcctca acttcaatat cgtgccactt gccgaagtgc atctttgtga gtacctttac 1441 gggcattccg cagatccact gccaaaggtc aagctggtga ggacactggt tcatcaatac 1501 gccgccgcct tcgcctgacc aggttgctct ccatccgcct gagttgtaat atgcctgggg 1561 acggtaccag tcggtgatga tccagttggt gcggcgaatc tcgccgtatt tacccgactg 1621 aataagctca cgcatttttc tgtaaacatg gttggtacgc tggttgaaca tcataccgaa 1681 aacaacttcg ggatgctttg cagcttcttc gttcatacgt ctaacatcga gggtatatac 1741 acctgc // LOCUS sequence315 1745 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence315 VERSION sequence315 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1745 /mol_type="genomic DNA" /organism="" /note="sequence315" CDS 415..1722 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MGMNCALDGPAGAGKSTVAKELAKKRGYIYVDTGALYRAVGYYAL SKGADTTSADDVAPLLGEINVELKFENGVQAVYLNGENVSDKIRTPEMSMAASNVSAIP AVRAFLLDLQRSIAANNDIIMDGRDIGTVILPNAQVKIFLTASIDERAKRRYDEHIAKG QDVNYEDIKADIAQRDYNDSHRATAPLKKADDAIEVDTSDMTIEEVIETIANIIESKKF KAPEGNIADKKPKCSFRLIGYTIIRWIVKVFIHIAFNVKIVNKQNIPHAGGCVIASNHI SWADGLIIGINPIVSGSYVSKAELFKSPLVAFLLKLLNCFPVLRGKGDMGFVTISCDFL NKGHNVIIFPEGTRSKTGEIGRAKTGVAYIVAASKAPIIPVSVKCDGKVKFRSKITVTF GDPIYYPQLGISGTSPSEMHKVRDIIMNKIKEQLDD" /locus_tag="LOCUS_8240" /note="WP_003700259.1 (d)CMP kinase (Ligilactobacillus salivarius) [pid:52.3%, q_cov:50.1%, s_cov:97.3%, Eval:2.3e-55, partial hit]" /note="MGA_1195" ORIGIN 1 agaatcctcc gggatttttc cgagactcct aatgtagaat atatgcattc gctgggcaga 61 cttctgccga gagatttaga gcaggtcgta gttgatatat caaaaatcga ccctcgcaag 121 ccttgcaatc agataacaaa agaagagcgt cttggccttg tgcatctgct caagcacttt 181 gaacttacac cgactgccct tcgccctgtt gatgaagcaa ttataactcg cgggggaatc 241 tctgttaaag agatagaacc tgcaacgatg gcttcaaagt ttgtaaaggg attatacttt 301 gcaggagaaa ttattgactg cgacgggtat acaggcggat ttaacctcca aatcgcgttt 361 tcaacggcat atgccgcggc aagcgcaatc gcaaatatga aaggacgata aattatggga 421 atgaactgtg ctcttgacgg ccctgcaggc gcaggcaaat caacagttgc aaaggagctt 481 gcaaaaaagc gcggatacat atatgttgat accggtgcgc tctatcgcgc tgtgggatat 541 tatgcactca gcaaaggcgc tgataccacc tcggctgacg atgttgcgcc tttgcttggc 601 gagataaatg ttgagcttaa atttgaaaac ggtgttcagg ctgtatattt gaacggcgaa 661 aatgtttcgg ataagataag aacccccgaa atgtcaatgg cggcatcaaa tgtttccgcg 721 attcccgccg ttcgtgcatt tttgcttgac cttcagcgct ctatcgccgc aaataacgac 781 atcattatgg atggcaggga tatcggcact gtaatcttgc ccaatgcaca ggtgaagata 841 ttcctcactg cttcaattga tgagcgtgca aagcgcagat atgacgagca tatcgccaag 901 ggacaggatg ttaactatga ggatattaaa gctgatattg cccagcgcga ctataacgac 961 tctcaccgcg ccaccgcacc ccttaaaaag gctgacgatg cgattgaggt cgatacctct 1021 gatatgacca ttgaagaagt tattgaaacc attgcgaata taatcgagag caaaaagttt 1081 aaagctcccg agggcaacat tgccgataaa aagccgaaat gctcctttcg cctcatcgga 1141 tatactataa tccgttggat cgttaaggta ttcatccata ttgcattcaa tgttaagatc 1201 gtgaacaagc aaaatatccc tcatgcgggc ggatgtgtta tcgcttcaaa ccatatctca 1261 tgggctgacg gacttatcat tggtatcaac ccgatcgttt caggttcata tgtttcaaaa 1321 gcagagcttt tcaaaagtcc tttggttgca tttttgctta agcttctcaa ctgtttccct 1381 gtactcagag gtaagggcga tatgggtttt gtgaccatct cttgcgactt ccttaataag 1441 ggacacaacg ttatcatctt ccctgaaggc acgagatcca aaacaggtga gattggcaga 1501 gcgaagacgg gtgttgcata tattgttgcc gcttcaaaag ctccgattat tcccgtatcc 1561 gtcaagtgcg atggcaaggt taaattccgc agcaagatta ccgttacctt cggtgacccg 1621 atctattatc ctcagctcgg tatcagcggt acatcgcctt ccgagatgca taaggttaga 1681 gatattataa tgaacaaaat taaggagcaa ctggatgact gatcaatgcg ttactgttgc 1741 caaaa // LOCUS sequence316 1744 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence316 VERSION sequence316 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1744 /mol_type="genomic DNA" /organism="" /note="sequence316" CDS complement(360..695) /product="inorganic diphosphatase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_010890780.1" /transl_table=11 /codon_start=1 /translation="MSDIIGKRVSVTVDRPLGSAHPNHPDLIYPINYGYIEGLIAPDGE EQDVYILGIDEPIEKFEGIVVAVIHRFDDIEEKWVVAPENMDFSKDEISASVEFQERFF KTEIIMT" /locus_tag="LOCUS_8250" /note="WP_010890780.1 inorganic diphosphatase (Clostridium) [pid:57.8%, q_cov:98.2%, s_cov:98.2%, Eval:4.3e-28]" /note="MGA_1197" CDS complement(655..1281) /product="flavin reductase family protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011017175.1" /transl_table=11 /codon_start=1 /translation="MNTSKKTTFKGSSILAPVPAVVVTCGTVDKPNALTIAWTGTINSI PPKTYISVRPERYSYDLIKESGEFVINLTTRELTRATDYLGVRSGKNEDKLKNLGLSVS PATQVSAPILDASPVSIECRVCDIISLGSHDMFVADVLAINVADELIDKNGKICLDKAD LIAYSHGEYFAIGEKLGSFGYSVKKPTKKAGKSERYYRQACKRHR" /locus_tag="LOCUS_8260" /note="WP_011017175.1 flavin reductase family protein (Fusobacterium nucleatum) [pid:49.0%, q_cov:93.3%, s_cov:99.5%, Eval:6.1e-50]" /note="MGA_1198" CDS complement(1253..1633) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MIIYNNSRKGGFALGGNHLTKSNLIAGGVAAIGLALAAVIGLWQP KKNDKKAKSTKKKRLLDLAVLIPLAFKLTKSAVSKIELDKIVTNISEAVNEADDNCDIE IIDAIPISSEEEVYEYIEKNDL" /locus_tag="LOCUS_8270" /note="MGA_1199" ORIGIN 1 caaatgtgaa tatgaggaga tacgttttga caattccggc tctgctcacg caggcgtaat 61 tcaagcgtat gtgaataata ttcttgacgg cacacctctt gtcgccaacg gatacgaggg 121 catcaatgag ctttcaattt ccaatgcggc gtacttatcg caatggctcg gcaacaagcc 181 gattgatctg ccctttgacg aatcgctctt tgatgagctt ttggcgaaga aagctgccac 241 atctcaaagc gcaaagaccg agggcgataa gaagatgaat gaggaatatc gccaacgctg 301 gcaaacaaac tggaactaaa caaaaacaaa cagcacggtt tatcgccgtg ctgttttctt 361 tatgtcatta tgatctccgt cttaaaaaat ctttcttgaa actcgaccga tgccgaaatc 421 tcatcttttg agaaatccat attctcggga gccacgaccc acttttcttc aatatcgtca 481 aatcggtgta ttaccgcaac gacaatgccc tcaaattttt caatcggctc atcaattccc 541 agaatatata catcctgttc ctcgccgtcg ggagcgatca aaccctcgat ataaccgtag 601 tttatgggat agatcaggtc gggatgattc ggatgggcac ttcccaaagg tctgtcaacg 661 gtgacgctta cacgcttgcc gataatatcg ctcacttttt cctgccttct tcgtcggctt 721 cttgaccgaa tagccaaagc tgcccaattt ctcgccaatc gcgaaatatt caccgtggga 781 ataggcaatc aaatcggctt tatcaaggca aattttgccg tttttatcaa tcagttcgtc 841 ggcaacattg atcgccaaaa catccgccac aaacatatcg tgtgaaccga ggctgataat 901 atcgcatact ctgcactcga tcgaaacagg ggaagcgtcc aaaatcggcg cggaaacctg 961 cgttgcaggg ctgacagaaa gccctaaatt ttttagcttg tcctcatttt tcccagagcg 1021 aacacccaaa taatcggttg cgcgggtcaa ttcgcgggtg gtgaggttga taacaaattc 1081 gcccgactcc ttgatgagat catatgaata tctttctggg cgaacggaga tataagtctt 1141 cgggggaatc gagtttatcg tgccggtcca agcgattgtc agcgcgtttg gtttatcgac 1201 cgttccgcag gtgacgacca ccgcgggcac aggagccaga atcgagcttc ccttaaaggt 1261 cgtttttttc gatgtattca taaacttcct cctcgctcga aatgggaatt gcatcaataa 1321 tctcaatgtc gcaattatca tctgcttcat ttaccgcttc gctgatgttg gtgacaattt 1381 tatccagttc gatttttgat accgccgatt ttgtcagctt aaatgccaag ggaatcagca 1441 cagctaaatc caaaagacgc tttttcttgg tgcttttcgc ctttttgtca tttttcttcg 1501 gttgccacag tccgattaca gccgccaacg ccaaaccgat tgccgcaacg ccgcctgcaa 1561 tcaaattcga ctttgtaagg tgatttccgc ccagagcgaa accgcccttg cgcgagttgt 1621 tatatattat catttgaagt tcaccgcctt aatgtatata tcatatcaca gatttgagcg 1681 aattacaata tcgggatagg aaaagcagag cgccgtctgc gcactcattt cgcggggggg 1741 cggc // LOCUS sequence317 1738 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence317 VERSION sequence317 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1738 /mol_type="genomic DNA" /organism="" /note="sequence317" CDS complement(390..1556) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MKKIFCLLLCVCLLCSCADFSIRREEDVTTITPPSTAESVVSEQT TTSEAVTTTAPDEPEEQPTTEPLATEPAISATEPITSQTEESSEATTTVITEPVPTFEF PEEFYSELSAIFAQFSFNLNCDGDPTKCTCNPEYEKLDAEGNIVTPRDRCMSIYFYDLE TGYEMTVNSGVHYPVASVVKIPYCTMIYEKMTAGEIDPELLLTYEKRHYFHGTGLVNKG TYGDTYTVMQLLKLAITESDNTAYEMLKDLVSWDDFMAYCQEAGYTHEQDLRSRKQKLC LESAGASGRLLANFLRSESGFVDAYEYDLTHTKNKMITSTYTVYRKYGWTNFAFHDVAY IDAPYPYVLVILSNIEGEERPDYTLFANVSMLIERYSQNRGDVPAEIG" /locus_tag="LOCUS_8280" /note="MGA_1201" ORIGIN 1 aattggtgcg actaagccga taagccgagt tttgtcgtgt acggcaatct atctagccga 61 tatgtcgcca tatcggtcaa gccaccttca acggtgtatc catcgagcag atgttgagat 121 acatcgaacc aatcggtgtt gcatcgggta gggtttacat ggcagcgcag tctcctgcgc 181 tccggtgagc tcttacctcg cctttccatc cttaccgctt gcgcggcggt ttctttctgt 241 tgcactttcc ctaaggtcgc cctcggctgc cgttagcagc taccctgctc tgcgatgctc 301 ggactttcct catccgccgg tttaagccga cgtccgctgc cgtatagctt actcgcaagt 361 gtgtatttta ctacttttgt ccccgtttgt caaccgattt cggcaggtac atcccctcta 421 ttctgcgaat agcgctcgat taacattgac acattcgcaa agagagtata gtcggggcgt 481 tcctcacctt cgatgtttga aagaatcacc agaacataag gatatggcgc atcaatatat 541 gcaacatcgt ggaaagcaaa gtttgtccag ccgtatttgc ggtataccgt ataggttgag 601 gttatcatct tgtttttggt gtgtgtcagg tcatattcat aggcatccac aaacccgctt 661 tccgagcgaa ggaagtttgc gagcagtctg cccgaagcac ctgccgattc caagcaaagc 721 ttttgcttac gagagcgcaa gtcttgctcg tgggtatatc ccgcctcttg acaatatgcc 781 ataaaatcat cccaagaaac gaggtctttg agcatttcat atgccgtgtt gtccgactcg 841 gtgattgcaa gcttcaaaag ctgcataacg gtgtatgtat cgccgtatgt gcccttgttg 901 acaagcccgg tgccatggaa ataatggcgt ttttcatagg tcaaaagaag ctccgggtca 961 atttcccctg ccgtcatctt ttcatatatc atcgtgcaat agggaatttt gaccacactt 1021 gcaacgggat aatggacacc gctgttgacc gtcatttcat agcccgtttc gaggtcatag 1081 aagtatatgg acatacatct gtcgcgcggg gtaacgatgt tgccctcggc atcaagcttt 1141 tcatattcgg gattgcaggt gcattttgta gggtcgccgt cgcagttcaa attgaacgaa 1201 aactgcgcga atatcgccga cagctccgaa taaaactcct cggggaattc aaaggtcggc 1261 acgggctcgg tgataaccgt tgttgtcgct tcgcttgatt cttccgtttg cgaggttatc 1321 ggttcggttg cggaaattgc aggttcggtt gccaaaggct cggttgtcgg ttgctcctcg 1381 ggttcatctg gcgctgtggt ggtgacagct tcgcttgttg tcgtctgctc gctgacaacg 1441 ctttcagcag ttgacggcgg agtgatggtg gtgacatcct cttcgcgtcg aatggagaaa 1501 tctgcgcagg agcacaaaag gcaaacgcac aaaagcagac aaaatatttt tttcaacggt 1561 ttcaccccgc tttcaaaaga caaataaccg accgcaacca cacatggaag cggtcggcaa 1621 aatattaata aacagaatta cttgatggat gtcggggtca tctgagaata gtattcgtta 1681 tatgtaatct cagcgttttc caaaagttca gtgatatctg cattgaactt agaggaaa // LOCUS sequence318 1736 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence318 VERSION sequence318 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1736 /mol_type="genomic DNA" /organism="" /note="sequence318" CDS complement(586..1605) /product="L-threonylcarbamoyladenylate synthase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011249899.1" /transl_table=11 /codon_start=1 /translation="MNTVVLSSCKDDIKYAASLINAGEVVGMPTETVYGLAADATNEDA VKKIFTAKGRPCDNPLIVHICRFDMVNDIASSVPELAYKLAEKFWPGPLTMIMPKSDNI PLVTSGGLDTVGIRFPSHKVALDLIEKSGKPLAAPSANLSGSPSPTTLRHVFEDMNTRI PAIIDGGDCEVGVESTVISFDADGTVRILRPGKISYDDLLSVTDKVCIDNGVLAQLDIN AKVASPGMKYKHYSPKANVIILDGSADAFKAYVSEHLTENTYCLLFDDSEAIEGVNYLT YGITSEEQAHLLFERLREFDVLGAKTVYARCPSKDGVGLAVYNRILRSAGFNVIKLDD" /locus_tag="LOCUS_8290" /EC_number="2.7.7.87" /note="WP_011249899.1 L-threonylcarbamoyladenylate synthase (Thermococcus kodakarensis) [pid:47.7%, q_cov:95.6%, s_cov:95.3%, Eval:7.1e-75]" /note="MGA_1204" ORIGIN 1 cttttcttta agagaatctt ggtcactacc gtttgatatg ttatagtcgc acttagaaat 61 aaaccattct tgatcgtgct gtgctgaaag tcttgccttt gcttgactct ctgttatgtc 121 atcgcgaagc ataattcttt ctgctaacac ctcatcaggc gccgtaacac taacaaccgc 181 atcgcagata tcatcaattc cgctttcaaa aagcgtagga gcatctaaaa gaatgtactt 241 tatcccttga tctttatatg cgcgaatctc attaaaaaca gcagttgtaa tgtacgggta 301 gatgattaat gaatatagtg tcattttctc tttatcgtta aatacagtcg aggccatttg 361 cttgcggtca agccctaaat cggttacaca tttgggaaaa tgcgccctga cttcttcaag 421 aaaaggctga tatgatgcaa cttttcgcgc aattgaatca gcatcaatca ccgcgaagcc 481 gaaatcggaa aacattgaag aaacggtggt ttttcctgca ccgctctgcc ctgtcagccc 541 gattatattg atacactcga aggtgttcat ttgtttaaca tcctttcagt cgtcaagctt 601 aattacgtta aagcctgccg aacgaagtat tctgttatat accgctaaac ctacgccgtc 661 ctttgaaggg caacgagcat atacagtttt tgcgccaagc acatcaaact cgcgcaagcg 721 ttcaaacaaa agatgcgctt gctcctcgct tgtgatgcca tatgtaaggt agttaactcc 781 ttcaatcgct tcactgtcat cgaacaaaag acagtacgta ttctcagtca aatgttcgga 841 aacatatgct ttgaaagcat cggcacttcc gtcgagaata atgacattag ccttgggtga 901 atagtgctta tatttcatac cgggagaagc aaccttggcg ttaatatcaa gttgagccaa 961 aacgccgttg tcaatacata ccttgtcggt aacggaaagc aggtcgtcat atgaaatttt 1021 gcccggacgg agaattcgca cagtgccgtc agcatcaaag ctgataactg ttgattcaac 1081 cccaacttca caatcgcctc cgtcgatgat tgcaggaatg cgtgtgttca tatcttcaaa 1141 tacatggcgc aaagttgtag gactgggact tccggagaga tttgcagagg gcgcagccaa 1201 aggttttccg gatttttcaa ttaaatcaag cgcaaccttg tggctgggaa atcttatgcc 1261 gacggtatca agtccaccgc ttgtgactaa tggaatatta tccgattttg gcataatcat 1321 cgtcaaaggt cccggccaga atttctcggc gagcttatat gcaagctcgg gcacacttga 1381 tgcgatgtca tttaccatat caaatctgca aatatgaaca ataagcggat tatcgcaagg 1441 tctgccttta gcggtgaaga tttttttgac agcatcttcg tttgtagcat cagcagcaag 1501 gccgtagacg gtctcggtgg gcataccgac aacttcgcct gcatttatca gcgaagctgc 1561 atatttgata tcatccttgc aagatgacaa aactactgta ttcatacgct ttcactctgc 1621 tttgcaagtt ttgcagcttg atctgctgtt gcaagtgcat caataacctc gtccagattg 1681 ccgtttaaaa tgctttcaag cttataaagc gtaagaccga ttctgtggtc gctgac // LOCUS sequence319 1733 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence319 VERSION sequence319 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1733 /mol_type="genomic DNA" /organism="" /note="sequence319" CDS complement(320..742) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MTSNNLGDPNTLNFTYMTYGYIGHVGNRYSDVEALADLDPATALT ISELNIYADKITVTVYSAGGRMSSFSQEFARKNVVEIVEEPEDVVEVENDSSADTTVES PAGENGAPAIVFVAIGAVVIIGAIVVIVVLKAKKKQ" /locus_tag="LOCUS_8300" /note="MGA_1206" misc_feature complement(749..>1733) /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_011948457.1:metallophosphoesterase" /note="WP_011948457.1 metallophosphoesterase (Clostridium botulinum) [pid:31.0%, q_cov:56.3%, s_cov:54.3%, Eval:5.2e-11, partial hit]" /note="MGA_1207" /locus_tag="LOCUS_8310" ORIGIN 1 gcttgaccaa cgggccgatg tttcacctaa tcagcgaaca ttaatattat aataaaagac 61 gtagaaaaag tcaatacctt ttgagaaatt tcatgataat tttcctgctt tttatattgc 121 ttttgcttct gttttgcgcg ggaaatgtaa gcataatcaa ctgactattt aaaagacaaa 181 aagaggataa cctaagttat cctcttaatt tgttgaaaag tcattcaaaa aacatatttg 241 cttgaaaaat acctagataa acgatacaat caagttttag ttcttcattc aattacgtta 301 atgctgttct tgatatatat tattgctttt tcttagcctt caagaccaca ataacaacta 361 ttgcgccgat aataacaaca gcaccgattg caacgaatac tatggcagga gcaccgtttt 421 ctccagcggg agattcaaca gtggtatcgg cagaagagtc attttcaact tcaacaacat 481 cctcaggctc ttctacaatt tcgacaacat ttttacgtgc gaactcttgc gagaaggaac 541 tcattcttcc gcctgcggaa tatacggtaa cagttatttt gtccgcataa atattaagtt 601 cactaattgt aagtgctgtc gcgggatcaa gatccgcaag agcctcaacg tctgaatatc 661 tgtttccgac gtgaccgata tatccatagg tcatatatgt gaagttaagg gtgtttggat 721 cgcctagatt attgcttgtc ataagtccct agccggaggc atcatagcaa tcctcggttg 781 aaacgtaaat tgtgtcaccc acggttttga aagcaataga accgccgatt tcggggtcgc 841 cggtcgagtg gttatgaccg aacataaaga taatgtcaag atcctttgca gcttcgttaa 901 tagcatcgaa aactatataa gcatatctat tgttgccatc agttcttgca acgtcatagt 961 gaagaccggt atgagaagtg atgataactg gtcttgtttc acctctttca ataagcgaat 1021 tcatatactg agttattttc tcggctgtgt tttggcatat ggtcttgttg gatgtatcat 1081 acattcccca aggcatatcg tcctcattta aaatataaac gataaagttg tcatattcat 1141 atccgccggt gggaacaaat ccgttgatgc cggagttatc gtgatttcct tcaacctgga 1201 tatagttgtt gttttccgga ctgatatggc tccacatatc ggaaacaagc tttaacacct 1261 gagatcttcc atggttggaa ccttctgttg agttgctaca tccatagtcg ccaccgaaga 1321 taaagtagtc aggttcaacc ttacgcattg tgttaaagat atcgttgatc tgagaaataa 1381 gtccatcgcc gttgttgctt gcgatgtcgg agccccaaag ctgatagtca gagaaagaaa 1441 cgatgcttgc aagcggatcg ccatagtcaa cagcggtgct tccatcggtg taagacactt 1501 caacggtgat tctgaagctt atttcgacct cgggagtgaa tgcaaaaggc aaaagccaaa 1561 tgctttgaac aacttcggga tcaacatcgg cagaatatgt gatctttgtt tttgaaccaa 1621 actgcttggt ttcaactaat gtattccacc atccgttcca gaaaagctga caggacggtg 1681 cagctccgtt tgcattgcta aatttttcaa cattgtcagc ttcaacggta aca // LOCUS sequence320 1731 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence320 VERSION sequence320 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1731 /mol_type="genomic DNA" /organism="" /note="sequence320" CDS 278..1327 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MKKLFAILVAAMLVMAMSVTAFAATASIITDAAKETTAEVASIAF ALPEGLTLETGDVVTVHIKGKATNDKVRIYFTDNVDNGRVNDAVDIYVVDGAFETTVDI VIDASGAIQGTAAPTVLLLKGPSYGVNLTDVSVEVVEITCDKIVAEEAPVEEAPAEDGY TAFLMFATSSWYPAAMEAADHNSVTVTGNGTYTIETDQLAGSSDALVFCVDIMDILVDH PNVTAVLDSIEVDGEVVEFNADAVQYGDIEQDNDHYRIEIRNEYGATLDTVITGWQFAI DSTIKVTFTVSGMEDVVEAPVEEETPAVEDTPAAEDTPAEEEPADTGLALAVVPMIVAA AAVVLSKKR" /locus_tag="LOCUS_8320" /note="MGA_1209" ORIGIN 1 aattcccgag gaagaggaaa caattcctga aaaccctgca acaggaatta cctattctgt 61 tttgcccctt tgtgctgccg caattgcaat tgtaatatca atatctagaa gataattaca 121 ataggcgtgg tatatatact acgccaaata cataaagagg tcacaaaaag caataaaata 181 tattgataat ttgcagtata tttattgaca aataatcaat aagattatat aatacattta 241 ggtaatagat taccaaatca tttaaggaga cataattatg aagaaattat tcgcaatcct 301 cgttgctgca atgctcgtta tggctatgtc cgttaccgca ttcgctgcaa ccgcatccat 361 catcaccgat gctgctaagg aaacaactgc tgaagttgca tctattgctt ttgcacttcc 421 tgaaggcttg actcttgaaa caggcgacgt tgtcactgta catattaagg gtaaggctac 481 caacgacaag gtaagaattt actttaccga caatgttgat aacggccgtg ttaacgatgc 541 agttgatatt tatgtagttg acggtgcttt cgaaaccact gttgacatcg ttatcgatgc 601 ttccggtgct atccagggta ctgctgctcc taccgttctc ttgctcaagg gcccctctta 661 cggtgtaaac cttactgatg tgtctgttga agttgtagag atcacctgcg acaagatcgt 721 tgctgaagaa gctcctgttg aagaagctcc cgctgaagat ggctacactg cattcctgat 781 gttcgccaca tccagctggt atcctgctgc aatggaagct gctgatcaca actctgtaac 841 cgttacaggt aatggtacat acaccattga gaccgaccag ctcgcaggct cctctgacgc 901 tttggtattc tgcgttgata tcatggacat tttggttgat catcccaacg taactgctgt 961 tcttgacagc atcgaagttg acggcgaagt tgttgaattc aatgctgatg ctgtacagta 1021 tggcgacatc gaacaggata acgatcacta cagaattgaa atccgtaacg aatacggtgc 1081 aacacttgac actgttatta ctggttggca gttcgctatc gattctacca ttaaggtaac 1141 tttcactgtt tccggtatgg aagatgttgt agaagctcct gttgaagaag aaactcctgc 1201 agttgaagat actcctgcag ctgaagatac tcctgctgaa gaagaacccg ctgacaccgg 1261 tttggcactc gctgtagttc ccatgatcgt tgcagctgct gcagttgttc tttccaagaa 1321 gagataattt atttacctaa caaaaaacta aggcgtccga ttgggcgcct tgttttttta 1381 tggatatatt aaaaaggcat ccgtccggat gccttttaat ttatccccaa agggaatcta 1441 aatattcaat tctatcctcg acccagttga tgattgcttt tgcgcgtccg gtgcgcttcg 1501 tgccgtcttt gttaaggtca gatgtgttgt tttcaaccgt tgttcttatc tctgcggcaa 1561 ctgcgctcat ttcgtcaact ctgtcctgcc aggtctcctt gaccatatcc ttaaaccaat 1621 ctgctgaata gaacaaaatc agccaagggt tggatctgtc gccccagtta tcaacaaagt 1681 aatcatcctt gaagtttgcg acgtaaagtc cgccatcggc atccgagcta t // LOCUS sequence321 1725 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence321 VERSION sequence321 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1725 /mol_type="genomic DNA" /organism="" /note="sequence321" ORIGIN 1 gataagacag aaaccatata cggcagtgtt gacagcgtta catatcgaaa tgacgacaac 61 ggctttgccg tcataacctt ggaccacgag ggcaagccat taacagttgt gggcgagttg 121 ggaaatgttg aagaaggcga agagcttgaa ctgacaggca tatattccaa ccacgccaag 181 ttcggcagac agtttaaagc cgatgtctgt gtccgctcgc ttccatccga aatatctgca 241 atcaggcgtt atcttgcagg cggtgtaatt aaaggtatcg gccccgtaac cgccgcaaat 301 atcgtcaaaa agttcggtga ggaaaccttc gatgtccttg aaaacagccc cggcaggctt 361 gcaaccgtcg aaggaatcac ccaagcaaag gcgcttgctt tctgccagga attcaagcgg 421 gtcatcggct tccgcgacgt cttggaatat ttcaaccgac tcagactaca gtcggtgtat 481 ggcgtccgcg cttggaagaa atatgaaatt aaaacccttg caatgatcga gcaaaaccca 541 tacatactct gctcctatgg catcgaactg cccttcacca tcgccgagga gatcgcccgc 601 gaaaagggcg tgccatacga tagctataac cgcctttgtg cgggcatcaa atatgtcctc 661 gctgagaatg ccgatgcagg ccacacctgc ctgcccaagg acaagctgat tgaaactgcc 721 tcgagatttt taagagtcga gcccgagctg gtcgaaaaag cagttatgag cgaggtcgat 781 gaagaaaatc tctatatcta cctcaaaaag caccgcccgt tcataatgct ccgcgaatat 841 ttcatcgctg aggactatat ctcccgacgt cttgcaatta tgaacagcct ttcctatgat 901 acaggtatca actacgacga ggttatcgac attcacgagc aggtgactga tattacctat 961 gccgacaaac agcgccaagc gataaatatc gcgctttccc gcggatttat ggtacttaca 1021 ggcggccccg gcacaggtaa aaccaccact ttaaatgcaa tgatatcgct ctttgaacag 1081 cagggcttaa agccgttcat atgtgcaccc acaggcagag ccgccaagcg tatttccgac 1141 cttacaggct acgaagccaa gacgattcac aggcttctgg gagtcaagag tgggggagag 1201 tttgccagct ttgagcacaa cgaaaataac cttctcgatt gcgacgttgt catcatcgac 1261 gaaatgtcaa tggtggatac ccttttgttt gaagcgcttt tgcgcgcgct tcccgtcaac 1321 tgcaaaatga taatggtcgg cgactccgac cagcttcctt ctgtcggtgc gggaaatatc 1381 ctgcgggata taatcgaaag cgaaaccgtg cccgttatcg cgttaaacga gatcttccgt 1441 caggcaagcg ccagcgcgat tgtcaccaat gcccataaga tcgtcaaggg cgaaatgatc 1501 gacctttggg agaactcccg cgactttttc ttcatgcaac tcctcgattt cgacgaagcc 1561 gctgccctta ccgtcgagtt gtgcttaaaa cgactgcccg atgcttacgg ctactcatcc 1621 atcagcgata ttcaaattct ttcgccgacc cgcaaaggcc ccttgggtac aaacgagctt 1681 aataaactct tgcagcaagc tctcaacccg ccatcccgcg aaaaa // LOCUS sequence322 1719 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence322 VERSION sequence322 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1719 /mol_type="genomic DNA" /organism="" /note="sequence322" CDS complement(284..724) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MNANKIEKVRGEIDERIKELNRGKEKAQDECPHNRGGYIDGVVDI YKKDGKVYMACKICGAKDMDAKAPTLDEVKAAKKTMETAVNFIKMRMSDTHPKGQETLE ECATFLRSARRLEKVYANLEKNTQEQKKKKNENGGGRVSLKL" /locus_tag="LOCUS_8330" /note="MGA_1213" CDS complement(875..1405) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MTYIFHDDPTERTNNHYSGVNVVTMYVEKTNSITSPVHVVLVKPF VQCGETCKELDLIILRDGFLFESPVLKKIDDYQNMLSAITYHFTPIDVVIEKLRNGGMN SYAIDYIKMISLCTNPTRVQIDSVNLMGKQLGLISRYVDKMEDISNHYDQLNNKIEGLS DSLNQLRRMGAFN" /locus_tag="LOCUS_8340" /note="MGA_1214" ORIGIN 1 aaaaagatga aaggcaccct ctttgccttt tgcagaaata tacataccga tacattcctg 61 aatctgttga aattgattgg ttatggcctg gtacacatcg tccttatagg ccatttctat 121 tgatggtttc ttagttgcca tctttattac ctccttttaa atgattaagt ccgagtactt 181 actcgggtat ataatatatt gttaaatatc atttattata taaatcgaca aaaaaatgag 241 agtgtaccga agtacactct catttgagtt gctgaagata tgattacagc ttgagggaaa 301 ctcttccgcc gccgttctcg ttcttctttt tcttctgttc ctgagtattc ttctcgaggt 361 ttgcataaac cttttcgagt cttcttgccg atctcaggaa agttgcgcac tcctcaagag 421 tttcctgacc cttggggtga gtatcggaca ttctcatctt gatgaagttt accgctgttt 481 ccattgtctt ctttgcagcc tttacttcat cgagagtagg agccttggca tccatatcct 541 ttgcgccgca gatcttgcag gccatgtaca ccttgccgtc tttcttgtag atatcgacaa 601 caccgtcgat atatccaccg cggttatgag ggcattcgtc ctgtgccttc tccttgcctc 661 tgttaagttc cttgattcgc tcatcaatct cgccgcgaac cttttcaatc ttgtttgcgt 721 tcatagcttt ttgacctcca tatggattat ttaatgaaac gtttcataac agctttcaca 781 gaaagcttta ccttgaagtt tagcaaatca taaaaagcta tcatgaatcg tgtatcacgt 841 atatgatata ttgttaaata ttggaagatt ttatttagtt aaaagcgccc attcttctca 901 gttgattcag actgtcagat aacccttcaa tcttattatt gagctgatca taatgattgg 961 agatatcttc catcttatcg acatatcgag atataagccc aagttgtttc cccattaaat 1021 taacagaatc aatctgcacc ctggtcggat tcgtgcacaa ggaaatcatc ttgatataat 1081 cgattgcata tgaattcatg ccgccattgc gaagcttttc gataacaaca tcaatgggcg 1141 taaagtgata cgttattgct gaaagcatat tttgatagtc gtctattttc ttcaataccg 1201 gagattcgaa taaaaatccg tctctgagaa taatgagatc cagctcttta caagtttcgc 1261 cgcactgtac aaagggtttt acaagtacaa catgtactgg tgaagtgatt gagtttgtct 1321 tttcgacgta catagttaca acattcacac cgctgtagtg gttgtttgtt ctttctgtag 1381 gatcatcatg aaaaatatag gtcattttta cttacctcca cttgttagtc attcgcgccg 1441 taacgcacct tgctgtagtt atcagaatcc tgatcaccaa aagctatctc gatattgaga 1501 gattttgtgc tgctactgga cagtgctttg caaaagcttt tgaccatgtc aacagcaata 1561 gcgggcgcat ccttgtcctt gtcagatacg tcgtatttct tgagcactct ctggatgttt 1621 gatgctgcat tctcatatat gcgatcgcga tcttcctcgg tttcggtact tccgccaagg 1681 tcatcccatt cgccatccca gaggtcatca tcctcatcc // LOCUS sequence323 1718 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence323 VERSION sequence323 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1718 /mol_type="genomic DNA" /organism="" /note="sequence323" CDS 73..744 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MAEIKKSQKSAPAGRKYIEVPVKSALPVWSAAAVWVLSALFVPMY NVVHILGIALASLGVALLVKKLLPKETKTVELPFASGNLELDAMVGEINKAVDSLEASR KLILAHDPETADVISSISATAEKIRDAIAQDPKDLVSLRRFFNYYLPTTLKLTEKYSFV LGQGVESANATETKESIKPALKQINNAFEKQLDALYADDALDISTDVTVLEAMLKRDNL N" /locus_tag="LOCUS_8350" /note="WP_009890534.1 5-bromo-4-chloroindolyl phosphate hydrolysis family protein (Clostridioides difficile) [pid:36.2%, q_cov:61.9%, s_cov:44.4%, Eval:4.1e-18, partial hit]" /note="MGA_1216" ORIGIN 1 ggtttgagta ttgaaatcgc tttaaattgt tgatataata atattgtata agtctatata 61 ggagatgatg ccatggcaga aatcaaaaag agccaaaaaa gtgctcctgc cggaagaaaa 121 tatatcgagg tgcccgtaaa atccgccttg ccggtctggt cggcggcggc tgtgtgggtg 181 ctgtcggcgc tgtttgtgcc gatgtataac gttgtgcaca ttctcggaat tgctcttgct 241 tccctcggcg ttgcgctgtt ggtaaaaaag ctgcttccaa aggaaacgaa aaccgtcgaa 301 cttccctttg cttcgggcaa tttagagctt gatgcgatgg tcggcgagat caacaaggcc 361 gtcgattcgt tggaagcttc ccgcaagttg attttggcac acgaccccga aaccgcagat 421 gtaatttcaa gcatctcggc aaccgctgaa aagatccgcg atgcgatcgc acaagacccc 481 aaggatctcg tttcgcttcg cagattcttt aactactact tacccaccac cctgaaactg 541 acagaaaaat attcgtttgt tttgggtcaa ggcgttgaaa gcgcaaacgc caccgaaacc 601 aaggaatcaa ttaagcctgc gctgaagcaa attaacaatg cgtttgaaaa acagcttgat 661 gcgctatatg cagacgatgc gctggatatt tccaccgatg tcaccgtttt ggaagccatg 721 ctgaaacgcg acaacttaaa ctaaagcata atcaaaaaat atattttgga ggttattaac 781 catgacagaa gcaccgaaat ttgaacttac acttgacccc ttcggaaccg aagccgaaaa 841 ggaagcagaa gacgttgttg caaaggaaga agcaaccgag gaaaagattg ccgagcttgc 901 aaagctgacc gaatcgagcc tttccgagga agaaaaggcg gcttgcgcgg aatttgccga 961 aaagatagac attaccaaca ccgcaatggt tctttcctat ggtgcaggca cacagcagaa 1021 gattgctgat tttagcgatt ctgcccttgc aaacgtccgc acacaggagc ttggcgaaat 1081 gggcgatatg atctccaagc tcgtgggcga gcttaaagca tttaacgacg atgccgacag 1141 ctcggacaag aagatcttgg gtctgttcaa gcgcgccaaa aagtcgataa tcaccctcaa 1201 ggcaaagtat gacaaggcag aagtcagcgt caacaacatt gtcaccgtct tggatggcca 1261 ccaggtaacc ctgctcaagg acatcgcagt tttggataag ctttatgaaa ccaacctgac 1321 ctatttcaag gagctttcga tgtatatcat cgcaggtaag cagaagcttg agaccgagcg 1381 tgcgactacc cttgttgagc tccagaacaa ggcaaaggaa tcgggacttc ccgaggatgc 1441 ccagaaagca aacgactttg ccgcaatgtg cgagcgcttt gaaaagaaga tctatgatct 1501 tgaacttaca agaatggtat ccattcagat ggctccccag atccgtcttg ttcagaacaa 1561 cgacacaatg atgagcgaga aaattcagtc caccatcgtc aacaccatcc ccctctggaa 1621 atcccagatg gcaattgctt tgggtcttgc acattcggaa gaagctttga gagctgagcg 1681 cgaggtcacc gatatgacca acgagcttct caagcgca // LOCUS sequence324 1707 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence324 VERSION sequence324 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1707 /mol_type="genomic DNA" /organism="" /note="sequence324" CDS 431..847 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MTPDMYKAFGYRVLKRVFEKASPNPNDYRYQHSDSPMGHIIPLLA DFNLTACNFGPTVTVQEIRKHMPNTRIDGQLAPFTFMRNVEDDIIAEVKRDCEAAKIGD LRGLNLATAGSINNGSLLESMRVVMAAIQNFGRY" /locus_tag="LOCUS_8360" /note="MGA_1219" ORIGIN 1 cggcgaagtc tttggtggta aatatgtctt tgacggaaac accacatggc ttcagggcac 61 aatttccgat gatgaatctt tgcgcaaaaa gctcgccgag gttaaagctt tggttgcaga 121 tcccgaggct ttccgcaaat ttgtcctgcc cgccgattgg gacgagcgtt gcaaacaggt 181 atactaactt tacggcaatc gccccggcca gttccgccat gttcgcggcc cagtaaccct 241 tgcaacatct gtttacggca ccgaaaatct tatctatctt tattatgacg acgaggagtt 301 atataccgag tttgctgaca ccatcgccga tgtaatcatc gcatatatag atctcttcat 361 ccgcgaatcg ggaagaacag aggaaaactt ccaccatggt ttctcctttg ccgatgacga 421 ctcttatctc ttgactcccg atatgtacaa agctttcggc taccgtgttc tcaagcgtgt 481 ctttgaaaag gcttctccca accctaatga ctatcgctat cagcactccg actcgcctat 541 gggtcatata atcccgcttc ttgcagactt taatctcact gcctgcaact tcggccccac 601 cgttaccgtg caggagataa gaaagcatat gcccaacact cgaattgacg gtcagcttgc 661 gcccttcaca tttatgagaa atgttgagga tgatatcatc gctgaagtca aacgcgactg 721 cgaagccgca aaaatcggcg accttcgcgg cctcaacctt gccaccgcag gttcgatcaa 781 taacggctcg cttttggaaa gtatgcgtgt tgtaatggca gcaattcaga acttcggaag 841 atactaaaca tataacaaat cagccgcgcc ataatcggtg cggctgtttt ttagccgtat 901 ctcatattga caaaaattta tcattctatt ataattgtag ttggatgatt tttcgtttgt 961 taaacaaaaa taaatacata aaggagtttt ttactatgag cagctttgaa aatcttcgca 1021 tcgtggataa cttctatcaa acatcgctat acttcccgat gccaactgtt atcatcagca 1081 cattgtgtga ggatggtact actaaccttg gaccatattc tcttgtacag ccgtactatg 1141 tcgcaggcaa ggattattac gcaatgcttt tgagctgtcg caattcctcc aacactgcac 1201 agaatattct tcgcacaggt aggtgcgcgc tcaacttcat tgatgacagt cccaagacct 1261 tcaaggaagc tgtaaagctc tcctggccgg gcgataagcc gagcgagaag atgcctaagt 1321 gtaactttag gcttgaaaca agccttgttg aagaagaaac gggtgaggca agacccaagg 1381 ttatgaccga tgcaattcag gtcattgaat gtacatgggt gcgcgagctt gacggtgccg 1441 acagagatat gccgggcgag ctcaacggat acgagccgcc gtatcacgat ttcaacggca 1501 ttacaagtaa attcggtgca cacttcattt tgaagatcga caagatcttg atgaagaaaa 1561 agtacagcga tgcgataatt cgcggtgtca cagccaagga ttttcctgca cttcccgttg 1621 attacggcta ccgtgacagc aaaaacttct ggttccacag aaagacaaga atgagagcag 1681 agcttttgca gatgcgtaag gcttctc // LOCUS sequence325 1707 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence325 VERSION sequence325 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1707 /mol_type="genomic DNA" /organism="" /note="sequence325" CDS 365..1015 /product="HAD family phosphatase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_012048390.1" /transl_table=11 /codon_start=1 /translation="MNIFKDFDCVIFDFDGTLVDSIGVWKDIDIKFMAKRSLPIPDDFY AKVSVLNLWQAAEYVIDECGVTDSPEDVVAEWLAMSEYEYANNIEMINGAKEFIFKLKE NGIKICLATAAGESQYKPCLEHHGVYDMFDAFVTTNEVKRKKGYPDVYLLAAERVGAKP EKCCVFEDIYLGVVGAKAGDFACVAVMEEHSKEWHDKIRELADVCVNDYTELM" /locus_tag="LOCUS_8370" /note="WP_012048390.1 HAD family phosphatase (Clostridium botulinum) [pid:37.3%, q_cov:98.1%, s_cov:99.1%, Eval:2.5e-41]" /note="MGA_1222" misc_feature complement(1061..>1707) /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_012028588.1:4-alpha-glucanotransferase" /note="WP_012028588.1 4-alpha-glucanotransferase (Streptococcus suis) [pid:46.6%, q_cov:94.9%, s_cov:40.2%, Eval:1.1e-46, partial hit]" /note="MGA_1223" /locus_tag="LOCUS_8380" ORIGIN 1 atcattgcgg ggggcttttt gctgacaact gttgcggcaa tgatgtttgt ttcatccaag 61 actgcatcct cgatggatac gggcgaggaa atgtcgagat agttcgccgg gtagtggttc 121 aaaagcccgc cgactgttgt gatattcagt gttgacaaaa gctgagcctt tgcaggaccc 181 acgaccttta aatatttcac atcgtcaata taaggcattt ttgcaccgcc ctttcgcaat 241 tacaatataa ttttattata cagttttatt tgtgcgtttg caagacttag ccgagcaata 301 aacaaattga cagaagacgt aaattcgggt aaaataagtc tgattaaaga aaggattttg 361 gtttatgaat atatttaagg attttgactg cgttattttt gactttgacg gcacgctggt 421 ggattcgatc ggtgtctgga aggatattga cattaagttt atggcaaaaa gaagcctgcc 481 aattcccgac gatttttatg caaaggtgtc ggtgctgaat ctttggcagg cggcggaata 541 tgtaattgac gaatgcggtg tcaccgattc gcccgaggac gttgttgccg aatggcttgc 601 gatgagtgag tatgaatatg ccaacaatat tgagatgatt aatggcgcga aggagtttat 661 ttttaagctc aaggaaaacg gcatcaagat atgccttgca actgccgcag gtgagagtca 721 atataagccc tgtcttgagc atcacggggt ttacgatatg tttgatgcat ttgtcaccac 781 caacgaggtc aagcgcaaaa agggctatcc ggatgtttac ctgctggcgg cggaaagagt 841 tggcgcaaag ccggaaaaat gctgtgtctt tgaggacata tatttaggcg ttgtgggcgc 901 aaaggcggga gatttcgcct gtgtcgcggt gatggaggag cactctaagg aatggcatga 961 caaaatcaga gagttagcag atgtatgcgt taatgattat acagagctga tgtgataaaa 1021 aagcaaagag cagttactga ggtaactgct cttttttgtt ttattcttcc gtttcctctt 1081 cgggtgcggg aatatagcgg ttatatgtct ttgaaagctt cataagcttt gcagcggctt 1141 catcggaaag ctgttcgctt gtaattctcc agcgccagtt ggttccgaca gttgagggaa 1201 tattgattct tgcctcgttg cccaagccca aaatgtcctg aggctgtgca atacaaacgt 1261 ctgcaatgct gctccatgcc gcacggatca tgctttcggc caagtttgac ttatcctcaa 1321 gtccgaagta gtcaagacag aagtcaagag cttcaccttc aagaccttcg acccagccga 1381 cgagggtgtc gctgtcgtga gttgaggtat agcagatata gtttgatgac ttatagttgc 1441 aaggcagata atcggacgtg cctgtgggat cgaatgcaaa ctgcaagacc ttcattcccg 1501 gatagccggt atcggcaaga agctgaacaa catcctcggt gacaaagcca aggtcttcag 1561 cgatgattcg ctttttgcca agccaatagt tggtggaatt gaaaagctcc attctcgggc 1621 cgtcacgcca tacgccgttg acagcagtct tgtctgttgc aggaatggaa taatatcctg 1681 cgaagcctct gaagtggtca attctca // LOCUS sequence326 1705 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence326 VERSION sequence326 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1705 /mol_type="genomic DNA" /organism="" /note="sequence326" CDS 264..1598 /product="histidine--tRNA ligase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003422928.1" /transl_table=11 /codon_start=1 /translation="MAVIVQRPKGTQDAVPSTINKWHTVEAVVRDSADQFGFKEIRTPV FEDTSLFVRSVGDTSDVVTKEMYTVSSKGDATFTLRPEGTAGAVRAMLENGVMNEGFPQ KIYYIASCYRHEKPQAGRLREFHQFGVEMFGSASPYADAEVIMLAKHILNQCIGDKISL NINSIGCPECRANYHKALKEYFEAKKADLCGTCLERLDKNPMRILDCKSPVCSEIAKDA PKILDYLCDDCSAHFEKLKEILDAHEIAYTVNPKIVRGLDYYTRTVFEFISTDIGAQGT VCGGGRYDGLVSQLGGQPTPALGFGMGLERLILVMEKLGIKFMDPVTPDIYIAPMGDKA QLFASKLAAELRDAGYKADYDIVGRGLKPQMRYADKVGAKFVVVLGDNELETGDVKIKN MRTGEQTDAKLDGFVKSLEELYVNEICETDNPFSRAVIEALGGEK" /locus_tag="LOCUS_8390" /gene="hisS" /EC_number="6.1.1.21" /note="WP_003422928.1 histidine--tRNA ligase (Clostridioides difficile) [pid:49.0%, q_cov:93.9%, s_cov:99.5%, Eval:1.2e-120]" /note="MGA_1224" ORIGIN 1 gatatcgaag agcatagcgc agccgggaga gaaaagatag tcaggaagag ggttccaaag 61 ggggaaacct cagaaagaaa agagagggcg gcggttgcgc ccttcctcct tttgagcgcc 121 tttcttgtct ttctgcggtt ttccccttta atgaattatg cttcgcacat gaatagcaga 181 aactagtttc tgcatgaata gtcgcttccg cgacataaat agtcgaaaca agtttcaaca 241 ttaaatatat aaggagaaat aaaatggcag taattgtaca aagaccaaag ggcacgcagg 301 atgctgtgcc ttcaacgatc aacaagtggc acaccgttga ggcagtcgtg cgtgactcgg 361 ccgatcagtt cggcttcaag gagataagaa cccccgtttt tgaggataca agcctctttg 421 tccgctcggt cggcgacacc tccgacgttg tcaccaagga gatgtatacc gtttcctcaa 481 agggcgatgc aaccttcacc cttcgccccg aaggcacagc aggcgcagtt cgcgcaatgc 541 ttgaaaacgg agttatgaac gagggcttcc cccagaagat atattacatt gcttcctgct 601 atcgccacga aaagcctcag gcaggacgac tcagagaatt ccaccagttc ggtgttgaga 661 tgttcggttc tgcttcgcct tatgccgacg cagaagtcat tatgcttgca aagcacatct 721 taaatcagtg catcggcgat aaaataagcc ttaacatcaa ctcgatcggc tgtcccgaat 781 gcagagcaaa ttatcacaag gctctcaagg aatattttga agcaaagaag gccgaccttt 841 gcggcacctg cttggaacga ctggacaaaa atcccatgag aatcctcgat tgcaagagcc 901 ctgtctgctc ggagatcgct aaggatgccc ctaagatctt ggactatctt tgcgatgatt 961 gctcggcgca ctttgaaaag ctcaaggaaa ttttggatgc tcacgaaatt gcatatacag 1021 taaatccgaa gatcgttcgc ggacttgact attatacccg cacggtattt gagtttatct 1081 ccaccgacat cggcgctcag ggcaccgttt gcggcggcgg aagatatgac ggacttgttt 1141 cacagctcgg cggtcagccc acacctgccc tcggcttcgg tatgggactt gagcgactta 1201 tccttgtaat ggaaaagctg ggtattaagt ttatggaccc cgtgacaccc gatatctaca 1261 tcgcacctat gggcgataag gcacagcttt ttgcttcaaa gcttgcggca gaactgagag 1321 atgcgggata taaagcagat tacgatattg tcggaagagg cctcaagccc cagatgagat 1381 atgccgacaa ggtgggcgcg aagtttgtcg ttgttttggg cgataacgag cttgaaacgg 1441 gcgatgttaa aattaaaaat atgcgcaccg gcgagcagac tgacgcaaag cttgacggct 1501 ttgtaaaatc gctggaagag ctttatgtca acgagatctg cgagactgac aacccttttt 1561 ccagagcagt gatcgaagct cttggcgggg aaaagtaaaa aatcaaatat agggtcgggc 1621 ctatgtgccc gaccgatagg cctgtgtgcc tgcccgagcg accacacagg gtcgctatca 1681 tcccctgcaa gagatataag ctata // LOCUS sequence327 1705 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence327 VERSION sequence327 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1705 /mol_type="genomic DNA" /organism="" /note="sequence327" misc_feature complement(585..>1705) /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_011948133.1:ATP-binding protein" /note="WP_011948133.1 ATP-binding protein (Clostridium botulinum) [pid:39.5%, q_cov:96.5%, s_cov:73.5%, Eval:4.9e-64, partial hit]" /note="MGA_1226" /locus_tag="LOCUS_8400" ORIGIN 1 caccgtgata ttcataagtg cgcttaatat ccttcataag gcttgtcagc gcgatatatg 61 cgatgaatac accaatcttg atgagtccct caatgcaggt ctttgcaaaa tcgcccaaag 121 ggagcaaaag tccgattccc tttgtgacaa gtgagggcac gaacataaag agcattaaag 181 caagcgccac gcccaaaaca gatgcaatta ccattacgat agtcatcagc ttgtcgccga 241 gcttttcggt cagcaacttt tcaaaatttg aaggctcctc ttcctcaatg ccctgcatcg 301 ctttgtcggc agatttggtg aggcacttgt aaccgtcaag catcgatgag atgaagttga 361 cagggcctct tacaaagggc acttttttat accactttgc cttgggaagg tcccaaacct 421 caaggtcgat ggtgccgtca ggcaatctta cagccatcgc ttccttttcg gggccgcgca 481 tcataacgcc ttctaaaagt gcctgtccgc cgatggacga ctttttgcag ccgctgttgc 541 aattatcttt gctcatattt tttaaacctc cgtgatctat ctctttaggc tgtcggcagg 601 actatcatta cggtagtgcc cttgcccagc tcgctgttta ttgtaaggct gccgccatgc 661 atctcaacaa tttcgttggc aaccgccaaa ccgattcctg agccgcggcg tgtgtgattc 721 gccttataga actttgtttt aattttgggc atatccttgg cggcaattcc ctcgcccgtg 781 tcggagataa gtacaattat ctcacctttt ttctcatatg cctcaattga cacctttccg 841 ccgggatttg aatacttcac ggcgttgtca attatattta taaacacctg acgaagtcgc 901 gacgggtcac cgtatacaaa gggaagctgt tccggctcgt aatatgcaat ttcaagaccc 961 aaggctttcg ctcgctcggt atatatgagc acagcatcgc caagctccgc caaaatgtcg 1021 gtggtttctt ttttaagggt aaagcgtccg tcctgaattc gtgaaaagtc caaaagctcc 1081 tcaaccattt cgctcaaacg ctgtgtttcg ccggttatta ccctcatgcc cttttggtat 1141 gtttcggggt cgtcggtgat gcccaaaagg gtctcgctcc agcccttaat ggctgtcaaa 1201 ggtgtgcgca attcgtggga aacgctggaa ataaactcgt ttttcatctt gtccgagtgc 1261 tcaagctcct cggccatgtt gttaattgca tcgcaaagtt cgccaagctc gtcgtcgcgt 1321 tctttttcga ttctctcgct gaagtcgccc tcggcatatg acttcgcggt ttctgtaatt 1381 ctgcttacag gcaaaacgat tgatttaatg aagtataagc ccgaagccag catcattccg 1441 atgatcgcaa ggattacggc gaagagcaaa acgcccagcc ttataagctg catatttaca 1501 gcatccatcg aggtcataat tcgcatcgcg gaaatatccc tcgcagggcc ttgacacata 1561 acggtatatc ccattacgtc ttcgccggtt gaaagctcat atacctcata gccttggcca 1621 tccgtcgagg cttttgcaag ctcatagtcg ggcatattca gccaatcgcc cggtctaaaa 1681 ccgctggatg taacggtaac tcgcc // LOCUS sequence328 1703 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence328 VERSION sequence328 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1703 /mol_type="genomic DNA" /organism="" /note="sequence328" CDS complement(832..1269) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MTPEMLEALKLQNRFAPLPMKLHIAFCVVATVLFLILYLRKKRMS DLYWMLVCDTTLILQFYYDPLTATAVGICELVLLSLIVWEAIKESKAQKAAKLAEKESE KNSENEIDELDKLVKTERRAIMDENKVDVIGDAFDGEDAVK" /locus_tag="LOCUS_8410" /note="MGA_1228" ORIGIN 1 aattatcaag tccgcggagc acacagtcct ctctcattgg ctcaagcgtc aaaacatcaa 61 gtcccgccgc agcaggcttg ccgtttttaa gggcagtggc caaagcaggt tcatcaataa 121 ctccgccgcg ggaggtgttt atcagtagcg agccttcctt catcaaagaa agggtgcgct 181 catttatcat cttctcggtc ttgtcggtca aaggacagtg aagtgtcaca acatccgagc 241 gtgtcataag ctcatccagc gatacgacct cgaccgtatc atcgttttga ggcgcagttc 301 ttgtataaat gagcaccttc attccgaatg ccagcgcaat ttttgcaacc tttttgccta 361 tcgctccata tccaacaatg cccaaggtct ttcccgaaag ctcatagaat gggatattaa 421 aataggtaaa cagctttgaa tatacccagt cgccgtttgc aaccgtgtcg gcatattttg 481 caatagagct gtaatggtga aggattagcg caaaggtgtg ctgtgccaca gagtcggtgg 541 aatatcccgg cacattgcaa acgcaaattc ctttttcctt tgccgcaaca atatcaatgt 601 tgttatatcc cgttgcaaag actccgatga atttcaaatt ccggcaagca tccatcactt 661 cgcgggtgat tctgcacttg tttgtcaaaa cagcttccgc atcgccgatt cggtcgataa 721 gttcctcatc ggtggaaaac ccgtatattt cacagtcgca gatatctgta atgggggaaa 781 gggaaacatc tccgcccgta acggtatccg catccaaaat taccgtctta atcatttcac 841 agcatcctca ccgtcaaaag catcgccaat gacatcaacc ttgttttcgt ccataattgc 901 gcggcgttcg gttttaacaa gcttgtcaag ctcgtcaatt tcattttcac tgtttttttc 961 agattccttt tcggcaagct tggccgcctt ctgtgccttg ctttccttaa ttgcttccca 1021 aacaataagc gaaagcaaaa caagctcgca gattccaaca gcagtcgctg tcagcggatc 1081 ataataaaac tgcaaaatga gtgtggtgtc gcatacaagc atccaataaa ggtcactcat 1141 tcgctttttt ctaaggtaca aaattaaaaa cagaaccgtt gcaacaacac aaaatgcaat 1201 gtgcaatttc atcggcaagg gggcaaagcg gttctgaagc ttcaaggctt caagcatctc 1261 gggtgtcatt atattagtcc tcctttaaag ggataaattc cgatttgaaa atactttcgc 1321 tattatattc aatttagtat atcacgctaa gcgtcaaatt gcaagatgaa cattaaacct 1381 ttataaaatg tggcaatttt tacaaaatat tcgttaaagt tttggctcac ctaatacata 1441 ttacaagttg acatttttct cggaataggg tactattagt gtataatgtt tcacaattct 1501 accacatttg gaacattatt cattcacgca aaattttata agtgaaagga ttgtttaaat 1561 tggaaaagat ctttaagctc aagcaaaacg gtactaccgt acgtaccgag atccttgcgg 1621 gtcttaccac gttcatgaca atggcttata tcattgcctt gaaccctaac ctcctcaccg 1681 gcttcggcgc tctcggaaat gaa // LOCUS sequence329 1702 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence329 VERSION sequence329 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1702 /mol_type="genomic DNA" /organism="" /note="sequence329" misc_feature complement(1093..>1702) /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_011459711.1:ABC transporter permease" /note="WP_011459711.1 ABC transporter permease (Desulfitobacterium hafniense) [pid:46.2%, q_cov:91.1%, s_cov:68.4%, Eval:5.0e-46, partial hit]" /note="MGA_1231" /locus_tag="LOCUS_8420" ORIGIN 1 aagcagatga aaacttccgt gttgttcgat aaatattcct gcgagggata gcaaagagga 61 ttattctttg tttcctcgtc caaaaggtca taagctgcct gatttggtgt tgaatagccg 121 gtatattcgc agtttgccaa agcaatttca gcctcgcaga ggaaggtaat ataaatctct 181 gcagcttctt tgttttctgc cgaaacggga atacacatag cgtccacaaa ctggttggta 241 ccttcagagg gtatgcagta tgtcagatcg gggttgtccg cgatcatcgt aaccgcgtcg 301 cctgcataat agggtgcaac tgccgcggat ccgccctgca tcttgtcaaa gatctcgtcc 361 ataacatatc cttggacgat cgacttctgt tcaatcagca aattcagcgc ggcttcaagc 421 tcctgcgggt tttctgtatt ttgagaatat cccaaatatg tcagcgcaat gccaaaagca 481 tctcgagggt tattgaacat cagtatgttg ttttcatact tttcgtcaaa cagcgccgac 541 caggaggtta tctcctcatc aaccattgtg gtgttataaa tgatgcacac cattccccaa 601 agatacggca ccgtatattc attttcgggg tcataatcgg ggttcaagaa ggtgggcata 661 atgtttgcca gattgggaac gttttcatag tttatctttt gaagcattcc ctcttttatc 721 attttagaaa tcatatagtc gctgggaatg acaatatcat atgccgcgcc gcccgaatta 781 agctttgaat aaagcgtttc gttcgatgca taggtctgat agttaacttc aattcccgtc 841 aactgggtga aagcgtcgtt aacgtcgatc atatccgctt cgtcaatgga catatattcg 901 ccccagtttg caacattgat ggtaattccc tcgtccttga gtctgtcgta gtcataatcg 961 gacagcaggg aagtatccac caaaagctcc tcttcagctt gaacgttgcc gcaggagcac 1021 aaaatgctca tcataaccgc aaagcagagg ataagactaa aaattcgttt caaattcatc 1081 cgtcacccct ccttatgcct ttgcttggcg cataagtgcg cggtcacgtc ttaacttacg 1141 gttttcaaaa tagttctttg taatgagcaa cagcgcgatg atgataaata tgcacgctga 1201 aagcgcattg acctcgggcg ttaccttcat tcttgtcatc gagtcgatgg taattgaaag 1261 ggtctcaacc ttaacacccg atgtgaagta tgatacaacg aagtcgtcaa tagaatatgt 1321 catcgccatc aaaaatcccg agaagatacc gggcataatt tcgggaatga ccaccttgaa 1381 gaatgccatc gagggagtgc atcccaaatc tcttgccgct tcaacaaggc tgggattcat 1441 ctgtcgcaac ttcggcataa cgttgtaaat gacataaggc acatcaaagg aaatgtgcgc 1501 caaaatcagc gatacaaagc cgaactcaaa gccgaacttt gttgcaaaaa acttgaacaa 1561 aagcatcagc gatacaccca taataatttc ggggttgata acgggaatgt atgtgatgtt 1621 cataattatc gccttggagg tctttttcat cgaatggatt cccaaagccg ccatggttcc 1681 caaaatggtg gaaagaattg at // LOCUS sequence330 1697 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence330 VERSION sequence330 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1697 /mol_type="genomic DNA" /organism="" /note="sequence330" misc_feature <1..1262 /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_005788204.1:phenylacetate--CoA ligase" /note="WP_005788204.1 phenylacetate--CoA ligase (Bacteroides) [pid:56.8%, q_cov:99.3%, s_cov:96.3%, Eval:2.1e-135]" /note="MGA_1232" /locus_tag="LOCUS_8430" ORIGIN 1 agctgaccaa actccagagt gagaggcttt gcgcgcaggt taaaagaacg tatgaacgcg 61 ttgctgtatt taaggaacgt atggacaaaa tgggactgaa gcccgaagat atccacggcg 121 ttgaggatct tcacaagctc cccttctcat ataagcagga tttaagagat tattaccctt 181 acggcctctt tgccgaaccg ctcgataaga tcgtgagaat tcacgcatcc agcggcacaa 241 caggcaagca gatcgttgtc ggatatacaa gaaaagacct tgacgactgg gcagacggcg 301 ttgcacgtat gatggttgcg atcggcttgt ccgacaagga tttcgttcag gtttcttatg 361 gctacggcct tttcacgggc ggtctgggtg cccacggcgg tgccgaaaag atcggtgcaa 421 ccgtaattcc caccagcgcg ggcaataccc aacgccagat cacaacaatg gtcgactttg 481 gctcaactgc cctttgctgc actccctcat atgctttata tttgggtgaa gccgttgaag 541 aagcgggact taaagatcag ctcaagctca aggtcggcat tttcggcgcc gagccttgga 601 cagaggatat gcgccacgcg atcgaatcga agctgaacat caaggcttat gatatttacg 661 gcctctccga aatcatggga cccggtgtgt cttatgaatg tcagtgccag gcgggtatgc 721 acgtctgcga ggatatgttc attcccgaga tcatcgaccc cgacacaggc gatgttttgc 781 ctgccggtca gtggggcgaa ttggtattta caaccatcac aaaggaaggc tttccgctca 841 tcagatatcg cacacgcgac atctgctcgc ttaactatga gccttgcgaa tgcggcagaa 901 cccacgttcg tatgcgcaag ccccagggca gaaccgacga tatgctcatt atccgcggcg 961 taaacgtatt ccccagtcag atcgaagaag ttttgctcaa gtcctcgggc ggcgtatcgc 1021 ctaactatca gatcattgtt gacagagtta acaacaacga cactctcgac attaacgttg 1081 agatgagccc cgaaatgttt gccgacgata tcggctcgat tgccaaggtt gaaaagcatt 1141 tggttgacca gctccgctct gttttgggca tcggtgccaa ggtccacctt tgcaacccca 1201 acacccttcc taagtcggaa ggcaaggcaa agagagtatt tgacaacaga aagctccact 1261 aaattacata ataaatacgg aggaaaacaa atgataaagc aagttaatgt ttttgttgag 1321 aacagacagg gccgagtatg cgacgttatt gaagtcctcg cccgcgaggg tatcaacatt 1381 ttgaccctat caattgcaga caccaccgat tacggcgtta tgcgccttat tgttgacaag 1441 ccttattccg cacaaaaggc aattatggcg gcaggattca ttgcaaaggt gacccacgtc 1501 attgctgttg cggttgacca cacaccgggt gagctggcaa agctcttgaa aattttgcgc 1561 gactgcggac agtcggttga atatctctat gctttctgcg tcgagaaggg caacgaaccc 1621 atcatcgtaa tccgccccac tcaccgcgag cctgcggtta aggcgcttga agcggcagga 1681 ggaacaaagc ttattgc // LOCUS sequence331 1694 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence331 VERSION sequence331 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1694 /mol_type="genomic DNA" /organism="" /note="sequence331" CDS 465..1472 /product="siderophore ABC transporter substrate-binding protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_002370087.1" /transl_table=11 /codon_start=1 /translation="MKRILALIMAAMMVFCLAACGSTNDGGESSTGGDENKPSTITIQS MNGKKEYADLTVPYDPQRIAILDMPSLDIIDSLGLGDRVVGSAKVTIEYLTDYNPDDSN GKIANLGSVKTADLEQVAICEPDIIFIGGRLSASYDALSEIAPVVYLGVDYEKGVVQST ADNAKTIASIFGKEAEIDAKMSGFQTRINALNAVLKDKNILLAMYNNNAMSLMDTESQL NIMAKELGGKNLGETVGEVDKATHGEDASWETIINLNPEYIFVLDRSTATGAAEDGVLG AKEVIENDLIKQLDCYKDGKIVYFIEHANVWYTSTGGIQALDTMLADLEAALIK" /locus_tag="LOCUS_8440" /note="WP_002370087.1 siderophore ABC transporter substrate-binding protein (Enterococcus) [pid:30.4%, q_cov:99.1%, s_cov:99.1%, Eval:8.0e-39]" /note="MGA_1235" ORIGIN 1 agttgataag gcaatcgcct atatggagct tgaagagttc gaggaacgtt atattgacga 61 gttgtccggc ggtcagaggc aacgggcata tatcgcaatg gttatagccc aggatactga 121 ttacgttctg cttgatgaac cgaccaacaa tcttgatatt taccatgcat ccaatctgat 181 gcacatcgtt cgcagacttt gtgacgagct tggcaagacc gtcattctcg tactgcatga 241 gatcaactat gcggcattct attccgatta catttgcgct tttgtagacg gcaagatcgc 301 aaaattcggc acagtggatg aagtgatcac caaagaagcc ttgcacgaaa tttacaaggt 361 tgactttgag atcatccgta ttcacgacaa acccctgtcc gtctactatt aaatttgtta 421 ggtttaattc taaaaataaa ttcagaaaag gagcgtataa acctatgaaa agaattcttg 481 cacttattat ggcagctatg atggtattct gcctcgcagc ttgcggcagc accaatgacg 541 gtggcgagtc ctccactggc ggtgacgaaa acaagccttc caccatcacc attcaatcca 601 tgaacggcaa aaaggaatat gccgatctga ccgttcctta cgatcctcag agaatcgcga 661 tccttgatat gccttctctt gacatcatcg actccctggg cctcggtgac agagtcgttg 721 gcagcgcaaa ggttaccatt gagtacctga ctgattacaa tcccgacgat tctaacggta 781 aaatagctaa cctcggttcc gttaagactg ctgatcttga gcaggttgcg atttgcgagc 841 ctgacatcat cttcatcggc ggccgtctca gcgcttctta tgatgcactc agcgagatcg 901 cacctgttgt atatcttggt gtggattacg aaaagggtgt tgttcagagt accgctgaca 961 acgcaaagac catcgcctcc atcttcggta aggaagctga gatcgatgca aaaatgtccg 1021 gtttccagac aagaatcaat gctctgaacg ctgttctcaa ggacaagaac atccttctcg 1081 ctatgtataa caacaacgct atgagcctta tggataccga aagccagctc aacatcatgg 1141 caaaggagct gggtggtaag aacctcggcg aaactgtggg cgaagttgac aaggctaccc 1201 acggcgaaga tgcttcttgg gaaaccatca tcaacctcaa ccccgaatac atctttgttc 1261 ttgacagaag caccgcaacc ggtgccgctg aggatggtgt tcttggagca aaggaagtta 1321 tcgaaaatga cctcatcaag cagctcgatt gctataagga cggcaagatc gtttacttca 1381 tcgagcacgc aaatgtttgg tacacctcca ccggtggtat tcaggctctc gacactatgc 1441 tcgcagacct tgaagcagct ctgattaaat aatagggcaa aaggacaact gtaattggca 1501 ggcgggatta tataatctcg cctgcttttg ccaattagaa gatatggaga tataatatat 1561 gttaaagcat ctgtgcccct gctgtggacg gcattgctat ctcgatgagc ttcagtgcga 1621 aagaggtgtc gaatataaag aaacaggtgt gattccacct cgtaagcccc gtcctcacgg 1681 aaacggcgaa ggaa // LOCUS sequence332 1667 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence332 VERSION sequence332 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1667 /mol_type="genomic DNA" /organism="" /note="sequence332" misc_feature complement(612..>1667) /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_011088289.1:serine hydrolase domain-containing protein" /note="WP_011088289.1 serine hydrolase domain-containing protein (Bradyrhizobium diazoefficiens) [pid:33.9%, q_cov:93.4%, s_cov:76.8%, Eval:1.7e-39]" /note="MGA_1238" /locus_tag="LOCUS_8450" ORIGIN 1 agggtcacag attcagcctt gctgacaaac agaggcgcag aatttgaaca ggtgatgttc 61 acgccgttca agataagcac aacatcctca ccatcggctc gtacaacgat tctgccgtca 121 tcaaatgtgc ctgaaagctc atagataccg ccgcgaatga tctttaaaag atttccttca 181 agctttgcgc ccgaaccttc aacatttgcg gtcataccaa ggaatgttat cttggttgtg 241 cctgtttcgg cggtttcctg cacaggaatg gtgacgtcgg gcaggtccgc ctcggcgatc 301 aggtcctttt tggtggagtt gtcggtgcct tgaatattgt cacccacaat atctccgcct 361 aagttgcccg agtttttatc agcatccgaa ggctggagca ttaagaacaa aacgattacc 421 gcaacaacag caaccactgc caaaacggcg acaagcgctt tgagatccga tttctttttc 481 ttttttgcca tatatatttt ctcctttatt cgagggcgtt gaaatgtttt cgcaagttaa 541 ttatattacc ttaaaagggc ttggtcaatc gaaaaatcgg ccgactgaaa aatttcattt 601 tttcatcaca ttcagccaag cagattgcga taaactgtgt tgacaagctt tcttgtgagg 661 gcacaggtgc cgcaatcgac acgctgcata ccgattaaaa ttgtcatatt ttcctcgggg 721 caatttgcaa agtagcatcc gagccagcca tcccaaccat agtcaccttt gcgggcaaaa 781 tggagcacct gaccggggtc ggaaacattg cgcataaggt tgccgtagct atatcctgca 841 aggcttcgcc aatcgcggtt gagagattcc ttttgccacg gtgtcaggct tgcgcttgtg 901 agatacttcg cggctgtttc cgagagaatt cttgtgccgc cgagttctcc gccgttaaga 961 agcatctgag cgaatttcgc gtagtcgtcc aatgtcgaac aaaggccggc accgcccgat 1021 tcaaaggcgg gagctttgtc catattataa gtgataccga ggtgattagt aattacaggc 1081 tcgacacgcc aattggcata gtcggtctta tatacttttg caagacgacc gagcttttcg 1141 ggagcaacaa agaagcctgt atcggacatt cccaaaggct caaatatctc ttttttgagg 1201 aactcgccga atttcattcc cgaaacgcac tcgacaacat agcctaaaat atcggcagat 1261 gtgccataca tccacttgtc gccggggatg aagcaaaggt caaccttgcc catacgctcg 1321 ccgaattcgc gagtggtcat cggattatcg gaatataagc gctgatccat ttcccagaaa 1381 attccgccaa cctgctcgcc acttattcca ccgccgggat aaggcaggcc cgaagtcata 1441 ttgagaagat ctttaattga tatctgctga ggagatttga cacgctcacc acgctcgttg 1501 atataataag cctcggaaaa accagggata gtccaacaaa tgcaatcggc caaatcgagc 1561 atacccctat cagcaagaat cataacagcc gcggcagtta ttggctttga catcgagtat 1621 aggcgcataa ttgtatcacg gctgaagggc accttgtttt caaggtc // LOCUS sequence333 1662 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence333 VERSION sequence333 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1662 /mol_type="genomic DNA" /organism="" /note="sequence333" ORIGIN 1 accgcgcata ttaaacgaaa atcttccttg attatatccg cgcattttgg aatcttgagt 61 catcgcaaaa agctcgcgga tgtcgttgaa tacacctgtg taggttgcgg gatttgagcg 121 aggcgttctg ccaatcggcg actggtcaat gttgattatc ttatcaagat gttcaatgcc 181 ctcaatacgt ttgaacatac ccggacggat tctcgctcta ttgagcttgc aagcaagctc 241 tttatataag atctcgttga caagtgaaga ttttcccgag ccggacacgc ctgttataca 301 ggtaaaggtt ccgagaggaa tggacacatc aattgctttg aggttatttt cttgggcgcc 361 gatgatttta aggctctcgc cgttgccttt tctacgttcc ttaggcacag gaattgagcg 421 tttaccgctt aaatatgcac ctgtgatgga atcttcacag gccataatgt cctcaatcgt 481 tcctgcacag acgatattac cgccgtgtac acctgcgccg ggcccgacgt caacaatata 541 gtcagcagca agcattgtat cctcatcgtg ctcgacgact atcaaggtgt tgccaagatc 601 gcgtaagcgc ttgagagctt caatcaaacg gtcattatcg cgctgatgaa gaccgattga 661 aggctcatca agaatataca acacgcccat tagcattgaa ccgatctggg ttgcaaggcg 721 aattcgctgg ctttcgccgc ccgaaagagt tgagcttgag cgggaaaggg tcagataatc 781 taatccgaca ttctttagga agttaagacg cgccttgatt tcctttaaaa tttgggcgcc 841 gatcatcttt tcgcgctcgg taagctcaag cgaatcgaca aattcaagag cttcaattat 901 cgacatatga gtgaactcgg caatattctt gccgccgatt gttacagcaa gaatttcctt 961 tttaagtcgg ttaccgccgc aggtttcaca ctttacctcg ctcatatatt cttcgatctt 1021 tgcctttgtt gcatcgcttt cggaggactt atatctgcgt tcaaggttgt tgattacgcc 1081 ctcaaaggga gtgatccaat atccaccgcc gaattcatca ggacgcttga aggaaagttt 1141 ttgaccctgt gtgccataga ggaagatatc aagtgcatcc ttttccaagt ccttaacggg 1201 agtgtcaagc gagatgttat atgtttcagc aatggtgttg taatatatca tcgaaaagga 1261 gttgtcatca agcgtgttcc agccgtcagc gcggatagct ccctcacgta tcgacagttc 1321 atcattcggg ataaccagct ttggatcgac ttttttgaat acgcccaagc ctgtgcaatc 1381 gggacaagcg ccgaagggat tgttgaagga gaacattcgg ggcgaaagct cttcaattga 1441 aactccgtgg tcagggcaag cgtaattttg cgagaacaaa agctcttctc cgccaatgac 1501 atcaacgccg acaagcccgc ccgagaggga tgttacaacc tcgatactgt cgctgagtcg 1561 ggaacggatt tccggcttga caacaagacg gtcaacgatg atctcaatgg tatgcttttt 1621 gtttttttcc attgttatct tttcggacag atcgtacact at // LOCUS sequence334 1650 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence334 VERSION sequence334 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1650 /mol_type="genomic DNA" /organism="" /note="sequence334" ORIGIN 1 ataccgacag cttcaccgac ggatacaacg gttgaatgtg caagatccat accgtagcac 61 ttagcgcaga cgcctctctt agtcttacag ccaagaacag agcggatagc gattctatcc 121 ttgccctgag cttcgagggt ctcaataacc ttcttggcat cagcagcatt catcagcttg 181 ttgttggaaa caacaacttc gccgttgtca ttcaaaagat cctcaaccaa gaatcggccg 241 acgagtcttt cagagaaggg ctcgatcatt tcgttgccgt tcttaatttc gaatacgtcg 301 ataccctcgt gagttccgca gtcgtcctcg gtgataataa cttcctgagc aacgtcaaca 361 agacggcggg taagatatcc cgagtcagcg gtacgcaaag cggtatcggt aagaccctta 421 cgagcaccac gggaagaaat gaagtattcc aaaactgtca agccttcacg gtagttagca 481 cgaatgggca tttcgatggt ggcaccggag gtgttggcga taagtccgcg catacctgca 541 agctgacgga tctgagcgat agatccacgg gcaccggagt cagacatcat ataaatgggg 601 ttatatttat cgaggttttc ctgcaaagca acggtaacat cgtcggttgc cttggaccag 661 atctcgatga acttcttgga cttttctcct ctggagatta gacctctctt atactgggcg 721 tcgatcttgt cgatcttctt gtcagcatca gccaaaattt ccttcttctt cggaggaact 781 tcagcatcgc ataccgcaac ggtaattgca gcacgggttg agaacttgaa gcccaaagcc 841 tttacagcgt ccaatacttc actggtcttg gtggtgccgt gcttagcaat acatctttcg 901 atgatgttgc cgagctgctt cttctttacc aagaagccga tttcaaggtc gaactgcttg 961 tcaggatcgg ttctgtcaac aaagccgagg tcctgaggaa tattctcgtt gaagataagg 1021 cggccgacgg ttgcgtcaat aaccttggaa acggtattgt cgccgacagt cttggacatt 1081 cttaccttga tcttagcctg caagctaaca acgcctgcct gataagccat catagcttcg 1141 ttaacgtcgc ggaagacctt gccttcgccc ttttcgccat ccttttcaag ggtcagatag 1201 tatgaaccca agaccatgtc ctgtgtaggt acagcaacag gcttaccgtc agcaggcttg 1261 aggaggttgt tggctgcaag catcaaatat cttgcttctg cctgtgcttc aacgctcaaa 1321 ggaacgtgaa cagacatctg gtcgccgtcg aagtcggcgt tatatgctgt acataccaag 1381 gggtggagct ttaatgctct gccttcaaca agaacaggct cgaatgcctg aataccgagt 1441 ctatgaagag tcggagcacg gttgagcaaa acagggtgac cctgaatcac attttcaaga 1501 gcatcccaaa cctcgtcacg tccgcggtca accatctttc ttgcgctctt gatgttgatc 1561 tggggattgg tgtcaacaag gcgcttcatt acgaaaggct tgaagagctc aagtgccatt 1621 tccttaggca aaccgcactg gtacattttg // LOCUS sequence335 1634 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence335 VERSION sequence335 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1634 /mol_type="genomic DNA" /organism="" /note="sequence335" CDS 489..896 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MNVIELTRELGKALQQDERYIAYHAAKLANDNDADLQNLIGDFNM KRMQLNNLMSKADKDTDKINELNNELRLVYGKIMGNENMVAYNKAKADVDDVLDQINNI ITASANGEDTETCPAVAHKCSGSCSTCGGCH" /locus_tag="LOCUS_8460" /note="MGA_1242" ORIGIN 1 cgttatatgt aaatccttcc ggagaatcca ttacaccctg agaaacccaa aatgcaacag 61 cctggtttac catatcggcg ctaaggcctg tcttttccat cacatattcc gaatccatac 121 tttcatcatc ggaattcaaa agacataata gcaccttcaa ggcggcttca tttgcaagct 181 tcaaatattt atcaaccaaa gcgcagggaa tagggaagtg tcttttccat tttgatgaat 241 caattttaag cttcaaaatc gtcgcctcct ttttgtgatg taaagagatt atatcacaaa 301 attttttgtt tttcaatctt tttgcagatt attgttattt agcgggagat agatttgttt 361 tttgcaaata atcacaatct ttggtgtaac aagtacttgt aatttacaat gttttgtggt 421 atattaatac taattattga tgtgatattt tgcattgata aaaataattt tacaggagat 481 aacgatatat gaacgtaatc gaacttacca gagagctcgg caaggctctg cagcaggatg 541 aaagatacat tgcataccac gctgctaagc ttgctaatga caatgatgct gaccttcaga 601 acctcatcgg tgacttcaac atgaagagaa tgcagctcaa caaccttatg tccaaggctg 661 ataaagacac cgacaagatc aacgaactca acaacgagct cagacttgta tacggcaaga 721 tcatgggcaa cgaaaatatg gttgcataca acaaggcaaa ggctgatgtt gacgacgttc 781 tcgatcagat caacaacatc atcaccgctt ctgcaaacgg cgaagacacc gaaacctgtc 841 ctgcagttgc acataagtgc tccggaagct gctcgacctg cggcggctgt cactaattcg 901 cattaactaa aacgatacgg agtgagagta atggctcttt tattggaatc aattgatatg 961 tcaaagcttt ctgccggtat gaggcagtat gttgagctca agctcgacca tcttgacagc 1021 atagttttct tccgtctggg agacttttat gaaatgtttt ttgacgatgc tattttggcg 1081 tcctccatac ttgaccttac tctcacaggc aaagactgcg ggcttgagag tcgtgcgccc 1141 atgtgcggtg tgcctcatca cgcctgcgat gtctatgtca aaaaacttat cgaagcggga 1201 cagagtgttg tcatctgtga acagatggaa gaccctgcca ccgctaaggg catcgttaag 1261 cgcgatgttg taagaattat cactccgggc actcttattg aaagtactat gcttgacgag 1321 agcaaaaaca actggctctg ctcaatttat ctttacgata aagagggctc tctttgcttt 1381 gcagatatgt ccacaggtga agcccacatg tttaaggttt cgggcaaaaa tattgaaact 1441 gagatcatta acaagctttc ccgcttttct cctgttgaga tacttgcaaa tcattccttc 1501 aaccgtatgg aggaagttgc ttggtttgtt cgtgataagc tcggcgcatc cgtgcgaatt 1561 ctcgaggaac gtgactttag catcgaaaag aatattgaag ctatgctcac tcagttttca 1621 gcttcggcga tcga // LOCUS sequence336 1632 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence336 VERSION sequence336 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1632 /mol_type="genomic DNA" /organism="" /note="sequence336" misc_feature <1..975 /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_003417090.1:trigger factor" /note="WP_003417090.1 trigger factor (Clostridioides difficile) [pid:44.4%, q_cov:96.3%, s_cov:73.6%, Eval:1.4e-77, partial hit]" /note="MGA_1244" /locus_tag="LOCUS_8470" CDS 1026..1610 /product="ATP-dependent Clp endopeptidase proteolytic subunit ClpP" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003357557.1" /transl_table=11 /codon_start=1 /translation="MALVPNVIENTCHGERFYDIFSRLLNDRIIVLSDEVNDATASIVV AQLLFLESQDSEKDIYLYINSPGGSITAGMAIYDTMQYVKCDVSTICVGMAASMGAVLL AGGAKGKRIALPHSEVMIHQPLIGGGLSGQCTDIKIHSDHMVRTREKLNKILAHDTGKT IEEIELATERDNYMTAEEAVEFGLIDKVIER" /locus_tag="LOCUS_8480" /gene="clpP" /EC_number="3.4.21.92" /note="WP_003357557.1 ATP-dependent Clp endopeptidase proteolytic subunit ClpP (Clostridium) [pid:68.0%, q_cov:100.0%, s_cov:99.0%, Eval:2.1e-70]" /note="MGA_1245" ORIGIN 1 acaggtgtta agttcaaggg cgtattcatc accaagcctg tagttgaaat taaggactac 61 aagggtataa aggttgcaaa gactgtcaat gatgtaacca acgaaatggt tgaccacgaa 121 atcagccata tgcttgaaag aaactccaga accgtcaatg ttgatgacag agcttgcgaa 181 ctcggcgacg atgttgttat cgactttgaa ggcttcaagg acgatgttgc atttgaaggc 241 ggcaaggctg aaaaatttaa cttgaagctt ggttccggcc agttcattcc cggctttgag 301 gatcaggttt ctggacataa aatctgcgat gattttgata ttaacgtaaa attccaagaa 361 aactacaagg ctgaagagct tgcgggtgca cctgtagtat tcaagatcaa gctccacgag 421 atcaagaaga ctgaacttcc tgagcttgat gatgatttcg ttaaggatac caccgagttt 481 gaaactgttg acgagctcaa gtctgacgtt aagaagcacc ttgaagaaga tgctaacaag 541 agagctgatg ctgaagttga aggcaagatc tttgacgcag taatcgaaaa gctcgaaggt 601 gaaattcccc agatcatgtt cgataacaag gttaacgata tggttgaaga tctcaaccag 661 cgtcttgcac agcagggtct tacccttgaa atgtatatgc agttcaccgg tcttaccatt 721 gaatccgtaa aggaaaccta taaggaacag gccgagaagc aggttaagct ccgcctcgct 781 cttgaaaaga tcgcagagct cgaaagcatt gttgcaacgg aagaggatat tgaaaaggaa 841 ttcgaagcaa tttctgctgc atacaatatg cctgttgaaa ctgttaaaca gtacatccag 901 cctgaaaacc tcaagcttga tgttgaagtc ggcaaggctg ctgacctcgt aaaggctgaa 961 gcagttgttg aataatttaa accgcaatca aaccgccata ttttaaagaa acggaggacc 1021 gacaaatggc acttgtacca aatgtaattg agaacacatg ccacggcgag agattttatg 1081 acattttctc ccgacttctt aacgacagaa ttatcgtttt gtccgatgag gtaaacgatg 1141 caactgcaag cattgttgtt gctcagcttt tgttccttga aagtcaggat tctgaaaaag 1201 atatctatct ttacatcaac agccccggag gttcgatcac cgcaggtatg gcgatctacg 1261 atacgatgca gtatgtcaag tgcgatgttt cgaccatctg cgtaggtatg gcggcgtcga 1321 tgggtgcagt tttgcttgcg ggcggtgcaa agggcaagag aattgccttg cctcacagcg 1381 aagtaatgat ccaccagcct cttatcggcg gcggactctc gggacagtgt actgacatca 1441 agatccactc tgaccatatg gttcgtaccc gtgaaaagct caacaagatt cttgcccatg 1501 acacaggcaa gaccatcgaa gaaattgagc ttgcaaccga gcgcgataac tatatgacag 1561 ctgaagaagc tgttgagttc ggccttattg ataaggtcat cgaaagataa aaatttttga 1621 gtctgttgct gg // LOCUS sequence337 1627 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence337 VERSION sequence337 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1627 /mol_type="genomic DNA" /organism="" /note="sequence337" misc_feature <1..937 /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_176742130.1:glycoside hydrolase family 9 protein" /note="WP_176742130.1 glycoside hydrolase family 9 protein (Amycolatopsis mediterranei) [pid:31.3%, q_cov:98.1%, s_cov:32.3%, Eval:3.1e-34, partial hit]" /note="MGA_1246" /locus_tag="LOCUS_8490" CDS 948..1571 /product="endonuclease III" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_010964008.1" /transl_table=11 /codon_start=1 /translation="MNKVDFIIGELEKLYPEAQCSLEYVKPYELLIATRLSAQCTDARV NIVTKVLFAKFPTLEAFAEADVAEIEEIVKPCGLFRTKAKSISELTKMLISDFGGEVPN TLEKLTSLPGIGRKTANLIMGDVYHQPAVVADTHCIRISNRLGLASSKDPYKVELQLKE ILPPERSNDFCHRLVNFGRDVCTARSPKCGECPLRDVCKDKQEK" /locus_tag="LOCUS_8500" /gene="nth" /note="WP_010964008.1 endonuclease III (Clostridium) [pid:47.2%, q_cov:96.1%, s_cov:94.3%, Eval:6.0e-50]" /note="MGA_1247" ORIGIN 1 cgactttgta atgcccgagg atgaccttcc tcagatgttc gttctgcctg tttcgacaat 61 ggcaacggcg gacttagcgg cagtttgcgc ccttgcaagc acgatttata gaaaatttga 121 ccccgaattt gccgacagac ttataaatgc cgcaattaaa acaggggagt ggcttgaggc 181 gaaccccgaa ttcatcggat ttaacaaccc cgaaggctgc ggcacgggtg gatacggcga 241 atggaacgac agggataacc gattctgggc ttggtccgag ttatatcttg caacgggaaa 301 tgaaaaatat cacacattga tgaagaatgc cattgacgag aaattcccct tgaccgctct 361 cggcgtggga atggtgacgg gacttggcac gttgtcatat attttgagtg acagagcgga 421 taaagatctc aagttggttg aaaaattcaa gcaggcgttt gttgcgtctg cggagcattt 481 ggcaaaggtg tccgacaatt gcggatacgg tgtggcgatg gatgagaaaa gctacggctg 541 gggaagcaat atgggcgttg gcaaaaacgg aatgatcttt gccattgcag attattgcga 601 gaatggctca cgcttcaaag aatatgccca taaacagctt gatttccttt tgggcgtcaa 661 cgcaacggga tatagtatgg ttacaggcgc gggtgaattt tgcattaact atccccatct 721 tcgccctgca tatgccgacg gcattgaaaa gtgtatgccg ggttatgtca gcggcggacc 781 gaacagtcac cgtcaggatg ccgacgcaag aaggctgatt cccgagggta cgccgccgat 841 gaaatgcttc attgacgagg ttggaagcta ttccatcaac gagatcacaa tttattggaa 901 ctcgcccctg gtgtttatgc tcggatattt aaactgaagg aagaactatg aataaagttg 961 attttataat cggtgagctt gaaaagcttt atcccgaggc gcaatgctcg cttgaatatg 1021 tcaagccgta tgagctttta attgcaacac gactatcggc acaatgcacc gatgcgcggg 1081 tgaacattgt gacaaaagtg ctgtttgcta agtttcccac ccttgaggca tttgccgagg 1141 cagatgtcgc agagattgaa gaaattgtca agccctgcgg acttttcaga acaaaggcaa 1201 agagtatcag tgagctgaca aaaatgctga taagcgattt cggcggagag gtgccgaaca 1261 cccttgaaaa gctgacctcg cttccgggga tcggcagaaa gaccgcaaat ctcatcatgg 1321 gggatgttta tcatcagcct gcggttgttg cggatacaca ttgcataaga atttccaacc 1381 gtttgggctt ggcaagctcg aaagaccctt ataaggttga attgcaactc aaagagatcc 1441 tgccgccaga aagatccaac gatttttgcc accggctggt gaatttcggc agagatgttt 1501 gcacggcgag aagcccaaag tgtggcgagt gcccgctgag ggatgtttgc aaggataagc 1561 aggaaaaata gtcacaaaaa gcggaacgct cgcgggagcg ctccgctttt ttcggcgcca 1621 ccgctcg // LOCUS sequence338 1626 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence338 VERSION sequence338 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1626 /mol_type="genomic DNA" /organism="" /note="sequence338" misc_feature <1..909 /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_008764094.1:glutamine-hydrolyzing GMP synthase" /note="WP_008764094.1 glutamine-hydrolyzing GMP synthase (Bacteroides) [pid:70.0%, q_cov:100.0%, s_cov:69.9%, Eval:3.3e-118, partial hit]" /note="MGA_1248" /locus_tag="LOCUS_8510" ORIGIN 1 gagaatgtcc gtgcgcaggt cggcaacaaa aaggttttgc tcgctctttc cggcggtgtt 61 gattccagcg ttgtagctgc attgctcatt aaagcgatcg gcgaccagct tgtatgtgta 121 cacgttaacc acggacttat gagaaaaggc gagagccagc aggttatcga catctttaga 181 gataatatgg gtatgggcga caaccttatc tatattgatg ctaccgacag attcttggat 241 aaattggcag gcgtttcagc acccgaaacc aagagaaaga tcatcggcgg cgagtttata 301 agagtatttg aagaagaagc aagaaagctc accgatgttt ccttcctcgc tcagggcacc 361 atttatcccg atattttgga atcggacggc gttaaagcac accacaatgt cggcggcttg 421 ccggaagata tcaagtttga aggcttggtt gagcctgtaa agcttcttta taaggatgaa 481 gtccgcgttg tcggcgaggc tttgggcctt cctcactcaa tggtataccg tcagcccttc 541 ccgggtcccg gattgggcgt aagatgcttg ggtgcgatca cccgcgaccg acttgaagca 601 ctcagagaag cagatgcaat tttgcgcgaa gaattcgaca agagcggcct tgccgaaaga 661 gtatggcagt atttcatcgc tgttcccgac ttaaagagtg tcggtgtcag agacggcaag 721 agatatgaag gctggcctgc aatcatccgc gcgatcaaca caaccgacgc catgaccgca 781 accatcgagg aaattcctta tgagttgttg caccacatta ccgcccgtat cacccacgag 841 gttgaaggaa tcaaccgcgt gcttctcgac ctcacaccca agccgatcgg cactatcgag 901 tgggaataat aagcgttgta aaagcctctt gtatccaagg ggctttttac gcataaaaaa 961 gaggaataac tatgggatta tttgataaaa ttaaaaatgc tatttggggt tcatcaaaca 1021 ataatcaggt cggatatcag cgaccacaaa gatcaaatta tattccgact tatcatattg 1081 aggattggca gcctaaatta aaatatcccg aatatgataa gctgttttca ctgcaaaagt 1141 atttggaaag tatagatttg cctaaaaata taatcagtca aataatcgaa tcaaaaaatg 1201 tgtttggcga agcaaaaaga attattacac acgtcacaga acaagtccca ctttctgaaa 1261 tgtgctatca cgagactgta cgtatagaga aatggataaa acttatggct ttgtgggagt 1321 ctccgtctga atatattttt gaaaatacat ttaagtatat tcttcttcga ctaagttgga 1381 tgtgtcattg ggatatgtta caacaaaaag cattaaacga ttgtgggctt aatgatattt 1441 tagatgcttg caaacaaaat gattataaaa aagttgttag ttatttcgat aatgatatat 1501 tatcttgctt tgcattatca catttaaaga gcaagaaatc tcttgtggaa gctgttagta 1561 taggatttga ttttttggaa atgaacacaa cacacaatgg ttcagcacac ggcagttttt 1621 ataatc // LOCUS sequence339 1623 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence339 VERSION sequence339 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1623 /mol_type="genomic DNA" /organism="" /note="sequence339" misc_feature <1..1146 /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_011986883.1:translational GTPase TypA" /note="WP_011986883.1 translational GTPase TypA (Clostridium botulinum) [pid:58.4%, q_cov:100.0%, s_cov:62.5%, Eval:1.4e-122, partial hit]" /note="MGA_1249" /locus_tag="LOCUS_8520" CDS 1164..1562 /product="thioesterase family protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_002261952.1" /transl_table=11 /codon_start=1 /translation="MKDIIIGTEFVCSTIVTGSNTAVAVGSGEAEVYATPMMIALMENA AYLCLKPFLDEEESSVGIHMSSTHESATPIGVAVSALAKITAVEGKIVTFEVTASDAFG VIGKGEHKRAVINSQRFIDKARKKLSVL" /locus_tag="LOCUS_8530" /note="WP_002261952.1 thioesterase family protein (Streptococcus mutans) [pid:41.2%, q_cov:84.8%, s_cov:93.3%, Eval:9.0e-15]" /note="MGA_1250" ORIGIN 1 aagatcgagc gcggctcggt caaggtcaac caggaagtta tgatcggcga ctatcatcac 61 accaaaaagg aatatcgcgg aaagatagtt accctttatc agatttcggg acttgagcgc 121 acacccgtag agaccgccac tgttggcgat atcgtctgca tcagcggtat tgagaatatc 181 accatcggcg acaccatctg cgactttgcg aactatgaac cgctcccgtt tgttaaaatc 241 agcgagccta cagttgaaat gaccttctcg gtcaacgact ctccctttgc aggacgcgag 301 ggcaagtttg taacaagccg ccatcttcgc gaccgcttga tgaaggagct tttgaaggac 361 gtttccctgc gtgtcagcga aacggacacc accgactcct tcaaggttgc aggcagaggc 421 gagatgcacc tttctatcct cattgaaaat atgcgccgcg agggatatga gcttgcagtt 481 tccaccccca gagtgctcta taaggagatt gacggcattc tgtgcgagcc aattgaggag 541 cttgttgtcg atgttcccga cacctgttca ggctcggtaa ttgaaaaaat gggcaagcgc 601 aaggcagata tgatctctat ggaccctgtc ggctcacgta tgagaattaa gttcttggtt 661 ccttcgcgcg gtcttttcgg atatagaaac gaattcctta ccgacacaaa gggcgagggc 721 attatgagct ctgtattcca cggttattca ccctataagg gagatattcc cagacgttct 781 cagggctctt tggttgcatt tgaaacgggc gaggctgtaa catatggtct ttataacgcc 841 caggagcgcg gaagcctctt catcggtgca ggtgtgcctg tatatgaggg tatgatcgtc 901 ggcgtatcgc ccaagacgga tgacttggtt gtaaacgtgt gcaagaaaaa gcacctcacc 961 aacacccgtg ccagcggctc ggatgatgcg ttaagactca ttcccccgag aattttaagc 1021 cttgaggact cacttgaatt catcgcggac gacgaactgg ttgaggtcac acccaagaac 1081 attcgtctca gaaaaagaac actttcaaac actcagcgcg ccaaggacaa tgcaaagctg 1141 aaataaaact aacggagaga aaaatgaagg acattataat tggaacggag tttgtttgca 1201 gcaccattgt caccggctcc aacaccgcag ttgccgtcgg aagcggcgag gctgaggtat 1261 atgcaacacc aatgatgatc gcgctgatgg aaaacgcggc ttatctttgc ctcaaaccat 1321 ttttggatga ggaagaaagc tcggtcggaa ttcacatgag ctccacgcac gaaagtgcaa 1381 cgccaatcgg cgtggcggtt tccgctctgg caaagatcac agcagttgag ggcaaaattg 1441 tcacctttga agtgaccgcg tcggatgcct ttggcgtcat cggcaagggc gagcataagc 1501 gcgctgtgat aaattcgcag agatttatcg acaaggcgcg caagaaactg tcggtattat 1561 aaaaagcaaa acgcaggtgc attagcatct gcgttttttt gtgagaccct ccttggggag 1621 ggg // LOCUS sequence340 1612 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence340 VERSION sequence340 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1612 /mol_type="genomic DNA" /organism="" /note="sequence340" misc_feature <1..1522 /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_011861457.1:heavy metal translocating P-type ATPase" /note="WP_011861457.1 heavy metal translocating P-type ATPase (Clostridioides difficile) [pid:48.8%, q_cov:99.6%, s_cov:61.0%, Eval:7.1e-136, partial hit]" /note="MGA_1251" /locus_tag="LOCUS_8540" ORIGIN 1 cgtaacggtc atccgcaacg gcgaggagaa ggagattccc gtctgcgata ttttagaggg 61 cgatgttgta gccgttcgac cgggcgaaag cttttcatgc gacggtttga ttctttcggg 121 cgccacaagt gccgacgaat cgatgctcac gggagaaagc ctgcctgtag ataaagacga 181 aggagacttt gtctatgcag gaacaataaa tctcaacgga tatgtcacta tgcgcgcatc 241 caaggtcggt gcggatacat ctttgtcaaa gataatcaag atggtcgagg atgcttccgg 301 ctccaaagcg ccgattgccc gccttgcgga caaggttgcc ggcgtttttg tcagttgtgt 361 aatggtgctt gccgttgcag ttttcttaat ttggctgctt gcaaccagaa attttgaact 421 tgcgctcaaa atctttgtca gcgtaatggt aattgcttgc ccttgtgcat taggccttgc 481 caccccgaca gcgataatcg ttgccgcggg caggggagca tcagacggac ttcttttcaa 541 aaacgctgaa gcccttgaaa tatgcaataa gataaacacc gttgtgttgg ataaaacggg 601 cactgtgacc gtcggcaagc cttttgtgac ggatatcatt cccatttctg aggacgaaaa 661 agccattgtg tctttggcgg catcccttga atcaaaatcc ggccacccca ttgccaatgc 721 tgtgatcgaa tatgcttcgc tcaacgagat agcatatccc gagtgtgaaa actttgaaaa 781 catttcaggc ttcggtctgc gcggcatcat cgacggcaag gatattatca tcggcaagcc 841 ggaaattatc cttgataagc tgacctcgga catcacgctt aaatgcaacg cccttgctga 901 cgagggcaaa actctgtcgg tggtcatctg tgatgatgag cctgtcggcg tgattgcgtt 961 tgccgataag cttaaaccca ccagcgccga agcgatcaaa tcgctgaaca aatcgggcat 1021 cagaacaatt ttgttgacag gtgataatgc ccgcgctgcg aaaaaggttg ctcacgagct 1081 tgaagtatac gactatgttg caaatgtcac ccccgacaaa aaagcggaga tgattgaaaa 1141 acttaaatat ggcggacgag ttgttgcaat ggtaggcgac ggcattaacg atgcagttgc 1201 cctcactacc gcagatgttg gcattgcaat tggcgcgggc tcggacattg caatcgagag 1261 cgcacaggtg gtgttggtgc gaaatgacct tcgcgatgta gcacgcgcaa tcgcactttc 1321 gggtgcaaca atgaaaacaa ttaaaatgaa tctcttctgg gcatttgcat ataataccct 1381 gatgattccc attgccgcag gacttttgca cgcgttcggc ggcccccttt tgaacccgat 1441 gatcgccgcg gcctgtatgt cgctgtcgtc catcactgtt gtaaccaatg ctttgcgctt 1501 gaagacgaag aagtattact gataagatga aaaatccacc ctttctggtg gattttttgc 1561 ggccgccccg aaattcgcac taccttgcaa accgcgctta aaagtgttat aa // LOCUS sequence341 1603 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence341 VERSION sequence341 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1603 /mol_type="genomic DNA" /organism="" /note="sequence341" ORIGIN 1 cgaccctgca agcaaattgc ctgaaatgaa aaacgaagtg ttggcgcagg tgtttattga 61 taagctggca aattaagata gtatcgaatt tttatatagt cacctcggaa cagccgtgta 121 cccacagggg tatgcggttg tttcatttat acgaaaaaat ccacaaaaaa tataaataat 181 tggtttttgg cattgaaaaa tgtatcatag aatgataaaa tgtttataag aaatgtgtcc 241 tgccaaattt ggaaaaattg gttcacggga atgtttcgaa gatatacagc catgtatata 301 taaaggcaaa aatctgtaaa ttgatccgta aggagggtaa aattatgagc aagaaatttg 361 aacccagctt tgaatcgttg catgagtatg ttgttcccga atggttccgc gatgcaaagt 421 tcggcatttg gagtcactgg ggacctcaga gtgtcccgat gttcggtgac tggtatgcaa 481 gaaatatgta cattgaagga agctcgcagt atgaatacca tctgcgccat tacggaaatc 541 cttccaagtt cggctataag gacctttgca acctttggaa ggctgaaaac ttcgatcccg 601 aaggattgat ggagaaatat tataaggcag gcgcccgtta ctttatgtcg cagggcaccc 661 accacgatca cttctttaac tatgactcaa agtttaaccg tatgaacagc gttaacgttg 721 gcccccacaa ggatattctt gcaatgtgga aggctgctgc cgacaagttt ggcatgcctt 781 tcggaatcag tgaacacttg ggtgcatcct tcagctggtg gagagttaac aagggttgcg 841 acaagaaggg cccttatgca ggcgtgcctt atgacggaaa tgaccctgaa tatcaggact 901 tctactatgc aaatcaggag catggcaccg atgatcccta caactgcttc ccttggtata 961 cagaaaacga agagtttaag gaatattgga agaagtgcat cggcgaaatg attgaaaagt 1021 tccagcccga gcttttatat actgacggtt cactcccctt cggcactcat tgggcaggcg 1081 gagacaacat cagcggcgaa aactcttatc agcagggcct tgatattgtc gcacagcttt 1141 acaatgcctc cattgaaaag cacggctcaa atgaagcggt atatctccag aaggatcgca 1201 gacccgagat ttataatgtg ggtgtattgg atattgaaaa gagccaactc cccggcatta 1261 tgcctgcacc ttggcacact gacacctgca tcggcaactg gttctatgat gttcactctc 1321 cttataagga gccggatcag atcatcgaga tgctcgttga catcatctcc aaaaacggcg 1381 taatgctcct taatattctc cagcgtccag acggcaccat agacgaatat gccgactata 1441 ttctcgacaa gatcggcgag tggtttgctg tttgcagtga ggctgtatac cgcacacgtc 1501 cttggagagt attcggcgaa ggcgatacat tcgttaagat cgaaggcttc agagaagata 1561 agaccgattg gaacgcaact gacttcagat ttgttcagaa gga // LOCUS sequence342 1594 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence342 VERSION sequence342 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1594 /mol_type="genomic DNA" /organism="" /note="sequence342" CDS 78..1586 /product="phosphoglucomutase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_004454621.1" /transl_table=11 /codon_start=1 /translation="MDYSKLCNESDIRGIALEGIEGQHVNLTETVCRDIGRGFTLWLTE RTGKKANELRVAIGRDSRISGPDMVKWLSEAMAEAGLNVTDMGMASTPAMFMTTKTDGF MFDASVMVTASHLPFNRNGYKFFTPEGGLESRDIKTILAYAESDKTTGEDKGTIVKGEF MDVYSKRLADMIRASAGSERPLEGLRIVVDAGNGAGGFYAEKVLKPLGANTDGSRYLEP DGSFPNHIPNPENKEAMESIKEAVAETGADLGVIFDTDVDRAGAVLPDGSELNRNRLIA ILSAILLREHPGTTIVTDSVTSSGLAKFIAEKGGIHRRFKRGYKNVINESIRLNNEGID SQLAIETSGHGAFKENYFLDDGAYIVTRLIIELSRARKEGYTLASLIDTLEEPKESIEF RMNILLDDFKPYGKKVIEELTEYASGCKGWALADDNHEGVRVNLDKEHGDGWFLLRLSL HEPLMPLNIESNTVGGAKIIAGEIAMFIERCDKLDSVKLVDFAK" /locus_tag="LOCUS_8550" /note="WP_004454621.1 phosphoglucomutase (Clostridioides difficile) [pid:52.9%, q_cov:97.4%, s_cov:98.8%, Eval:2.0e-143]" /note="MGA_1254" ORIGIN 1 acactttcca cttgaataaa aactaacaac gtgctattat aaataaggaa acattataac 61 aatttggagg cacatttatg gattattcaa agctttgcaa cgaaagtgac atcagaggta 121 tcgcgctgga aggtattgaa ggtcagcacg ttaatctgac cgagactgtc tgccgtgaca 181 tcggcagagg ttttaccctt tggctgaccg agcgaacagg caaaaaggca aatgagcttc 241 gagttgcaat cggaagagat tcgagaattt cgggacccga tatggtcaag tggctaagcg 301 aagcgatggc cgaggcgggg cttaatgtca ccgatatggg aatggcgagc acacccgcta 361 tgtttatgac caccaagacg gacggattta tgtttgatgc gtcggttatg gtcacagcaa 421 gccacctgcc cttcaacaga aacggatata agttcttcac tcccgagggc ggtctggaat 481 cacgggatat caagaccatt ttggcatatg ccgaaagcga taagactacg ggcgaagaca 541 aggggacgat cgttaagggc gagtttatgg atgtttactc aaaacgcctt gcagatatga 601 taagagcatc ggcgggaagc gaaagaccct tggagggact ccgaatcgtt gttgatgcag 661 gaaacggcgc aggcggattt tatgccgaaa aggttttgaa gcctttgggg gcaaacaccg 721 atggctcacg ttatcttgaa cccgacggaa gcttccccaa ccacattccc aaccccgaaa 781 acaaggaagc aatggaatcg attaaggaag cggttgccga aacaggtgcc gatttgggcg 841 ttatttttga tacggacgtt gaccgcgcag gcgcggtttt gcccgacgga agcgagctta 901 accgcaacag actgattgcg attttgtctg cgattttgtt gcgtgagcac cccggaacaa 961 cgatcgtcac cgactcggtc acatcgtcgg gtctggctaa gtttatcgca gaaaagggcg 1021 gaattcaccg cagattcaaa cgcggatata aaaacgtcat caacgagtcg atccgtttga 1081 acaacgaggg aattgattcg cagcttgcaa ttgaaacctc gggacacgga gcgtttaagg 1141 agaactactt ccttgatgac ggcgcatata tcgttacaag gctgataatt gagctaagcc 1201 gtgcgagaaa agagggttat acccttgcat cgctgattga tactcttgag gagccgaagg 1261 aaagcattga gttcagaatg aatattttgc ttgatgactt caagccttac ggcaaaaagg 1321 tgatcgaaga gctgacagaa tatgcaagcg gctgtaaagg ctgggcactt gcagatgata 1381 atcacgaggg tgtgagagtg aatttggata aggagcacgg cgacggatgg ttcttgctca 1441 gattatcgct tcacgaaccg cttatgccgc ttaatatcga gagcaacacg gttggcgggg 1501 cgaagataat tgcgggagag attgcgatgt tcattgagag gtgcgataag ctcgattctg 1561 tcaagctggt tgactttgca aagtaatata atac // LOCUS sequence343 1590 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence343 VERSION sequence343 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1590 /mol_type="genomic DNA" /organism="" /note="sequence343" CDS complement(342..1475) /product="nucleotidyltransferase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011861133.1" /transl_table=11 /codon_start=1 /translation="MKIAGIIAEYNPFHNGHAYQIRSTREAGATHIVCVMSGNCVQRGD IAITDKHFRARTAVKNGADLVIELPMPYSLGTAPDFARTGVNILDRLGCVNMLSFGSEC GDVNKLIFAANAIDLLSDKDIKQKMSEGMTYPSVIALLVGDDCSEILNGANNTLAIEYI RALRGTNIEPFTVKRTSAHDSPEAIGEFTSASHIRELLLSGDDALRFMPEAIPAQMISS VKRVEEAILYRLAMMTKGDFADVPYDDGLETRLYDASRTAITLEALYDSVKTKNITHAR VRRAVMLAAVGVQKSDLCAIPYARVLAMNDRGAEILALCKKTATIPISASLAELSKLND VAARFATLDERSSRLRALATAEREQLSEFSRKFEIVT" /locus_tag="LOCUS_8560" /note="WP_011861133.1 nucleotidyltransferase (Clostridioides difficile) [pid:32.7%, q_cov:89.1%, s_cov:88.7%, Eval:2.8e-43]" /note="MGA_1255" ORIGIN 1 caattacaga ctcatcgtcc atattgagaa gctgatactt caaagaagag cttcccgcat 61 ttactactaa taccaaattc agaataattg cctcctgatg taaataataa gtaaaaaatg 121 actataaaat tatacactct cggcgtggaa aaatcaagcc ttgagcggga gtttggcgac 181 ttttttgagc acttaccgcc gaaagacgat gggagtgaga ggcgaagcct gcccgaaatg 241 ccccgacggg acatttcggg cacattaaaa cgcctgtcgg ggtgatcccg tcaggcgttt 301 tgatgcactc gcgcgacgcg cgagttgggc ttcgcgtgcc gctatgtcac gatttcaaac 361 tttcttgaaa attccgacag ttgttccctt tcggcggtgg caagagcgcg caaacgggat 421 gaacgctcat cgagcgtggc aaagcgcgcc gccacatcat ttagctttga aagctcagca 481 agcgatgccg atatgggaat tgtcgccgtt tttttgcaaa gcgctaagat ttctgcgccg 541 cgatcattca tcgcaaggac acgtgcgtat ggaatggcgc aaaggtcaga tttttgaaca 601 cccactgccg ccagcattac agcacggcga actctggcat gggtgatatt tttggtttta 661 acgctatcat ataaagcttc aagggttatt gctgtgcggg atgcatcgta tagccttgtt 721 tcaagtccgt cgtcataggg tacatctgca aagtcgccct ttgtcatcat tgcaaggcgg 781 taaagtatcg cctcttcaac ccttttgacg gaggatatca tttgggcagg aatcgcttcg 841 ggcataaacc gcaaagcatc atcacccgaa aggagaagct cccttatgtg ggatgccgag 901 gtgaactcgc ctatagcttc gggtgaatca tgggcggatg tgcgcttgac ggtgaaaggt 961 tcaatattgg ttccgcggag agcgcggata tattcgattg cgagggtgtt gttggcaccg 1021 ttcagaattt cagaacagtc atctcccaca agcaaagcta tcaccgaagg ataggtcatg 1081 ccctcggaca ttttttgttt tatgtctttg tcgctcagca aatcgatcgc atttgcagca 1141 aaaatcagct tgttaacatc tccgcactcg gaaccgaagg agagcatatt tacacagccg 1201 aggcgatcga gaatattcac acctgtgcgg gcgaaatcgg gcgcagtgcc aagtgaatac 1261 ggcatcggca gttcgattac aagatcggcg ccgtttttaa cagctgtgcg ggcgcggaag 1321 tgtttgtcag ttatggcgat atctccccgc tgaacgcagt ttccgctcat gacacaaaca 1381 atatgggtgg cacccgcttc gcgggttgaa cggatctgat atgcatggcc attgtggaaa 1441 gggttatatt ccgcgattat tcctgcaatt ttcaaggtta gacctcctgt gggagtgatt 1501 gttttacggc tcctccaccg ttcgggcaca gccgagcctt cgctcggcgc agcccgctcg 1561 acgtcgtcgc cttatgaggc gcatcgcccc // LOCUS sequence344 1587 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence344 VERSION sequence344 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1587 /mol_type="genomic DNA" /organism="" /note="sequence344" CDS 168..791 /product="aminoacyl-tRNA hydrolase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_012048384.1" /transl_table=11 /codon_start=1 /translation="MGLFNKYKDKSASGGSVEWLIVGLGNPGTKYTYTRHNCGWLTIDR LAEKLGIKVNRVKFKSLVAEANFGGKKCLIMKPTTMMNASGEAVVEAMNFYKVPIENVL VISDDVSLDVGNLRIRRKGSDGGQKGLRSIIYLTGKDDFPRIKCGVGAKPHPDYDMAAW VLSNFTKDEQSKMLSAFDNAVAAAELIVAGKTDEAMNKYNVKAN" /locus_tag="LOCUS_8570" /gene="pth" /EC_number="3.1.1.29" /note="WP_012048384.1 aminoacyl-tRNA hydrolase (Clostridium botulinum) [pid:45.4%, q_cov:89.4%, s_cov:96.3%, Eval:5.1e-41]" /note="MGA_1257" ORIGIN 1 aaggatattg aggaaagggt tcacgcatcc cttgcaaaca ccgactttga cgacgacatt 61 gaccatgagc cttgggacta aacaaataaa ataattgcaa gtacccccta tcctgcacgg 121 atatggggca tttgcgcgtg gaaatataaa tgcaggagga aataaatatg ggactgttta 181 ataaatataa ggataagagc gcttcgggag gaagtgttga atggcttatt gtgggtcttg 241 gcaatccggg aacgaagtat acctataccc gccacaactg cggctggctg acgattgata 301 ggctcgcgga aaagctggga atcaaggtca accgagttaa gtttaagtcg ctggtggcgg 361 aagctaactt tggcggaaag aaatgcttga ttatgaagcc gacaacaatg atgaacgcca 421 gcggcgaagc ggttgttgaa gcgatgaatt tttataaggt gccgattgag aacgtgcttg 481 taatcagcga cgatgtttcg ttggatgttg gcaacctgcg aattcgacgc aagggctcgg 541 acggcggtca aaagggtctt agaagcataa tttatttgac aggcaaggat gattttccga 601 gaatcaagtg cggtgtcggc gcaaagcccc atcccgatta cgatatggcg gcttgggtgc 661 tttcaaactt caccaaagac gaacagtcca agatgctttc ggcatttgac aatgctgttg 721 cggcggcaga actcattgtt gcaggcaaga ccgacgaagc aatgaataaa tataacgtta 781 aggcgaacta agttatgata aatttgtttt atgaagcggc ggcggggctc cccttttgtc 841 gggagctgag cgcatcgctt aaaaacgggc ggatgcctgc atcggtgacg gggctttcag 901 ccgtccacaa ggcgcacacg gttttatatt tggcacaaag tgccaacatt ttggttgttt 961 gcgacgacga agcgggcgca ttgaagatga ccgaggacat caacgcgatg gccgacgagg 1021 aaattgcggt tttgttccct gtaaaggact atgcctttgc aaacattgaa accgcttcgc 1081 ccgaatatga gcacaaaaga atcagagcac tgacgagaat catatcgaag caatctaagg 1141 ttttgatatg ctcggcagag gcggcaatgc aaccgacaat acctttggat gttttggagg 1201 agaacaccct cacagttaaa ccggacgatg agattgttgt cagagaattt gcatcgagat 1261 tggtttcttt gggatatacc cgtgcggcgc agactgaggg cagagggcag ttttccattc 1321 ggggagatat tattgacgta ttccctgtta atgctgttat gcctttaaga atcgagcttt 1381 ggggcgatgt tgtggacact gtgtcatact ttgacattga gtcgcaaagg cgaattgata 1441 cggttaaatc ggcaattatt gcgcccgcaa aggagctttt gatctcaaag gatgatttgg 1501 cagaggccat tgaggttttg atcaataggg caagcggcaa gctcaaagac caaattaaaa 1561 agaatctata ttcggatttg gaccaca // LOCUS sequence345 1573 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence345 VERSION sequence345 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1573 /mol_type="genomic DNA" /organism="" /note="sequence345" CDS complement(770..1126) /product="YraN family protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_012583880.1" /transl_table=11 /codon_start=1 /translation="MTTKEIGNIGEDYTTRYLESKGCEILARNFTVRGGEIDIIAKKGE LIHFVEVKSRKRSPLSSGGDAITKNKIKCIVRAAKEFINRNEIDLSCVFDVAIVEVDNG KVTDFTYIQRAFTA" /locus_tag="LOCUS_8580" /note="WP_012583880.1 YraN family protein (Dictyoglomus turgidum) [pid:35.6%, q_cov:98.3%, s_cov:100.0%, Eval:4.0e-15]" /note="MGA_1260" ORIGIN 1 gaacatatga agatacatag tagatgatct gaggtgcgag tctgccccag ttaattgagt 61 ttgcgctgga gaacatcata ttgttttctg cgagtttagc agaaacatta tgatcggtaa 121 atattttctt aacgcctgtc tgtgcatcgt cgaaattgcc cttgattgca caaacaccga 181 cgttttcgcc ctcctgagtg accatctgga gtctttgcat cgggctgaca ccttcaacgg 241 gatagaacac caaaatttct gtacccggaa catccttgaa tccttcaagt gccgcttttc 301 ctgtatcgcc ggaggttgca accaaaatta caaccttctt ttcggagcca agcttcttga 361 tcgatgttgt caaaagataa ggtaaaatct ggagagccat atccttgaaa gcacaggtgg 421 ggccatgcca cagctcgagc atatagatac cttcaaataa gcatgccaac tccattatgt 481 tttcggtgtc gaagttcttg gtgttatatg caccgtcaac acagtatctg atctcaacat 541 cgctgaagtc ggtgagatac tttgagaaga tatcaaacgc tctgtcgcaa taagacttat 601 cacataactc caaaagctcg gattcattga gcttgggaat ttcgtttgga acgaaaagtc 661 cgccgtcttc ggaaataccc tgagcgatag cctgcgcaga ggttacttta aggtctttgt 721 ttcgtgtgct tgaataaaac atggtagttg ctcctttcgg cgtttgcgtt tatgcagtaa 781 acgctcgctg aatatatgtg aaatcggtca ccttgccgtt atcgacctcg actattgcga 841 catcgaaaac gcaagataaa tcaatttcat ttctgtttat aaactctttt gcggcacgca 901 caatgcactt gatcttgttc tttgtaattg catcgccgcc cgaacttaga ggcgaccgct 961 tgcgggactt gacctcaaca aagtgtatca gctcgccctt tttggcgatg atatcaattt 1021 cgccgccgcg aacggtaaag tttctggcaa ggatctcgca tccctttgat tccaaatatc 1081 tggttgtgta gtcctcgccg atgtttccga tctcttttgt tgtcattatt tctcactcag 1141 attcttcaaa aagcttggac ggtgaacatc gcttatgccg tgctttttga gcatttcgta 1201 atgaagcttg gtgccatatc ccttatgctt tgaaaactga tattcgggat acttctcgtc 1261 gatctccttc atatatctgt cacgtgaaac ctttgcaaga attgatgctg ccgcgatcga 1321 ttggctggtg gcatcgccct taacaaccgc aaatgccttt gtgtcaacat tgggagtttt 1381 gttgccgtca ataagtgcta aatcgcactg aatacccaag ccttcgtatg cgcgcttcat 1441 tgcaagcatt gcggcgttaa gaatattaag ctcttcaatt tcagcaactg atgcagttgc 1501 aatgcaatat gcctttgctt ttgagataat ttcatcaaac agcttctcac gcttcttttc 1561 ggatagcttt tta // LOCUS sequence346 1566 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence346 VERSION sequence346 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1566 /mol_type="genomic DNA" /organism="" /note="sequence346" misc_feature complement(591..>1566) /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_010964641.1:mannonate dehydratase" /note="WP_010964641.1 mannonate dehydratase (Clostridium) [pid:61.6%, q_cov:98.8%, s_cov:91.2%, Eval:5.4e-117]" /note="MGA_1263" /locus_tag="LOCUS_8590" ORIGIN 1 caagttctta aggcatatac cgcctgtggg cataaccttg aacatcggga agggagcgct 61 gattgccttg atttttgcaa gtccgcccga ctgttcagca gggaagaact ttaaaacctc 121 aaggtcaaac ttgagagctg cgtgataatc ggtgggggtg gtgcaaccgg gatagatcgc 181 aatatttctg tcacagcaat acttaacgat ctcaggatcg aagccggggg taacgataaa 241 ttcagcgcct gcggcaattg ccatgtcaac gtgctcggtc ttggtgacag ttcctgcacc 301 gcagagcatt tcggggcaag cttccttcat aagtctgatc gccttgtcag cacctgcagc 361 tctgaaggta acttcggcaa cgggaacgcc gccttcgcaa agagcctttg caaggggagc 421 agcatcacgc tcggggtttg tgagcttaat tacgggaacg attccgatat tggaaatctt 481 ctgattaatg gtgttcatat ttatctgtcc tcctgaaata taaggtttaa actaccttat 541 aaagtatatc acaagcaaaa agttcgtcaa tagtttatat cacaaaagcc ttattttgca 601 agattttttt cagctgcttc aaacaagccg ttgatataag ttgcacccaa agctctgtca 661 aacaagccat atccgggctt gcctgtttcg ccccagatca ttctgccgtg gtcgggtctg 721 acatatccgt catatccgtt ttcaacgaga gcattgacaa tttcataaat atcgagtgaa 781 ccgcaggaag aaaggtgagc tctttcctca aatgagccgt cctccataat tttgacgtta 841 cggatgtgca taaatgcaat tctgtccatt tcggcatatt ttcttaccat tgcaacaacg 901 tcgttggact tagcacagcc caaagagcct gtgcagaggc aaaggctgtt ggctggggag 961 tcaacaagct tcaagaatct gtcaagattt gcttcgcagg tgatgattct gggaagaccg 1021 aagatggggt acggcgggtc atcggggtga attgccattc tgacgccgca ttcctgcgca 1081 acgggaataa cctttttaag gaacttttca aggtttgccc aaaggccttc ctcgccaagc 1141 tcgccatacg ctgtaataag ctctctgacc tcttcctgag aatagctgga gtcccaaccg 1201 ggaaggtgaa tgtcgtcctt gagggggtca agtcctctca tctggtccca atacattgca 1261 aggctggtag atccgtcggg agccttcttg tcgagctggg ttcttgtcca gtcgaaaaca 1321 ggcataaagt tatatgtcac gcacttgatg ccatactttg cacatctgcg gatattttca 1381 cagtacactt ccaaaagctc gtcaacattg tttctgccga gcttaatatc ctcgtgaacg 1441 ggaatggatt caacaacgtc aaacaccaag cccttatcct cacaagcctt aaccattgcc 1501 gcaagacttt cttcgggcca gacttcaccg ggcttaacgt cataaactgc cgaaacaatt 1561 gatctc // LOCUS sequence347 1565 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence347 VERSION sequence347 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1565 /mol_type="genomic DNA" /organism="" /note="sequence347" ORIGIN 1 atttgcccat atgctttgaa acagaagcag caagcggctg tgagaacggt gtgaaataat 61 atgcctcaac gcctctgact ccgttaccct ttgcaacact gttgcagtga acagatatga 121 acacatctgg attataccgc gcggcatatt cgcttcggtc ataaaggttg atgtattgag 181 tatcagtcgg gagcatatat acagttgcac catatgcctg caaaagcgat gtgagagttc 241 tcgcgagaga aatgttgatc ttctgctcaa caacgtgtcc aacagcaccc ggatcaaata 301 cgcttgcgct ctttgaatat ccgtgtccgg ggtcaacaac gattacagca ccatacaaac 361 tctggttata tccgttaaaa gtgaatgtca atccgccgct gtcgtcatat gacgcagtgt 421 agcctgcgaa tatgcccgat tttctcagcc tcagtttaag ctgaagcttt ggttcgccgt 481 taacttcgac atttttccat tcagccctct taaacagtga atccgcgggg aattctgcac 541 ttccagcgaa ttcggaaaca taatcaaatg tgatcaaaac ataatcgggg tcgaattcgc 601 tgatcaaata tgaattatcg tcggggtcgt catagctaag tggtgaatat gaaacggtga 661 acggagtctg gtggttaagc tgaagcgaaa tcaccgtatt tccgccctga gtataaacgc 721 tgtttaatgt tacgatattg tcaacgatcg tgtagccgtc aacgacctcg caatcagcag 781 ccttaattct aagcttcgat tttgtaaggt agtaatcaac tgtttggtta acgccatcag 841 ccgatacgtt atatgaaacc ttgttgacaa taacatccaa tgttcctgca ggaagtctgg 901 ggcaagtggg agttgccacg ttgtcggtgg tgtagtaatc gtaggtgatg ggattgtcgt 961 gtttaactct gataagctgt gcgcgctcgg catatggcga gatctcattg acgatcacgc 1021 gagaaccgct cattgtctca aaaacaaagt tattataact accgttaacc acgatattgc 1081 caaggtcctg ttcctcgcca accttgcctt ccggcgcaat aaagtagccg gtaaacttgg 1141 tgtagttggt gttggagtcc agatcttccg agagagtgtc actttctgta agagttattg 1201 tcttgccgtt aaggctcgct gtaatttcag agcctttata agcaagaaca gatatagaga 1261 tcttggttgt gccttcaact cttgtttcgg ttccctcttc aggttcaacg ctttgcaaaa 1321 ccttgacctt tcgagtgatc ttatatgtga tcgtagtcga tttattcttg aaggtgaatt 1381 tattcacacc aacttcaagg tcaacttcaa agaagaagtt tcccgcttcg ttaagctcga 1441 tcttctcgcc gttgaagtaa atatcaaaat tggcatcaaa cgaaccttgg aacttaactg 1501 tgggttcata tgttgtaaag tcagtctttt tcggcaatac cattgaaagc tctttataga 1561 gcgag // LOCUS sequence348 1561 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence348 VERSION sequence348 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1561 /mol_type="genomic DNA" /organism="" /note="sequence348" CDS complement(285..878) /product="stage II sporulation protein R" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011947973.1" /transl_table=11 /codon_start=1 /translation="MKKLTVSMALSLIICLVFSIFSNACEVSRMTDKLIRLHVVANSDS DADQALKLAVRDEVAFLCANITSACQDKASAYSALTDNLNLIESAAKSVITREGYSYPV SCSLSPTVFDRRIYDDFTLPAGEYDALCVTIGDGEGKNFWCVCYPSLCLGSVMKIDDCE QFSEDELIIVKHPEKVCYKLFCYEIIEWFRSLLK" /locus_tag="LOCUS_8600" /gene="spoIIR" /note="WP_011947973.1 stage II sporulation protein R (Clostridium botulinum) [pid:33.2%, q_cov:91.4%, s_cov:89.0%, Eval:4.4e-23]" /note="MGA_1266" ORIGIN 1 aatactgtta tcttattgaa gtcgcgggca cccaactcgg aatataggct tttgtcgaag 61 gcgaaggaaa actggtcggg aattattgcg acaacttccc tacccgatgc tatatccttt 121 ttcattgagc aagcaagatt tttaagcttt gcatcctcat tttcgcctaa ccaaagttta 181 agcatggttc gttttcctcc tataaatgtt tatacattga ttttaccatt agaaaagcga 241 caaatcaagt cgcgagttga aagaaattgt acaagaatcg ggacttattt taagagcgaa 301 cgaaaccact ctattatctc atagcaaaag agcttatagc acactttttc gggatgtttg 361 acgattatca gttcgtcctc ggaaaactgc tcgcagtcgt caattttcat cacagagcca 421 aggcataggg atggatagca tacgcaccaa aagtttttgc cctctccatc gcctattgtc 481 acgcacaagg catcatattc tcctgcgggg agagtgaaat cgtcatagat gcgcctatca 541 aataccgtag gtgatagcga gcaggaaacg ggatatgagt acccctcgcg agtgatgacc 601 gattttgcgg cggattctat cagattgaga ttatcggtca gagcggaata tgccgaggct 661 ttatcttggc aggctgaagt gatattcgcg caaagaaatg caacttcatc gcggacagcg 721 agcttgaggg cttggtcggc atcggaatcg gagttggcga caacgtgcag acggattagc 781 ttgtcggtca ttcggcttac ctcgcaggcg ttggaaaata tgctgaaaac aaggcaaatg 841 atgagcgata gtgccattga aacggtgagt tttttcattt tatctttcct ttttatggat 901 tttgataaga gtgttgacgg gaaaagaagg aaatatacaa aagcctccct ctgacgaggg 961 aggtggcaaa aatctttgat ttttgacgga tggagagata cgcaaacaac aaatctttgt 1021 ctcggcctct ccctcagtca gctacgctga aagctccctc gtcagaggga gccttcatat 1081 gcctcacatt gcaagaaacc cacctgaaat tatcacaggt gggtatccaa attacatata 1141 tcttttatct cttaaacaca gaaatgcgtt cgaagccgtt gcggagcttg tctttaatgc 1201 ggaaggcgcg atgggtaccg cgggcaacac agccaagcgg gtcatgggcg acatggcatt 1261 taactcccaa ctcgcgggtg atatacaggt cgagtccgcg caggagcgcg ccgccgcctg 1321 ttaaaagtat gcccgattca tagatatcgc cgataagctc gggcggggtg acctcaaatg 1381 cttcgcggat tatttcaatt ataccgtcaa cgtcatcaat tatcgcgcgg gcgatatcat 1441 cctcggaaaa ctcgcatcgg gcaggcatac cgttgattag gcttcgtcct gttgcaacgc 1501 ccgtgttttc aatagagggc caaaaaacgt tggcatattg aaccttgata tcctcggcgg 1561 t // LOCUS sequence349 1560 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence349 VERSION sequence349 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1560 /mol_type="genomic DNA" /organism="" /note="sequence349" CDS 227..1522 /product="diaminopimelate decarboxylase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_000280659.1" /transl_table=11 /codon_start=1 /translation="MICNNISTVDGVLHFAGQDTTKLAKKHGTPLYLMDEEKIRENCRQ YKTALDEFYGNGALALYASKAASFKRMYEIVAEEGLGIDTVSCGEIYTALKAGFPMERA YFQGNNKTDEDICFAIDNGVGYFVCDNVEEVDAISRIAGEKQITQNILLRLTPGIDPHT YDEVATGKVDSKFGTAIETGQAAEIVEHTLALPNISLEGFHCHVGSMVFESSVFTRSAL VMLSFIKQMYQEHGYITKILDLGGGYGVRYTGEDPYIDVYDNIRQVCEYVKATCNELEI PLPSLRFEPGRSIVADAGMTLYTAGTVKKITGYKNYVSVDGGMTDNPRFALYGSKYTVA TANKANEPLELVADLVGRCCESGDVIQPEVMFPKSIQRGDIVAVMTTGAYNYSMPSNYN RVTRPPVVMLNKGKDYVAVKRESLEDIVGLDI" /locus_tag="LOCUS_8610" /gene="lysA" /EC_number="4.1.1.20" /note="WP_000280659.1 diaminopimelate decarboxylase (Bacillus cereus group) [pid:44.3%, q_cov:97.4%, s_cov:95.4%, Eval:2.5e-102]" /note="MGA_1269" ORIGIN 1 atatctgcaa gaattacctt aacggtgacc tcgagagagc acttgatgct cagcttgagc 61 ttttgccttt ggttgatgcg ctgttcagcg aggtcaaccc tattcccgtt aaggcggcaa 121 tggcggcaat gggctttggt gaaaacagcc tgcgtctgcc cttgacacca atggaagaaa 181 agaatgaagc agttttgctt aaccttatga aggagtaggg actcatatga tctgcaataa 241 tataagcact gttgacggcg ttttgcactt tgcaggacag gatacaacga agcttgcaaa 301 aaagcacggc actccccttt accttatgga tgaagagaag atcagagaaa actgccgtca 361 atataagact gcgcttgatg agttttatgg caacggagcg ttggctcttt acgccagcaa 421 agcggcaagc tttaagagaa tgtatgaaat cgttgctgag gaaggcttgg gaatcgacac 481 cgtttcctgc ggcgagatat acaccgctct caaggcggga ttcccgatgg agcgcgcata 541 ttttcagggc aacaacaaga ccgacgagga catttgcttt gccattgaca acggcgtggg 601 atatttcgtt tgcgacaatg ttgaagaggt tgatgcaatc agccgaattg cgggcgaaaa 661 acaaatcacc cagaatattc ttttgcgctt gacccccgga attgaccctc acacctacga 721 cgaggttgca acaggcaaag tcgattcgaa attcggcaca gccatcgaaa caggtcaggc 781 ggcggaaatt gttgaacaca cgctcgctct tcctaacatt tctcttgaag gattccactg 841 ccacgtgggc tcaatggtgt ttgaatccag cgtattcaca agaagcgcct tggttatgct 901 aagctttatt aagcagatgt accaagaaca cggatatatt accaaaatac ttgacttggg 961 cggcggatat ggtgtaagat atacaggtga ggacccatat attgatgttt atgacaatat 1021 aagacaagtt tgcgaatatg ttaaggcgac ctgcaacgag cttgaaattc cgcttccctc 1081 ccttcgcttt gagccgggaa gaagcattgt tgccgatgcg ggtatgaccc tttacacagc 1141 gggcaccgtc aagaaaatca ccggatataa gaactacgtt tctgttgacg gcggtatgac 1201 cgacaacccg agatttgcac tttacggctc gaaatatacc gttgcgaccg ccaacaaggc 1261 aaacgagcct ttggagctgg ttgcggatct ggtcggaaga tgttgtgaat cgggcgacgt 1321 tattcagccc gaggttatgt ttccaaagtc gattcagcgc ggcgatattg ttgcagttat 1381 gaccacagga gcttacaact actcgatgcc atcaaactat aaccgcgtta caagaccgcc 1441 tgtcgttatg ctcaacaagg gcaaggatta cgttgcggtt aagcgcgaaa gcttggagga 1501 tattgttggg ttggatatat gaacgcgggg cggaggccgt ttgacacctg cggtgtcaaa // LOCUS sequence350 1558 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence350 VERSION sequence350 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1558 /mol_type="genomic DNA" /organism="" /note="sequence350" ORIGIN 1 attggcttca agcccaccgt cagcgacagc ggaaaaagat gctgtgaaac tcacatactt 61 gatttttcct gcgattcata cggcaagacg gcaacggttg aatttttgga attttaccgc 121 gatgagaaaa aatttgacaa caccgaagaa ctgattgaaa caattaaaaa tgatataaac 181 agaagaaaag gagcgaacaa ataaaatgaa tgaagtaaga acaagatttg cgccttcccc 241 cacgggatat atgcatatcg gaaacctcag aacggctctt tatacttatc ttattgcaaa 301 gaagtcgggc ggcaaattca ttttgagaat cgaagacacc gaccaggaaa gatatgttga 361 gggcgctgtt gatattattt acagaacact tcgcactgtc ggcctcaact gggacgaagg 421 acccgacgtt ggcggtcctg ttggacctta tatccagtcg gagagaatgg gcattttcaa 481 gaaatatgcc gaagagttgg ttgaaaaggg cgaagcatac tactgcttct gcgacaagga 541 cagactcacc gagcttaaag ctgttcagga ggcaagcggc gttaatccca tgtatgacag 601 acactgccgc aacctttcaa aggaagaaat tgccgaaaaa cttgctgcag gcgttcctta 661 tgtaatccgc cagaagattc ccgaaacagg caccaccacc ttccacgacg agctttacgg 721 cgatatcact gttgacaact ccacccttga cgaccagatc ttgcttaaaa ccgacggtat 781 gcccacctat aactttgcaa acgttgttga cgaccacctt atgggcatca cccacgttgt 841 aagaggtaac gaatatctgg catccagccc taagtataat ttgctttata aggcatttgg 901 ctgggaagtt cccacatata ttcacgttga gcacattatg aaggataagc agaacaagct 961 ttcaaagcgt aacggcgacg catcctttga agaccttatg accaagggct acctttgcga 1021 agctgtcatc aactatattg cgcttctcgg ttgggcaccc aagggcgaaa gagaaatttt 1081 cacccttgaa gagctgattg aagagttcga catcaacggt ctttccaaga gccctgcaat 1141 ttttgacccc ctcaagctca gagcgatcaa cggcgaatac attcgcaagc tcacccccga 1201 aaagttctat gaatatgctg agcctttcat taagcaggtt gtaacccgtt ctgatgttga 1261 ccttacaaag atcgcggcac ttttgcagaa cagaacagaa gtcttctccg aaattcccga 1321 gcaggtcgat tttatcgacg ctatgcccga ttatgagctt tccttgtatg ataacaagaa 1381 gatgaagaca aatgccgaca ccgcacttga cgctttggaa aaggtactgc ctgttttgga 1441 agctattgat gaggcaagct ggaactttga aaccattcac gacaagctct tcgagctgat 1501 cgcttcaatg gaagttaaaa acggctacat tctctggcct gtaagagttg ccatcagc // LOCUS sequence351 1557 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence351 VERSION sequence351 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1557 /mol_type="genomic DNA" /organism="" /note="sequence351" CDS complement(535..1425) /product="YitT family protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003430304.1" /transl_table=11 /codon_start=1 /translation="MKRILRKIAIYIILILLSMLSAVSYVVFVFPNNFAPSGFNGIATI IQHVFDINAGYLTILMNSPLIILVFIFVDKEFAVKTFVFLGTFSSALVLLEYLDLSAFV YHTESGTSTILGPIIAGIISGATVGVAVLFNCCSGGTDLCAALIHKYKPSFDFVWIAFI LNVSVAIVSYFVFGRNLEPVIMCIIYSYFTSSITDKFIKGSRAAIKFEVVTTMPNEVGK AIIEQLGHSATVIKGEGIYTKTEKSILFCIVNKDEIVKFKDILKDYPDTFAYASNVNFT IGKFRNPRPTNDKIA" /locus_tag="LOCUS_8620" /note="WP_003430304.1 YitT family protein (Clostridioides difficile) [pid:27.7%, q_cov:91.2%, s_cov:92.3%, Eval:2.7e-27]" /note="MGA_1273" ORIGIN 1 agaccttaac tgcttcggtg gattcggaca gcaaggatac ggctataatg ttgcatccct 61 gcgcgaaaag atcggcgaga ttttgggtgt cggtaactct gttccgacaa ttctcatcgg 121 tgtcggcaac ctgggcaagg caatcgccat gcacattggc tttgaagcaa gaggatttga 181 ccttttggct ctctttgact ctaaccccga tctgacaggc gaacaggtcg gagattatgt 241 cattaagaat tatgacgaga tcgatgagtt ctgccgagaa aataagccta aggttgcggt 301 gctgtgtgta cccaagaccg cctcgcaggg aatctgcaac aaactgattg agctgggcgt 361 tgagggcttc tggaacttct cacattatga ccttgctgtg aatcacgaag gcgttgtggt 421 cgagaatgta catatgggcg actcgctttt acgcctcgga tataaactga caaacggcac 481 agaaaaatga acataaaaat aacccccgaa gagattcggg ggtttgtttt tgtattatgc 541 aattttgtcg tttgtaggtc tgggattgcg gaatttgccg attgtgaagt tgacatttga 601 agcgtacgcg aaggtatcgg gatagtcctt gaggatgtcc ttgaacttaa caatttcatc 661 cttattgacg atacagaaaa gaatgctttt ttcggttttg gtgtatatac cctcaccctt 721 gatgacagtt gcagagtggc cgagctgttc gattattgcc tttccgacct cattgggcat 781 tgttgtaaca acctcaaatt tgattgcagc acgtgagccc ttaatgaact tatcggtgat 841 ggaacttgta aagtatgagt aaataatgca cataattacc ggctcgagat ttctgccgaa 901 aacaaagtat gatacaatag ctacggatac gttaagaata aatgcgatcc aaacaaagtc 961 gaacgagggc ttatatttat ggataagtgc cgcacaaagg tcagtgccgc ccgagcagca 1021 gttaaagagt accgcgacac ctaccgtcgc gccgcttatg atacccgcaa tgattggacc 1081 gagaattgtg ctggtaccgc tctcggtatg atatacaaac gcggaaaggt ctagatattc 1141 caaaagaacc agcgcactcg agaatgttcc caagaaaacg aaggttttaa ctgcgaactc 1201 cttatcaaca aagatgaaaa ccaaaattat cagcggactg ttcatgagaa tggtcaaata 1261 accggcgttg atgtcaaata catgctgaat aatggtggca attccgttga aaccggatgg 1321 cgcgaagtta ttggggaata cgaaaacaac atatgatact gcactgagca tggaaagcag 1381 gatcaatatg atatagattg caatttttct taagattctt ttcatatagc ttaacctcaa 1441 acctgattac atttcaaata cgaccttggt ggttgtaacg tgggcatcgt cgttaatctt 1501 gtcgattctg gggagcgaga atttaccgac tcgggaagga acatcaatta cggttat // LOCUS sequence352 1549 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence352 VERSION sequence352 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1549 /mol_type="genomic DNA" /organism="" /note="sequence352" ORIGIN 1 aattcgcgta tgaagtcaaa ctgattgagg cgttgggaat tgaggacgag ggcaaagcta 61 agatatacta taaaattgca caaaaactct ttggcgtaac cataaaaagt gtataaaaac 121 gcctgttgac aacaccgctt tagagtggta aaatgatatt actgttttaa atattacagt 181 attaaaagcg atgacgaaga cgggacgctt tcaaagctat tccaaagcga gtcgggtttg 241 gtgtgagccg acggaatttc aagcgaacct atcacttccg agctgagaat ccgaaagggt 301 atctcccaag taggcgttct ccgtgactgc tgcgttaatg catacggctt aataatgagc 361 ctgaggggtg tgaatttttg cattcacaca atttgagtgg taccgcgggt atgaatttat 421 attcagctcg tctcaagcaa attgagacgg gctgttttgt ttaaaaaaca ggcggcccgt 481 aagaaaaaat cttacagaca aaggagaaaa ccgaaaatga gcaacaccgc caaaaaccag 541 cttcttgaaa tcgccgcacg tatcaaggag atgcgtgaga ttttgggcta taccacagcc 601 gaaatggcag caaaggttga agtttccgaa gcgacctatg tggcatacga atcgggcaac 661 gacgatatgc ccttcagctt tattcacaag tgcgctcttg aattcggcat cgacctgacc 721 gacctgctcg agggtaataa ccaggcaaga ctttcaacct ataccgtaac ccgccgcgga 781 aaaggccagc gcaccgccaa ggaagagggc attgacattt caaacctcgc tcccaaattc 841 cgcaacaaga tcgccgagcc ttactgggta aaatatgaat attccgcact tcagcaggat 901 aagccgattc atctttcgac ccactcggga caggagttcg actttatcgt ttcgggcagc 961 ctcaaggttc aggtcggctc tcacgttgaa atacttaacg aaggcgactc gatctattac 1021 aactcatcgg aaccccacgg tatgatcgct gtcggcggaa cagactgtac ctttgtcgca 1081 gttgttttgc cgggtgagga caccaaggaa gaaactttgc gcagctctgt tgttaaggct 1141 gcaagctctg aaaagctcat ctgcgagaag tttgttaaaa ccaccgagga cgaaaaccgt 1201 cagcttaaaa acatcgaatt cctcaatacc gacaccttca acttcggctt tgatatcgtc 1261 gatgagatcg caaataaata tcccgacaag cttgcgatga tccatgttga caagaaccat 1321 gttgaaagac gtttcacctt caaggacatc aagcgtgcct ccaaccagac tgccaactac 1381 ttccgctctc tgggcatcaa gaagggcgat aaggtaatgc ttgttttaaa gcgccattat 1441 cagttctggt ttgcaatggt tgcgcttcac aagctcggcg cagttgcaat tcccgcaaca 1501 aatcagctca aggaacacga ctttgaatat agatttaact cagcaagcg // LOCUS sequence353 1541 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence353 VERSION sequence353 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1541 /mol_type="genomic DNA" /organism="" /note="sequence353" CDS 489..1178 /product="spore cortex-lytic enzyme" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_010964005.1" /transl_table=11 /codon_start=1 /translation="MKVNISASGKQFIILFCACLAVLMVASLMTPAVQIENEALSKLGS SGAEVTAIQKTLKEWGLFNAEVTGYYGSATQSAVKRFQKIRGLNADGVAGPATLAALGI SVGTVPAATEANVKLLAQMISAEARGEPYEGQVAVGAVILNRIEHPSFPDTLSGVIYQK GAFTAIDDGQFWEPIASSAYNAARDALNGWDPTGGAIYYYNPAKTSNKFIRSRPVITTI GEHLFCS" /locus_tag="LOCUS_8630" /gene="sleB" /note="WP_010964005.1 spore cortex-lytic enzyme (Clostridium) [pid:48.2%, q_cov:95.6%, s_cov:96.6%, Eval:9.2e-53]" /note="MGA_1277" ORIGIN 1 atcttgtcga tgaataaaat cttgactccg gtataaaccg gcttgtacta ttttttgttt 61 cagtgtcgta cattcactgt tacaagaatt actgttcaaa gtaattttac aagggtctct 121 tgtttttttg tgttcattgt tcaattttca agctgccatc tttttgctcc gttttttcgg 181 agcgcttgac tatcttacca cattcaatgt ggtttgtcaa gtactttttt caaacttttt 241 tgaaaagttt tttaaagttt tcttgcgccc gcgagctgtt gctcgcagac agctttgtta 301 taatacaata ttttgcagtc gaagtcaagg gttttttcgc aatttgtatg tttgaccaat 361 aaaattgaaa caatgtcaaa acaaccgagc aagttaacct aacaaagcca gaattataca 421 gaaaagtcgg ggtatttgaa gtgattttcg gggcaaatta taataaaaca aaggaaaggg 481 attttgcaat gaaggtaaat atatcagcaa gcgggaaaca gtttatcatt ttgttttgcg 541 cctgtctggc ggttttaatg gttgcatcgt tgatgacgcc tgctgttcaa attgagaacg 601 aggcactttc aaagcttggc tcatcgggag ccgaggtcac agccattcag aaaacgctca 661 aagagtgggg acttttcaac gctgaggtca ccggttacta cggctcagcc acacaatcgg 721 cagttaagcg gttccaaaag attcgcgggc ttaatgctga cggcgttgca gggcctgcaa 781 cccttgccgc cttgggcatc agtgtcggaa cagttcccgc cgcgacagaa gcaaacgtca 841 agctgctggc tcagatgatc tcggccgagg cgcgcggcga gccatacgag gggcaggtcg 901 ccgtaggagc ggtaattctc aacagaatcg agcatccctc tttccccgat accctctcgg 961 gcgttatcta tcagaagggt gcattcacag cgatcgacga cggacagttt tgggagccga 1021 tcgcatcgag cgcatataat gccgctcggg atgccctcaa cggctgggac cccaccggcg 1081 gagccatata ctattataat cccgcaaaga catcaaacaa gttcatccga agccgaccgg 1141 taattacaac catcggcgag catcttttct gctcataaca gcaatcacgc ttcatttaca 1201 aagcaaataa aaagagcaag agtaaaagga tatttcctta cattcttgct cttgttttat 1261 tatttgatga attgatgctg acgcatcata aatagcagaa acaagtatct gccagaaaca 1321 agtatctgca tgaatacctc ccgaaattgc gaagcaattt cgctcacatg aattgaattg 1381 caactaaatg tgccgtaagg cacaattcat ttccgtagga aaattcatga aggcaaagcg 1441 ttctattcat gcaacaatgt tgaaattcat tgattatctc ccgcagggag ataatcttat 1501 cattccttct caacctcaaa atacttatgc atacaaggcg a // LOCUS sequence354 1534 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence354 VERSION sequence354 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1534 /mol_type="genomic DNA" /organism="" /note="sequence354" CDS complement(538..1422) /product="nucleotidyltransferase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011203586.1" /transl_table=11 /codon_start=1 /translation="MNATLLILAAGLGSRFGGDKQISHVGPSGEFLMEYSIHDAIKAGF NKVVFILKQEMVDVVKREVGDKISDKVEVCYAIQDFATAMPEGYVVPENREKPYGTVHA VLCAKEYLTEPFATVNADDYYGTECFEIMYDYLSKLENGSEAAMVTYIIKNTVSENGAV TRGICSTADGYLVKVDETSNILPKDGKIVGDNGEIDPEAEVSMNFWGFHNETLERMTKY FEDFCAGLTPEQIKAECLLPIMVNDLLATKELSVMAKPSNDKWFGITYKADKEDVENKL KALHTEGVYPEKL" /locus_tag="LOCUS_8640" /note="WP_011203586.1 nucleotidyltransferase (Bacteroides fragilis) [pid:40.9%, q_cov:100.0%, s_cov:99.7%, Eval:1.3e-58]" /note="MGA_1279" ORIGIN 1 acagcggaga agtatgatgt gccgtaggca aatgccgaaa gccaagggcc gatgttgcgt 61 ccgcccagaa caaagccgcc cacgtccttg gtgcgctttg cggagtatac ggcgatggcg 121 atcataattg cgaagaatgc caaaagcatt gcgattttaa taaacatatg gtcaaatcct 181 ttctcttgtc cgattggata ttgctttaac gattaaaagt ataaaacttt aaagcgtaaa 241 agtcaagctc tagttggaaa taatttgaaa aagcataggg gcgggcctat gtgcaaaaat 301 attgctccct ttggtcgcaa aattttccaa gaacccgctt tgcggcttct tgccattctt 361 caaatagtaa gggcgggcct atgcctgccc ctataagtaa tcggttgaat gaattgcgct 421 tcgcgcatgg attgacaaaa tgtcatgaat agtcaaaaca agttttgaca tgaatagcag 481 aaacaagttt ctgcattaaa aaagggcacc ccctatgtgg gtgccccata tgaaatatca 541 caacttttcg ggataaacgc cctcggtatg aagagccttc agcttgtttt caacatcttc 601 cttatctgcc ttataggtga tgccgaacca cttgtcgttt gagggcttcg ccataacgct 661 cagctccttg gttgccaaaa gatcgttgac catgatcggc aacaaacact ctgccttgat 721 ctgctcggga gtgagtcctg cgcagaagtc ttcaaaatat tttgtcattc tctcaagggt 781 ttcattgtgg aatccccaga agttcattga tacctctgcc tcgggatcaa tttcgccgtt 841 atcgccgacg atcttgccat ccttgggcaa aatgtttgag gtttcatcaa ccttgaccag 901 ataaccgtct gcagttgagc agattccgcg ggtaactgcg ccgttttccg aaacggtatt 961 tttaataatg tatgttacca ttgccgcttc actgccgttt tccagcttcg agagatagtc 1021 atacataatt tcaaagcact ctgttccgta atagtcatcg gcatttacgg ttgcgaaagg 1081 ctcggtgagg tattccttag cgcacaaaac agcatgaacg gtaccatatg gcttctcgcg 1141 gttttcggga acaacgtaac cctcgggcat tgcggttgca aagtcctgaa tagcatagca 1201 aacctcaacc ttgtcggaaa tcttgtcgcc aacctcgcgc ttgacaacat caaccatctc 1261 ctgcttgagg atgaaaacga ccttgttaaa tcctgcttta attgcatcgt gaatggaata 1321 ttccatcaga aattcgccgc tcgggccaac gtgagatatc tgcttatcgc cgccaaagcg 1381 ggagccaaga cctgctgcga gaatgagtaa tgttgcgttc ataatttatc agttcctttc 1441 ggtcaaatta cgttgtgagc cttccccttg tgggaaaggt tcctccgaag gaggcagatg 1501 aggtgaatct ctcccctttt ccgcccttat ttta // LOCUS sequence355 1517 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence355 VERSION sequence355 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1517 /mol_type="genomic DNA" /organism="" /note="sequence355" ORIGIN 1 cgtcataatt aaaagatacc aatataagca acatggtaat aacgattgcc accaaaacat 61 atttgagtat ctcgctatac ttcttatttc cgaaaaactt caatgctcca cttccttccg 121 agaagaatat tatcaattct attatacaat aaattaaaac aaaatgccat agcgaaatac 181 attttttgtg aaaaatgtat ctacaaatat ttaataataa cctattttca ttcacgaggt 241 tttatgttat aataatatgt aatctttatt gtggggtaat gttgtgactg acagagaatt 301 tttggattta aaaagacaag ctcttgacaa atacttttca agactgaacg ataaacaacg 361 tgaggcggta tttaccgtca atggacctgt gctcatattg gcgggtgcgg gaagcggcaa 421 gaccaccgtt ttggttaacc gtgttgcaaa tatgatatat ttcggcaatg cttactatga 481 caccactcgt tttgccggcg ttggcgccgc cgatgagaaa tttctggaaa actatgctaa 541 gggcatcgaa accgatactg agcgcctcaa aagaatcgtt gcggtggatt gtgtcaatcc 601 ttggaacatc cttgccataa ccttcacaaa caaggctgcg ggggagctca aagagcgttt 661 aagtgcaatg ctcggcgaac agggcaacgg cattatggcg gcaaccttcc actctgcctg 721 tgtgcgaatt ttgcgccgtg aaattgaaaa gctcggttat gataaaagct ttaccattta 781 cgatgccgat gattcaatca gagtaatcaa aagctgctta caggatctga atatttccga 841 taagcttttc cctgcgaaaa gtattgccgc ggaaatatcc aatgccaaag agtcgcgcat 901 cactcccgac gagtatatgg catctgcttt gagtgactac cgcaaacagc agtacggtaa 961 ggtttacagc ttatatcaat caaagcttaa aaactcaaat gctgttgact ttgatgacat 1021 tattctgctt acagttcagc ttttcgaaga atttcctgat gttctcgacc actaccagaa 1081 cttatataaa tatattctcg tggacgaata tcaggatacc aatatggccc agtatcaact 1141 ggttgcaatg ttaagcgcaa agcgcaaaaa catctgcgtt gtgggtgatg acgaccagtc 1201 tatatataaa ttccgcggag cgacaattga aaatatcctc tcctttgaag atcagtttga 1261 aaacgcaaaa gctatccgcc ttgagcaaaa ctaccgctcg acccagaaca ttttgacctg 1321 cgctaatcac gttatcgaaa acaacaaggg cagaaagggc aaaaaccttt ggacagactg 1381 cggcgatggt atgaagccca tcgtatacca ggcatcaagt gagcaaggcg aagcaagata 1441 tgttgccaat gcgattttga atttcgtcaa aaagggcgga aagttctccg ataacgctgt 1501 tttataccgc atgaacg // LOCUS sequence356 1516 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence356 VERSION sequence356 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1516 /mol_type="genomic DNA" /organism="" /note="sequence356" CDS complement(195..1475) /product="UDP-N-acetylglucosamine 1-carboxyvinyltransferase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003359322.1" /transl_table=11 /codon_start=1 /translation="MDKFVINGGIPLKGDVIISGAKNAAVAIVAATILSDEPCVLENVP EISDISICIKILYEMGASIKILGKNEIRIDTRGICDPIVPYELARSMRASSYFLGTLLG RFHKADVPMPGGCDLGDRPIDQHLKAFNALGAKHSIDGGVVSLRADELIGNQIYFDINT VGGTINALFAAVKADGLTIIENAAKEPHIVDLANFLNSMGADIMGAGTDVIKVKGVKFL KGVNYAIIPDQIEAGTYMAAAAATKGDVWVKNVIPKHLESITAKLRKVGVTVEEYDESV HVFVEGPLMKTNLKTMPHPGFPTDMQPQFSTLLTVADGTSIVTDDIFDNRFRYVSELRR MGAEITVEGTTALITGVSGLTGATVRASDLRAGAALVIAGMMASGTTVIENIYHIERGY ENIEDKFRALGADIKRITDYDTTRMVG" /locus_tag="LOCUS_8650" /EC_number="2.5.1.7" /note="WP_003359322.1 UDP-N-acetylglucosamine 1-carboxyvinyltransferase (Clostridium) [pid:54.9%, q_cov:97.7%, s_cov:100.0%, Eval:2.3e-121]" /note="MGA_1283" ORIGIN 1 cgtgtgtaac aaatatggct ttaacgctgg tttcatccaa atcgttctgc tttagggcgt 61 ttaccagccg tttacagctt acgcccgcgt cgatcaagat tccgccttca cgtgtgccga 121 taaagctcga atttcccgag ctcgatgaga aaaggggata tacccttgcc aaaaaaacac 181 gtcctttatt tatttcagcc gaccattctg gtggtatcgt aatcggtgat acgcttgata 241 tcagcaccca aggctctgaa cttgtcctca atgttttcgt atccgcgctc gatatgatag 301 atgttttcaa ttacggtggt tcccgatgcc atcatacccg caattacaag cgccgcacct 361 gctcgcaggt cacttgcgcg cacggttgct cccgtaagtc ctgaaacgcc cgtgatgagt 421 gcggtggtgc cctcaacggt gatttcagcg cccatacgtc taagctcgct gacatatcgg 481 aaacggttgt caaatatatc gtcggtgaca atgctggtgc cgtccgcaac tgtcaataga 541 gttgagaact gtggttgcat atcggtgggg aaaccggggt ggggcattgt tttgaggttg 601 gtcttcatta aaggaccttc aacaaaaacg tgaacgcttt cgtcatattc ctcaacagtt 661 acgccgacct tgcgaagctt tgcggtgatc gattcgagat gcttcggaat gacattcttg 721 acccaaacgt cacctttggt tgcggcagcc gccgccatat atgttcctgc ctcgatctgg 781 tcggggatga tcgcatagtt aacgcccttg aggaacttga cacccttgac cttgataaca 841 tcggtgcctg cgcccataat gtccgcaccc atggagttta agaagtttgc aaggtcaaca 901 atgtggggtt cctttgcggc attttcaatt attgtcaaac cgtctgcctt aactgcggca 961 aaaagggcgt tgatcgttcc gccgacggtg ttaatgtcaa aatagatctg gttgccgatg 1021 agctcgtctg cacgcaggct tacaacaccg ccgtcaattg aatgctttgc gccgagggca 1081 ttgaatgctt tgagatgctg atctatcggt ctgtcgccca aatcgcatcc gccgggcatg 1141 ggaacatccg ccttgtggaa tcggccaagg agtgtgccga gaaaatagct ggatgcacgc 1201 atactgcggg caagctcata gggtacaatg ggatcgcaga ttccgcgtgt gtcgattcgg 1261 atttcgtttt tgcccaaaat tttgatggat gcgcccatct catataaaat tttaatacaa 1321 atgctgatat cgctgatctc gggaacgttt tccaaaacgc aaggctcgtc cgagagaatg 1381 gttgcagcaa cgatcgcaac ggcggcgttc ttcgcgccac tgattataac gtcgcccttg 1441 agagggatgc caccgttaat tacaaacttg tccatagttt tctcctatat atcatccgtt 1501 ttcggtaagt agtcgc // LOCUS sequence357 1512 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence357 VERSION sequence357 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1512 /mol_type="genomic DNA" /organism="" /note="sequence357" ORIGIN 1 actcccgagg gtactcccgg taccgtgggc cagggccacg gttggggcgg ctccatctac 61 aagtccgatc ctaccactct gacggttgag tacacgcctc tgaccgctga ggagctggat 121 gctaaggaag catgggctga cgagaatagc attcctctgc tgggcttcaa caagcctttc 181 ggcggcatga cccttgataa cgaggactac accgcaggtt ccggttctaa catcttcaag 241 ctcggctccg ctcccagcgc taccttcgat cccattgacg gtaccggcat ggataccttg 301 accttcgacc tgtacatctc cgacctggct ctgttcgatg ttaagtttgc taacacaggt 361 cttgagctga cctccgccgg tgcatacgac aaggaggaga tctcttggaa gctgcagggc 421 atccgtgaca acaaccttgg cgatgagctg aaggctggct ggaaccatat cattctgccc 481 ctggagaccg ctgacatggg tcagggcggt gctgacttca acattgctgc tatcaacttc 541 ttccgtttct tcatggttaa ccctgagggc ggcgaggaca tcgttgttaa gatcgataac 601 atgagacttg acaactccgg tattgcacgc aaggaagctc agatgaagat tgaccaggat 661 caggctgata aggtaatcag gctgatcaac gatatcggtg aggtcactat cgactcagag 721 cgcgctatcg agaaggctga aaatgcattc aacaagctga cgcttgacca gaaggcactt 781 gttaccaaca aggacgctct ggatgcagcg aaggatacgc tgaagactct gcaggatcaa 841 cagaaccagc ccgatcccga gcccgagccc gagcccgatc ctgagcccga tcccgagcct 901 gagcccgatc ccgagcctca gcccgacgag tccaacaata ctgttgttat catcatcgtt 961 gttgttgcta tcgttgtcgt tgctgctgct gtttgtgtat acttcttcgt tatcaagaaa 1021 aagaagtaat ataacgcaaa aagcaatcga gtgaatatat ttgcaaggtg ttatcctcgg 1081 atagcacctt gcttttttgt ctaaagtgtg aattttgttt ctaaaatatg aataaatatg 1141 gatgagacta ttgacaaatt ataaaaacta tgatatactg aattcaccat cgggctgaca 1201 gtgcttgttt gtccgaaaat tattattttt atggaggaaa atccaatgaa aaagttcctt 1261 gcgattctgc tggtgctttg tatgttgatt tcttctgtgg tagtagtttc cgcagagggt 1321 gtcgaagatt ttacaaagta cgttaagaaa aaggcagaat tctcctttac gactggccag 1381 gcagtaactc ctggcgccat catgttcact ccgaacttca aggatggcga aaccgtcaac 1441 ctcaacgact ataagtacgt tgatctggca atctacgcct acaatgctga ggcagctgct 1501 aacgtcacca tg // LOCUS sequence358 1507 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence358 VERSION sequence358 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1507 /mol_type="genomic DNA" /organism="" /note="sequence358" CDS complement(155..775) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MGKFWKVLAGLGVAAATAGVVLSLAKKKNEEVYDEFDLEEDLCEG CEDENCDACKCEDCACEDDCSECECDEDCEECDCYIDFEEADEEDIGLDIKDAVNSVID GVMGGIVIAADKVSELAGKLADTVSNKLVERQEAAMFDMDDCDFDCDCEECEDECCCGC CGEACEEACEVVVETCGDVSDAIEEAAEAVEEAVVEATEETAE" /locus_tag="LOCUS_8660" /note="MGA_1286" CDS complement(839..1468) /product="16S rRNA (uracil(1498)-N(3))-methyltransferase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003430913.1" /transl_table=11 /codon_start=1 /translation="MRLGDEIVLCYDRCDYICEILKISDEAVITKVLSHKPSSEPTIDL TLYMAMPKLDKLETVIQKSVELGAVKIVPVLTSRCVARPEKQQFSKKLERLQRISLEAA KQSGRGIIPEVSDIISLDECISQMSELDLALVLYENGGKPLNAFSYPDCGSVGVFVGSE GGFDKAEIERCLDNGIEAVWLGERILRCETAPLAAISIIMHLTGNI" /locus_tag="LOCUS_8670" /EC_number="2.1.1.193" /note="WP_003430913.1 16S rRNA (uracil(1498)-N(3))-methyltransferase (Clostridioides difficile) [pid:34.9%, q_cov:97.1%, s_cov:82.9%, Eval:1.9e-27]" /note="MGA_1287" ORIGIN 1 acccgccaaa aatatctgca gttagcgagc aagtgacgct ccggggcacc tgctcggacg 61 gctccgccac ccttcgcaga cgcccctccg ctccaaatcc aacaaaaaaa cgggaaccca 121 cacaggttcc cgttttcctc ttacttttca aaaattactc tgcagtttct tcggttgctt 181 caacaactgc ttcttcaaca gcctcggcag cctcttcaat tgcatcgcta acgtcgccgc 241 aagtctcaac aacaacttcg caagcttctt cgcaagcttc gccgcagcat ccgcagcagc 301 actcgtcttc acattcttcg caatcgcagt cgaaatcgca gtcgtccata tcgaacatag 361 cagcttcctg tctttcaacc aacttgttgg aaacggtgtc tgcaagcttg cctgcaagct 421 cactcacctt gtcagcagcg ataacgattc cgcccataac gccgtcgata acagagttta 481 cagcgtcctt aatatcaagg ccgatgtctt cttcgtcagc ttcctcgaag tcgatgtagc 541 agtcgcactc ttcacagtct tcgtcgcatt cgcattcaga gcaatcatcc tcgcaagcac 601 agtcttcaca cttgcaagcg tcgcagtttt catcttcaca gccttcgcag agatcctctt 661 caaggtcgaa ttcgtcgtaa acttcttcgt ttttcttctt agccaaggaa agaacaacgc 721 ctgctgttgc agcggcaacg cccaaacctg ctaatacctt ccaaaactta cccataataa 781 cagctccttc gctatatttt tctttatttt agcatatata tccgataatt gcaagtgctt 841 aaatattccc cgtcaggtgc ataataattg aaattgccgc aaggggtgct gtttcgcatc 901 gcaaaattcg ctcgcccagc caaacagctt caatgccgtt atcaaggcac cgctcaattt 961 ccgccttatc aaatccgccc tctgagccga cgaaaacgcc aacacttccg cagtcgggat 1021 aggaaaacgc attcaaaggc ttgccgccgt tttcatataa aaccagcgcc aaatcaagct 1081 cgctcatctg cgaaatgcac tcatcaaggc ttattatgtc cgaaacctcg ggaatgatac 1141 cgcgtcccga ctgcttcgct gcttcaaggg agatcctttg aagtcgctca agcttttttg 1201 aaaactgctg tttttcggga cgagcaacgc atcttgatgt caacacaggc acgattttaa 1261 ccgcacccaa ctctaccgac ttttgaataa ccgtttcaag cttatccagc ttcggcatcg 1321 ccatatacag cgtcaaatca attgtaggct cgcttgatgg cttatgcgat aaaaccttcg 1381 taatgaccgc ttcatcgctt attttgagaa tctcgcatat gtagtcacat ctgtcataac 1441 aaagaactat ctcatcgccc aatcgcatac ggagcgacct tccgatgtgt cttgcatcat 1501 cgcccgt // LOCUS sequence359 1503 bp DNA linear BCT 21-JUN-2023 DEFINITION . ACCESSION sequence359 VERSION sequence359 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1503 /mol_type="genomic DNA" /organism="" /note="sequence359" CDS 52..450 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MLQEKYKDAAKTLETSLELIQCIFKDNEVMPPIHHREHGDLYMLL AESYLKDDDTDKALLYLEKMVDYDLNDYATIDSNTPTKSPLLNLIPHGLYRKCIDRHRD LMIKLTDSRFDSLKVNNGYQKLVERASK" /locus_tag="LOCUS_8680" /note="MGA_1288" CDS complement(558..776) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MIINGQADVLRSEGEAFGEKLRRAGVEVTALRAQGIIHDFVMLNS LDQTNACRTAMDASTAWINRKNQSDTF" /locus_tag="LOCUS_8690" /note="WP_002303627.1 alpha/beta hydrolase (Enterococcus) [pid:65.2%, q_cov:91.7%, s_cov:21.0%, Eval:2.3e-18, partial hit]" /note="MGA_1289" ORIGIN 1 cagtatcttg aaggaatgtt gaatataacc gcacgattgg caaaaagtta tatgcttcaa 61 gagaaatata aagatgccgc taaaaccttg gaaacatctc ttgaacttat acaatgtatt 121 ttcaaggaca atgaagttat gccgccgatt catcaccgtg agcacggaga tctgtatatg 181 cttcttgcag aaagctatct gaaagacgat gataccgaca aagcattatt gtatcttgag 241 aaaatggtcg attacgattt gaacgattat gcaactattg atagtaacac accaactaag 301 tctccgcttt taaatttaat tcctcacgga ttgtatcgaa agtgtattga tcgtcatcgg 361 gatttaatga tcaagcttac tgactcacga tttgatagtt tgaaagtaaa taatggctat 421 cagaaattag ttgaacgggc aagtaaataa tccgcgcctc cgatagggaa gatccttgtc 481 ggaggctatt ttcacgcgga ctaatgacag gatcggattc ttcgccttca aaattggtat 541 gcggtaaacg atagcctcta aaatgtgtca gattgatttt tacggttgat ccacgcggtt 601 gatgcatcca tggccgtgcg gcaggcattt gtctgatcca aagaattgag catcacaaaa 661 tcatgtatga taccttgtgc tcgcaatgcg gttacctcca cgcctgcccg gcgaagcttt 721 tcgccaaacg cctctccctc actgcgcaaa acatccgcct gcccattgat gatcatcgtt 781 tgcggcaagc gccttaaaca atcgagagtt gcgcgaagag gggatgcggt gatttgattt 841 cgttcctcca tggaggttgt gtattgacgc cagaaccact tcattccctc acgataaaga 901 taataaccca ccgcaaattc acaatagctc ggcgtgttaa aacaggcgtt ggtcaccggg 961 taatatacca gtaatttgtg aatgtcgggt ccccggcgca tccccgacat cagcgccata 1021 ccgattgcca tatttccgcc gacgctgtcg cccgcaaccg tgattgtgtg gcgattgatc 1081 gtggaacagc gattgcctat gatctcccat aggtgggata ggataaagta acactgctcg 1141 atggcagtcg gatatttcgc ttcaggcgat cgcgaatatt cggggaatac gacaagagaa 1201 tttgttcttg cacaaagctc cctgaccagc ttttcgtgcg tatgaaagct gccgaacacc 1261 cagccggcac cgtgaatata aaatatcacg tttctgatcg ctgtatcttt tggcgcaaca 1321 aaatatacag gtatactgcc ccagccttca gtgttaatgt agtttgagga tatatcggca 1381 ggatatttat atacaggcat atcctgcgcc gcttccaata cttggcgacc ttgcccgggc 1441 ggcagctgaa aaatcagtgg cggaactgag ttttgctcgc agaccgcttc tgcggcaggc 1501 tcc //