LOCUS sequence001 10729 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence001 VERSION sequence001 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..10729 /mol_type="genomic DNA" /organism="" /note="sequence001" CDS complement(679..1770) /product="ABC transporter ATP-binding protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_002902455.1" /transl_table=11 /codon_start=1 /translation="MLNNGDIILSVKDLHVKFSLRGKVLNAIRGISLDLHKGESLAIVG ESGSGKSVFTKNFIGLLDKNGWVDSGEIWYYGLEEGPVDLATYKTEEQWQHIRGKEVAM VMQDPMTSLNPLKTIGWQIEEALKLHQGLQGEDAKKKAVEILSDVGILEPERRAKQYPH EFSGGMRQRVVIAIAMACNPQILICDEPTTALDVTIQAQILQLIRNLKEKYGLTTIYIT HDLGVVANVADRIAVMYAGDIVEVGTCEEVFYDPRHPYTWALLSSLPQLGIKGSDLYAI KGTPPNLFNEIRGDAFAPRNPHPLKIDFLYRPPYFDVSPTHKARTWLLDPRAPKVDPPE IISHIRNIRLDTMEQQAKGGEQA" /locus_tag="LOCUS_0010" /note="WP_002902455.1 ABC transporter ATP-binding protein (Streptococcus) [pid:58.0%, q_cov:95.0%, s_cov:95.8%, Eval:4.2e-113]" /note="MGA_2" CDS complement(1786..3483) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MSKFSPSEKLTKKIENSQEEFLKKHGILAAELLDDNLNEQQIASL DPALFDLAIVDESEAERTGYSNYSYWGSTVRMFFKNKVAVFNLIVMLVLVLFTFIQPHL PNQIDPNLVNYYDSKAVWYVVDSDGSFTVDGMKRTQGDYVQVPGSDEILAYIQAPADWG TPVAIAYDEEGEETELDVQADPANSGWYWTLLKKDAPYLAILSEDLTASTYYNAVWLTV TGDKNAVYSSGVKQTAGELITDVPDGKSLAYVSAPDSWGVPKLKAQGSLNGSDAEYVSL KAVEDEDGWFYGFFPTEKNTLILTSEDGSQKGMNRATVSIGLPQEAKIVKGFIENKPPN KVYWFGTNDIGQDLWARMWAGTRTSLFIGIVVAVIEAIIGILAGLLWGYVRKLDFLFTE MYNLIDNIPSTIILLLAAYVMRPGIRTIIIAMSLTRWIGLARFIRNQVLIIRDRDFNLA SRCLGTPTRRVITRNLLPQMVSVVMLRMALAIPDAIGSEVFLSYINLGLPISIPSLGNL INKGRTMMMAPSLRYQLFIPAIILSIITICFYLVGNAFSDAADPKNHV" /locus_tag="LOCUS_0020" /note="WP_002893621.1 ABC transporter permease (Streptococcus sanguinis) [pid:38.1%, q_cov:40.0%, s_cov:72.7%, Eval:1.2e-46, partial hit]" /note="MGA_3" CDS complement(3480..4421) /product="ABC transporter permease" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_002293573.1" /transl_table=11 /codon_start=1 /translation="MLKYSIKRLARSLITLIILITIVFALLRFMPEEGYFNNYEKMSPA QIELGLIKMGLKDPLYVQVGRFIRNLLQGDLGVSYRYRVNSPIARIIAPKIAISAKLGI ICMAISLPLGLALGVLMARYKGRFWDRLGNAYIVFIQAVPNAVYFIFIQLYGSTWLKIP MLYNENDWRTLILPTISLALPSISSYAMWLRRYMVDETNKDYIKLARAKGVPNTTIWFR HVFRNAVVPIVNLIPGSLLMTISGSIYTESFYSIPGMGGLLVDVIKRQDNNMVMVLVVL FAAVGILGLLLGDIAMALVDPRISFTKKEGSR" /locus_tag="LOCUS_0030" /note="WP_002293573.1 ABC transporter permease (Enterococcus) [pid:31.4%, q_cov:99.7%, s_cov:98.4%, Eval:7.0e-42]" /note="MGA_4" CDS complement(4518..6554) /product="peptide ABC transporter substrate-binding protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_000748873.1" /transl_table=11 /codon_start=1 /translation="MNTKKILAVLLALAMIFSMAACTNSGETTPEPSGEGEGTEAGTGP DGRTYAAEQVYRTLYSSEMTTMNYLVSGTTYELEVGANTIDSLVENDTYGNIVPCAAES WEESEDGLTWTFHLRPDQHWYDTDGNEMAPVTANDYVAAARYVCDSANDCSNSYLMDGW IVNATELLEYTAAKLVAVPAGTEGEDDEYVVDDAGVIYEITDNGYEEVPAVAPEDLGVV AVDDLTLEYHLEKARPYFLTVLQFGTYWPAPAELLEQLGTDYALDNESMWFNGAYILQT AQPQQKRVYVKNEHNWDAEHIYIERIEETYNQEAATLAPEMFLRGEVDSADIGSDIVAD WLSDPEKSNMVCTSRIVGDYSYFFGFNFEPKFDEQYEPENWIKAVNNENFRKCIFHAID REAYLTAKYPGDDPHMHMINTITPLGFATYEGKDYVNYGGLAKYTENDSFDEALALEYR DKAKAELEAAGATFPIKMPINYNPSSTTWGNCTVVLEQQLEDLLGSDFVDVIVVEFSGN SFLNETRRNGNYAIQELNWGADFMDPETWADPFDRENSYNFFCHDTDSYRVFQDTKSAE TNALIDEYFRLCDYARTCVDDFDERYEAFAAAESFYLDHAIVVPGFISGGSYQATKLNG FEGQYAMMGQSSSRFKGQHVYNEAMSQEMYEEQYEAWLEALGK" /locus_tag="LOCUS_0040" /note="WP_000748873.1 peptide ABC transporter substrate-binding protein (Streptococcus pneumoniae) [pid:26.2%, q_cov:92.6%, s_cov:93.4%, Eval:1.2e-56]" /note="MGA_5" CDS 6832..8583 /product="threonine--tRNA ligase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_009888359.1" /transl_table=11 /codon_start=1 /translation="MTIIRQNTPFETAEEKKIFWETSSQIMAQALLRLYPDVKFAIGPA IDNGFYYDIDLGQRLTDADLSQIEDEMRRIVREDLPIVCRPVTRMEALGEAVAKNQPYK IEIINSLPQDVQLTFFDDGEFSDLRVGPLLERTSQVRAFKLMSIAGAYWRGSEKNKMLQ RIYGISFPKPSMLDEYLQNLVEAKRRDHRKIGREMDLFMFPAEGPGFPLYLPKGMVIRN ELMSFWKELHSEKKYNEIRTPIILNEDLWHTSGHWDHYKEHMYFTEIDGDPYAIKPMNC PGALLAYKRRMYSYRDMPVRLSELGHVHRHEPSGSLHGLMRVREFTQDDAHIFMLPEQV KGELKDIIKLIDDIYSVFGFSYKVVLATRPQNAIGSAEDWTRAQDALKEAVEDLGIEYD IAPGGGAFYGPKLDFHLRDCIGRTWQCGTVQLDFQLPQRFDLTYTGADGEKHRPVMIHR TVFGSIERFMGVLIEHFEGKLPLWLAPVQVKIVSVSEKYNEAAWKLADEMEAAGLRTEV DARNEKTGYKVREAILARDSYIIVVGEKEASTDMLTVRSSKAGDMGEFPKAEFIAMLQK EIAEKAL" /locus_tag="LOCUS_0050" /gene="thrS" /EC_number="6.1.1.3" /note="WP_009888359.1 threonine--tRNA ligase (Clostridioides difficile) [pid:56.6%, q_cov:98.1%, s_cov:89.5%, Eval:1.6e-198]" /note="MGA_6" CDS 8834..9214 /product="GntR family transcriptional regulator" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011987070.1" /transl_table=11 /codon_start=1 /translation="MIQLDLKSRKSIYEQIMDGFKELIALGVLHAGDKLPSVRELSRTL TVNPNTIQKAYRQLEADRYIYTVSGLGCFVSEKPEDPDLGKAAAIYEVIEDNVKQLRYL GISDEEIRGKLEEIACRKEEKG" /locus_tag="LOCUS_0060" /note="WP_011987070.1 GntR family transcriptional regulator (Clostridium botulinum) [pid:40.7%, q_cov:93.7%, s_cov:93.7%, Eval:1.9e-20]" /note="MGA_7" CDS 9211..10113 /product="ABC transporter ATP-binding protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003385582.1" /transl_table=11 /codon_start=1 /translation="MINVKGLCKQFDGFQALNDLNVNVEKGSIYGLIGVNGSGKTTLIR HLTGVLKPDTGSVQMDGQDVYDNVELKKRLGYIPDELFFFGSYSLKSMRDFYKGVYPNW DDARYEMMLQDFGLPERGKIAKFSKGMQKQAQFILTMSCRPDFLILDEPIDGLDPIVRK KVWKYVVDDVAERQMTVLVSSHNLKEMEGICDAIGILSKGEMKIEQDLDELKSDIHKVQ AAFHNAEDAEKAFAGLNVVHREKSGSIEHLIIRGAREDVEKAVYAADPIIFDILPLSLE EVFIFEMGGENDDIQSILA" /locus_tag="LOCUS_0070" /note="WP_003385582.1 ABC transporter ATP-binding protein (Clostridium) [pid:33.7%, q_cov:98.0%, s_cov:98.7%, Eval:2.3e-55]" /note="MGA_8" ORIGIN 1 ccgcgatccg gtccgtgatg aaccgcatga ccgacaggtc gtgggcgatg aagagatagg 61 tgagacctct ctctttctgc agcttgctca tcaggttgag cacctgcgcc cggatggaga 121 cgtccagcgc ggagatcggc tcgtctgcaa tgatgaactc aggctccatg acgaaggaac 181 gcgccatgcc gacacgctgc cgctgaccgc cggagaactc gtgggggaag cgggtggcga 241 actcgggcag cagtcctacg tcggacagcg cctgggagac gcgttcctcc cgctcctcct 301 tcttcatgtc cggatggacg ttcattaagc cttcggaaac gatgtagtcc accttggcgc 361 gttcgttcag cgatgccatc gggtcctgga agatcatctg gatcttctgg gtcaccatct 421 tatccatctc tttggagatc ttgccggaga tgcgttctcc cttgaacagg acttctcccg 481 cggagatggg attgatgcgg atgatggcgc ggccgatcgt ggtcttgccg gagccggatt 541 cgccgacgag gccgaaggtc tcgcctttgt agatgtcgaa gtttacgccc ttgacggcca 601 cgaaggcctt gcggcccttg ccgaacgtca cttccatgtt ccgcacggag cagagcactt 661 ctcttccttt gtagtcgatc atgcctgctc acctcccttc gcctgctgtt ccatggtgtc 721 cagacggatg ttgcggatgt gactgatgat ctccggcgga tccaccttcg gcgctctcgg 781 gtccagcagc caggtcctgg ccttgtgggt cggggagacg tcgaagtagg gcggccggta 841 caggaaatcg atctttaaag gatgcggatt tctcggcgca aacgcgtcgc cgcggatctc 901 gttgaagagg ttcggcggtg ttcccttgat ggcgtacaga tcgcttccct tgatgcccag 961 ctggggcagg gaggacagca gcgcccaggt gtagggatgc cgcgggtcgt agaacacctc 1021 ttcgcaggtg cccacctcca cgatgtcgcc ggcgtacatg acggcgatcc ggtcggccac 1081 gttggctacg acgcccaggt cgtgggtgat gtagatggtc gtaagaccgt acttttcttt 1141 taagttgcgg atgagctgca ggatttgggc ctggatcgta acgtccaggg ccgtggtggg 1201 ctcatcgcag atgaggatct gcgggttgca ggccatggcg atggcgatga cgactctctg 1261 gcgcatgccg ccggagaact cgtgggggta ttgcttggcg cggcgctcgg gttcgaggat 1321 gccgacgtcg gagaggatct ccacggcttt cttcttcgcg tcttcgccct gcagcccctg 1381 gtggagcttt aaggcttctt cgatctgcca acctatggtc ttcaaggggt tgagggaggt 1441 catcggatcc tgcatgacca tggcgacctc cttgccccgg atgtgctgcc actgctcctc 1501 agtcttatac gtcgcgaggt ccacgggacc ttcttccagt ccgtaatacc agatctctcc 1561 tgaatccacc cagccgttct tgtcgagcag gccgatgaag ttcttggtga agacggattt 1621 gccggagccg gactcgccga cgatggccag ggattcgccc ttgtgcagat ccagggagat 1681 gccccggatc gcattgagca cttttccgcg gaggctgaat tttacatgca ggtctttgac 1741 ggaaagaatg atgtctccat tgttcaacat gtctttgcct cctttctata cgtggttctt 1801 cgggtcggcg gcgtcggaga aggcgttgcc caccagatag aagcagatgg tgatgatgga 1861 caggatgatg gcggggatga acagctgata ccgcagcgac ggcgccatca tcatggtgcg 1921 gcccttgttg atcaggttgc ccagcgacgg gatcgagatg gggagcccca ggttgatgta 1981 actgaggaac acttccgaac cgatcgcgtc ggggatggcc agggccatgc gcagcatgac 2041 cacggagacc atctgcggca gcaggtttct cgtgatgacc cgtctcgtag gcgtgcccag 2101 gcagcgggac gccaggttga agtcgcggtc gcggatgatc agcacctggt tgcggatgaa 2161 ccgtgccagt ccgatccagc gcgtaaggct catggcgatg atgatcgtcc tgatgcccgg 2221 ccgcatgacg taagccgcca gcagcaatat gatggtgctg gggatgttgt cgatcaggtt 2281 gtacatctcc gtaaacagga aatccagttt gcggacgtaa ccccacagca ggcctgccag 2341 gatgccgatg atggcttcga tgacggctac gacgataccg atgaacagag acgttctcgt 2401 accggcccac atgcgggccc acaggtcctg cccgatgtcg ttcgtgccga accagtagac 2461 cttgtttggc ggtttgtttt cgataaagcc cttgacgatc ttcgcttcct gcggcaatcc 2521 gatggagacc gttgcccggt tcataccctt ctggctgccg tcctcggagg tgaggatgag 2581 ggtgttcttc tccgtgggga agaagccgta gaaccagccg tcttcatctt ccactgcctt 2641 cagggagaca tattccgcat cgctgccgtt taaggagccc tgtgccttca gcttgggaac 2701 gccccagctg tcgggtgcgg atacgtaggc gaggctcttg ccgtcgggca cgtcggtgat 2761 gagctctccc gccgtctgtt tgacgccgga ggagtagacc gcgttcttgt cgcccgtcac 2821 cgtgagccag accgcgttgt agtatgtgct cgctgtcaga tcttcggaca ggatggcgag 2881 gtagggcgcg tccttcttca ggagggtcca gtaccagccg ctgttggcgg ggtcagcctg 2941 gacgtccaac tccgtctctt cgccttcttc gtcgtaggcg atggcgacgg gtgtgcccca 3001 gtcggcaggc gcctggatgt aggcgaggat ctcgtcgctg cccggtacct gaacgtagtc 3061 gccctgggtg cgcttcatgc cgtcgacggt aaaggatccg tcgctgtcca ccacgtacca 3121 gaccgctttg gaatcgtagt agttgaccag gttcgggtcg atctggttgg gcaggtgagg 3181 ctggatgaag gtaaacagca ccagcacgag catgacgatg aggttgaaca ccgccacctt 3241 gttcttgaag aacatccgga cggtggaccc ccagtaggaa tagttggagt agccggtccg 3301 ttccgcttcg ctttcatcca cgatggccag atcgaacagc gccggatcca gagaagcgat 3361 ctgctgctcg ttcagattgt cgtccagcag ttccgcggcc agaatgccgt gctttttgag 3421 gaattcttcc tgggaattct cgatcttttt cgtgagtttt tcagagggag agaatttgct 3481 catctggatc cctccttttt cgtaaagctg atgcgtgggt caaccagcgc catggcgata 3541 tcgcccagca gcagtcccaa gatgcccacg gccgcaaaca gcacgacgag caccatgacc 3601 atgttgttgt cctggcgttt gatgacgtcc accagcaggc cgcccatgcc gggaatggag 3661 tagaaggatt ccgtataaat ggagccggaa atggtcatga gcagggagcc ggggatgagg 3721 ttgacgatgg gaacgaccgc gttgcggaac acgtgccgga accagatggt ggtgttgggc 3781 acgcctttgg cgcgggccag tttgatgtag tccttattgg tctcgtccac catgtaccgc 3841 cgcagccaca tggcgtagct ggagatggaa gggagggcga gcgaaatggt gggcaggatg 3901 agtgtccgcc agtcgttttc gttgtacagc atggggatct tcagccaggt ggagccatac 3961 agctggataa agatgaagta gaccgcgttc ggtacggcct ggataaatac gatgtaggca 4021 ttgcctaaac ggtcccagaa tctgcccttg tagcgggcca tcagcacgcc cagggcaagt 4081 cccagcggca agctgatcgc catgcagatg atgcccagtt tcgcggagat cgcgatcttc 4141 ggtgcgatga tcctggcaat gggggagttg accctgtaac ggtacgatac gcccagatcg 4201 ccttgcagca gattgcggat aaagcggcca acctggacgt agagaggatc cttcagaccc 4261 attttgatga gtccgagttc gatctgcgcc ggggacatct tctcgtaatt gttgaaataa 4321 ccttcctctg gcatgaaccg cagcaaggca aatacgatgg tgatcagtat gatcagcgtg 4381 atgagggacc gtgcaagtct tttgatggaa tacttcagca cgttgcgtct cctttgtaaa 4441 atcagaggag cggccgtgct ccgtgtgggg gcagagccgc tcctgatggt tcgtttagtt 4501 ttccttgtca gtaaggatta cttgccgagc gcttccagcc aggcttcgta ctgttcttcg 4561 tacatttcct gagacatcgc ttcgttatag acgtgctgtc ccttgaatct gctggaagac 4621 tggcccatca tggcgtactg gccttcgaag ccgttgagct tcgtagcctg gtaggaaccg 4681 ccggagatga agccggggac cacgatcgca tgatcgaggt agaaagattc ggctgctgcg 4741 aaggcttcgt atctttcgtc gaagtcgtcg acgcaggtac gggcgtagtc gcacagtctg 4801 aagtattcgt cgatcagggc gttggtctct gcggacttgg tatcctggaa gactctgtag 4861 gagtcggtgt cgtggcagaa gaagttatag gaattctctc tgtcgaacgg gtcggcccag 4921 gtctcgggat ccatgaagtc ggcgccccag ttcagttcct ggatggcgta gttgccgttt 4981 cttctggtct cgttcaggaa ggagttgccg gagaattcga cgacgataac gtcgacgaag 5041 tcggagccca gcaggtcttc cagctgctgc tcgagaacga ccgtgcagtt gccccaggtc 5101 gtggagctcg ggttgtagtt gatcggcatc ttgatgggga atgtagcgcc ggccgcttcc 5161 agttccgcct tggccttgtc tctgtattcc agagccagcg cttcgtcgaa gctgtcgttt 5221 tcggtgtatt tggccagacc gccgtagttg acgtagtcct tgccctcgta agtggcgaag 5281 cccagcgggg tgatggtgtt gatcatgtgc atatgcggat cgtcgccggg atacttcgca 5341 gtgaggtacg cttctctgtc gatggcgtgg aagatgcact ttctgaagtt ttcgttgttg 5401 acggccttga tccagttttc aggttcgtac tgctcgtcga acttcggctc gaagttgaat 5461 ccgaagaagt aggagtagtc gccgacgatg cggctggtgc agaccatgtt gctcttctcg 5521 gggtcactca gccagtcggc tacgatatcg gaaccgatgt cggcggagtc gacttcgcct 5581 ctgaggaaca tttcgggagc cagcgtggca gcttcctggt tgtaggtctc ttcgatgcgc 5641 tcgatataga tgtgctcggc atcccagttg tgctcgttct taacgtagac tctcttctgc 5701 tggggctgag cggtctgcag gatgtacgcg ccgttgaacc acatggattc gttatccaga 5761 gcgtaatcgg tgccgagctg ctcgaggagt tcggccggtg cgggccaata ggtaccgaac 5821 tgcagtacgg tgaggaagta gggacgggcc ttctccagat gatactcgag agtgaggtcg 5881 tctaccgcta cgacgcccag atcttccgga gcgacggcgg gaacttcttc gtaaccgttg 5941 tcggtgatct catagatgac gccggcgtcg tccacgacgt attcgtcatc ttcgccttcc 6001 gtgcctgccg gtacggcgac cagttttgca gccgtgtatt ccagcagttc ggtggcgttt 6061 acgatccagc cgtccatcag atagctgttg ctgcagtcgt ttgcggagtc gcagacatag 6121 cgggctgcgg ctacgtagtc gtttgcggtg acgggggcca tctcgttgcc gtccgtatcg 6181 taccagtgct gatccggtct caggtggaac gtccaggtga ggccgtcttc gctctcttcc 6241 cagctctcgg ctgcgcaggg aacgatgttg ccgtaggtgt cgttttccac gagggagtcg 6301 atggtgttgg cgccgacttc cagctcatag gtggtgccgc tcaccagata gttcatggtg 6361 gtcatctcgc tggaatacag cgtgcggtag acctgttccg ctgcataggt gcggccgtcc 6421 ggaccggtac cggcttccgt accttctcct tcgccgctgg gttccggagt cgtctctccg 6481 gaattcgtgc aggctgccat ggagaagatc atggccagtg ccagaaggac tgcaaggatt 6541 ttctttgtgt tcatatcaga ttttcctcca atctttccgt cctgttccgt tccgatacac 6601 ggggaagggg acaggaccgt ttacacagga gcagacaggc tgctcctggt caattatact 6661 acaatattca gtgagaaaac agtaaatata caaaaatatc ttcctccctt gtgttttata 6721 aataaatgta tgcgaattcc tttggtgaaa tcgcaaaacc gtcttttctt gattttggcg 6781 accggaatcg ttatagtaaa tagtggaact atcttggatg gaggccggca tatgacgatc 6841 atcagacaga acacaccttt tgaaacagcg gaggaaaaga agatcttctg ggagaccagt 6901 tcccagatca tggcgcaggc gctgctgcgg ctgtatccgg acgtaaaatt tgcgatcgga 6961 cctgccatcg acaacgggtt ttattacgat atcgacctgg gtcagcgact gacggacgca 7021 gatctctcgc agatcgagga cgagatgcgg cgcatcgtgc gcgaagacct tccgatcgtc 7081 tgccgcccgg tgacccgcat ggaagctttg ggcgaagcgg tcgccaagaa ccagccctat 7141 aagatcgaga tcatcaacag cctgccgcag gatgtgcagc ttacgttctt cgacgacggc 7201 gaattctccg acctgcgggt tggaccgctg ctggaaagaa cgagccaggt gcgggctttc 7261 aagctgatga gcatcgcagg cgcctactgg cgcggcagcg aaaaaaataa gatgctgcag 7321 cgcatctacg gcatctcgtt ccccaagccc agcatgctgg acgagtatct gcagaatctg 7381 gtggaggcca aacggcgcga ccaccgcaag atcggccggg agatggatct gttcatgttc 7441 cccgcggaag gccccggatt cccgctgtat ctgcccaagg gcatggtcat ccgcaacgag 7501 ctgatgtcgt tctggaagga actgcacagc gaaaagaaat acaacgagat ccgcacgccc 7561 atcattctga acgaagatct ctggcatacc agcggtcact gggaccacta caaggagcac 7621 atgtacttta cggagatcga cggcgatccc tatgccatca agcccatgaa ctgccccggc 7681 gcgctgctcg cctataagag aaggatgtac tcctaccggg atatgccggt tcgcctctct 7741 gaattgggtc acgtgcaccg gcacgaaccc tccggcagcc tgcacggtct gatgcgggtg 7801 cgggaattca cccaagacga tgcccatatc tttatgcttc ccgagcaggt gaagggggaa 7861 ctgaaggaca tcatcaaact gatcgacgac atctattccg tgttcggctt ttcctataaa 7921 gtcgtgctgg cgacccgccc gcagaacgcg atcggcagcg ccgaagactg gacgagagcc 7981 caggacgcgc tgaaggaagc ggtggaggat ctcggcatcg aatacgacat cgcccccgga 8041 ggcggcgcgt tttacggtcc gaaactggat ttccacttaa gagactgcat cggacgcacg 8101 tggcagtgcg gtaccgtaca gctggacttc cagctgcccc agcgcttcga cctgacctat 8161 accggtgcgg acggcgaaaa gcacagacct gttatgatcc accgcaccgt gttcggcagc 8221 atcgagcgct ttatgggcgt gctcatcgaa cacttcgaag gcaaattgcc gctgtggctc 8281 gctccggtac aggtaaagat cgtatccgtg tcggagaagt acaacgaagc ggcctggaaa 8341 ctggcggacg agatggaagc tgcgggcctt cgcaccgagg tggacgcgcg gaacgaaaag 8401 acgggctaca aggtgaggga agcgattttg gcgcgtgact cctacatcat cgttgtcggc 8461 gaaaaggaag cctccacgga tatgctgacg gtccgctcct ccaaagcggg cgacatgggc 8521 gagttcccga aagcggagtt tatcgcaatg ctgcagaagg agatcgccga aaaagctttg 8581 tgatcgcggc ggacgggagt taatgaacaa gaattaatta aaatatttgt gcatttcaca 8641 cgaaaattta ttgacaaatc cagtttttta aagatataat gcttgcagtg cagcagctcc 8701 aaccctgttg ccgttgaata cacacagcaa aagtcccgga ttcagttccg gggtttttgt 8761 tttttgcgtt aacttcttct tgacactgta ctatgtgacg tagtacagtt agtacatcaa 8821 aaggaggtac gccatgatac agttggatct gaaaagccgg aaatccatct acgaacagat 8881 catggacggc tttaaggagc tcatcgccct cggcgtcctt catgcagggg acaaactgcc 8941 ctccgtacgg gagctctccc ggacgcttac cgtcaatccg aacaccatcc agaaggcata 9001 ccgccagctg gaagccgacc ggtacatcta caccgtatcg ggcctgggct gcttcgtttc 9061 ggaaaagccg gaggatccgg atctgggcaa ggcggccgcc atctacgagg tcatcgaaga 9121 caacgtaaag cagctgaggt atctggggat ctcagacgaa gagatccgcg gaaaactgga 9181 ggagatcgcc tgcagaaagg aggagaaggg atgatcaacg taaaaggatt gtgcaagcag 9241 tttgacggct tccaggcact caacgacctg aatgtaaacg tggagaaggg ctccatctac 9301 gggctgattg gggtcaacgg aagcggcaag acgacgctca tccgccatct gacaggggta 9361 ctcaagcccg acacgggcag cgtacagatg gacggacagg acgtgtacga caacgtcgag 9421 ctgaagaaga ggctggggta catccccgac gagctgttct tcttcggttc ctacagttta 9481 aagagcatgc gggatttcta caaaggcgtc tatcccaact gggacgatgc ccggtacgaa 9541 atgatgctgc aggatttcgg tctgcccgaa cggggcaaga tcgccaagtt ctccaagggc 9601 atgcagaaac aggcgcagtt tatcctgacg atgagctgcc ggccggattt tctcatcctg 9661 gacgagccca tcgacggtct cgaccccatc gtccgcaaga aggtatggaa atacgtggtg 9721 gacgacgtgg cggaacggca gatgaccgtg ctcgtgagct cccacaacct gaaggagatg 9781 gagggcatct gcgacgccat cggcatcctg tccaagggcg agatgaagat cgaacaggat 9841 ctggacgagc tcaagtccga catccacaag gtgcaggcgg cgttccacaa cgcggaagac 9901 gccgaaaagg cctttgccgg gctcaacgtg gtgcaccgcg aaaagagcgg cagcatcgag 9961 cacctgatca tccggggcgc gagggaagac gtggaaaagg ccgtctatgc ggctgacccc 10021 atcatcttcg acatcctgcc gctgtccctg gaagaagtgt ttatctttga gatgggaggt 10081 gaaaacgatg acatccagag catcctggct taacgtttct ctcattaagg agaattttaa 10141 acggttctgg cccatcatgt gcggcgggtt cctgttctgg ctggtctgcg gtcccatcgc 10201 cctcgtcctc accaagagtt cggaaggcta cagctacagc tttatgcgca gcatcctgcg 10261 gcacatcaac ccggcaccga tcctgctcaa cggccttctg ccggtggcgc tggcgctggc 10321 ctgcttcggg tatctgcacc ggacgaattc cgccggggtc atccacagca tgcccttcac 10381 ccgccgcaac ctgtttctca gcaactatgt gagcggtctc gtgatggcgg tgctgccggc 10441 ggcagtcatc tccctcatgc tgctcgcgat gagaggcaac gtggacatcg gctggtacgt 10501 ggacgatccg gtctacttta cgggcatgaa catcttccgc tttttcctgg aggagttcac 10561 cgtcatcgcc ttcgtgtact cgatctcggt gtttgcggcc agcatcagcg gtctgtccgt 10621 catccacgcc cttacggcgg tggcgctcaa cttcatctgc ccggtggtgt acctgttgct 10681 gatgggttat atggacacct acgagtacgg ctttaccgca ggctcgctc // LOCUS sequence002 9212 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence002 VERSION sequence002 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..9212 /mol_type="genomic DNA" /organism="" /note="sequence002" CDS 92..2905 /product="FtsX-like permease family protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_010964141.1" /transl_table=11 /codon_start=1 /translation="MLLRSLLRTIRSTLGRFLAIFAIIALGVGFFIGLRVTHDSMLKTA DDYLTDLLLYDFRLVSTLGLTDEDVNTFARDPAVALSEGSFSIDALIETAKGQDDVLHF HTLLPDVNRVDLVSGRLPETSDEIVLDARYAGPGMVGKTVTLAESNDEDTLKHFGHSSF KVVGTANTSYYVNFERGSTSLGSGKVSGFAYALPAAFDADYYTEVFLRLKDMPSMGSQA YDKAADAQQDRLEGLLEERGQIRYEDLKQEANDKIEEAQAEIDDGWAKIDDGKREIADA ERKLADADRELKDARKELDDGWAELKDAETELADARKELDDAEIELADSRKELDDAKAE LADARQELDDGWKEYEDGKKEYEDGLAEYEKGMSAYRSGRREANEQLAAASKQLDDAQA QLSETRTQLDAAAEQKTTLEQSLPYLEGDKLAEAQTAIGTISEQLAYGEAAYAQGLSEL ESGREAYEAAEASARGQLRSAKRKLDKAKEELDAAALELEDALAELEDGEQEYADGLAE YEDGEQKYADGLAEYEDGLKEYEDGVAEYEDAKKELEDGEAEYQDGLREYQTKSADAAV TIRDAKADIAQAEIDLEEGQKKVDDAREELADLKEPSTYVLGRDKNAGYAALENDTAIV KGIAKVFPLFFFLIAVLVCITTMTRMVDEQRTENGTLKALGYGDAAIISRYLIYSGSAS ILGCFAGFFAGSKFMPFTIWKIYRIMYDIDRPVAFVLDWKMFGICAGLYLLCSLGSTWY VAHGELKEMAAQLIRPKAPEAGKRVLLENVPAIWNRLSFLRKVSIRNIFLYKKRMVMMI IGIGGCTALLLTGFGIRDTISGIVDYQYEEISLYDGDVSFAEDMDEDAQRAFRKEYGDL IEDAVFLAAAKMDVSGKATEEANVICFEEPPEGFVDLHSGDTKLPWPQEGEAVLNYRLA RDLGVTA" /locus_tag="LOCUS_0080" /note="WP_010964141.1 FtsX-like permease family protein (Clostridium) [pid:29.3%, q_cov:98.3%, s_cov:78.1%, Eval:2.4e-109]" /note="MGA_11" CDS 2921..3580 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MDSDMRSVDLRVTGVFDNYLFDYVYVSRNTLENAWGTVPETKNAY VDFKEGMEVHQASADLLASDDVLSVSLAADLRSTIGNLLESMDLVVLIVLVCSGALAFI VLYNLTNISITERRREIATLKVLGFFQNETAQYVFRENLILTGIASLFGIPAGLALLHY VMAQIVIKQMYFGCRLAPLSYVWSVLITFAFAVLIDLALRVKIDRIDMAESMKAIE" /locus_tag="LOCUS_0090" /note="WP_112297324.1 ABC transporter permease (Lactiplantibacillus plantarum) [pid:34.4%, q_cov:95.9%, s_cov:24.6%, Eval:1.3e-32, partial hit]" /note="internal stop codon at [2903:2905](+)" /note="MGA_12" CDS 3664..6306 /product="alanine--tRNA ligase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_009889064.1" /transl_table=11 /codon_start=1 /translation="MKYMGVNELREKFLKFWETKDHLRHASYSLIPENDKSLLLIAAGM APLKPYFSGAQVPPRKRMTTAQKCIRTNDIDNVGHTARHATFFEMMGNFSFGDYFKEGA INWGWEFITSPEWLDIPKEKVWATIYEDDDEAYNIWRDQVGMPAERIVRLGKEDNFWEI GTGPCGPCSEVYYDRGPEYGCGKPDCKPGCDCDRYMEFWNFVFTQFDRQEDGSYVPLAH PNIDTGMGLERMACIMQGVDSIYNIDTMHEILQEVCKLSGVKYQDGAAPTDVSLRIITD HVRTVSFMIGDGILPSNEGRGYILRRLLRRAARHGRLLGIKGAFINDVAEKVFEQYGEA YPELIERKDYIRKIISIEEEKFDQTVESGMSVLEGYMAEAKAAGKTQLSGEQVFKLYDT YGFPIELTQEIAEEQGYTVDEEGFRAHMQAQKDQARAARKAEDNEGWLDESVMFKDYPA TEFTGYDSLAMDAKVLGLVRGMNALKSAGEGEEVRIVLDRTPFYAEGGGQVGDTGLLEA DGFTAAVTDTIKVGNVYVHKAVVTAGEVSVGDTVTACVDALRRHAIARNHTATHLLQKA LRTVLGDHVEQAGSLVNENELRFDFTHFEGISAEDLARVEDIVNAEILKFTDVETKEMP IDEAKKLGAMMLFGEKYGETVRVVNVPDFSMEFCGGTHVANIGQIGCLHIVSESGVAAG TRRIVAVTGSAVNTLLAEEQARIAAAAASLKTNAAGLEKRAEDMAAELKAVKKELEELK AKAAQEGAGDLLKEAKVFGTARLIEHTFEGAGIDQLRSLSDQIKAAEKNVVMVFAAVNG EKATLMVSVTDDLTEKGYHAGNMIKEIAKAAGGGGGGKADMAQAGAKDLAKLPDAFAKA EELMAAKAK" /locus_tag="LOCUS_0100" /gene="alaS" /EC_number="6.1.1.7" /note="WP_009889064.1 alanine--tRNA ligase (Clostridioides difficile) [pid:51.2%, q_cov:98.2%, s_cov:98.2%, Eval:8.8e-260]" /note="MGA_13" CDS 6386..6634 /product="IreB family regulatory phosphoprotein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_000348590.1" /transl_table=11 /codon_start=1 /translation="MERKTILFSSPEKPEQRTTEDILKTVYDALEEKGYNAIDQMVGYI LSGDPSYITGHNNARNLIRHIERDDLVEELLRNFLKK" /locus_tag="LOCUS_0110" /note="WP_000348590.1 IreB family regulatory phosphoprotein (Bacilli) [pid:55.1%, q_cov:95.1%, s_cov:88.6%, Eval:3.3e-20]" /note="MGA_14" CDS 6690..7151 /product="Holliday junction resolvase RuvX" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003428279.1" /transl_table=11 /codon_start=1 /translation="MEYGDIFMRILGLDIGDKTIGVAVSDPLFISAQGVTTIERIGVKK DTTKVLEYAKEYEAGTIVSGLPLMLSGEDSPQTQKVREFVEKLQNKARSTGMKLQFVFQ DERFTTKIAEDVLIAADMRREKRKTIIDRQAAVIILQSYLDANRGKLTL" /locus_tag="LOCUS_0120" /gene="ruvX" /EC_number="3.1.21.10" /note="WP_003428279.1 Holliday junction resolvase RuvX (Clostridioides difficile) [pid:51.1%, q_cov:89.5%, s_cov:93.6%, Eval:4.3e-28]" /note="MGA_15" CDS 7175..7762 /product="4Fe-4S dicluster domain-containing protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011459585.1" /transl_table=11 /codon_start=1 /translation="MGRLGFFFNMNTCLGCGACQVACKDLHGLQPGEFFRRVETISVEA GGQKVYAHYSGACNHCEEANCVKACPTGAMHKAADGTVVHDDNLCMGCGSCMWNCPNGA VSFSLTKGVAQKCDACAELRERGYEPACCGACPTRSLKFGDIDELQKEYGVSAAERGFL PIADITDPNLIVKLPANVVKALKGGSAHAEDL" /locus_tag="LOCUS_0130" /note="WP_011459585.1 4Fe-4S dicluster domain-containing protein (Desulfitobacterium hafniense) [pid:49.7%, q_cov:90.3%, s_cov:92.2%, Eval:9.2e-50]" /note="MGA_16" CDS 7746..8942 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MQKIYKYIIVGAGIAAVSAAAGIRETDPDGAILMVGDEAVPAYSR PMLTKTPLRSYELGRTIVYGPEWYKDNKIDLVLGTKVKGIDNSSRLVTLSNGDTFFYNR LIYSAGANGFVPPIKGADLPEVVVIRRYEDILKVKRLSVNTGKAVIIGGGVIGLEAGFE LARYGLDVTVLEALPMLMPRFLDEDCARMLERSIHSFPVYTGVTIEEIAGNGHVESVRL QDGREFPCDLVIMSTGVRADTALAQAAGIKCDRSGILINEKCETSAKDIFACGDCAAYG INWQLWSQALEQGRVAGINAAGGTASIQPTDSSMIINSPEVSMFSCGDVGKDPNKVYTT EVDDNMQPDLFAVNKKFIRSYEKRFYCGEKLVGAIIIGNLARMQELKEQILGIAPREV" /locus_tag="LOCUS_0140" /note="WP_011861274.1 FAD-dependent oxidoreductase (Clostridioides difficile) [pid:31.8%, q_cov:92.2%, s_cov:41.9%, Eval:6.4e-49, partial hit]" /note="MGA_17" ORIGIN 1 ccgaccgcat tataagggtc aacagcggca ccatcctcga acagcgcgtc aacgataccg 61 taacgcccgt cgaagacatc gagtggtagc catgcttctg cgttctcttc tccgcaccat 121 ccggtccacg ctgggcagat ttctggcgat attcgccatc atcgcgctgg gcgtcggatt 181 cttcatcggt ctccgtgtta cccacgattc catgctcaaa acggcagatg attatctgac 241 ggatcttttg ctgtacgatt tccgcctggt ctccacgctg gggcttacgg atgaggacgt 301 taatacgttt gcgcgcgatc ccgccgtcgc actgtcggaa gggtcgttct ccatcgacgc 361 tctgatcgaa acggcaaaag ggcaggacga tgtgctgcat ttccatacgc tgctgccgga 421 tgtcaaccgc gtggaccttg tgagcggcag gctgcccgaa acatcggacg agatcgttct 481 ggacgcccgc tatgcgggtc cgggcatggt aggcaaaacg gtgaccctgg cagagtccaa 541 cgacgaagat acgctgaaac acttcggtca cagcagtttt aaggtcgtcg gcacggccaa 601 cacctcctat tacgtcaact tcgaacgggg ttcaaccagc ctgggttccg gcaaagtctc 661 cggatttgcc tatgcgcttc cggcggcttt cgacgcagat tattataccg aagtattcct 721 gcgccttaag gacatgcctt ccatgggttc tcaggcctac gacaaggcag cggatgcgca 781 gcaggacaga ctggaagggc ttttggaaga acggggccag atccgctacg aagacctgaa 841 acaggaagcg aacgataaga tcgaagaggc gcaggccgag atcgacgatg gctgggccaa 901 gatcgacgac ggaaaaagag agatcgccga cgcggagaga aaactggcag acgccgacag 961 ggaactgaag gacgcccgca aagagctcga cgacggctgg gcggaattga aggacgcgga 1021 gacggagctg gcagacgccc gcaaggaact ggatgacgcc gagatcgaac tggcggattc 1081 gcgcaaggaa ctggatgacg cgaaggcaga actggcggat gcccgccagg aactggatga 1141 cggctggaaa gaatacgagg acggcaaaaa agagtatgaa gacggcctgg cggaatacga 1201 aaaaggcatg agcgcctacc gcagcggccg cagagaagcc aacgaacagc tggccgcagc 1261 ctccaaacag ttggacgatg cccaggcgca gctaagcgaa acacgtaccc agctcgatgc 1321 agccgctgag cagaaaacga ccctcgagca gagcctgccg tacctggaag gggacaagct 1381 tgcggaggcg cagaccgcca tcgggaccat ttccgaacag ctggcctacg gagaagccgc 1441 ttacgctcag ggactgagcg aactggagag cggccgggag gcctacgagg cagcggaagc 1501 gtctgccaga gggcagcttc gctctgccaa gagaaaactg gataaagcca aagaagagct 1561 ggacgccgcg gcgctggagc tggaagatgc gctggcagag ctggaagacg gagaacagga 1621 atatgcagac ggtctcgccg aatacgaaga cggggagcag aaatacgcag acggcctcgc 1681 ggaatatgag gacggtctga aggaatatga agacggcgtc gcagaatacg aagacgcaaa 1741 gaaagagctg gaggacggag aagcagagta tcaggacgga ctcagagaat atcagacaaa 1801 gtctgccgat gcagcggtca ccatccggga cgccaaggcg gacatcgcac aggcggagat 1861 cgacctggaa gaagggcaga agaaggtcga cgacgccaga gaagaactgg cggatctgaa 1921 ggaaccttcc acctatgtcc tggggcgcga caagaatgcg ggatacgccg cactggagaa 1981 tgataccgct atcgtcaaag gcatcgcgaa ggtgtttccg ctgttcttct tcctcatcgc 2041 ggttctggta tgcatcacga cgatgacccg catggtggac gaacagagaa cggagaacgg 2101 cacgctcaaa gcgctgggat acggcgacgc tgccatcatc tcccgctatc tgatctattc 2161 aggcagcgcc tcgatccttg gctgctttgc cggtttcttc gccggctcga aattcatgcc 2221 ctttacgatc tggaagatct accgcatcat gtacgacatc gaccgtcccg tcgcgttcgt 2281 gctggactgg aagatgttcg gcatctgtgc cgggctctat ctgctctgtt cgctgggctc 2341 cacctggtat gtggcgcacg gggaactgaa ggagatggcg gcgcagctca tccgccccaa 2401 ggcaccggaa gcgggaaaac gcgttctcct cgaaaacgtt cctgccattt ggaaccgcct 2461 gagttttctg cgcaaggtct cgatccgcaa catcttcctg tataaaaagc gcatggtaat 2521 gatgatcatc ggcatcggag gctgcaccgc gctgctgctg acaggcttcg gcataagaga 2581 tacgatctcc ggcatcgtag actatcaata cgaggagatc tccctgtacg acggcgacgt 2641 atcgttcgcg gaggatatgg acgaagacgc acagcgggca ttccggaagg aatacggaga 2701 cctgatcgaa gatgccgtct ttctggctgc tgcgaagatg gatgtgagcg gcaaagccac 2761 ggaagaagcg aacgtcattt gctttgaaga gcctcccgag ggattcgtgg accttcacag 2821 cggagatacg aaactgccat ggccgcagga aggagaggcg gtgctcaact accgtctcgc 2881 gagggatctc ggcgtgaccg cgtgagatac catacgcatc gtggacagcg acatgcgcag 2941 cgtggatctg agggtcaccg gcgtgttcga taattacctg ttcgattacg tctacgtctc 3001 ccgcaatacc ctggagaacg cctggggcac cgtaccggag acgaagaacg cctacgtcga 3061 ttttaaagag gggatggagg tccatcaggc gtccgcagat ctgttggcgt cggacgacgt 3121 gctttctgtt tcgctggcgg cggatctgcg cagcaccatc ggcaatctgc tggaatccat 3181 ggacctcgtc gtgctgatcg tgctcgtgtg ttccggtgcg ctcgccttta tcgtcctgta 3241 caacctgacg aacatctcga tcacggagcg gcggcgggag atcgcgacgc tcaaggtgct 3301 cggcttcttc cagaacgaga cggcccagta cgtcttccgg gagaacctga tcctgaccgg 3361 catcgcctcg ctgttcggca ttccggcagg tctggcactg ctgcattacg tcatggcgca 3421 gatcgtcatc aagcagatgt atttcggctg ccgtcttgcg ccgctgtcct acgtctggtc 3481 cgttcttatc acgttcgcgt ttgccgtgct catcgacctg gcgctgcgcg taaagatcga 3541 ccggatcgac atggcggaat ccatgaaggc gatcgaataa tcccgcatgg cgccttgaca 3601 cttcataccg aaatgcaata aaatgaagtg tttttataag catattttgg aggtagtttt 3661 agtatgaaat acatgggcgt aaacgaactg cgcgagaagt tcctgaagtt ctgggagacc 3721 aaggaccatc tcagacacgc tagttattcc ctgatccctg aaaacgataa atccctgctg 3781 ctgatcgcag ccggcatggc accgttaaag ccttatttca gcggcgcgca ggttccgccc 3841 agaaagcgca tgaccacggc gcagaagtgc atccgcacga acgacatcga taacgtcgga 3901 cacaccgccc gccacgccac gttcttcgaa atgatgggca acttctcctt cggcgactat 3961 ttcaaagaag gcgccatcaa ctggggctgg gagttcatca cgtccccgga atggctggac 4021 atccccaagg aaaaggtctg ggccacgatc tatgaagatg acgatgaagc ctataacatc 4081 tggagagatc aggtcggcat gcccgcagag cgcatcgtgc gcctcggcaa ggaagataac 4141 ttctgggaga tcggcaccgg tccctgcgga ccctgcagcg aagtctacta cgacagaggc 4201 cccgaatacg gctgcggcaa gcccgactgc aaacccggct gcgactgcga ccgttacatg 4261 gagttctgga acttcgtatt tacccagttc gaccgccagg aggacggcag ctacgttcct 4321 ctggctcacc ccaatatcga taccggcatg ggtctggaga gaatggcctg catcatgcag 4381 ggcgtagact ccatctataa catcgacacc atgcacgaga tcctgcagga agtctgcaag 4441 ctgtccgggg tcaaatacca ggacggcgca gcgcccaccg acgtatcgct gcgcatcatc 4501 acggaccacg tccgcaccgt atccttcatg atcggcgacg gcatcctgcc cagcaacgag 4561 ggcagaggct acatcctgcg cagactgctg agaagagcgg cccgccacgg cagactgctg 4621 ggcatcaagg gcgcctttat caacgatgtc gcggagaagg tgttcgaaca gtacggcgaa 4681 gcttatcccg aactcatcga acgcaaggac tacatccgca agatcatcag catcgaagag 4741 gaaaagttcg accagaccgt cgaatccggc atgtccgttc tggaaggcta catggcggaa 4801 gccaaggcgg ccggcaaaac gcagctgtcc ggcgaacagg tctttaagct gtacgacacc 4861 tacggattcc ccatcgagct cacccaggag atcgcggaag agcagggcta taccgtggat 4921 gaggaaggct tccgcgctca catgcaggcg cagaaagatc aggccagagc tgccagaaaa 4981 gcagaggaca atgaaggctg gctggacgag agcgtcatgt tcaaggatta tccggcgacg 5041 gaatttacgg gctacgacag tctcgccatg gacgcgaagg tcctgggtct cgtgcgtggc 5101 atgaacgcgc tcaagagcgc aggagagggc gaagaagtcc gcatcgtttt agaccgcacc 5161 ccgttctatg cggaaggcgg cggccaggtg ggcgataccg gtctgctcga ggcggacgga 5221 tttaccgcag ccgtgaccga caccatcaag gtgggcaatg tctacgtcca taaggcagtc 5281 gtgaccgcgg gcgaagtctc ggtaggcgat accgttacgg cctgcgtgga tgccctcaga 5341 agacacgcca tcgccagaaa ccacaccgcg acccacctgc tgcagaaggc gctgcgcacc 5401 gttctgggtg accacgtcga acaggcgggc tccctcgtca acgaaaacga gctgcgcttc 5461 gactttacgc acttcgaagg catctccgcg gaagacctgg ccagagtaga ggatatcgtg 5521 aatgcggaga tcctgaagtt tacggatgtc gagaccaaag agatgcccat cgacgaagcc 5581 aagaagctgg gcgccatgat gctgttcggc gaaaagtacg gcgagaccgt ccgcgtcgta 5641 aacgttccgg acttctccat ggaattctgc ggcggcaccc acgttgccaa catcggtcag 5701 atcggctgcc tgcacatcgt ctccgaatcc ggcgtcgccg ccggcaccag acgcatcgtg 5761 gcggtcaccg gatctgccgt caacacgctg ctggcagagg aacaggcccg catcgctgcg 5821 gcagccgctt ccttaaagac caacgcagcc ggattggaaa agcgggcaga agacatggct 5881 gcggaactga aggccgtgaa gaaggaactg gaagaactga aggccaaggc agctcaggaa 5941 ggcgcaggag acctgctgaa ggaagcgaag gtcttcggta cggcccgcct catcgagcac 6001 acgttcgaag gcgccggcat cgaccagctg aggagcctgt ccgaccagat caaggcggcg 6061 gaaaagaacg tcgtgatggt atttgcggcg gtcaacgggg aaaaggccac gctgatggtc 6121 tccgtcaccg acgatctgac ggaaaagggc taccacgctg gcaacatgat caaggagatc 6181 gccaaggcgg caggcggagg cggcggcgga aaagccgaca tggcgcaggc cggcgcgaag 6241 gatctggcca agttacccga tgcgttcgct aaggcggaag aactgatggc agccaaggca 6301 aaataactgc agcgccttct tgagaattac acaaaacgtc tgtataatat aaaaggtgat 6361 tagagaatcg aacaggaggt aaaaagtgga gagaaaaacg atactgttca gcagtccgga 6421 aaaacccgag cagagaacga cggaagacat cctcaagact gtgtacgacg cactggagga 6481 gaagggttac aatgccatcg atcagatggt cggctacatt ctttccggcg atccctccta 6541 tattacgggt cacaacaacg ccagaaacct catccggcat atcgaacggg acgatctggt 6601 agaggaactt ctccggaatt tcctgaagaa ataatcggca tatcatcgca aagaaacaaa 6661 acaaagcgga ctttacaggt ccgcttgttt tggaatatgg ggacattttt atgaggatac 6721 tgggactgga tatcggggac aaaacgatcg gcgtcgccgt aagcgatccg ctgttcatct 6781 ccgcccaggg ggtgaccacg atcgaacgga tcggcgttaa gaaggatacg acgaaagtgc 6841 tggaatacgc gaaggaatac gaagccggca ccatcgtctc gggacttccc ctgatgcttt 6901 ctggcgaaga cagcccgcag acgcagaaag tgcgggaatt cgtggagaaa ctgcagaata 6961 aggcgcgaag cacggggatg aaactgcagt tcgtctttca ggacgagcgc tttaccacga 7021 aaatcgcaga agacgtgctg atcgctgcgg atatgcgcag agaaaagcgt aagactatca 7081 tcgaccgcca ggcagcggtc atcatcctgc aaagctacct ggatgccaac cggggaaaac 7141 tcacgttata ggaaaggaca agagcaagga aaacatgggt agactaggat ttttcttcaa 7201 catgaacacc tgcctgggct gcggagcctg ccaggtggcc tgtaaagacc tgcacggtct 7261 gcagcccggc gagttcttcc gccgcgtgga gaccatctcg gtcgaagcgg gcggtcagaa 7321 ggtgtacgcg cactactccg gcgcctgcaa ccactgtgaa gaggcaaact gtgtaaaagc 7381 ctgtcctaca ggcgccatgc acaaggcggc ggacggcacg gtcgtgcacg acgacaacct 7441 ctgcatgggc tgcggcagct gcatgtggaa ctgccccaac ggcgcagtct ctttctccct 7501 cacgaagggc gtagcgcaaa agtgtgatgc ctgcgccgag ctgagagaaa ggggatacga 7561 acctgcctgc tgcggtgcat gtccgaccag atcgctgaaa ttcggtgata tcgacgaact 7621 gcagaaagaa tacggcgttt ccgcagcgga gcggggtttc ctgcccatcg cggacatcac 7681 ggatccgaac ctgatcgtaa aactgccggc aaacgtagta aaagctctga agggaggcag 7741 cgcacatgca gaagatctat aaatacatca tcgtcggtgc cgggatcgct gcagtgagcg 7801 cggcagccgg catccgggag accgatccgg acggcgccat cctgatggta ggtgacgaag 7861 ccgttcccgc ctatagccgt cccatgctca cgaagacgcc gctccgctcc tacgaactgg 7921 gccgtaccat cgtctacgga cccgaatggt ataaagataa taagatcgac ctggtgctgg 7981 gcacgaaggt gaagggcatc gacaattcgt ctcgccttgt gaccctttcc aacggcgata 8041 cctttttcta caaccgtctg atctactcag ccggcgccaa cggatttgtg ccgcccatca 8101 agggcgccga tctgccggag gtcgtcgtca tccgccgtta tgaggacatc ctgaaggtca 8161 agcgcctgtc cgtgaacacc ggcaaagctg tcatcatcgg cggcggcgtc atcggcctgg 8221 aagcgggctt cgagctggcg cgctacggcc tggacgttac ggtgctggag gcgctgccca 8281 tgctcatgcc cagattcctg gacgaagact gcgcgcggat gctggagaga tccatccatt 8341 cgttcccggt ctataccggg gtgacgatcg aggagatcgc cggaaacgga cacgtggaaa 8401 gcgtacggct gcaggacggc agggaattcc cctgcgacct cgtcatcatg tccacgggcg 8461 taagggcaga taccgcgctg gcgcaggcgg caggcatcaa atgtgaccgc agcggcatcc 8521 tcatcaacga aaagtgtgag accagcgcca aggacatctt cgcctgcggc gactgtgcag 8581 cctacggcat caactggcag ctgtggtccc aggcgctgga acagggcagg gtggccggca 8641 tcaacgccgc tggaggcacc gcttccatac agcccacgga ttcttccatg atcatcaact 8701 cgccggaggt ctccatgttc tcctgcggcg acgtgggcaa ggacccgaat aaagtctata 8761 cgacggaagt cgacgacaac atgcagccgg acctgttcgc ggtcaacaag aaatttatcc 8821 gttcctacga aaagcgcttc tactgcggcg aaaagctggt gggcgccatc atcatcggca 8881 atctggcccg catgcaggaa ctgaaggagc agatcctggg gatcgctccc cgtgaggtat 8941 agaccatggc atttacgaac agcaagacct ttttatataa cgcgcacatc ctgaagtcgt 9001 tcttcgagga cctggagcgc tggagagagg agtgcgcctg cttcggcatc cgcagcacca 9061 tcgaggacca gcagtacgac gatctgttta aagggactga cgcggatgtg tacatcccca 9121 tgtgggcctc ggcctgcaag ggtcacggag acatcctgat cgaccggacg acctacgact 9181 gcatccgttt ctataaagcc tacggctacg aa // LOCUS sequence003 8597 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence003 VERSION sequence003 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..8597 /mol_type="genomic DNA" /organism="" /note="sequence003" CDS 240..1952 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MLKSHEKYYSESGKRQVLVVDDEIINREMLGFMLASDYNVLYAED GEDALQKIRENSHTLSLVLLDLMMPKIDGFQLMEIMRKDPDLEHIPFIVLTSERSAEVA SLRGGASDFIAKPFEQPEVILARIQRTIELAEDKDIIQNTERDPLTSLFNREFFYRYVE QYDMHHPGQKMDAVALNINHFHLLNELYGWDYGDHVLSAIGNKVRELMAATGGIAGRMD ADSFLLYYPCGADYSAMREMLGKGLLEGKATNSNKVRIRIGVYTDVDRDVKIERRFDRA KQAADTIRSSYTKFVAFYDNSLREKELMEESLIESLDTAVAERQFQIFYQPKYDITGEK PVLCSAEALVRWQHPEYGMVSPGVFIPLFEDKGLIQKVDRYVWEEAAVQIRRWKEKFGV TLPVSVNVSRIDVYAPDFVSNFKKLVKENGLQPQDYYLEITESAYTEDSEQLLAVVGEL REEGFSVEMDDFGSGYSSLNMISTLPIDALKLDMNFIRNMHHKESKNNRIIELMIDIGR YLDVPVVAEGVETEDQVDLLRRMGCHIAQGYYFSKPVSAEAFETFIKEKLEQC" /locus_tag="LOCUS_0150" /note="WP_003439757.1 EAL domain-containing protein (Clostridioides difficile) [pid:32.4%, q_cov:75.1%, s_cov:57.5%, Eval:1.9e-71, partial hit]" /note="MGA_20" CDS 1946..2290 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MLTIEKLKEFGADTEAGLTRCMNNEAFYFRLIGMAAKDPNFEKLE IALAMEEPDDAFEAAHALKGVLGNLALTPLFEPANEMCELLRSRTEMDYDPLLEQLMQA KSQLNALLAE" /locus_tag="LOCUS_0160" /note="MGA_21" CDS complement(2349..3239) /product="diacylglycerol kinase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003233894.1" /transl_table=11 /codon_start=1 /translation="MKKLLFIINPVAGKKHAGSSMYNVVKRFCSAGYLVTIAVTQYKGH GHELAMHAKEEGFDLVVCTGGDGTLNEVTSGIVDGQPIPFGYLPAGSTNDFARTLGIST IPLKATEHIIQEKPKTLDMGNFNDGKQHFIYIASFGAFTEVSYSASQTAKNRFGHMAYL YEGIKDMRHLKAYNVTVEADGDRTYKGRYIFGCVTNTRSIAGLIKLYDKKVDLNDGMFE VMLVKEPKDPIDFSNIILGLSTTVQGNEMFDYFRASDLTFTMDKKAPWTVDGEEAKADK KVHLTNMKEALTIYK" /locus_tag="LOCUS_0170" /EC_number="2.7.1.107" /note="WP_003233894.1 diacylglycerol kinase (Bacillus) [pid:32.6%, q_cov:92.9%, s_cov:90.1%, Eval:1.2e-32]" /note="MGA_22" CDS 3394..4497 /product="efflux RND transporter periplasmic adaptor subunit" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_008762064.1" /transl_table=11 /codon_start=1 /translation="MDSENRENGTMQEKQDNRRSGAGRAVAILVALGLVAFFGYRVYQY LNRPEPEVPVESVNVMVEQAILEDIDQQAPITGRLEPVEEVAIVPLAQGQVTRVYVSVG DKVSKGQTLFTIDSSSVAAQLNQAKVGVDAAQSAYDRMQTLYNEGAVSAQDLESVKTQY LSAKESYNQVAEVISNYTVTSPITGYITSLSVSAGSIAGGSMAGSVANIDSLVVNTTVS ENMAAKIEVGDEVDVYIASVDRTFKGTVTTFSRIPSIGTLTYPLTITMEPDEALFAGMF AEVHMTSEAATNTVTVSSEAVIIKGGRSVVCVVDPATNIPTFREVSVGIDNGTRVQILE GLEEGETVAYSGQQFVTEGEAVTIVGE" /locus_tag="LOCUS_0180" /note="WP_008762064.1 efflux RND transporter periplasmic adaptor subunit (Bacteroides) [pid:27.6%, q_cov:84.2%, s_cov:89.9%, Eval:1.3e-21]" /note="MGA_23" CDS 4501..7650 /product="efflux RND transporter permease subunit" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011461050.1" /transl_table=11 /codon_start=1 /translation="MKFSLAKLTIKRPVSTIMVVLMVIVLGVSAFLDIPKDLMPEMELP YALVMTSYPNASPEEVESMVTVTVEQALAQVENLSDMISYSLENTSVVLIQFNFGTDMN FASLDMREKISLIEDYLPDTCSQPMVMKLNMNALPTMQVYVSADLPLEELNSIVEDNVV SYFERSSGVASVSVNGGLEEEISIVFSQENLTNYGLTLQTIAQILAAENINLPSGNVSR GDSKVIVRTMGKFTSAEELGNIPLMTSDYSKVRLADVATISQGAGKQESITRINGKTAV GIMITKQSDANTVKVSQALKKELARVQAKYPQLNFIVGYDAADFINASLSSVGRSAIIG AVLAVLVVFIFLRNVRSTMVIGISIPLCILLTFAVMNFRHITLNLVTLCSLAIAVGMIV DNSIVVLENIYSTRMKMGSAKEAAEYGTGEVFLAIVASTVTTVLVFLPIALTDGLASIM FGDFCLTIIIALLASLLVAVTVVPMLCSKLMQGNISTDYVRVGHVRYKYKLLPLFNRGL QNLISWYEGVIRRALKKRGRVLLVCFLVFGLSLGLLAMVGTELLPASDEGSINISVDVP YGTSLATTDKLMSQVEDYILQLPEVRYVSMNTSSISALSLGGGASFTVGLCSRTERDRT TDEVAKDIDNFAKGITGIDVSAASSSSIMGMFGDSDIAIYVMGKDLDKLEEVGHDIAAR ASHLDLVESAELDITEGSPEIKVLINRGTASFYGVTAYQLASGLSGALNGVTATNVSID GEDIAVKLSLSDYYADSIENMKQIVINGNYGTPVTVGQIASFEFDNSPANITRYNQSRY FIVNAAIQGDSLAAASEQVQAMLDAYPFPDGYSYEIQGLADTMAEMFGSLFKALIVAIA LVFLVLAAQFESMTMAFIVMMAIPFAMTGAFIAMFLTGTKMSLTSLLGLVLLVGTVVNN SILLVEFINQNKHSMGREEAMVAAGKQRLRPILMTTLTTIVGMIPLSLGYGEGGEILAP MGISIIGGLLTSTLLTLIVIPCMYKLVEERRDASAAKAEARAAEIAALEAKWAEEDAKG N" /locus_tag="LOCUS_0190" /note="WP_011461050.1 efflux RND transporter permease subunit (Desulfitobacterium hafniense) [pid:36.7%, q_cov:96.4%, s_cov:97.3%, Eval:7.8e-194]" /note="MGA_24" CDS 7652..8329 /product="L-fuculose-phosphate aldolase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011017137.1" /transl_table=11 /codon_start=1 /translation="MLLEEKRKELVAIGLRAIREGLTTGTGGNFSVCDRESGLMCITPS GIPYVETTPEQIVVMDVQTGKIVEGDAVPSSECDMHRIFYKYRTDLDAVIHTHTTYAST YSCFRRPLPPIHYLAAFGGTHVNCAEYATYGTVELARNAFRAMEGVKAVLLANHGLLAG GKDLNEAYNITEELEFCCKMVCNAMAMEASGYKPVQLPQDEMDRMVERFKSYGKVHEKH EEI" /locus_tag="LOCUS_0200" /EC_number="4.1.2.17" /note="WP_011017137.1 L-fuculose-phosphate aldolase (Fusobacterium nucleatum) [pid:57.5%, q_cov:100.0%, s_cov:100.0%, Eval:8.9e-69]" /note="MGA_25" ORIGIN 1 cccatctgag agctctggtg cagcggaaga tcgaactggc gcaggcgcag ctgaaagacg 61 aggagaacgg cgttcccggg gtcaccatca gcgtaggcgt cgccttcccg gaccgggacg 121 atcctacgga agatatttac caggacgcgg ataccgccct ttacaaagtc aaaaatgcag 181 gccgcaacgg gctcgcgttt tatgaataga actctctttt tccaaaaagg ggcagaacca 241 tgctaaaaag tcacgaaaaa tactacagcg aatccggcaa acggcaggtg ctcgtggtag 301 atgacgagat catcaaccgc gagatgctgg gctttatgct ggcatcggat tataacgtcc 361 tgtatgcgga ggacggggaa gatgcgctgc agaagatccg ggagaactcc cacacgctct 421 cccttgtgct gttggacctg atgatgccga agatcgatgg tttccagttg atggagatca 481 tgcggaaaga tccggatctg gagcacatcc ccttcatcgt gctcacctcg gagcgttcgg 541 cagaagtcgc gagtctgcgc ggcggcgctt cggatttcat cgctaagcca ttcgaacagc 601 cggaagtcat cctggctcgc atccaacgca ccatcgagct ggcggaagac aaggacatca 661 ttcagaacac cgagcgcgat ccgctcacca gtttgttcaa ccgggagttc ttctaccgct 721 acgtggagca gtacgacatg caccacccgg gccagaagat ggacgctgta gccctgaata 781 tcaaccattt ccacctgctg aacgagctgt acggctggga ttacggcgat cacgtgctga 841 gcgccatcgg caacaaagtc cgggaactca tggcggccac cggcggcatc gcgggccgga 901 tggatgcgga cagttttctg ctgtattatc cctgcggcgc agattattcg gccatgcggg 961 agatgctggg gaaaggcctg ctggaaggga aggcgacgaa cagcaataag gtacgtatcc 1021 ggatcggcgt ctacacggac gtggacagag acgttaagat cgagcgtcgt ttcgaccgcg 1081 ccaagcaggc tgccgatacg atccgcagca gctatacgaa gttcgtcgct ttctacgaca 1141 actccctgcg ggaaaaggaa ctgatggagg agagcctgat cgaaagcctg gatacggctg 1201 tggcagagcg gcagttccag atcttctatc agccgaaata cgacattacg ggcgagaagc 1261 ccgtcctgtg cagcgccgaa gcgctggtgc gctggcagca cccggaatac ggcatggtga 1321 gtccgggcgt atttatcccg ctcttcgagg acaagggcct catccagaaa gtcgaccgtt 1381 acgtctggga ggaagcggca gtgcagatcc gccgctggaa ggaaaaattc ggggtcacgc 1441 ttcccgtgtc ggtaaacgta tcgcggatcg acgtctatgc gccggacttc gtgtcgaact 1501 ttaagaagct tgtaaaggag aacggtctcc agccccagga ttattatctg gagatcacgg 1561 aatccgctta cacggaagac tccgagcagc tgctggctgt ggtgggagaa ctccgggaag 1621 agggattctc cgtggagatg gacgacttcg ggtcgggcta ttcttctctc aacatgatct 1681 ccacgctgcc catcgacgcg ctcaagctgg atatgaactt catccgaaac atgcaccaca 1741 aggagtccaa gaacaaccgc atcatcgaac tgatgatcga tatcgggcgg tatctggatg 1801 ttccggtcgt cgccgaaggc gtagagacag aagatcaggt cgatctgctg cggcggatgg 1861 gctgccacat cgcgcaggga tactatttct cgaaacctgt atccgcggaa gcttttgaaa 1921 cgtttatcaa ggagaaactg gaacaatgct gacgatcgaa aagttgaaag aattcggtgc 1981 agacacggaa gcgggcttaa cgcgctgcat gaacaacgag gcgttctatt tccggctgat 2041 cggaatggcg gcgaaagacc ccaattttga aaagctggag atcgcgttgg ccatggaaga 2101 accagacgat gctttcgagg cggcgcacgc gctgaagggc gtgctgggca acctggctct 2161 tacgccgttg tttgagcctg ccaacgagat gtgcgaactg ctgcgcagcc gcaccgaaat 2221 ggattacgac ccgctgctgg aacagctgat gcaggcgaaa tcgcagctga acgcgcttct 2281 ggccgaatag gacagtacat caaaccaaaa gaaagacccg gcggtcgccg ggtctttgct 2341 gtttttgact atttgtagat cgtgagcgct tccttcatgt tggtgaggtg gaccttcttg 2401 tccgccttcg cttcttcgcc gtccacggtc cagggcgctt tcttgtccat cgtgaacgtc 2461 aggtcggacg cccggaaata gtcgaacatc tcgttgccct gcacggtggt cgagagaccc 2521 aggatgatgt tgctgaagtc gatggggtct ttgggctcct tgaccagcat gacttcgaac 2581 atgccgtcgt tcaggtccac cttcttgtcg taaagcttga tgaggcccgc gatggaccgg 2641 gtgttcgtga cgcatccgaa gatgtagcgg cctttgtagg tgcggtcgcc gtccgcctcg 2701 acggtgacgt tgtaggcctt cagatgccgc atgtccttaa tgccctcgta cagatacgcc 2761 atgtgtccga accggttctt ggcggtctgc gaggcgctgt aggagacttc cgtaaaggcg 2821 ccgaaagagg cgatgtagat gaaatgctgc ttgccgtcgt taaaattgcc catgtcgagc 2881 gtcttgggct tttcctggat gatatgctcc gtcgccttga gggggatggt ggagatgccc 2941 agtgttctgg caaagtcgtt cgtgctgcct gcggggaggt agccgaatgg gatgggctgg 3001 ccgtccacga tgccggatgt gacctcgttg agcgtgccgt cgccgccggt gcagaccacc 3061 aggtcgaagc cttcttcttt ggcgtgcatt gccagctcgt ggccgtgacc cttgtactgg 3121 gtgaccgcga tcgtcacgag atagcctgcg ctgcagaagc gttttacaac gttatacata 3181 gaagatcccg catgcttttt ccccgccacg ggattgatga taaacagcaa ttttttcata 3241 ggataccgtt cctttaaaac acttgaaatt ttaaggatta cacaccctgt ctagtatact 3301 cagttctcct tgcaaatgca agggctttgc tatattatta atggtgaata attatgccct 3361 tttcggggca ggaaaaggaa atatacaacg taaatggaca gcgaaaacag agaaaacgga 3421 accatgcagg aaaagcaaga caacaggaga tctggtgcag gccgggcagt cgcgatcctc 3481 gtcgccctcg gcctcgtcgc tttcttcgga tacagagtct atcaatacct gaaccggccg 3541 gaaccggagg taccggtcga gagcgtcaac gtcatggtgg agcaggcgat cctggaagat 3601 atcgaccagc aggcgcccat caccggccgt ctggagccgg tggaagaggt cgccatcgtg 3661 cctcttgcgc agggacaggt gacccgggtc tacgtcagcg tcggcgataa ggtatcgaag 3721 ggtcagacgc tgttcaccat cgacagttcc tccgtcgcgg cacagctcaa ccaggcaaaa 3781 gtaggggtcg atgcggcaca gtccgcctac gaccggatgc agacgctata caacgaaggc 3841 gccgtgtccg cccaggatct ggagtcggtc aagacccagt atctgtccgc caaggaatcc 3901 tataaccagg tggcggaagt catcagcaat tacacggtca cttcccccat cacgggctat 3961 atcacgagcc tctccgtctc cgccggcagc atcgcgggcg gcagcatggc ggggtccgtc 4021 gccaatatcg attctctcgt ggtcaacacc accgtgtccg aaaacatggc ggcgaagatc 4081 gaagtggggg acgaagtgga cgtttacatc gccagcgtcg accggacgtt caaaggcacc 4141 gttacgacgt tctcccgcat tcccagcata ggcacgctca cctatccgct caccatcacg 4201 atggaaccgg acgaagcgct gttcgccggc atgttcgcgg aagtgcacat gacgtccgag 4261 gcggcgacca acaccgttac ggtaagctcc gaagcggtca tcatcaaggg cggccgcagc 4321 gtcgtctgcg tcgttgaccc cgccacgaac atcccgacgt tccgggaggt gtccgtcggc 4381 atcgacaacg gcacccgcgt gcagatcctc gaggggctgg aagaagggga gaccgtcgcc 4441 tattccggcc agcagttcgt taccgaaggc gaagctgtga cgatcgtagg ggagtagtct 4501 atgaagtttt ctcttgcgaa actcacgata aagagacctg tctccaccat catggtggtg 4561 ttgatggtca tcgtcctggg cgtttccgcg ttcctggaca tcccgaagga cctgatgccg 4621 gagatggagc tcccgtacgc gctcgtcatg acgagctatc ccaacgcatc tcccgaggaa 4681 gtggagagca tggtgaccgt cacagtggag caggcgctcg cccaggtgga gaacctgagc 4741 gacatgatct cctattcgct cgagaatacc tctgtcgtgc tcatccagtt caatttcggc 4801 acggacatga atttcgcttc tctcgacatg cgggagaaga tctctctcat cgaagattat 4861 ctgccggaca cctgttcgca gcccatggtc atgaaactca acatgaacgc gctgcccacc 4921 atgcaggtgt acgtctctgc ggatctcccc ctggaggagc tgaactccat cgtggaagac 4981 aacgtcgtat cgtatttcga gcgctcttcc ggcgtcgctt ccgtttcggt caacggcggt 5041 ctggaggagg agatctccat cgtcttcagc caggagaatc ttacgaacta cggccttacg 5101 ctgcagacca tcgcccagat cctggcggca gagaacatca acctgccctc cggtaacgtc 5161 tcccggggcg acagcaaggt gatcgtccgc accatgggta agtttacgtc tgcagaagag 5221 ctgggcaaca tcccgctcat gacctcggat tacagcaagg tccgcctggc ggacgtcgcg 5281 accatcagcc agggcgccgg caagcaggag tccatcaccc ggatcaacgg caagaccgct 5341 gtgggcatca tgataacgaa gcagtccgac gccaacacgg taaaggtctc ccaggcgctg 5401 aagaaggaat tggcgcgcgt acaggcgaaa tatccccagc tgaacttcat cgtcggctac 5461 gacgcggcgg atttcatcaa cgcgtcctta agttccgtcg gccgctccgc catcatcggc 5521 gcggtcctgg cggtgctcgt cgtgttcatc ttcctgcgca acgtgcgcag caccatggtc 5581 atcggcatct cgatcccgct gtgcatcctg ctcacgttcg cggtcatgaa cttccgccac 5641 atcacgctca acctcgtaac gctgtgctcg ctggccatcg ctgtcggcat gatcgtcgac 5701 aactccatcg tcgtgctgga gaatatctat tcgacgcgca tgaagatggg aagcgctaaa 5761 gaagcggcgg aatacggcac gggagaggtc ttcctggcga tcgtggcgtc cacggtcacc 5821 acggtgctgg tattcctgcc catcgcgctg acggacggcc tcgccagcat catgttcggc 5881 gatttctgcc ttacgatcat catcgcgctg ctggcttcgc tgctggtggc ggtcaccgtc 5941 gtgcccatgc tctgcagcaa actgatgcag ggcaacataa gcacggatta tgtccgtgtc 6001 gggcacgtgc ggtataaata caagctgctg cccctgttca accgtggcct gcagaacctt 6061 atctcctggt atgaaggggt catccgcaga gcgctgaaga agcggggcag agtgctgctc 6121 gtctgcttcc tggtgttcgg tctgtccctg ggtcttctcg ccatggtggg cacggaactg 6181 ctgcccgctt ccgacgaagg ctccatcaat atctccgtgg atgttcccta cggcacgtcc 6241 ctggcgacga cggacaagct gatgtcccag gtggaggact acatcctgca gctgccggag 6301 gtgcggtacg tttcgatgaa tacgtccagc atctcggcgc tctccttggg aggcggtgcc 6361 agctttaccg taggtctgtg cagccgcacg gagcgggacc gcacgacgga tgaggtcgct 6421 aaggatatcg acaacttcgc gaagggcatt acgggcatcg acgtgagcgc agcctccagt 6481 tcctccatca tgggcatgtt cggcgattcc gatatcgcga tctacgtgat gggcaaggat 6541 ctggataaac tcgaggaagt cggccacgac atcgctgcca gagcgtctca tctggatctg 6601 gtcgaaagcg cggaactgga catcacggag ggaagccccg agatcaaggt gctcatcaac 6661 cggggcaccg cgagcttcta cggcgttacg gcctatcagt tggccagcgg tctgtccggc 6721 gcgctcaacg gcgtcaccgc cacgaacgta agcatcgacg gggaagatat cgcggtcaag 6781 ctctccttga gcgattacta cgccgattcc atcgagaaca tgaagcagat cgtcatcaac 6841 ggcaattacg gtacacccgt aacggtcgga cagatcgcca gcttcgagtt cgacaattcc 6901 ccggctaaca tcacgcgcta caaccagagc cgctacttta tcgtgaacgc agccatccag 6961 ggcgacagcc tggcggccgc atccgagcag gtgcaggcca tgctggatgc ctatccgttc 7021 ccggacggct attcctacga gatccagggc ctcgcggata cgatggcgga gatgttcggc 7081 agcctgttta aggcgctcat cgtggccatc gcactggtgt tcctcgtact ggcggcgcag 7141 ttcgaatcca tgaccatggc gttcatcgtc atgatggcga tccccttcgc catgaccggc 7201 gcctttatcg ccatgttcct caccggtacg aagatgtccc tcacgtcgct gctgggcctg 7261 gtgctgctgg tgggtactgt cgtcaacaac tccattctgc tggtggagtt catcaatcag 7321 aataaacatt ccatgggcag ggaagaggcc atggtcgctg ccggcaagca gaggctgcgc 7381 cccatcctga tgaccacgct caccaccatc gtgggcatga tcccgctgtc gctgggctac 7441 ggcgagggcg gcgagatcct ggcgcccatg ggcatctcca tcatcggcgg cctgcttaca 7501 tccacgctgc tcacactcat cgtcatcccg tgcatgtaca aactcgtgga ggagagaaga 7561 gatgcgagcg cggcgaaagc ggaggccaga gcggcggaga tcgctgcact cgaagccaag 7621 tgggccgaag aggatgcgaa aggaaactaa catgctctta gaagaaaaac gcaaagaact 7681 tgtcgctatc ggccttcggg ccatccggga gggccttacg acgggcaccg gcgggaattt 7741 ctccgtctgt gaccgcgaaa gcggcctcat gtgcatcacg ccttccggca ttccctacgt 7801 ggaaacgacg ccggaacaga tcgtcgtcat ggacgtgcag accggcaaga tcgtggaagg 7861 agatgccgtt ccctccagcg aatgcgacat gcaccgcatc ttttacaaat accgcacgga 7921 tctcgatgcg gtcatccata cgcacacgac ctacgcctcc acctacagct gcttccggag 7981 accgctgcct ccgatccatt acctggcggc tttcggcgga acgcacgtaa actgcgcgga 8041 atatgccacc tacggtaccg tggaactggc gagaaatgcg ttccgggcga tggaaggcgt 8101 aaaggcggtg cttctggcca atcacgggct gctcgccggc ggtaaggact taaacgaggc 8161 ctataacatt acggaagagc tcgaattctg ctgcaaaatg gtatgcaatg cgatggccat 8221 ggaagccagc ggatacaagc ccgtacagct cccccaggat gagatggacc gcatggtgga 8281 gcgctttaaa agctacggca aagtgcacga gaagcatgag gagatctaaa tgagacccaa 8341 agccttcgtc tccgcggaga tggactacga gatcgcaaaa cagctcgagg atgtgctgga 8401 catcacctat gactggggca acgccgtcct gagcgtcgag cagatgaagc atgcctgcgc 8461 ggataaagac atcatcatta cgagctacga tcccgttacg aaagacgtga tcgacgctgc 8521 gccgaactgc gggctcatcg tctgcacgcg ggccacgccc gtcaacgtgg ataccgccta 8581 cgccagggaa aagggca // LOCUS sequence004 7872 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence004 VERSION sequence004 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..7872 /mol_type="genomic DNA" /organism="" /note="sequence004" CDS complement(1260..2165) /product="DMT family transporter" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_000802592.1" /transl_table=11 /codon_start=1 /translation="MNRQKQADLVLVIITFFWGIANPVSDYVMNFWQPMQLNALRFVVA LAVSWAVMHKDLRGISKTTLRSGIFVGFLLSLIYLFAMYGIKNSASVTTFSFIVAMPVI INPIINLVFRRIVPQKKFLISLALSVGGLYLMTMKGGDFRIGLGEGLALLSATCYSIDL CFTDVMVARDDVDPKQLGLLQIGFGALFMSLISLVLDRGHALTWTPALFGWLLVLGVGS TAVAFIAQPVAQQYTTSNHVGVIFALEPVFSTLAAILFLHEIVSARAYVGAALMIAAVI LMNVDLKRKDKNDETDPQHL" /locus_tag="LOCUS_0210" /note="WP_000802592.1 DMT family transporter (Bacillus cereus) [pid:33.0%, q_cov:94.7%, s_cov:96.9%, Eval:2.7e-35]" /note="MGA_28" CDS complement(2173..3246) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MAYTSKAKTPAEHPFRTIVKLLDSEALPRVLVCYGHEEFLVNWAE KFVKGKLIEPAAEALDFTVFSEDLDPYSIIAACETLPMLSKRKLVVVHDTDLFTQTPKD MKAEGVQILSEYLANVPETTMLLFTAEKVNKTKALYKNAVKAGVVYDFCPLDRQTLAGW IAKQLQNLGKNASRDDIFAYADKCGYLDKESGYTLYNVKNDVAKAAAFADAQTVTAKDF AACMQGEEETDAFAILDAAFSGQKGKALTILHNSVDAEQASKQDGVVLRFLGLLCSQLE IMLEARERGGRDGDPYSVASAMGANPYRIRKAMDASYRKKYSELKASLAAAYDIEKDFK SGQIDAYLALELFIAGL" /locus_tag="LOCUS_0220" /note="MGA_29" CDS complement(3263..5464) /product="DNA internalization-related competence protein ComEC/Rec2" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011392112.1" /transl_table=11 /codon_start=1 /translation="MFCILFFCLGFLTMEAASAKMSPLLELSEETGSAVQSFEGLVVHA SFKTDRWDLMVRTAEEKVLVRLDAPEEARLAVCSLTGRICRFTGPVRRPDGRRNFGCFD YALYLKGRDVRCLCEVSRFRAEAGELRFRLLNALAVSKARFFDRIAPYMDREAFSLLAG LLFGEKGYLEEDVYVSFQRNGIAHVLAVSGLHVGLVYAVVLKLMQGRRNGKTTAASAIV LLCYICLSGFSVSVLRASFMIGLHLLSFHLHRRYDLVSAASLAACVFLGVNPYQLFDSG FQLSYMAAYSLGVALPRMQLKATELADRYKKGWIDDAGKLLLPCIAVQLGMTPLTLFHF LIFSPVSLLLNPFAVALAGLLLPAGLFLYLVQSFGISLATAAAAGPASAFAHLLLALND AGNALGGSFPMAAPPIGMLCLYYAVFFYWFSEGRAVLLRKGRQRSAALLCLAMTLSSCL LPFWFGLGELLPWQRPLRDVVFVDVGQGDCIHIASDGCHVLVDGGGSAMKNVGEGTLLP YLLKNGVSGLEMAVVTHPDQDHCKGIKELSQKMNIRTIVFPAVYENDISVTEGYRADRF VFAGRGDVIRMGDAVFRVLTPYKDGRVTARTEDRNETCIAGMLETKDLKVLLTADMTDQ TEQWLLADGSDVDADILKVAHHGSAYSSREDFVSAVSPRFAVISCGRNNSYGHPAERIT AMLAEMGVEMLRTDLSGAVGVTLRKDGSLKIEKAGRAVL" /locus_tag="LOCUS_0230" /note="WP_011392112.1 DNA internalization-related competence protein ComEC/Rec2 (Moorella thermoacetica) [pid:29.6%, q_cov:87.3%, s_cov:79.5%, Eval:1.1e-61]" /note="MGA_30" misc_feature complement(5679..>7872) /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_011393212.1:PBP1A family penicillin-binding protein" /note="WP_011393212.1 PBP1A family penicillin-binding protein (Moorella thermoacetica) [pid:33.6%, q_cov:56.0%, s_cov:44.2%, Eval:1.4e-50, partial hit]" /note="MGA_31" /locus_tag="LOCUS_0240" ORIGIN 1 actgtttgac ggagccgccc atcatgcaga caagtcctgc ggccgccatg ccgacgccgc 61 agccgatctc cgcctggcat ccccagcctc cgaaatagtc tgtctcggcc atgaagacgc 121 ccgccatgcc ggcagccaga aggcctttta cggcatcttc ccggccaagg catttgtctt 181 cgcacaggcc ctggatgacc ccgggcacga taccggaagc gcctcccgtc ggaatgcaga 241 cgatggtgcc ggaactgccc gcccattcca tgatggacag agacatctgc gccgccttgt 301 cgacgatgcc gccggcgatc ttctgcggac tgttttcgta gaatgctttt acctggggcg 361 ctttcggtcc gagcagctgg cgcagatcgt tgccttcttt atatccgttc ttctccgatg 421 ccaggatgac gtcccacagg ttttccgcct gggagatgac ctgctgctcc gtccagccgg 481 agatagaaca ttcgtaagcg actgcagcct ccgcgaacgt cttgccgctc tcttcgcacc 541 aggccagcaa ttccgcgggg gtctcgaata ccggcggtct gctgtctgag gtcacgaccg 601 tatgcgccgg tcttgcgtaa ccgaagtgcc gcaggccttc gatattttta aaagcatcca 661 gctgctcctc cgtgggagca tccgccagtt ttacgtcgta cagcagctta tccggcccct 721 cgcagatctt gatctcctcc gggtcgccgg cgatggtgag gatcgccttc accatgtcgt 781 ggcgccgcac ttcccccgca gggtctgtaa acagcagcac ctcgtgggta tagccgcccg 841 tgtgcatggg acagccgtcc gcggattcca ggtagaaccc gcctccgccc acggatgcgc 901 cgcagaaggt cattttccgg cccgtatcgg cattttccag cacgaggcgg acatattccc 961 ccggctctgc cggaaggtcc tcatagaagc cgtattcgat cgcgacgccc ctttccttcg 1021 cctcgtcgta ggcgtcgaag aaaccgggat ccgccgggct gtgacccaga agaccgaaca 1081 cgaacgccag gtcgctgcgc atgccgaaat atgtaaacgt aaacgagccc ttgtccgaca 1141 tctggatgga tgccttcgta atgggcaggc cgaagaactg ccggcagacc gacgcgatgc 1201 gcatggggcc tgcggtgttg gaactggagg gaccgggggt gaccggcgcc aatgcttcgt 1261 taaagatgct ggggatccgt ttcatcgttt ttgtcctttc ttttcaagtc tacattcata 1321 aggatgactg ccgcgatcat gagcgcagca cccacgtatg cccgcgcgga gacgatctcg 1381 tgcaggaaca ggatggctgc cagcgtggag aataccggtt ccagggcaaa gatgacgccc 1441 acgtggttcg aggtcgtata ctgctgcgcc accggctgtg cgatgaaggc gacagcggtc 1501 gatccgacgc caagcaccag cagccagcca aaaagcgcag gcgtccaggt aagcgcgtga 1561 ccccggtcca gcaccaggga gatgaggctc atgaacaatg cgccgaagcc gatctgcagc 1621 agacccagct gtttgggatc cacgtcgtcc cttgcgacca tcacgtccgt aaagcagaga 1681 tcgatggaat agcaggtggc ggacaggagc gccagtccct cccccagacc gatgcggaaa 1741 tcgccgccct tcatggtcat caggtagagc ccgccgacgg agagcgcgag actgatgagg 1801 aatttcttct gcggtacgat gcggcggaac accaggttga tgatgggatt gatgatgacc 1861 ggcatcgcta cgataaagct gaacgtcgtt acgctggcag aatttttgat gccgtacatg 1921 gcaaacagat agatgaggga aagcaaaaac cctacaaaaa taccgctgcg aagggtcgtt 1981 ttggagatcc cccgcagatc tttatgcatg acggcccagg agaccgccag ggcgaccacg 2041 aagcgcagcg cgttgagctg catgggctgc cagaaattca tgacgtaatc ggagaccgga 2101 ttggcgatcc cccagaaaaa cgtgatgatc accaggacca gatcggcctg tttctgtctg 2161 ttcatgtata tactataatc ctgcgataaa cagttccagc gccagatagg cgtcgatctg 2221 tccgctctta aaatcctttt cgatatcgta agccgctgcc agagaggctt tcagctcgga 2281 atactttttc cggtaactgg cgtccatcgc cttgcggatg cggtaggggt tggcgcccat 2341 ggcagaggcg acgctgtagg ggtcaccgtc ccggccgccc cgctccctcg cctccagcat 2401 gatctccagc tgggagcata gaagcccaag aaagcgcagc acgacgccgt cctgcttgct 2461 ggcctgctcc gcgtccacgc tgttgtggag gatcgtaagg gctttcccct tctgaccgga 2521 gaaggctgcg tccaggatgg cgaacgcgtc ggtctcctcc tcgccctgca tgcaggccgc 2581 gaagtccttc gccgtaacgg tctgcgcatc tgcgaaagcg gcggcctttg ccacgtcgtt 2641 tttcacgttg tacagcgtgt aaccggattc cttgtccaga tagccgcact tgtcggcgta 2701 ggcgaagatg tcgtcccggg acgcgttctt gccgagattc tgcagctgct tggcgatcca 2761 gccggccagc gtctggcggt ccagcgggca gaaatcgtag acgacgcccg ccttgacggc 2821 gttcttgtag agcgccttcg tcttgttcac cttttccgcg gtaaacagca gcatcgtggt 2881 ctccggcacg ttcgccagat actccgagag gatctgcacg ccttccgcct tcatatcctt 2941 gggcgtctgg gtaaagagat ccgtatcgtg cacgacgacg agtttgcgct tcgacagcat 3001 gggaagcgtc tcgcaggcgg cgatgatgct gtaggggtcc agatcttccg aaaagaccgt 3061 aaagtccagc gcttccgccg cgggctcgat cagtttgccc ttcacgaact tttccgccca 3121 gttcaccagg aactcttcgt gtccatagca caccaaaacg cggggcagcg cttcgctgtc 3181 cagcagtttt acgatcgtgc ggaacggatg ctccgccgga gttttcgctt tcgacgtgta 3241 tgccataggt ttatatagta tatcataaaa ccgccctgcc cgctttctcg atctttaggc 3301 tgccgtcttt tctgagggtg accccgacag cccccgaaag gtctgtccgc agcatctcca 3361 cgcccatctc cgccagcatg gccgtgatcc gctccgccgg atgcccgtag ctgttgttcc 3421 tgccgcagga gatgaccgca aaacgggggc ttacagcgct tacgaagtcc tctctgctcg 3481 aataggcgct gccgtgatgc gctaccttca ggatatctgc gtccacgtcc gaaccgtccg 3541 ccagcagcca ttgctccgtc tggtccgtca tatccgccgt aagaaggacc ttaaggtctt 3601 ttgtttccag catgccggcg atgcaggtct cgttgcggtc ctccgtccgt gcggtcaccc 3661 gtccgtcttt gtacggcgta agcacccgga acacggcatc tcccatgcgg atcacatcgc 3721 cccttcccgc aaagacgaag cggtctgccc ggtacccttc ggtaacggaa atatcgtttt 3781 cgtaaactgc cggaaacacg atggtgcgga tgttcatctt ctgcgacagc tcctttatcc 3841 ccttgcagtg gtcctggtcc ggatgggtaa cgacagccat ctccagcccg gacacgccgt 3901 ttttcaacag atacggcagc agcgtgccct cccctacgtt cttcatggcg ctgccgccgc 3961 cgtccaccag cacgtggcag ccgtccgagg cgatatggat gcagtccccc tgccccacgt 4021 cgacgaagac gacgtcccgc agaggccgct gccagggcag cagttcgcca aggccgaacc 4081 agaatggcag caggcagctc gagagggtca tggcgagaca aagcagcgcc gccgaccgct 4141 gccttccctt tcgcagcaaa acagcccggc cttccgagaa ccagtagaaa aatacggcgt 4201 aatacaggca gagcatgccg atgggaggtg ccgccatggg aaacgatccg cccagggcgt 4261 ttccggcgtc gttgagcgcc aaaagaagat gcgcaaaagc ggaagccggc cctgccgcgg 4321 ctgcagtcgc gagggatatg ccgaaactct gcacgaggta cagaaacaac cccgccggca 4381 gcagcagacc tgccagcgct acggcaaaag gattcaacag caggctgaca ggcgaaaaga 4441 tcaggaaatg aaacagcgta agcggcgtca tgcccagctg tacggcgatg cagggcaaca 4501 gaagtttgcc ggcgtcatcg atccatccct ttttataccg gtccgccagt tcggtcgcct 4561 tcagctgcat gcgtggcagc gccactccca ggctgtaagc cgccatatag gacaattgaa 4621 atccggaatc gaacagctgg tacgggttga ccccaagaaa gacacaggcg gcaagagagg 4681 ctgcgctcac gaggtcgtag cgccggtgca ggtggaacga gagcagatgc agtccgatca 4741 tgaaggaggc ccgaagcacg gagacggaga aaccggacag gcagatgtag caaagcagta 4801 cgatggccga ggccgccgta gtctttccgt tgcggcggcc ctgcatcagt ttcagtacga 4861 ccgcatacac gagccccacg tgaagtcccg ataccgccag aacgtgcgcg atgccgttgc 4921 gctgaaacga cacgtagacg tcctcctcca gatatccttt ttcgccgaac agcaggcccg 4981 ccagcagcga aaaggcttcc cggtccatat agggcgcgat gcggtcgaag aagcgcgctt 5041 tgctcaccgc caaagcattc agcagccgga agcgcagttc tcccgcctct gcgcgaaagc 5101 gggatacctc acagaggcag cggacatccc gccctttcag ataaagcgcg taatcgaagc 5161 agccgaaatt gcggcgtccg tccggtcttc gcacaggccc cgtaaagcgg cagatccgtc 5221 cggtcagaga acagacagcc agtctggctt cttccggtgc atccagccgc accagcacct 5281 tttcctccgc cgtccgcacc atcagatccc agcggtctgt cttgaaggaa gcgtggacga 5341 caagcccttc gaaggactgc actgcactac cggtctcctc tgacagttcc agcagcggac 5401 tcatctttgc cgaagcagct tccatcgtca gaaagcccag acagaagaac aggatgcaga 5461 acaacacaaa acggctccgc cgcattcccc ggaacataac aaataaggca cctatgcaga 5521 tgcataagtg ccttaccgaa agttccgtat aggctgccaa caggatgccg gctgcctgag 5581 aaaacgcaag ggccgtaaaa ggtcttcgca cggagcatcc gctcccgcat cctcaggcat 5641 tatagcaacg aatggtaata tctgtcaagt cctgtgtgct attcaccgcc gccctcgccg 5701 ctttcgcctc cggtctctcc gccttcagac ggagccggtt gcggttcagg ttccggcgcc 5761 ggctcgggag ctggttccgg ttccgaaggc tcggtcggtg caggttccgg attctcctct 5821 acaggaggct tgtactgcga cggatcggag atgcccggga tgtagtccgg gttgttggga 5881 tcgtattccg taatatcctc ctgcccgttg ttgttcgcat cgccttcagg agtctccggt 5941 tcttccggct catccggttc cacggaatcg taggggctct cgccgttgta cagcggggaa 6001 attggataag cggccggatt cggattgtga atcgggcagt agtagtccgg cgcgtccagt 6061 ttggcgtccg gttccgcatt cacgcctaag gagcgcagtc cgctctccac gaggatcttc 6121 tcccaggaac tgccgccggg acggacgatg ccgaccttcg tggcggtatg cgggcagtcc 6181 ggcgtggcca gatatccggt ctccgcgcag atggtgcact cgcggtggaa gtcctccgcg 6241 ccaccctgca ccgtgccttt gatgaagtac tcggagatcg tgtcgccgcc aacgccggtc 6301 atgccggagt acttgtcgac agtcgctctc acgatgtcgc cgcgcatctc gaactcttcg 6361 cgttcgtaca tgggtcccac gtctttcatg accttggccc acatcttggc cgcgataccg 6421 gagtattccc gcagggagat attgacgtcg ttgcccatcc agaccgtgcc ggtgagctgg 6481 ggcgtgagcc cgcagaacca caggtcgaag ttatcggatg tcgtacccgt cttgcctgcg 6541 gagggctggc tggagatctt cgcgttgctg gacagaccgt tcgttacagt cgtgcgcagc 6601 atatccagca tgatggacgc cacttcctcg gaaaggaccc ttcttgtgat gggttccttc 6661 tgcagaacga tgtcgccctt cttcgtggtc accgtcgtgt agaacgtcgg ttcggtgtag 6721 atgccgtagt tgccgaaggt ggcgtaggcg ccgcacatct ccagaggcga gatgcccttg 6781 gtcatgccgc ccagcgccag ggccgacgcg ttcatgtcgt tgacgtcgcc gttatggacg 6841 atgctggtga tgcccatggc ttcgagctga tccacgcacc actggggatc catctgcagg 6901 tagcactgga ctgccgtcgt gttgatggac tgctcgatgc agtaccgcat gttcttgatg 6961 ccccaatagc cggcgtacca gttcttgggc cagggtttgc cgcccatgac gacgggtctg 7021 tcgtccaaag gcatggcagc ggtaaacgga atgccgtcct tgcctgcctt gccgtcctgt 7081 ccagcctgca gcgcagtgct gtagatggag atcggcttaa tggaagaacc cggctgccgc 7141 ggcgccgttg ctctgttgta gagcagcttg ccttccacgt tgcgtccgcc gatcatgccc 7201 agcacgtagc cggtgcgatg gtccatgatg accatggcgg actggggctg gatcgtgggc 7261 ttgcgaagcg taaagtagtc ggacgtaagg taaaggcgtc cgtcttccag tctatggatg 7321 acgtcaggat gatcctcgaa gaacttggcg ctgatgatca tatcgccgtt gtcgtcgcgg 7381 gtcttgtatt cggaggccac ggcccagttt ccgccctcga tgctgtacag aagaccttcg 7441 ttcttctcgt acatgttctt gaactcgatg gtgtagtccg tgccgttgcc gctggtcgtc 7501 ttatagaaat tgaggcgttt gtccttcagc agcttgagat cgccgttgcc ctgccactcg 7561 aactcctcga gcggcatcac aaagtcgccg tcctcgtcga acatcacgct cttgctgtag 7621 agcatgatct tgccgttgtc gccgatgatg ttgccgctgc cgtccgtgcg gtagccgctg 7681 atggtgggcc agccggaatt gtccgcccag accgcttcca tgatctcctg gatctcgcgg 7741 ttcatggtcg tgttgatgtg cagaccgccg ttgtacagca tgcggtccgc ttcttcctcg 7801 gagaggccca gctcccgcat catgtcctcg cggacctgct ttacggcaca gtccgtgaaa 7861 taggacgtga cc // LOCUS sequence005 7867 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence005 VERSION sequence005 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..7867 /mol_type="genomic DNA" /organism="" /note="sequence005" CDS complement(876..1403) /product="nitroreductase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_008765867.1" /transl_table=11 /codon_start=1 /translation="MENESIKTLLTRRSVRKYKPEHITEEEMEIILEAGKYAPTGKGTQ CTKFVVVRNKAVRDKLSEINAEILGANSDPFYGAPDLIAVFANSAATGTWIEDGSLAMG NLMNAAHAIGVASCWINRARQTFDSPEGRAMATAWGIPESYKGIGYCILGYADGDEPLP KPRKEDFVVYVD" /locus_tag="LOCUS_0250" /note="WP_008765867.1 nitroreductase (Bacteroides) [pid:36.0%, q_cov:88.6%, s_cov:88.4%, Eval:2.2e-22]" /note="MGA_33" CDS complement(1430..2494) /product="butyrate kinase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_004454677.1" /transl_table=11 /codon_start=1 /translation="MERILVINPGSTSSKIAVYDGEQQVFLENINHPVEEIGVYPTTYD QLQYRIDAIAVTLQKAGIAADSFDCVMGRGGGIARLATGGYEVNQALLDSAKDHPLFDH VSNIGAALAYHFAQMSGCKAYIYDAVSAETLLPVAKITGLDGMERTSLCHVLNARAMSI RYAKEQGKKYEDMNLIVAHMGGGITVSAHCHGRIIDNVRDDGGPMSPTRCGAVNTMDVV DLCYSGKYTYEQMAKKVRGDAGLTNLLGTHNAREVERRIEEGDAYAKLVYDAMGFQVAK YAAMMIGSFTEPVDAVILTGGIAHSKMLTGTIKEHLEHTVKVVVMPGENEMEALAFGGL RILRGEEAANPAYE" /locus_tag="LOCUS_0260" /gene="buk" /EC_number="2.7.2.7" /note="WP_004454677.1 butyrate kinase (Clostridioides difficile) [pid:46.7%, q_cov:98.0%, s_cov:97.5%, Eval:1.2e-91]" /note="MGA_34" CDS complement(2494..3681) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MNKPSSTLSNTVQRRKDRFIKTFASRSGFVREQGIYEKLKGSGLV PTMLSAQDGTIETQYEEGTNFYEFFLAAGNDPAKQAACFELFFSWYRRYRELTNISIGE TDFRDFIVQGDSLMCLDLEHCRPGSAEEDVARLACMLALYPKGYTGAGLDSAKLFICVG SSYLNWHPETLAKAVPAAADGIEGSLGLKKHPGMALYLAAYFTTAGAVLAGGRSSRMHQ DKRQMEVDGRTMLEASTSLVAAMPQRMVSVAKGEDVQFPGFETICDEREDIGPLEGIVR CLRVSRQPWTLFLTCDMPLLTDKLLRLFLSYPKEDADVFLFEAGGRIQTFPLLLRTENA VRALQEALDKDERKVQDALMNRLKVRRIRAEDFKDFAPRMLWNINTPEDYQEITK" /locus_tag="LOCUS_0270" /note="WP_005817332.1 molybdenum cofactor guanylyltransferase (Desulfitobacterium hafniense) [pid:32.4%, q_cov:46.8%, s_cov:89.9%, Eval:2.4e-16, partial hit]" /note="MGA_35" CDS complement(3674..4234) /product="phosphoribosyltransferase family protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011016017.1" /transl_table=11 /codon_start=1 /translation="MKEYYEMQIAGLTRKLPICKLTQDLCIAGFVIFGDPDLTVAAAGE LVKRMPEHDYMITAEAKGIPLIHEMARQAGEKKYILARKAEKVYMRDVFHVTVNSITTR FQQTLYLDGADAALMKGKKILVVDDVISTGESLKAIEALVEAAGGTVCGRMTILAEGDA AKRDDIIYLEKLPMFDSEGEPLE" /locus_tag="LOCUS_0280" /note="WP_011016017.1 phosphoribosyltransferase family protein (Fusobacterium nucleatum) [pid:52.9%, q_cov:93.5%, s_cov:98.3%, Eval:7.2e-46]" /note="MGA_36" CDS complement(4295..4552) /product="TIGR03905 family TSCPD domain-containing protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003357396.1" /transl_table=11 /codon_start=1 /translation="MQYTYRTSGTCSRVINFDVTDGKVHDVSFIGGCDGNLKAIGKLVE GHDATEVIKLLKGNTCGYKNTSCGDQLALALEAALAQQAQ" /locus_tag="LOCUS_0290" /note="WP_003357396.1 TIGR03905 family TSCPD domain-containing protein (Clostridium) [pid:55.9%, q_cov:80.0%, s_cov:79.1%, Eval:7.5e-17]" /note="MGA_37" tRNA 4703..4790 /product="tRNA-Ser" /inference="COORDINATES:profile:Aragorn:1.2.38" /locus_tag="LOCUS_t0010" /note="Aragorn_1" CDS complement(4847..6067) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MEKMEELKEMRKKIHRTLTGPALPIDAVLDAVDVLVREMQSGVYS DLLGDYDLSNSPERLSITAKQMGRRTLLKRLEEELTPLKDTPELTRRRVPLGVLLHIAA GNTDVLPVFTVLEGLITGNINIVKLPSHDGGFTEKMVDILLHLEPRLSEYIYLVNAPSS DVDTLSYLAEMSNAVVVWGGDDAVRSIRRITEPDTKIFEWGHKLSFAYLSGDFMHWSVE NDLKGLARHIFRTQQLLTSSCQVIYLDTDDPAKQQQFCERFLPILENEFVTEEANDNVI SEGTLKRFTARTKERESLPGEKDYKADHCCLTACEDQALDGSGRFGHMLVKRLPQEQIV SVLSPYNGYLHTAGVLEAGTKIQELLIHAGVTRITRLADMSKYFDGEAHDGVFPLELYT KIVDIQK" /locus_tag="LOCUS_0300" /note="MGA_38" CDS 6176..6808 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MILYAAETILYLTFLGMDIFGLGNTTPLKFLSILLLTLSVLDFRE KTVTIALAFTAAADVFLLLLDRYYEAGILCFIAVQICYALRLQKETGGSFRPYLLSPLA GLAACSIRGFGLTEALAAAYIALFAVNLVRAAILAGSRQERKWLLFAAGLALFFCCDLC VGLHNLPGLGSAGLHRFANVAMWGFYLPGQCLIRASAYPAVRKETVL" /locus_tag="LOCUS_0310" /note="MGA_39" CDS 6805..7491 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MKSKGFSCLLAILLALFAISASVSAPILCRPFYYAHIEALDMPEK TGWTAEQIREAFDDVMDFLLKGTEFRTGDLLWSESGKTHFADCKVLFHLDLWIFAVTGA LLLAVFWAFRRKKQRPARPAGHGPSFWAGVLILVLFGGFGAFAASDFDRAFTVFHKIFF PGKTNWVFDPRTDQIILVMPEEFFRNCAILIAALLALFVVLFFVLDKRVKISSVVDESG KNDRDQ" /locus_tag="LOCUS_0320" /note="WP_011101692.1 TIGR01906 family membrane protein (Lactiplantibacillus plantarum) [pid:31.6%, q_cov:59.6%, s_cov:55.4%, Eval:1.5e-10, partial hit]" /note="MGA_40" ORIGIN 1 gaaccagcgg atgttgcagt agagcatcgg cgtgtaaccg gattctttta cggtctcgca 61 gaacgcgatg gcgtggtctg tccgcgcctg ctgcgagagt tccgccgtcc ttgccgtcgc 121 gctggcggcg tcctcgatgt ccaggacgat gggccaggtc acgttatacg gccggatgtt 181 ctccataacg aactgcgcct cttccacggc ttcttccacg gagatggcct gggtcacgaa 241 atagacaccc accgcgatgc cgttctgcag cgcgccgcgg atgttgtcct cgaagcggtc 301 gtcctttacg agaagaccgc tctcgtagcc acggtagccg aggcggataa agacgaactt 361 gacgccgctc gccgccacct tctcccagtc gatgtctccc tgataggtgg acacgtcgat 421 gcccttgatg gaaacggtct ccccatccac ggcgtattcc acttctctcg gcgtttcgct 481 cacctccacc agattgctcc aatcgtaatc ggactgcgga agactgcggt cgatggacgc 541 gtactgaaac acgccccccg cgccccggta gacgatgaga ttcggcagca gatcctgcag 601 cagttcccag acggaagcgt cgttccggcc gaactcctgg atctctccca cggtatacga 661 tacgatctcg tcctgcggcg taagcacggt gtccggcttc gcggaaggct cggtctgccc 721 gccctgctgc gtgcagcctg tgagaaggct tgcgagaaga gcgatgcaga gtatgatagt 781 cacaaatttc ttcatgaggg tattgtatca tacccaaaga aaaaaaacag gcccgcaggg 841 agcctgtcac agaaaattaa cactctctta accgtttagt caacgtacac cacgaaatct 901 tcttttcggg gtttcggcag gggttcgtcc ccgtccgcgt agcccaggat gcagtagccg 961 atgcccttat agctctcggg aatgccccag gcggtcgcca tggctcttcc ctccgggctg 1021 tcgaacgtct gccgcgcccg gttgatccag caggacgcga cgccgatggc gtgggcggcg 1081 ttcatcaggt tgcccatcgc aagagagccg tcctcgatcc aggttccggt cgccgcgctg 1141 ttcgcgaata cggcgatcag atccggcgcg ccgtagaacg gatccgagtt cgcgcccagg 1201 atctccgcat tgatctccga cagtttgtcg cgcactgcct tgttgcgcac gacgacgaac 1261 ttcgtgcact gggtgccttt tccggtgggg gcatacttgc ccgcctccag gatgatctcc 1321 atctcctctt ccgtaatgtg ttccggcttg tatttgcgga cacttcttct cgtcagcaga 1381 gtcttgatgc tttcgttttc catgggtctc ctccttccga tccgggatgt tattcataag 1441 ccggattggc agcctcctcg ccccgcagga tgcgaagacc gccgaaagcg agcgcttcca 1501 tctcgttttc tcccggcatc acgacgactt ttaccgtatg ttccagatgt tccttgatgg 1561 ttccggtgag catcttcgaa tgggcgatgc cgcccgtcag gatgaccgcg tccacgggct 1621 ccgtaaaact gccgatcatc atggccgcgt atttcgcgac ctggaagccc atggcgtcgt 1681 acaccagttt cgcgtatgcg tccccttctt cgatgcgcct ctccacctct ctggcgttgt 1741 gcgtgcccag caggttcgta aggcccgcgt cgcctctcac ctttttcgcc atctgctcgt 1801 aggtgtattt tccgctgtag cagagatcca cgacgtccat ggtgttgacc gcgccgcagc 1861 gggtgggaga catggggccg ccgtcatctc ttacgttatc gatgatccgt ccatggcaat 1921 gggcagagac ggtaatgccg cctcccatat gcgcgacgat caggttcatg tcctcatatt 1981 ttttgccctg ctccttcgcg taccggatgc tcatggcgcg tgcgttgagc acgtggcaca 2041 ggctggtgcg ctccatgccg tcgagacctg tgatcttcgc gacgggcagc agggtttccg 2101 cgcttacggc gtcgtagatg taggccttgc agccgctcat ctgcgcaaag tgatacgcca 2161 gcgccgcgcc gatgttagat acgtggtcga acagcggatg gtctttggcg gagtccagca 2221 atgcctggtt cacttcgtag ccgccggtgg caagacgggc gatgccgccg ccccgtccca 2281 tgacgcagtc gaaggaatcc gctgcgatcc cggctttttg cagcgtgacc gcgatagcat 2341 cgatgcggta ctgcagctgg tcgtacgtcg tcggatagac gccgatctcc tcgacagggt 2401 ggtttatatt ttccagaaac acctgctgtt cgccatcgta gacggcgatc ttggacgaag 2461 tgcttccggg gttgatgaca agaatacgtt ccattatttc gtgatctcct gataatcctc 2521 gggggtattg atattccaaa gcatgcgggg cgcaaagtcc ttaaagtcct ccgcccggat 2581 ccgcctgact ttcagacggt tcatcagagc gtcctgcacc ttccgttcgt ccttgtccaa 2641 cgcttcctgc agcgctctta cggcgttctc cgtgcggagc agcagcggga aggtctgtat 2701 tctgccgccg gcctcaaaca ggaaaacgtc cgcgtcttcc ttcggatagc tcaggaacag 2761 gcgcagcagc ttatccgtca gcagaggcat gtcgcaggta aggaacaggg tccagggctg 2821 ccggctgacc cgcagacagc ggacgatgcc ctccagcggt ccgatatctt cccgttcgtc 2881 gcagatcgtt tcgaatccgg gaaactgcac atcctcgccc tttgcgacgg acaccatgcg 2941 ctgcggcatc gcggccacca gagacgtgga agcttcgagc atcgtacggc cgtccacctc 3001 catctggcgc ttgtcctgat gcatgcgcga cgatcttcca cccgccagga cagcgcctgc 3061 cgtcgtgaaa tacgccgcca gatagagcgc catgccggga tgtttcttta accccagcga 3121 accttctatg ccgtcggccg cggcggggac cgccttcgcc agcgtttcgg gatgccagtt 3181 cagataactg gagcctacgc agatgaagag ctttgcactg tcgagcccgg cacctgtata 3241 ccctttcgga tacagagcca gcatacaggc cagacgcgcg acatcttcct ctgcggagcc 3301 gggacggcaa tgctccagat ccaggcacat cagggaatct ccctgcacga taaagtcccg 3361 gaagtcagtc tccccgatgg agatattcgt cagttcccgg tatctgcggt accaggaaaa 3421 gaacagttca aaacacgcag cctgtttcgc cgggtcgttt ccggcggcga ggaagaattc 3481 gtagaaattc gttccctctt cgtactgcgt ttcgatcgtg ccgtcctgtg ccgacaacat 3541 cgtcggcaca agaccgcttc cttttaattt ttcgtagatc ccctgctccc ggacaaaacc 3601 gctgcgggag gcaaatgtct tgataaaccg gtctttgcgc ctctggacgg tgttgctcag 3661 agtcgaggac ggcttattca aggggttctc cttcgctgtc gaacatgggc agcttttcca 3721 ggtagatgat gtcgtcgcgc ttcgcggcgt caccctccgc caggatggtc atgcggccgc 3781 agaccgtgcc gccggcagct tccaccagag cttcgatcgc cttcagggat tcgccggtag 3841 agatgacgtc gtccacgacc aggatcttct tgcctttcat cagtgcggca tcggcgccgt 3901 cgaggtacag cgtctgctgg aaccgcgtcg taatggagtt gaccgttacg tggaacacgt 3961 ctctcatgta gaccttttcc gcttttctgg ccaggatgta cttcttttcg ccggcctggc 4021 gggccatctc gtggatgaga ggaatgccct tcgcttctgc agtgatcata tagtcgtgct 4081 ccggcattct cttgacgagt tctccggcag ctgcgaccgt aagatccgga tcgccgaaga 4141 tgacgaagcc tgcgatgcac agatcctgcg tcagcttgca aatggggagt ttgcgggtaa 4201 gacccgcgat ctgcatttcg taatactctt tcatggggta cctcgtttat aaatagaaaa 4261 ggacagcgaa agccgccctt gcctgtacgg tgctttactg cgcctgctgt gccagagcag 4321 cttcgagcgc cagcgcgagc tgatcgccgc aggatgtgtt cttgtagccg caggtgttgc 4381 ccttcagaag tttgatgact tccgtcgcgt cgtgaccttc cacgagcttg ccgatggcct 4441 tcaggttgcc gtcgcagccg ccgataaagg atacgtcgtg gactttgccg tccgttacgt 4501 cgaaattgat gacccgggag caggtcccgc tggttctgta ggtgtattgc atttggtgtt 4561 gcctttctta agtttatctg attttgccgc ctgttactgc acaaaaagta tacaccaaac 4621 agaaaacaaa ataaactgct tgctttttgt cgggcggtgt tataatatat ttgagcgaca 4681 taaaggaaac agaaattagc acggacgatt gaccgagtgg ctaaggagct cgcctggaaa 4741 gcgagtaggg ctgaaaggcc tcgtgggttc gagtcccatg tcgtccgcca atgcataaga 4801 cccacccttt gcgggtgggt cttgttttgt acgatgtgcg tatttgttac ttctggatat 4861 ccacgatctt cgtgtacagt tccagcggga agacgccgtc gtgagcctcg ccgtcgaaat 4921 acttggacat atccgccaga cgggtgatgc gcgtgacccc tgcatggatc agcagttcct 4981 ggatcttcgt gcccgcttcc agcacgcctg ccgtgtgcag gtagccgtta tagggagaca 5041 gcaccgatac gatctgttcc tgcggcagcc gctttaccag catgtgtccg aaccggccgg 5101 agccgtccag cgcctggtct tcgcaggccg ttaagcagca atggtccgcc ttgtagtcct 5161 tttcgcccgg cagcgactct ctctctttcg ttctggcggt aaaccgcttg agcgtgcctt 5221 ccgagatgac gttgtcgttc gcttcttccg ttacgaattc gttctccagg atcggcagga 5281 accgttcgca gaactgctgc tgtttcgccg ggtcatccgt atcgaggtag atcacctggc 5341 agctgctggt aaggagctgc tgcgtgcgga agatgtggcg ggcgagaccc ttcagatcgt 5401 tctccacgct ccagtgcata aagtcgccgg acagataggc gaagctcagt ttgtgacccc 5461 actcgaagat cttggtatcc ggttccgtga tgcgccggat cgaccggacg gcatcgtcgc 5521 cgccccagac gacgactgcg ttggacatct ccgccagata gcttaacgta tccacgtccg 5581 aagagggtgc gtttacaaga tagatgtatt cggaaagccg cggctcgaga tggagcagga 5641 tatccaccat cttttccgta aatccgccat cgtgggaggg aagcttaacg atgttgatgt 5701 tgcctgtgat gagcccttcc agcaccgtaa atacgggcag cacgtccgta ttgccggcgg 5761 caatgtgcag cagcacaccc agaggcactc tgcggcgggt gagttccggg gtatccttca 5821 gcggggtgag ttcctcctcc agccgcttca gcagcgttct tctgcccatc tgctttgccg 5881 tgatggacag tctttcgggg gaattcgaca ggtcgtaatc accgaggaga tcgctgtata 5941 cgccgctctg catctcccgg acgagcacgt ccaccgcgtc cagcaccgca tctatgggaa 6001 gcgccggacc cgtaagtgtc cggtgtatct ttttccgcat ttctttcagt tcttccatct 6061 tctccattcc tgcaacctcc tcgatccgac aggtaacgac agaactccga ttgttagttt 6121 cagtatacca aaaaaaatat gataaaatat agcaaaacgg aaaggacgcg atggaatgat 6181 cctctacgca gccgaaacaa ttttatacct gactttttta ggaatggata ttttcggtct 6241 tggaaacacg acgccgctaa aatttctatc cattttgtta ttgaccttat ctgttctcga 6301 tttcagagaa aaaacggtga ccatcgccct cgcatttacg gcagcagcgg acgtattttt 6361 gctgctgctc gaccggtatt acgaagccgg catcctctgt tttatcgccg tgcagatctg 6421 ctatgcgctg cgtctgcaaa aggagaccgg agggtccttc cgcccctatc tcctgtcccc 6481 attagccggg cttgccgcct gcagcatccg cgggtttggc ctgacggaag ccctggccgc 6541 cgcgtatatc gccctgtttg cggtcaacct cgtgcgcgcc gccattctgg caggcagcag 6601 gcaggaacgc aaatggctgc tgttcgccgc agggctcgcc ctgttcttct gctgcgatct 6661 ctgcgttggg ctgcataacc tgcccggact cggatccgca gggctgcacc gctttgcgaa 6721 cgtcgccatg tggggctttt atctgccggg tcagtgcctt atccgtgcgt cggcctatcc 6781 cgccgtcaga aaggaaacgg tcctatgaaa agcaaagggt tttcctgcct attagctatc 6841 ctgctcgcgc tgttcgccat cagcgcttcg gtctctgccc ccatcctctg ccggccgttt 6901 tactacgccc acatcgaagc gctcgatatg ccggaaaaga caggatggac agcggaacag 6961 atccgcgagg cgttcgacga cgtgatggat tttctgctga aagggacaga attccggacc 7021 ggcgatctcc tctggtccga atccggaaag acgcactttg cggactgcaa agtgctgttt 7081 cacctcgacc tttggatctt cgccgttaca ggcgcattgc ttctcgccgt cttttgggcg 7141 ttccgccgca aaaaacaaag acctgcccgt ccggcaggcc atgggccttc cttctgggca 7201 ggagttctta tcctcgtgtt attcggcgga ttcggcgcgt ttgcagccag cgatttcgac 7261 cgggcgttta ccgtatttca caagatcttc ttcccgggaa agacgaactg ggtgttcgat 7321 ccccgcaccg atcagatcat tctcgtgatg ccggaggaat tcttccgcaa ctgcgccatc 7381 ctcatcgcgg cgctcctggc actcttcgtc gtcctgtttt tcgtcctaga caaacgggtt 7441 aaaatatctt ccgtggttga cgaaagcggt aagaacgacc gagatcagta gcaccgccag 7501 tcccagcagc atcgcaccga agtcccacgc cgtaaatttg cggtagcggt accaggtgcg 7561 ctttttattt ttgccgaaac tgcgcagttc catggcattg gagatcacct cgatccggtc 7621 catgctggac aggatgagcg gcaccagcgt gccggatgca gtctttaagc gcgcgcccag 7681 agatgccttc ttcgacatct ccacgcccct cgcctgcagc gacagcgtaa tgtcgtggta 7741 ctcccgctgg atgtccggga tataccgcag cgccagcgcc acggagtagg cgatcttgta 7801 attcacgccg atgcggttga gggacgacgc gaattcgctc ggatccgtcg tcgtaacgaa 7861 caacagc // LOCUS sequence006 7866 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence006 VERSION sequence006 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..7866 /mol_type="genomic DNA" /organism="" /note="sequence006" CDS 267..1238 /product="PhoH family protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011861553.1" /transl_table=11 /codon_start=1 /translation="MSEIRINQDTDLGPRDVFGTLDTNLKAIEKDCGVEIAVRGDEIII NGEEAERAASVIEEMFKVSDAGQPLDEQKVNYILELSREGISYSQSALSKDVVCFTHKG KPLKAKTLGQKQYVDAVRKNDIVFGIGPAGTGKSYLAVAMAINALKNKEVEKIILARPA VEAGERLGFLPGDLQEKVDPYLRPLYDALYDILGRDAALRLKEKETIEVVPLAYMRGRT LDNSFIILDEAQNATKEQMKMFLTRMGFGSKVIVTGDVTQIDLPRGKRSGLVDAMHILN HVEGIAFCRLTDSDVVRHPLVRRIVNAYDRYLQKHPEWAQDE" /locus_tag="LOCUS_0330" /note="WP_011861553.1 PhoH family protein (Clostridioides difficile) [pid:55.9%, q_cov:95.7%, s_cov:91.4%, Eval:1.6e-92]" /note="MGA_43" CDS 1242..1697 /product="rRNA maturation RNase YbeY" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003430894.1" /transl_table=11 /codon_start=1 /translation="MYIYFDDEERVDKKTSAQMYAAAALCAREEDLDDDRLSLSVSFVD ADEIQRLNREYRDKDAVTDVLSFPQFDPYEYMQDWDEVALGDVVICEERARQQAEEYGH SYERELIYLFVHSCFHLLGYDHETEEEKKVMREKEEKVMTELDLRRG" /locus_tag="LOCUS_0340" /gene="ybeY" /note="WP_003430894.1 rRNA maturation RNase YbeY (Clostridioides difficile) [pid:51.3%, q_cov:76.8%, s_cov:75.8%, Eval:6.6e-26]" /note="MGA_44" CDS 1699..2082 /product="cytidine deaminase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_012583680.1" /transl_table=11 /codon_start=1 /translation="MRPTDKELFRMAVKASENAYVPFSNFHVGAALLTKDGQVYTGCNI ENSSYGATICAERTAMVKAVSEGVREFEAIAIAGNGGTSWPCGICRQFMFEFSEDMRVI SGENEDELKSYRLNELLLEGFKL" /locus_tag="LOCUS_0350" /gene="cdd" /EC_number="3.5.4.5" /note="WP_012583680.1 cytidine deaminase (Dictyoglomus turgidum) [pid:56.0%, q_cov:96.9%, s_cov:95.4%, Eval:1.7e-32]" /note="MGA_45" CDS 2079..3011 /product="GTPase Era" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003416645.1" /transl_table=11 /codon_start=1 /translation="MKSGFIGIIGRPNVGKSTLLNSILGEKIAITTEKPQTTRNTIRGI YTRREGEGEDREPACQMVFIDTPGIHKPKNKLGSYMTDTAVNTLKEVDVILFLVDSEFE GEGSGDAYILDLLKSNQTPKLLVINKIDKIDPDTFRRIYEYYEGLDLFDAIIGTNAKSG QNVDELLVTLEDLLAEGPMFFPEDMITDNPMRFLASEIIREKALLYLNDEVPHGVAVEI ERFEEQPGIANISAVIYCEKDSHKGIIIGRDGKKLKGIGKSARLEIEAFLGTKVFLELF VKVKKNWRQSDVMLGNFGYVASWKTDLHR" /locus_tag="LOCUS_0360" /gene="era" /note="WP_003416645.1 GTPase Era (Clostridioides difficile) [pid:53.0%, q_cov:96.5%, s_cov:98.3%, Eval:1.6e-83]" /note="MGA_46" CDS 3018..3758 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MVTDTEGLVLRQIKAANGRRMIVILTKRYGKISAGTSISEGGKNK TALALRPFTYGRYELFKARDSFSINGAETLQSFYAIGEDVDKYMAASYALELTDALAQE AEPQPALLGLIRDFLQLLDERKRAFGTLLIGFQMKALQIEGSAPQLDRCMRTGSREDLQ ALSIAEGGMLCGDYAKDLSADPLVFAVTPDQLSALRYMAAHPIGALKGIGLNEEAEKKL RRLFKAYYAYHLGIENLKSESLLI" /locus_tag="LOCUS_0370" /note="MGA_47" CDS 3786..4544 /product="DUF4342 domain-containing protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003357722.1" /transl_table=11 /codon_start=1 /translation="MEITLEKIELVKDRTGVGYKEAKDALEKTDGSVVDAIILIEETID DSTKETEKKNVQILDTIKEAVRKGNVSKIVIKKDGDIVMNLPVNIGIIGTVLFPWAAIG GCIAALGTKCSIELVKEDGGVVNVSDKASKTFETVKDKGSVIYDEVKDKSGNLFETAKD KGGDLFEAAKGKSGDLFEAAKDKSGELFEAAKDKGGDLYEAARDKGGDLYEAAKDRFVK EKAPEAEETYAKKNDFDLSDLDLDGMEEDK" /locus_tag="LOCUS_0380" /note="WP_003357722.1 DUF4342 domain-containing protein (Clostridium) [pid:34.8%, q_cov:75.0%, s_cov:97.6%, Eval:5.4e-28]" /note="MGA_48" CDS 4566..5969 /product="glycine--tRNA ligase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_012048370.1" /transl_table=11 /codon_start=1 /translation="MNKELTMDQIVALCKNRGFLYPGSEIYGGLANSWDYGPLGVEFKN NVKKAWWKKFVQESPYNVGLDAAILMNPQTWVASGHLASFSDPLMDCKACRARFRADKL IEDFAGANGIDLGGSVDGWSNQEMETFIAEHKIPCPECGKTDFTPIRQFNLMFKTFQGV TEDSKAELYLRPETAQGIFVNFKNVQRTSRKKVPFGICQIGKSFRNEITPGNFIFRIRE FEQMELEFFCQPGTDLEWFAYWKEYCRKFLESLSMNMDKLRLRDHSKEELSFYSRATTD FEYLFPFGWGELWGIADRTDYDLGRHQEVSGQNLEYIDPVTNERYLPYVIEPSLGADRV ALAFLCDAYDEEDLSKDGKTDSRTVMHFHPFLAPYKAAVLPLSKKLSEQAMAIYQDLSK YFSVDYDQSGSIGKLYRRQDEIGTPFCITVDFDTATDGCVTVRDRDTMEQVRMPISELR AYIEKAMEF" /locus_tag="LOCUS_0390" /EC_number="6.1.1.14" /note="WP_012048370.1 glycine--tRNA ligase (Clostridium botulinum) [pid:71.2%, q_cov:98.9%, s_cov:98.9%, Eval:4.7e-203]" /note="MGA_49" CDS 5969..6976 /product="asparaginase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_010948559.1" /transl_table=11 /codon_start=1 /translation="MKKILILNTGGTIGMTRTEKGYMPDREYFRKALINMDSLRAPGMP AWDLAETEELLDSSNMTVRDWNEIAKILADAYDSYDGFVVLHGTDTMAYTSSALSFMLE ELDKPVILTGSQIPLCELRSDGRDNLISSMLIAAEGRVKEVCIYFGGKLLRGNRAMKYS ADGLLAFTSPNYPPLAEAGISIQYNTKAMLDPIKKPFRLQLLEEVPIGVLKVFPGIQFG LFESIMTESLKGIVIETFGAGNIPAGGDALLPIIRRAFENGSILTVCSQCPQGTVSLGT YETSSGLTSAGAVSGKDMTTEAAVAKLYYLFSKGYPKEGIKKLMECNLRGEMRD" /locus_tag="LOCUS_0400" /gene="ansA" /note="WP_010948559.1 asparaginase (Legionella pneumophila) [pid:49.2%, q_cov:99.4%, s_cov:99.1%, Eval:1.5e-85]" /note="MGA_50" ORIGIN 1 cgaaaatctg gaaagcgctc ttaagagatt caagcgttct tgcgccagag acggcgtcat 61 gtccgagctc cgtaagagag aacactatga aaagcccagc gtaaagcgga agaagaagtc 121 cgaagctgca cgcaagaagg cgaacaagag atactaatcc gatcaaagca aacctgagcc 181 gaagccgaaa agcttcggct ttgtgttttc aaagacaggc agtttatggt atcatatagg 241 ttgagtaatt atagggagga tcgtttttga gcgagatcag gatcaatcag gatacggatc 301 tgggcccgag ggacgtcttc ggtaccctgg ataccaactt aaaagcgata gaaaaggatt 361 gcggcgtgga gatcgccgtc cgcggcgatg agatcatcat caacggggaa gaagcggagc 421 gcgcagcgtc cgtcatcgag gagatgttta aagtctcgga tgcgggtcaa ccgctggacg 481 aacagaaggt gaactacatc ctggaactct cccgggaggg gatctcttat tcccagagcg 541 cgctgtccaa ggacgtggtg tgcttcaccc acaagggcaa acctctgaaa gcgaagacgc 601 tcggccagaa gcagtacgtg gacgcggtgc gtaagaacga catcgtgttc ggaatcggtc 661 ctgcgggtac cggcaagtcc tatctggcgg tcgccatggc catcaacgcc ttaaaaaaca 721 aggaagtgga gaagatcatc ctggccagac ctgccgtgga agcgggggag aggctcggtt 781 ttctgcccgg cgatctgcag gaaaaggtag atccctacct gcgtcctctg tacgatgcgc 841 tgtacgacat cttaggcaga gacgcagcgc tgcggttaaa ggagaaagag accatcgaag 901 tcgtgccgct tgcctacatg cgcggccgta cgctggacaa ttcctttatc atcctggacg 961 aggcgcagaa cgccacaaag gagcagatga agatgttcct cacccgtatg ggtttcggaa 1021 gcaaggtcat cgtaacgggc gacgtaacgc agatcgacct gccgagaggc aaacgctccg 1081 gcctcgtaga cgccatgcac atcctgaatc acgtggaagg catcgcgttc tgccggctca 1141 cggacagcga cgtggtgcgt catccgctgg tgcgccgcat cgtaaacgcc tacgacagat 1201 acctccagaa gcacccggaa tgggcgcagg acgaatagct catgtatatt tattttgacg 1261 acgaagaaag agtagataaa aagacatctg cacagatgta cgccgcggcg gcgttgtgcg 1321 caagagaaga agacctggac gacgacagat tgtccctgtc cgtttcgttt gtggatgcgg 1381 acgagatcca gcggctcaac cgggaatacc gggacaagga cgccgttacg gacgtgctgt 1441 cctttcccca gtttgacccc tacgaataca tgcaggactg ggacgaagtg gccctgggcg 1501 atgtggtcat ctgtgaagag cgggccaggc agcaggccga ggaatacggc cacagctacg 1561 aacgggagct gatctacctg ttcgtgcatt cctgcttcca tctgctgggc tacgaccacg 1621 agacggaaga agagaaaaag gtcatgcgcg agaaggaaga gaaggtcatg accgaactgg 1681 acctgaggag gggatagcat gagaccgaca gacaaagagc tattccgcat ggcggtcaag 1741 gcgtcggaaa acgcctacgt gccgttttcg aatttccatg tgggtgcggc gctgctcaca 1801 aaggacgggc aggtctatac cggctgcaac atcgaaaact cctcttacgg cgccacgatc 1861 tgcgccgagc ggacggccat ggtaaaggcc gtatcggaag gcgtacggga attcgaggcc 1921 attgcgatcg ccggcaacgg cggcaccagc tggccctgcg gcatctgccg gcagttcatg 1981 ttcgagtttt cggaagatat gcgggtcatc agcggagaaa atgaggacga actgaagtcc 2041 taccgcttaa acgaacttct cctggaggga tttaaactat gaagagcggt tttatcggca 2101 tcatcggcag acccaacgtg ggcaaatcca cgctgttgaa ctccatctta ggagaaaaga 2161 tcgccattac gacggaaaaa ccacagacga cgagaaatac catccgcggc atctacacga 2221 ggagggaggg cgaaggcgag gacagggaac cggcttgcca gatggtcttt atcgacacgc 2281 cgggcatcca taagcccaaa aataagctgg gcagctacat gacggacact gcggtgaata 2341 cgttgaagga agtagacgta atcctgtttc tcgtcgactc tgaattcgag ggcgagggca 2401 gcggcgacgc ttacatcctg gacctcttaa agtccaacca gacaccgaaa ctgctggtca 2461 tcaacaagat cgacaagatc gatccggata cattccgccg gatctacgag tattacgaag 2521 gtctggatct gttcgatgcc atcatcggca cgaacgccaa gagcgggcag aacgtggacg 2581 agttgctggt gaccctggaa gatctgctgg cggaaggacc catgttcttc cccgaagaca 2641 tgatcaccga caaccccatg cgtttcctgg cttcggagat catccgcgag aaggcgctgc 2701 tgtacctgaa cgacgaagtg cctcacggcg tggctgtcga gatcgagcgc ttcgaagagc 2761 agcccggcat cgcgaacatt tccgcggtca tctactgcga gaaggattcc cacaagggca 2821 tcatcatcgg cagagacggc aagaagctga agggcatcgg aaagtccgcc agactggaga 2881 tcgaagcatt cctgggcacg aaggtgttcc tggagctgtt cgtcaaggtc aagaagaact 2941 ggcgtcagag cgatgtaatg ctgggcaact tcggctacgt cgcgtcctgg aagacggacc 3001 tgcaccggta ggctgccatg gtaacggata ccgaaggtct ggtgctgcgg cagatcaaag 3061 cggcgaacgg ccggcgcatg atcgtcatcc tgacgaagcg ctacggcaag atctccgcgg 3121 gcacgtccat cagcgaaggc ggaaagaaca agacggcgct ggcgctgcgg cctttcacct 3181 atgggcgcta cgaattgttt aaagcccggg attccttcag catcaacggg gcggagacgc 3241 tgcagagctt ctacgccatc ggcgaggacg tggataaata catggcggca tcgtatgcgc 3301 tggaactgac ggacgccctg gcgcaggagg cagagccgca gccggcgctg ctggggctca 3361 tccgggactt cctgcagctg ctggacgaaa gaaagcgcgc gttcggaacg ctgctgatcg 3421 gctttcagat gaaggctttg cagatcgaag gcagcgcgcc gcagctggac cgctgcatga 3481 ggaccggaag cagggaagac ctgcaggcgc tcagcatcgc ggaaggcggc atgctctgcg 3541 gcgactacgc gaaggatctt tcagccgatc cgctggtgtt tgcggtcacg ccggaccagt 3601 tgtcggcctt gcgctacatg gcggcgcatc ccatcggcgc cctcaagggc atcggattga 3661 acgaggaagc ggagaagaaa ctccgcagac tctttaaggc atattatgcg tatcacctgg 3721 ggatagaaaa cctcaagagc gagagtttac tgatctagat cggcttttgc cggaaagggg 3781 aaactatgga aatcacactg gaaaagatcg aactggtaaa agacagaacg ggcgtcgggt 3841 ataaggaagc caaggacgct ctggagaaga ccgatggcag cgtcgtggac gcgatcatcc 3901 tgatcgaaga gaccatcgac gactccacga aggaaacgga aaagaaaaat gtccagatcc 3961 tggatacgat caaggaagcg gtccgcaagg gcaacgtgag caagatcgtc atcaagaagg 4021 atggcgacat cgtgatgaat ctgcctgtca acatcggcat catcggcacg gtcctgttcc 4081 cctgggctgc gatcggcggc tgcatcgcgg cgctgggcac caagtgcagc atcgaactcg 4141 ttaaggagga cggcggcgtc gtaaacgtgt ccgataaggc atcgaagacc ttcgagaccg 4201 taaaggacaa gggttccgtc atctacgacg aagtgaagga caagagcggc aatctgttcg 4261 agaccgcaaa ggacaagggc ggcgatctgt tcgaggcagc caagggcaag agcggagacc 4321 tgttcgaagc ggcgaaggat aagagcggcg aactgttcga agcagcgaag gataagggcg 4381 gcgatctcta tgaggcagcc agagacaagg gcggtgacct ctacgaggcg gcgaaggaca 4441 gattcgtcaa ggaaaaggct cccgaagcgg aagaaaccta cgcaaagaag aacgattttg 4501 acctttccga tctggatctg gacggaatgg aagaagataa atagaacaac aaataggaga 4561 acagcatgaa caaagaactg acgatggacc agatcgtagc gctctgcaag aacagaggat 4621 ttctgtatcc cggctccgag atctacggcg gactggcgaa ttcctgggac tatggtcccc 4681 tcggcgtgga attcaagaac aacgtaaaaa aggcgtggtg gaagaaattc gtccaggaaa 4741 gcccctataa cgtgggcctg gatgccgcca tcctgatgaa cccgcagacc tgggtggcat 4801 ccggccatct ggccagcttt tccgaccctc tgatggactg caaagcctgc cgcgccagat 4861 tccgtgcgga caagctcatc gaggactttg ccggcgcgaa cggcatcgac ctgggcggct 4921 ccgtggacgg ctggtccaac caggagatgg agacctttat cgcagaacat aagatccctt 4981 gccctgaatg cggcaagacc gactttaccc ccatccgtca gttcaacctg atgttcaaga 5041 cgttccaggg ggtcaccgag gattccaagg cggagctgta cctgcgcccc gaaacggccc 5101 agggcatctt cgtcaacttc aagaacgtgc agcgcacgag ccgcaagaag gtgcctttcg 5161 gcatctgcca gatcggcaag tccttccgca acgagatcac cccgggcaac ttcatcttcc 5221 gcatccgcga attcgaacag atggagctgg agttcttctg ccagcccggc acagaccttg 5281 aatggttcgc ctactggaaa gagtactgca gaaagttcct ggagagcctg tccatgaaca 5341 tggataagct gcgcctgcgc gaccactcca aggaggagct gtccttctac agccgcgcca 5401 ccacggactt cgagtatctg ttccccttcg gctggggcga actgtggggc atcgcagacc 5461 gtaccgacta cgacctggga cgccatcagg aagtttccgg ccagaacctg gaatacatcg 5521 atcccgttac caacgagcgc tatctgccct acgtcatcga accctctctg ggcgcagacc 5581 gcgtagcgct ggcattcctg tgcgacgcct atgacgagga agacctgagc aaggacggca 5641 agaccgacag ccgcaccgtc atgcacttcc atccgttcct ggcgccttat aaagccgctg 5701 tcctgccgct gtccaagaaa ctgtccgagc aggccatggc gatctatcag gatctgtcca 5761 agtacttctc cgtggattac gaccagtccg gcagcatcgg taagctgtac cgccgtcagg 5821 acgagatcgg tacgccgttc tgcatcaccg tggacttcga taccgccacg gacggctgcg 5881 ttacggtgcg tgaccgcgac accatggaac aggtccgcat gcccatcagt gagctgagag 5941 cctatatcga aaaggcaatg gagttctagt gaaaaagatc cttatcctga acacaggcgg 6001 caccatcggc atgacccgca cagagaaggg ctacatgccg gaccgggaat atttccgcaa 6061 agcgctgata aacatggatt ctctgcgcgc gccgggcatg ccggcctggg acctggcgga 6121 gacggaagaa ctgctggatt cttccaacat gaccgtgagg gattggaacg agatcgcgaa 6181 gatcctggcg gatgcctacg acagctacga cgggtttgtg gtgcttcacg gcaccgatac 6241 catggcgtac acgtcctcgg cgctgtcctt catgttggaa gaactggata aacccgtcat 6301 cctgacaggg agccagatcc ctctgtgcga actgcgcagc gacggcagag acaacctcat 6361 ctcctcgatg ctgatcgcag cggaagggcg ggtgaaggag gtctgcatct atttcggcgg 6421 aaagctgctg cggggcaacc gcgccatgaa gtattccgcg gatggactgc ttgcttttac 6481 gtctcccaac tatccgcctc tggcggaagc cggcatctcc atccaatata atacgaaggc 6541 gatgctggac ccgatcaaaa agccgttccg tctgcaattg ctggaggaag tgccgatcgg 6601 ggtactcaaa gtcttccccg gcatccagtt cggcctgttt gaatccatca tgacggagag 6661 cctgaagggg atcgtcatcg agaccttcgg cgcgggcaat atcccggcag ggggcgatgc 6721 gctgctgccc atcatccgca gagcgttcga gaacggcagc atccttacgg tatgctccca 6781 gtgtccccag ggcaccgttt cgctggggac ctacgagacc agcagcggtc tgacttccgc 6841 gggcgccgta tccggcaagg atatgacgac ggaagccgca gtcgccaaac tgtattatct 6901 cttctcgaaa gggtacccga aagaagggat caaaaagctg atggaatgca atctgcgggg 6961 ggagatgcgg gattgacccg ggtcatccaa acgaacctga gcaaggtgcg aaagcacctt 7021 gctttttgat tgcttgtgca aagaaaataa cgggaataat ggtaaaatat gcttgacaaa 7081 aactggatgt ttgctatgat aaaaatacac aaaatggtaa atgaggtaaa gtatgaatga 7141 attcagattg gcgctcgttc tgagcgacga agcgctggca tctgccctgg ccagggcgat 7201 cgccaaagaa taccgctatg tcctcgtgca catcggagaa tgggacgagg cggattatac 7261 gatacgggac ggttttctgg gcggccccgc accggtttgg gagatcgtcg accgggcgct 7321 tgcagccagc ggaaagactt tccatttcca aaggaggccc ggctcctgtc ctattacggc 7381 gtttaccgcc ggtggtgggg gcaggggcgt gaccctttgc tctgtcattt acagtgcgat 7441 cgccgccaaa ggagaaaaac gcagcgtgct gcagatcagt ttcgatcctt acgctccggg 7501 aacagaaccg gagcgtggca tgtatctgct cgaaaagatc ctggacggca gctcgcttcc 7561 cttgcagccg gcatgcagga aaatggaaga agggtattat gttccgtcgc agcagacggt 7621 aaataacgtc tttttcgaac tggatgccca gactgttgcc tcttttctgc agacagcgga 7681 agacagcgaa gaatgggacg agatcgtatt ggatgtcccc aggagctatc cccactggcg 7741 ggatgtcatg agcatgtgcg agaactgcgt ggtggtctat agccgccggg aagaccagcg 7801 gcttgccgac gacgcggcgt acgcagagct ctctctgctg gcggagcagc ggccggtcgg 7861 cgcttc // LOCUS sequence007 7296 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence007 VERSION sequence007 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..7296 /mol_type="genomic DNA" /organism="" /note="sequence007" CDS 192..1115 /product="glutaminase A" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003417962.1" /transl_table=11 /codon_start=1 /translation="MESDQRIQEAVKTAYLRGKEVTGKGAVATYIPELGKARPEAVGLC IHTKDGKVFKAGDSGIRFTMQSVSKLLSLAMALEIRGYDTVFEHVGMEPSGVAFNSIVE LDTRDKPHNPLINAGAITVESLLIEYKQFEDMLDFARKVCLDPEITLNRQVYNSEMATC DRNRAIAYLLKSKNVIHTNVDTSIELYTKICSINVSAESLANFALVLANNGVNPHSGER LLKASTAQTVKAIMFTCGMYDGSGTFAVEVGIPTKSGVGGGLLSVVDKQMGIGVYGPAL DENGNSIAGITALQYLSKELNLHMFA" /locus_tag="LOCUS_0410" /gene="glsA" /EC_number="3.5.1.2" /note="WP_003417962.1 glutaminase A (Clostridioides difficile) [pid:49.0%, q_cov:93.8%, s_cov:94.8%, Eval:7.0e-71]" /note="MGA_53" CDS 1248..1835 /product="HD domain-containing protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_002679500.1" /transl_table=11 /codon_start=1 /translation="MQSDMVVAAAKQYIETLFAGNSGGHGTDHTLRVYRNAMAIAEGEI CDPDIVALAALLHDADDHKLFDTKDNANARAFLRTQGVPDEMADRICEAVNAVSFSQNR GRRPETIEGKIVQDADRLDAIGAIGVARTFAYGGEHGRSLDDSIAHFHEKLLLLKDEMN TGTGWRLAEEQHAFLLAFLAEYQKELGEVPQR" /locus_tag="LOCUS_0420" /note="WP_002679500.1 HD domain-containing protein (Treponema denticola) [pid:37.6%, q_cov:93.8%, s_cov:92.8%, Eval:2.1e-33]" /note="MGA_54" CDS 1832..2020 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MRKWVHIAVTVFCMLVLSRFLVRLIDATVQIDSDIGMLALVLLLL NAAIGFASHKLYRTFKK" /locus_tag="LOCUS_0430" /note="MGA_55" CDS 2063..2395 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MNQQPTQTTVYIGLNDSETGVQKFESQKYVSVLKNVCRMYKVAFS VQEIKGGYFHEDGRYTEENSLKLTLVDVPEQTVTELAKDLCAFFHQESVMVTFAPTKVV FIKETI" /locus_tag="LOCUS_0440" /note="MGA_56" CDS 2452..2928 /product="low molecular weight protein-tyrosine-phosphatase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003546643.1" /transl_table=11 /codon_start=1 /translation="MVKVLFICHGNICRSVMAEFIFKDMVRKAGREDAFEIASRATSRE EIGNDMYPPAKRCLTAHGIPFERHFAAQVTRQACEDYDLLVCMDDWNLQNMQRMFGSDY AEKTVKLLDLTPLKRDVADPWYTGDFEQTYRDLVLGCEALLCGSPAPKQFLNNR" /locus_tag="LOCUS_0450" /note="WP_003546643.1 low molecular weight protein-tyrosine-phosphatase (Lactobacillus acidophilus) [pid:42.8%, q_cov:91.1%, s_cov:95.4%, Eval:2.0e-31]" /note="MGA_57" CDS 3047..4429 /product="electron transport complex subunit RsxC" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011948145.1" /transl_table=11 /codon_start=1 /translation="MSSGKHLNGIHVNHCKNTAGQAIIPMTLPEKVYIPMSQHIGAPCQ PVVAVGDHVKVGQKIGDSEAFVCAPIHSSVSGEVTAINKAMSQMGRVDTIIEIVPDGKQ EIAETVVPPVITDKASFIKAVRESGVVGLGGATFPMSVKFNVKPPAKVDTFIVNGAECE PYITVDHQNMLTHAQEIVDGVKAVLHWLEIERAFIGIETNKPDAIKLFKDLLKDEKNIS VAELRQVYPQGAERVIIYETTGRHLIAGKLPADVGCIVSNVTSVLKMQQFLATGMPLVS KAMTVDGNAVADPKNVEVPIGTPLCDVIEFCGGTKADVRKIILGGPMMGRAIPKDEYGV MKGNSAILCFDETAGTQLPETACISCGRCVRGCPMNLMPTKLAKAWEHQDIDTLREYDV TTCMECGCCSYSCPARKQLSFEIKLAKTWVMTEDRKAAEKAKAEAEAAKAKEEEKKEGG DK" /locus_tag="LOCUS_0460" /gene="rsxC" /note="WP_011948145.1 electron transport complex subunit RsxC (Clostridium botulinum) [pid:43.3%, q_cov:92.6%, s_cov:97.7%, Eval:2.6e-97]" /note="MGA_58" CDS 4429..5397 /product="RnfABCDGE type electron transport complex subunit D" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011948146.1" /transl_table=11 /codon_start=1 /translation="MSTKHTNLIVSSAPHVNNPVDTKSIMRDVVIALCPALLVAIYVFG ARALVLTAVCVAACVIFEGATRKILNRPQTIGDWSAVVTGVILAFNLPVTLPLWMAVIG CFAAIVIVKQVFGGLGQNFANPAIVGRIVLFIGFATPMTNWAVTSRMSSVIQSTSVDGV TGATPLGLLAAGKDVPSNLDMFLGTISGSMGEVSAIALLIGGCYLLWRKVITWEIPVAM LASIAVMALLMHQDPIFHIFAGGAMLGSIFMATDYVTSPITSKGKIIFGVGCGVITMLI RVFGSYPEGVSFAILLMNILTPHIDRWTRTHINGVDRKAVK" /locus_tag="LOCUS_0470" /note="WP_011948146.1 RnfABCDGE type electron transport complex subunit D (Clostridium botulinum) [pid:48.9%, q_cov:95.0%, s_cov:96.8%, Eval:2.6e-79]" /note="MGA_59" CDS 5400..5948 /product="RnfABCDGE type electron transport complex subunit G" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011948147.1" /transl_table=11 /codon_start=1 /translation="MDKKAMLAPTIVLVCICLVASMLLAATYQITKPIIDDINIRMANE SRAEVLPEADGFTQLDVDLVDGVTEVYQADNGAGYVMTAAFKGFGGLVTVMTGMDADGV IQNIKVTDASNETPGLGSKTTLPDHTNKFQGVSGTITMDKAGEGTYIAPVTGASYSSKA VFNAVAAALAQYAEIGGAF" /locus_tag="LOCUS_0480" /note="WP_011948147.1 RnfABCDGE type electron transport complex subunit G (Clostridium botulinum) [pid:31.0%, q_cov:97.3%, s_cov:82.1%, Eval:1.8e-17]" /note="MGA_60" CDS 5948..6631 /product="electron transport complex subunit E" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_005904084.1" /transl_table=11 /codon_start=1 /translation="MENKKSKLSIFTNGFIKENPILVLVLGTCPTLAVSTMASNGIGMG LCVTFVLFFSNIFISALKKVIPDQVRIPCYIVVIATFVSVLQMLLQAYLPDLNKSLGLY VPLIVVNCIILGRAEAFANKNSVVDSALDGLGMGLGYTCALTIMACIRELLGAGTIFGH VVTANLFSPMSIFVLAPGGFFTFGCIIAALNKLTKGRVKEKQAANKCLGCPGASVCSKV EEGGC" /locus_tag="LOCUS_0490" /note="WP_005904084.1 electron transport complex subunit E (Fusobacterium) [pid:53.7%, q_cov:89.4%, s_cov:99.0%, Eval:1.9e-58]" /note="MGA_61" CDS 6634..7227 /product="electron transport complex subunit RsxA" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_005904083.1" /transl_table=11 /codon_start=1 /translation="MKEMLMIIMAAVLANNYVLVRFLGICPFLGVSKKLDSAVGMSFAV IFVMVLATAATWPIQRLLLDPNGIGYMQTTVFILVIAALVQLIETFMKKSLPALHKSLG IYLPLITTNCAVLGVCTLNIDEGYTFIQSLMNSFGSGVGFLLAMFLFAGVRSKIEENDY PESFKGVASTLVAASILSVSFMGFSGMIDNIFGM" /locus_tag="LOCUS_0500" /gene="rsxA" /note="WP_005904083.1 electron transport complex subunit RsxA (Fusobacterium nucleatum) [pid:51.9%, q_cov:94.9%, s_cov:96.4%, Eval:3.0e-56]" /note="MGA_62" ORIGIN 1 acgacctggt tgccggcgcc aacatcgcag gcttcaagaa ggtcgcagaa gctatgatgg 61 agcagggctg cttctaagct tttcgatctt tcgaacagaa cacaaaaatt cccggagaaa 121 tccgggaatt ttttgttata atgttaacaa gagaatttat cgtcgcagcc gtaatggcga 181 aggagaaaag gatggaaagc gaccagagaa tccaggaagc ggtaaagact gcctacctga 241 gaggaaaaga agttaccgga aagggcgccg ttgcgaccta cattccggaa ttgggaaaag 301 cccggcccga ggccgtcggc ctctgtattc acaccaagga tggcaaagtc tttaaagctg 361 gagactccgg gatccgcttt acgatgcagt ccgtatccaa gctgctgtcg ctggcgatgg 421 cgctggagat ccggggctac gataccgtat tcgaacacgt gggcatggag ccttccggtg 481 ttgccttcaa ctccatcgtg gagctggaca cccgggataa gcctcacaat ccgctcatca 541 acgcgggtgc tattaccgtg gagagcttgc tcatcgaata caagcagttc gaagatatgc 601 tggatttcgc gcgcaaggta tgcctcgacc cggagatcac cctcaaccgc caggtctaca 661 actccgagat ggcgacctgc gaccgcaacc gggccatcgc ctatctgctg aagagcaaga 721 acgtcatcca tacgaacgtg gataccagca tcgagctgta cacgaagatc tgctccatca 781 acgtgtccgc cgaatctttg gcaaactttg cgctggttct ggccaataac ggggtcaacc 841 cccactccgg cgaacgcctg ctgaaggcca gcaccgccca gaccgtaaag gccatcatgt 901 tcacctgcgg catgtacgac ggttccggca cctttgccgt ggaagtcggc attcccacca 961 agtccggcgt cggcggaggc ctgctgtccg tcgtggacaa gcagatgggc atcggcgtct 1021 acggtccggc tctggacgag aacggcaact ccatcgcggg catcaccgcg ctgcagtacc 1081 tgtccaagga actcaacctg cacatgttcg cgtaacaaga gacattcttc agcccggaaa 1141 acagaagagg atagaataaa agggaacggc aagtggttgc cgttcctttt tgttatgcgg 1201 tatactgttt gcgtgccgga ccggtccggt gcagaaggag gcgcttcatg cagtcagata 1261 tggtagtggc agcggcaaaa cagtatatcg aaacactgtt tgccgggaat tccgggggtc 1321 acgggacgga ccatacgctg cgggtgtacc gcaacgcgat ggcgatcgcc gaaggcgaga 1381 tctgtgaccc ggatatcgtc gccctggctg cgctgctgca cgatgcggac gatcataaac 1441 tgttcgacac gaaagacaac gccaatgccc gggctttcct gaggacccaa ggcgtgccgg 1501 acgagatggc agaccgcatc tgcgaggcgg tcaatgcggt ctccttcagt cagaaccggg 1561 gcaggcggcc ggaaacgatc gagggaaaga tcgtgcagga tgcggaccgg ttggacgcga 1621 tcggcgccat cggagtcgcc cgcacctttg cctacggtgg agagcacggc cggtctctgg 1681 acgattctat cgctcatttt cacgagaagc tgctgctcct gaaggacgaa atgaacaccg 1741 ggaccggctg gcggctggcg gaagagcagc acgcgtttct cctggctttt ctggcggaat 1801 atcagaaaga actgggggag gtgccgcagc gatgagaaaa tgggtgcata tagccgtaac 1861 ggtcttctgc atgctcgtac tctcccgctt tctcgtgcgg ctgatcgacg ccaccgtgca 1921 gatcgacagc gatatcggaa tgctggcgct ggtgctgctc ctgctgaacg cggcgatcgg 1981 gttcgcgagt cataaactgt accgcacttt taagaagtag accggcatga ccgggaggaa 2041 ggatatattg cgagggagca gtatgaatca acaaccaacg caaacgacag tttatatcgg 2101 tttgaatgat tccgagaccg gcgtccagaa atttgagtcc caaaagtatg tttcggttct 2161 gaaaaacgta tgcaggatgt acaaagttgc cttttctgtt caggagatca aaggcggata 2221 tttccacgaa gacggcaggt atacggaaga aaacagttta aagctcacgc tggtggacgt 2281 tcccgaacag accgtcacgg aactggcgaa ggacctctgt gcctttttcc atcaggaaag 2341 tgttatggtc accttcgccc cgacaaaggt agtttttata aaagaaacga tctgatctcc 2401 cgcgctgccg tcaacggcgg gaaccggact ccggcaagga gagaataata gatggtgaaa 2461 gtactcttta tctgtcacgg caatatctgc cgcagcgtaa tggcggagtt tatttttaaa 2521 gatatggtcc gcaaggcggg cagggaagac gcgttcgaga tcgcatcccg ggcgacgagc 2581 cgggaggaga tcgggaacga catgtatccg ccggcgaagc gctgcctgac ggcccacggc 2641 attcccttcg agcggcattt cgccgctcag gtgacccggc aagcctgcga agactacgac 2701 ctgctggtct gcatggacga ctggaacctg cagaacatgc agcgcatgtt tggaagcgat 2761 tatgccgaaa agaccgtaaa actcctggat cttacgcctt taaagcgcga tgtggccgat 2821 ccctggtaca ccggcgactt cgagcagacc taccgcgacc tggtgctggg gtgcgaagcg 2881 ctgctctgcg ggtcacccgc gccgaaacag ttcctgaaca atcgctaaat ttacctcaat 2941 ctttccttga aatccctgac aatttgatat attctatact gtgcaggtct atggctgcag 3001 attttaacgt gtgccgagac ctgatagaaa aataaggaga aatagtatga gttcaggcaa 3061 acatctgaat ggcatccatg tgaaccattg taagaatact gccggacagg ccatcattcc 3121 gatgaccctc ccggaaaagg tttacattcc aatgagtcag cacataggtg ccccctgcca 3181 gcctgtcgtg gccgtcggcg accacgttaa ggttggccag aagatcggag acagcgaagc 3241 ctttgtatgc gctcctatcc acagcagcgt atccggcgaa gtgaccgcca tcaacaaggc 3301 catgtctcag atgggcagag tcgataccat tatcgagatc gtgcccgacg gcaagcagga 3361 gatcgcagag actgtcgttc cccccgtcat cacggataag gccagcttta tcaaggctgt 3421 ccgcgaatcc ggtgtcgtag gcctcggcgg cgctaccttc cccatgagcg tcaagttcaa 3481 cgtaaagccc cccgcaaagg tggatacctt catcgtgaac ggcgctgagt gcgaaccgta 3541 catcaccgtc gaccatcaga acatgctgac gcacgcccag gagatcgtgg acggcgttaa 3601 ggcagttctg cactggctgg agatcgaaag agccttcatc ggcatcgaga ccaacaagcc 3661 cgacgccatc aagctcttca aggacctcct gaaggacgaa aagaatatct ccgtggcgga 3721 gctgcgccag gtctatcccc agggcgcaga gcgtgtcatc atctacgaga ccaccggacg 3781 ccacctcatc gcaggcaagc tgcccgcaga tgtaggatgc atcgtatcca acgttacgtc 3841 cgttctcaag atgcagcagt tcctggccac cggcatgccc ctggtctcca aggccatgac 3901 ggtagacggc aacgccgtcg ctgaccccaa gaacgtggaa gtgcccattg gcaccccgct 3961 gtgcgacgtc atcgaattct gcggcggcac caaggccgac gtcagaaaga tcatcctggg 4021 cggaccgatg atgggccgcg ctatccccaa ggacgaatac ggcgtcatga agggcaacag 4081 cgccatcctg tgcttcgacg agactgcagg tacccagctg cccgagaccg cgtgcatcag 4141 ctgcggccgc tgcgtaagag gctgcccgat gaacctgatg cccaccaagc tggcgaaggc 4201 ttgggaacac caggatatcg atactctcag agagtacgac gttaccacct gtatggaatg 4261 cggatgctgc tcctactcct gcccggccag aaagcagctg agcttcgaga tcaagctcgc 4321 gaagacctgg gtcatgacgg aagacagaaa ggccgcagaa aaggccaagg ccgaagcaga 4381 agctgccaag gctaaggaag aagaaaagaa ggaaggagga gacaaataat gagtacgaaa 4441 cataccaatc tgatcgtatc ctccgctcct cacgtaaata acccggtcga taccaagagc 4501 atcatgagag acgtcgtgat cgctctgtgc ccggctctgc tggtcgcgat ctacgtcttc 4561 ggcgccagag ctctcgtgct caccgctgtc tgcgtagccg cctgcgtcat cttcgaaggc 4621 gctaccagaa agatcctcaa cagaccccag accatcggcg actggtccgc agtcgtcacc 4681 ggcgtcatcc tggcgttcaa cctgcccgta acgctgcccc tgtggatggc tgtcatcggc 4741 tgcttcgccg cgatcgtcat cgttaagcag gtcttcggcg gtctgggcca gaacttcgcg 4801 aaccccgcga tcgtcggccg tatcgtcctg ttcatcggtt tcgcaacgcc gatgaccaac 4861 tgggctgtta cctcccgcat gagctccgtc atccagagca cctctgtgga cggcgtcacc 4921 ggcgctaccc cgctgggtct gctggctgcc ggaaaagacg ttccctccaa cctggacatg 4981 ttcctgggca ccatcagcgg ttccatgggc gaagtttccg ccatcgcact gctgatcggc 5041 ggctgctacc tgctgtggag aaaggtcatc acctgggaga tccccgtggc gatgctcgca 5101 tccatcgcgg tcatggccct gctgatgcac caggatccga tcttccacat ctttgccggc 5161 ggcgccatgc tgggctccat cttcatggcg acggactacg ttacgtcccc catcaccagc 5221 aagggtaaga tcatcttcgg cgtcggctgc ggtgttatca ccatgctcat ccgcgtattc 5281 ggttcctatc ccgagggcgt ttccttcgcc atcctgctga tgaacatcct gaccccgcac 5341 atcgatcgct ggaccagaac gcacatcaac ggcgtagaca gaaaggcggt gaagtaggaa 5401 tggataagaa agccatgctg gctccgacta tcgtgctggt ctgcatctgc ctcgtagctt 5461 ccatgctgct ggctgctacc taccagatca cgaagcctat catcgacgat atcaatatcc 5521 gtatggccaa cgaatccaga gcggaagttc tgcccgaggc agacggcttt acgcagctgg 5581 acgtggacct cgtagacggc gttaccgaag tctatcaggc agacaacggc gcgggctacg 5641 ttatgactgc tgcttttaaa ggttttggcg gcctcgttac cgttatgacc ggtatggatg 5701 cggacggcgt catccagaac atcaaggtga cggacgcttc caacgagacc ccgggtctcg 5761 gctccaagac cacgctgccc gaccatacca acaagttcca gggcgtaagc ggcaccatta 5821 ccatggataa agcaggtgag ggtacctata tcgcacccgt taccggcgca agctattcct 5881 ctaaggctgt gttcaacgcg gtcgctgccg cgctggcgca gtatgcagag atcggaggtg 5941 ccttctaatg gaaaacaaga agagcaaact cagcatcttt accaacggtt ttattaaaga 6001 aaacccgatc ctggtcctgg tcctgggtac ctgccccacg ctggcagtat ccaccatggc 6061 ctccaacggc atcggcatgg gactgtgcgt aaccttcgta ctgttcttct ccaacatctt 6121 catttccgcg ttgaagaagg tcattcccga tcaggtccgc atcccgtgct acatcgtcgt 6181 tatcgcaacg ttcgtatccg tgctgcagat gctgctgcag gcgtacctgc ccgacctgaa 6241 taagtctctg ggtctgtacg tgcccctgat cgtagttaac tgcatcatcc tgggccgtgc 6301 ggaagcgttc gccaacaaga acagcgtcgt agactccgcg ctggacggtc tgggcatggg 6361 cctgggttac acctgcgcgc tcaccatcat ggcctgcatc cgcgaactgc tgggtgccgg 6421 aaccatcttc ggccacgtcg tgaccgcaaa cctgttcagc ccgatgtcca tcttcgtgct 6481 ggctcccggc ggcttcttca ccttcggctg catcatcgct gccctgaaca agctaaccaa 6541 gggaagagtc aaggaaaagc aggctgccaa caagtgcctg ggctgccccg gcgcatctgt 6601 ctgcagcaaa gttgaagagg gaggctgcta accatgaaag aaatgttaat gatcattatg 6661 gcagctgtcc ttgccaataa ctatgtactg gtccgcttcc tgggtatctg cccgttcctg 6721 ggtgtttcca agaagctgga ttccgcagtc ggcatgtcct tcgccgttat cttcgttatg 6781 gtactggcga ccgccgctac ctggcccatc cagcgcctgc tgctggaccc caacggcatc 6841 ggctacatgc agaccaccgt gttcatcctc gttatcgccg ctctggtaca gctgatcgag 6901 accttcatga agaagagcct gccggcactg cataagtccc tgggtatcta tcttcctctg 6961 atcaccacca actgcgccgt tctgggtgtc tgcaccctga acatcgacga gggatacacc 7021 ttcatccagt ccctgatgaa ctccttcggt tccggcgtcg gtttccttct cgccatgttc 7081 ctgttcgcag gcgtgcgcag caagatcgag gagaacgact atcccgagag cttcaagggc 7141 gttgcttcca ctctggttgc cgcttccatc ctgagcgtct ccttcatggg attctccggc 7201 atgatcgaca acatcttcgg tatgtaaggg agggatagaa gtatgttaac agcatctgct 7261 ttcgtaactc ccgtcgtact gacgatcgtt accggc // LOCUS sequence008 6915 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence008 VERSION sequence008 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..6915 /mol_type="genomic DNA" /organism="" /note="sequence008" misc_feature <1..855 /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_201626185.1:AMP-binding protein" /note="WP_201626185.1 AMP-binding protein (Fusobacterium canifelinum) [pid:38.7%, q_cov:93.3%, s_cov:30.3%, Eval:2.4e-38, partial hit]" /note="MGA_64" /locus_tag="LOCUS_0510" CDS 1014..2156 /product="exonuclease SbcCD subunit D" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011072763.1" /transl_table=11 /codon_start=1 /translation="MKFMHLADLHLGKRVNGFSMLDDQKYILKKILQIVDEEQPDAVLI AGDVYDKSMPSAEAVVLLDDFLCRLAKRKLQVLLIAGNHDSAERLAFGGRLLSESGVHI SPVYDGTVSCVTLTDAFGPVHFWLLPFVKPVHVRAFLPEEAAKIETYTDALAAAIEGMH ADFEERNVLVCHQFVTGAGRSESEELSVGGTDNVDGIVFDGFDYVALGHLHGPQNVGTE RIRYCGTPLKYSFSEKDHIKSVSVVTLGEKGSLEVRAVPLAPLRDLREVKGSYDEVVYR GNQEGQLRDDYMHVILTDEEDVPDALQKLRTVYPNLMKLDYDNTRTRTAAFFDEGAERE NKSEIELLDEFYEKQNGISLNDAQRKYSLSLLEKIKEELA" /locus_tag="LOCUS_0520" /note="WP_011072763.1 exonuclease SbcCD subunit D (Shewanella oneidensis) [pid:37.7%, q_cov:96.1%, s_cov:92.5%, Eval:1.1e-66]" /note="MGA_65" CDS 2153..4918 /product="SMC family ATPase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_013229784.1" /transl_table=11 /codon_start=1 /translation="MRPLQLKISGFGPYAGTQELDLEKLGRSGLYLITGDTGAGKTTIF DAICYALFGEASGNNREPAMLRSQYAAEDAPTEVELTFENAGKVYTVKRNPEYLRRKKR GEGFAKQIAGAELHYPDGRIETRTTAVTRAVEELLGVSKDQFSQIAMIAQGDFLKLLLA DTSARKEIFRSLFQTDLYRMFQDRVKQDYSALEKERDAAKLGVDLAAKGILCEEEDVLY TEAQKARAGGCLTEDRIALIESLCAQDERTLEALQIREKAAAENIQELAVLLEKCGQRK ELELEKKTAEKAVEDHRQNGPAVEQAVLQAEECAKNAEAWEQEASVLAVKLPDYDRLEA LRGQLGSLDRNMAELQKAITVQDEKIDTLKAETAALQEELQSLASAGENRAVLASRKEK LQQEIADLTSLQEELAALVPLRTGLKEAQDEYVAAESAMKAAADLALSYRSHFNREQAG IMAEQLEEGKPCPVCGSLSHPNKAVKAEDAPSEAQVEKAEQASQKAQKACSDASAAAAE AKAKLESAESAAEKRTAKLLEGCPLAQADLVLPEKAGEKQRSFDDISEALRQEEDNVRR KAELEEAKPAKETALKEAEERSSALKLQEREEKATAEGLKVQIEELSGSLAFESKKEAE SRIESLQDRAKQARDAVKKAAEAKTAWEKDLASRRSAVENLEKLLAGQPQLNEEALLQE KQKAEEENKAVQEQIRAAGHRLQVNRDIVSQIQNSADQLKKLDETWRWMDALRRTVTGQ LSGKEKVELEVWIQMTTFDRILRRANVHLMEMSSGMFELRRRETAENARSQSGLELDVN DHGSGSLRSVKTLSGGESFLASLSLALGLSEEIQANAGGVQLDCMFVDEGFGSLDEDTL QQAMKALGRLTEGNRLVGIISHVAELRRQIDRQIVVKKDPAGGSRAELQV" /locus_tag="LOCUS_0530" /note="WP_013229784.1 SMC family ATPase (Amycolatopsis mediterranei) [pid:26.5%, q_cov:99.3%, s_cov:99.4%, Eval:3.5e-73]" /note="MGA_66" CDS complement(4925..6313) /product="MATE family efflux transporter" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_005786787.1" /transl_table=11 /codon_start=1 /translation="MASQNQTKKGDFSQGSIPKTVLRMGIPIAMAEIVHVLYNVVDRIF IGHIPGVGTAALSGVGIAFPLISLVTAFANLCGTGGNPLCSMARGQGNNERAQKILETA FTMLLGFSAVLTVVLFLFARPFLAAMGGDAETLPYAVNYFRIYVAGTVFVLISLGMNPF INGMGFPKIGMGTVLIGAVLNIALDALLLFVFHMGVEGAAIATVISQFVSAVWVIRFLT GKKTLLRISRIHLDMEEVPRILKLGATGFMFKFSNSVAQTVVNLTLKTFGGAASTLYIG AFSIINSMREVISQPISGINGASVPVMSFNYGARNYDRVRKTIRFMIAAALIYNIAAWL VVFTHPEQLIRLFTADDVLVKTAIPCLHIYYAAYFMMSFQTGGQNTFVALNKPKYAVFF SMLRKLFLIVPLTIALPRLGFGVMGVFYAEMASQIIGASLCSITMYFRIYRRLPKENGQ PSAL" /locus_tag="LOCUS_0540" /note="WP_005786787.1 MATE family efflux transporter (Bacteroides) [pid:40.8%, q_cov:93.9%, s_cov:95.1%, Eval:1.1e-90]" /note="MGA_67" ORIGIN 1 atcaagaagc agggcaagga caagaccgtc gcgaaggtcc tgaagatcaa taagtatacg 61 aagaagatcg gtctcgatct ggtccccaaa tttatgggtc agatcctgga cgttttcggc 121 ggacagctcc gtacgatcat cgccggcggc gccgccatgg atccgatcat cacggatttc 181 ttctgcgacc tgggattccg cgccgtacag ggttacggcc tgacggaatg ttccccgatc 241 gcagcgctca acccggataa gagagaactg gccaaccccg cagccgcagg tcgcgtgctg 301 cccatgttcg acgccaagat cgtcgacgcc ggcgaggacg gcaacggcga gatctgcatc 361 aagggcgacc acgtaatgct gggctactac cagatgcccg aacagaccgc ggaagtcctg 421 gtggacggct ggtaccacac cggcgacctg ggctacatgg acgaaaaccg ctttatcttc 481 atcaccggcc gcaagaagaa cgtcatcatc acgtccaacg gcaagaacgt ctatccggag 541 gaactggaat acaagctgtc tctcagcaaa ttcgtgtccg aatccatggt ctgggcggac 601 gaagacgagc agggccacga cgtgcgcatc gtcgccacca tcattcccga aaaggaagaa 661 gtggaagcgg tcctgggcga aaacgctccc gcggacaagg tgctggaact gctgcagggc 721 gaagtggaca aactgaacga tcaggaaccg atcttcaagc agatcaagaa ggtcgtcctc 781 cgtaccgaac ccttcgtcaa gaacacatct gcaaagatca agcgcttcga agcggccaac 841 aagaaactga actaagaact tctgcgaagc ccggccatgt gccgggcttt ttctttacga 901 aaagtgcagg ccgctttggc acaacttcag gaatctggtg tttcaacggt ttcttcagaa 961 tgtgccgcag cagcctgcac tttttggtaa aataaaagca ggagggattc catatgaaat 1021 tcatgcattt ggccgatctt catctgggaa agcgcgtaaa cggtttttcc atgctggatg 1081 atcagaaata tattctgaaa aagatcctgc agatcgtaga cgaagagcag cccgatgctg 1141 tcctgatcgc aggcgatgta tacgataaat ccatgccttc tgccgaagcc gtcgttttat 1201 tggacgattt tttatgccgt ctggcaaagc ggaaactgca ggtccttctg atcgcgggga 1261 accacgattc cgcggaacgg ctggcttttg gcggacggct tctctcggaa agcggcgtgc 1321 acatttcacc ggtctacgat gggaccgttt cctgcgtgac cctgacagat gctttcgggc 1381 cggtgcattt ctggctgctt ccctttgtta aacctgtcca cgtgagagca tttctgccgg 1441 aagaggctgc aaagatcgag acgtatacgg atgcgctggc tgcggcgatc gaaggcatgc 1501 atgcggactt tgaagaacgc aacgtgctgg tctgccatca gttcgtaacg ggagctggcc 1561 gttccgagtc tgaggaactc tccgtcggcg gcacggataa cgtggatggg atcgttttcg 1621 acggatttga ctacgttgct ctgggtcacc tgcacgggcc gcaaaatgtg ggaacagaac 1681 ggatccgtta ctgcggaact cctttgaaat actctttttc ggaaaaggat cacattaagt 1741 ccgtttccgt cgtaacattg ggcgaaaagg gctctctcga ggtccgcgcc gttcctcttg 1801 cgccgcttcg cgacttgcgg gaagtgaagg gctcctacga tgaggtggtt taccggggaa 1861 atcaggaggg ccagctgcgg gatgactaca tgcacgtgat ccttacagat gaggaagacg 1921 tgccggacgc actgcaaaaa ctgcgcaccg tctatcccaa cctgatgaag ctggattacg 1981 acaatacccg cacacgcacg gcggcgttct tcgacgaagg ggcggaacgg gaaaacaaga 2041 gcgagatcga actgctggat gaattctatg aaaagcaaaa cggtatctcg ctcaacgatg 2101 cgcagaggaa gtacagtctg tcgctgctgg aaaagatcaa ggaggaactg gcatgaggcc 2161 tttacagtta aagatcagcg gattcggacc ttatgccggg acgcaggaac tggacctgga 2221 gaaactgggc cggagcgggc tgtatctgat caccggcgat accggtgcgg ggaagaccac 2281 gatcttcgat gcgatctgct atgcgctgtt cggcgaagct agcggaaaca accgggaacc 2341 cgccatgctg cgctcccaat atgcggcaga ggatgcgccg acggaggtgg aactcacctt 2401 cgaaaacgcc ggcaaggtct ataccgtaaa acgcaatccg gaatacctgc gccgcaaaaa 2461 gaggggcgag ggcttcgcaa agcagattgc aggagcggaa ctgcactacc cggacggacg 2521 catcgagacc aggaccaccg cggtgacccg cgcagtggag gaactgcttg gtgtttcgaa 2581 agaccagttc tcccagatcg ccatgatcgc ccagggcgat ttcttaaagc ttttgctggc 2641 agacacctct gcaagaaagg agatcttccg cagtctgttc cagacagatc tgtaccggat 2701 gttccaggac cgggtaaagc aagactattc tgcgttggaa aaggaacggg atgcggcgaa 2761 attgggcgta gatctggcgg caaaggggat cctctgcgag gaagaggacg tactgtacac 2821 agaagcgcag aaagccaggg caggcggatg tctgacggaa gaccggatcg cgttgatcga 2881 atccttatgc gcgcaggatg aaagaactct ggaagccttg cagatccggg aaaaagcggc 2941 tgccgaaaac attcaggagc tggctgtcct cctggaaaag tgcggccagc gcaaagaact 3001 ggaactggaa aagaagacgg cggaaaaggc ggtagaagac caccgccaga atggaccggc 3061 ggtggaacag gctgttctgc aggcggaaga atgcgccaaa aatgcggaag cgtgggaaca 3121 ggaagcctct gttcttgcgg tcaaactccc tgattacgat agactggaag ccctgcgggg 3181 acagctcgga tcgctggacc ggaacatggc agagctgcag aaagcaataa ccgtccagga 3241 cgaaaaaata gacacactga aggcagagac tgctgctctt caggaagaac tgcagtctct 3301 ggcttccgct ggagaaaaca gggctgtact cgcgtcccgg aaggaaaagc tgcagcagga 3361 gatcgcggat ctgacgagcc tccaggagga attagctgcg ctggtgccgc tgcggaccgg 3421 attgaaagag gcgcaggatg agtatgttgc ggcggaatcc gccatgaaag cggccgcaga 3481 tctggcttta tcctaccgca gtcactttaa cagggagcag gccggcatta tggcggaaca 3541 gctggaagag ggaaaaccct gtccggtatg cgggtcacta tcccatccca acaaggcggt 3601 gaaggcggaa gatgccccat cggaagcgca ggtagagaag gcggaacagg cttcgcagaa 3661 agcacaaaag gcctgcagcg acgcctctgc cgcagctgcc gaagccaagg cgaaactgga 3721 gtctgccgaa tctgctgcag aaaaacggac cgcaaaactg ctggaaggct gtcccctggc 3781 gcaggcggat cttgtactgc cggagaaggc cggagaaaaa caacggtctt tcgacgatat 3841 ttcagaggca ttgcggcagg aagaagacaa cgtgcggcgc aaagcggaac tggaggaagc 3901 aaagcctgcc aaagagacgg ctctgaaaga ggcggaggaa cggtcgtcgg ctttaaaact 3961 gcaggaaaga gaagagaaag cgacggcgga aggtctgaag gtccagatcg aagaactgtc 4021 ggggagtctg gcgttcgaga gcaaaaaaga ggcggaaagc cggatcgaat cgctgcaaga 4081 ccgggcgaag caggccaggg atgcggtaaa gaaagcagca gaagcgaaga cggcctggga 4141 gaaggatctt gcctcgcgcc ggagcgctgt ggaaaacctg gagaaactcc ttgccggtca 4201 gccgcagctg aacgaagaag cactcctgca ggaaaagcag aaggcggaag aagagaataa 4261 agcggtacag gagcagatcc gtgccgcggg tcaccggctg caggtcaacc gggacatcgt 4321 ttcgcagatc caaaacagcg cggatcagct gaaaaaactg gatgaaacat ggcggtggat 4381 ggatgccttg cggcgaaccg ttaccgggca gctatccggc aaggaaaagg tggaattgga 4441 agtctggatc cagatgacga ccttcgaccg catcctgcgc cgggccaacg tgcatctgat 4501 ggagatgtct tccgggatgt tcgagctgag gcgcagagaa acagcggaga atgcgcgcag 4561 ccagagcggt ctggaactgg acgtgaacga tcatggcagc ggcagtctgc gcagcgtaaa 4621 gacgctgtcc ggcggcgaat ccttcctggc atccctctcg ctggcactgg gtctttcgga 4681 agagatccag gcaaatgcgg gcggtgtgca gctggattgc atgttcgtag acgagggttt 4741 cggctcgctg gacgaagaca cgctccagca ggccatgaaa gcccttggaa ggctcacgga 4801 agggaaccgg ctcgtgggca tcatctccca cgttgcggag ctgcgccggc agatcgaccg 4861 gcagatcgtc gtaaaaaaag accctgccgg cggaagcagg gcggaactgc aggtgtagcg 4921 gatatcacag cgcagacggc tgcccatttt ccttgggcag tcttctgtat atgcggaaat 4981 acatggtgat cgagcagagg ctggcgccga tgatctggga tgccatttcc gcatagaaca 5041 cacccatgac gccgaatccc aggcggggca gcgcgatcgt gagcggcacg atcaggaaca 5101 gcttgcgcag catggagaag aacacggcgt atttcggctt gttgagcgcc acgaacgtgt 5161 tctgcccgcc ggtctgaaag ctcatcatga aataggcggc gtagtagata tgcaggcagg 5221 ggatcgcggt ctttacgagc acgtcgtccg ccgtaaacag gcggatgagc tgctccggat 5281 gcgtaaagac gaccagccag gccgctatgt tatagatgag agcagccgcg atcataaagc 5341 gtatcgtttt tcttacgcgg tcgtagttgc gggcgccgta gttgaagctc atgacgggaa 5401 cggacgcgcc gttgatgccg ctgatgggct gactgatgac ctcccgcatg gaattgatga 5461 tggagaacgc gccgatgtac agcgtgctcg cggcgccgcc gaatgtcttc agcgtaaggt 5521 tgacgacggt ctgggcgacg ctgttggaga acttgaacat aaacccggta gcgccgagtt 5581 tcaggatgcg ggggacttcc tccatgtcga gatggatccg ggagatgcgc agcagcgttt 5641 tctttccggt aaggaatcgg atgacccaca cagcgcttac gaactgggaa atgaccgtag 5701 cgatagcggc tccctcgacg cccatgtgga acacgaacaa aagcagggca tccagcgcga 5761 tattcagcac tgcaccgatc agcacggtgc ccatgccgat cttgggaaat cccatgccgt 5821 tgatgaaggg gttcatcccc agactgatga ggacgaatac ggtgcctgcg acgtagatgc 5881 ggaaatagtt gaccgcgtac ggcaatgttt cggcgtcacc gcccatggcg gcgaggaaag 5941 gcctggcgaa caggaacaat acgacggtaa ggacggcgct gaaccccagc agcatcgtga 6001 acgccgtctc caggatcttc tgggctcttt cgttgttgcc ctggccccgg gccatggaac 6061 acagcggatt gccgccggta ccgcagagat tggcaaatgc ggtcaccaaa gagatgagcg 6121 gaaacgcgat gccgacgccg gacagcgctg ccgttcccac gccggggatg tgtccgataa 6181 agatgcggtc caccacgttg tacagtacgt gcacgatctc cgccatcgcg atggggatcc 6241 ccatgcgcag gacggtcttc gggatgcttc cctgggaaaa atctcctttt ttcgtctggt 6301 tctgagaggc caaatctgtt actccgtttc agaaattgta tacagcttaa acattatagc 6361 acaactgtcc ctgagacgtg caattcttta caaaccacaa gatatagcgt acaatggaac 6421 cgtattgata gaactcttgt ggacagattg aactgtcggg agaattccta tgaaatgtcc 6481 gttttgtgaa gccccggata cgaaggtcat cgactcgaga cccacagaag agggccacgc 6541 catccgccgg cgcagagaat gcgagaagtg cggcaagcgc tttacgacgt acgagaaggt 6601 agaagaagtg ttcttcatgg tcgtcaagag agacggcagc cgcgaatcct tcgaccgcaa 6661 caaggtgctc aacggcatcg tccgtgcctg tgaaaagcgc cccgttacca tggaacagat 6721 ggaatccgtc gtgtccgagg tggaaagagg cctcaacaac atgatggaaa aggagatcag 6781 cagttccttc atcggcgagg tcgtcatgga gaaactgaag gatctggacg aggtcgccta 6841 cgtgcgcttt gcctcggtct accgtcagtt taaggacgtc aacaccttta tcgcagagat 6901 cgaaaaactg ctggg // LOCUS sequence009 6900 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence009 VERSION sequence009 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..6900 /mol_type="genomic DNA" /organism="" /note="sequence009" CDS complement(523..1476) /product="alpha/beta hydrolase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003722331.1" /transl_table=11 /codon_start=1 /translation="MKKKTKIILTSVTAASVTSGLLAGLYATYRVAFHSPNGNQNDDFE YRFNDQTRPMSYKIFRMIGAMHAMEYERVSVESFDGHKLIGRYYEVSKGAPLCICVHGY RGTPARDFSGGARMLMEMGYNVLMPEQRATGESEGRAITFGMKEHKDCKSWIDYAIRRF GTGVKICLVGVSMGATTVLMSAVDGLPENVKGIAADCPFDSPVEIIKQVAWKDYHIPPF IAGPAAGMAALLYGHFRLGGLTASDGAAASQVPILLIHGEEDRFVPSYMSQRIAEANPQ MVTRVTFPGAGHGISYLADEEKYKKVTGDFLKRIFA" /locus_tag="LOCUS_0550" /note="WP_003722331.1 alpha/beta hydrolase (Listeria monocytogenes) [pid:32.9%, q_cov:98.4%, s_cov:99.1%, Eval:1.5e-36]" /note="MGA_70" CDS 1667..2371 /product="ABC transporter ATP-binding protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011462143.1" /transl_table=11 /codon_start=1 /translation="MQPLLKAENITKTYKTGDVDVQALKGVSFTIEDGELIVVLGPSGS GKSTMLNILGGIETATSGNIFYEGEPLDWSDRNALSDYRRAHIGFVFQFYNLLPGLTAL ENIELSGELSQAPLDAKKLIGEVGLADRADHYPSRLSGGEQQRIAIARALCKNPDILLC DEPTGALDSKTGIQVLKLLWDFCREYHKTVVLITHNQSIAGIADRVIYVRDGLIEKIEA NPDPRDPEEVVW" /locus_tag="LOCUS_0560" /note="WP_011462143.1 ABC transporter ATP-binding protein (Desulfitobacterium hafniense) [pid:52.6%, q_cov:100.0%, s_cov:100.0%, Eval:3.8e-70]" /note="MGA_71" CDS 2371..4716 /product="ABC transporter permease" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011090710.1" /transl_table=11 /codon_start=1 /translation="MRSFRKNVLRLALQNKASVLGSVLIIAIGIFVMVSMFDTLQNLTD QIFSYYERYEMADVFVTVRGIPLETLQRMDSIEGIAKADGKLSADVRMVCEGQTEIATV HLMGYREDAQINRMDLFGKTMTEETVFVGSRMAEAYGFSEGDSVSLILGGESYDFTYAG NIGAPDYVYAVSTESAMVPDGELYDMACISQERLAELLGMRGQVNELGFLLTPGYTFED VKYRLETALADYGVLSIVEKKDQTSYNMVNGEITELVSIGTILPLLFMAISIFMLYISL KKMIDHDQTLIGSMKAFGMRNSELVGAYLIEGCAIGLAGALLGWVLAIPFGMYMYDLYL NFFTLPVATFHNYWNTRLIGLAIALATAMGAVLLGVRRVLNITPAMAMKSRAPSVTKQS ILPRSWTARLGTFRKLGIRSMTRSPLRGLLIILAVAFPFALSPVLFSFSPIVDEMIDAY FGKVRTYDLQLAMASYSDPNDLGNAGLDLPFVTDAEGICQTPVQLKNDNLKEYSMLYGL QRGSKLWKVGDNEGNTFDPPESGIVLNERLAKKLHLQEGDVVGVNLTAYGNTWVDVPVR MVVTEIFGGSCYMDLGSFPRQLGVGASANTLLLSVQDGHVGDVKAAVRNTSMVPSIIDA EKITSSFAGMMDSMVMMVNMFAFFAVVAGFVLIHNISMINIRERFTELGTLEVLGATKK EIDGMLRDESILYFLGGIALGIPGSIGFKKLIEVLIISESYAIRMHVQPMAYVVSFAMC AGMMWLAWKQDTKLIRTIALTDILKERE" /locus_tag="LOCUS_0570" /note="WP_011090710.1 ABC transporter permease (Bradyrhizobium diazoefficiens) [pid:24.7%, q_cov:95.6%, s_cov:95.7%, Eval:1.5e-58]" /note="MGA_72" CDS 4720..6048 /product="HlyD family efflux transporter periplasmic adaptor subunit" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_015945389.1" /transl_table=11 /codon_start=1 /translation="MKQFGKKKIIACVAAAAVLAAAVLGGIAFQNGKSVAVEKAAAVRE AFEDTYTVSGNVSFGDSSMVISEVTGRVEETPVSLNQRVEAGDVLMRIDPSEYGYQRAQ AAAQSAGYSAQLSQAKISHLMTASPGEYLSNLQGGLTAAKDALSAAETQYNAAQQLYEA GGASKVELDSAKAAYDQAKQAYDTANAGYEKSSSVKDSLEKQGITEANINEQFYKSEEA QLGALISAQNTVVSHLDDLIAKCTITAPAAGTVAQLPLAGVTLASAGQVVCVVVPDGSS VTVEGDVLTSIAPYVKAGDPAEISLDLRGGKLVCSGRVSQVYDYAVEDVSPLGLKEYKV HVVVTPDDPSQLASMSGYEADLKLQLFRGSDVLTVPSEAVFESGGEYFVFTVRDGKAVK TAVEVGYQSPQKTVILSGLSEGDEIVARAETEGVYDGAAVRWK" /locus_tag="LOCUS_0580" /note="WP_015945389.1 HlyD family efflux transporter periplasmic adaptor subunit (Desulfitobacterium hafniense) [pid:28.1%, q_cov:95.5%, s_cov:90.0%, Eval:3.2e-28]" /note="MGA_73" ORIGIN 1 acggattcga aagagtgccg gagatcctgg cgaaaccttt ggacagcgag atccatccgt 61 ttgacccgaa ggagaccggc tacaattccg gctccacgga cgtgggcgac gtgggctatg 121 cgacgcccac cgtcaacatc aacgtggcga cggcctgcgt gggcaacgtg ggacacagct 181 ggcagaacgt ggcgttctcc aacagctcca tcggcgacaa gggcatgatg gtggcggcga 241 aggtgctggc gctggcgacg gtgcgcacga tggcgcagcc ggaactcatc gaaaaggcga 301 aggcagagct gctgcgcaag aacggcggca aatacacctg cccgctgccc gaatacgcgc 361 agccgcccat cgggaagtac taaaacaata aagtattaaa agcataataa gaagccggac 421 cggtatatcc tctcgggaca acactctgtt cgctgcgctc acgcgtttgc gattgcccct 481 cgaagatata ccggctccgg cttttttatc gctatttgca gtttatgcga aaattctctt 541 caggaaatct cccgtaactt tcttgtactt ttcttcgtcc gccagatagg agatgccgtg 601 gcctgcaccg gggaaggtga cccgggtgac catttgcgga ttcgcctctg ctattctctg 661 gctcatgtag gagggcacga agcggtcctc ctcgccgtgg atcagcagaa taggcacctg 721 agacgccgcc gcgccgtcgg atgccgtaag gccgcccagg cggaagtgtc cgtagagcag 781 cgccgccata ccggctgcag gacctgcgat gaagggtgga atgtggtaat ccttccaggc 841 cacctgcttg atgatctcca ccggagaatc gaaggggcag tctgctgcga tgcccttgac 901 gttctcgggc aggccgtcca cggcgctcat caatacggta gtcgcgccca tggagacgcc 961 caccaggcag atctttacgc cggtgccgaa gcggcggatc gcgtagtcga tccagctttt 1021 gcagtcctta tgttccttca tgccgaaggt gatggcgcgg ccttcgctct cgccggtcgc 1081 cctctgctcg ggcatcagca cgttgtatcc catctccatc agcatgcggg cgccgccgga 1141 aaagtctctg gcaggcgtac cgcggtagcc gtggacgcag atgcaaagag gcgcgccttt 1201 gctgacttcg tagtagcggc cgatgagttt atgcccgtcg aaggattcga cgctcacccg 1261 ctcgtattcc atggcgtgca tggcgccgat catgcggaag atcttgtagg acatcggccg 1321 ggtctgatcg ttaaagcggt attcgaaatc gtcgttctgg ttgccgttgg gcgagtggaa 1381 cgcgacgcgg tacgtagcat acaatcccgc aagaaggcct gaggtaacgg atgccgccgt 1441 aacggatgtt aagatgatct tggtcttttt cttcatgtcg ggtctccttc cgggacggtc 1501 cttcgcccct gtctttttca ttataccttg ttcgactttt gtctgcaatc tcttgaccaa 1561 aacagcgcaa agtgcaataa taggacagac ggttagcgta tgctaaccac aaatgtcaat 1621 atctcgccgg attccggcgt cgaaaggaat atagaggaac aaacctttgc agccgctgtt 1681 aaaagcagaa aatatcacga aaacatacaa gaccggagac gtggacgtac aggcattaaa 1741 aggggtgtct tttacgatcg aagacgggga actcatcgtc gttctgggcc cctccggttc 1801 cggaaaatcc accatgctca acatcctggg aggcatcgaa acggccacgt ccgggaatat 1861 tttttatgag ggcgagcccc tggattggag cgaccggaat gcgctgtccg attaccgcag 1921 ggcgcatatc ggcttcgttt ttcagttcta caatctgctg cccgggctca ccgccctgga 1981 aaacatcgag ctttccggcg aactttccca agccccactg gatgcgaaaa aactcatcgg 2041 ggaggtcggc ctggcagacc gtgcagacca ttatcccagc cgtctttccg gcggcgagca 2101 gcagcgcatc gccatcgcca gagccctttg caagaacccg gacatcctgc tgtgcgacga 2161 acctaccggc gccctggact ccaagaccgg catccaggtc ttaaaactgc tgtgggattt 2221 ctgccgggaa taccataaga ccgtggtcct catcacccac aaccagagca tcgccggcat 2281 cgccgaccgg gtgatctacg taagggatgg ccttatcgaa aagatcgaag cgaatccgga 2341 tcccagagat cccgaagagg tggtctggta atgcgcagtt tccgcaaaaa cgtgctgcgg 2401 ctggcgctgc agaacaaggc ctccgtcctg ggatccgtgc tgatcatcgc catcggcatc 2461 tttgtgatgg tctccatgtt cgatacgctg cagaatctga cggaccagat cttctcctac 2521 tacgagcgct acgagatggc agacgtattc gtgaccgtac ggggcattcc gctggagacc 2581 ctgcagcgca tggacagcat cgaaggcatc gcgaaagcag acggcaaact gtcggcggac 2641 gtgcgcatgg tctgcgaggg tcagacggag atcgcaacgg tgcatctgat gggataccgg 2701 gaggatgcac agatcaaccg catggacctg ttcggaaaga cgatgacgga ggagaccgtc 2761 ttcgtcggaa gccgcatggc cgaagcctac gggttttcgg aaggcgacag cgtgagcctg 2821 atcctcggcg gagaaagcta cgattttaca tatgcgggca atatcggtgc gccggattat 2881 gtgtatgccg tctccacgga gagcgccatg gtgccggatg gagagctgta cgacatggcc 2941 tgcatttccc aggagagact ggcggaactg ctgggcatgc gggggcaggt aaacgagctc 3001 ggctttctgc tgaccccggg atacaccttc gaggacgtga aataccggct ggaaacggcg 3061 ctggcggatt acggcgtgct ttccatcgtg gagaaaaaag accagaccag ctacaacatg 3121 gtaaacgggg agatcacgga actggtgtcc atcggcacca tcctccccct gctgtttatg 3181 gcgatctcca tctttatgct ctacatttcg ctcaagaaga tgatcgacca cgaccagacc 3241 ctcatcggca gcatgaaggc cttcggcatg agaaattccg agctggtggg cgcctacctg 3301 atcgagggct gcgccatcgg cctggcaggt gcactgctgg gctgggtcct ggctatcccc 3361 ttcggcatgt acatgtacga tctgtacctg aatttcttta cgctgccggt ggcgacgttc 3421 cataactatt ggaatacgag gcttatcggc cttgccatcg cgctggctac ggccatgggt 3481 gcggtgctgc tgggggtacg gcgggtgctg aacatcaccc cggccatggc catgaagtcc 3541 cgggcgcctt ccgtaacgaa acagtcgatc ctgccaaggt cctggacggc gcgtctgggg 3601 acattccgca agctgggcat ccgttccatg acccgcagcc ccctgcgggg gctgctcatc 3661 atcctggcag tcgcatttcc tttcgccctg tctccggtgc tgttctcctt ctcgcccatc 3721 gtggacgaga tgatcgacgc ctatttcggc aaggtgcgca cctacgatct gcagctggcc 3781 atggcctctt acagcgatcc caacgacctg ggaaacgccg ggctggatct gcctttcgtg 3841 acggatgcgg aagggatctg tcagacgccg gtgcagctga aaaacgacaa tctgaaggaa 3901 tactcgatgc tgtacggcct gcagcggggt tcgaagctct ggaaagtcgg cgacaacgaa 3961 ggcaatacct tcgatcctcc cgaaagcggc atcgtgctga acgagcgcct ggcgaagaag 4021 ctccatctgc aggaggggga cgttgtgggg gtcaacctga ccgcctacgg caacacctgg 4081 gtggacgtgc cggtgcgcat ggtcgtaacg gagatcttcg gcggcagctg ctatatggat 4141 ctgggcagct ttccccgcca gctcggcgtc ggggcatctg ccaacacgct gctgctgtcg 4201 gtgcaggacg gacacgtggg ggatgtaaag gctgcggtgc ggaataccag catggtacct 4261 tccattatcg atgcggaaaa gatcacttcc agctttgcgg gcatgatgga cagcatggtg 4321 atgatggtga acatgtttgc cttttttgcc gtggtggcgg ggttcgtgct tatccacaac 4381 atctccatga tcaacatccg ggagcggttt acggagctgg ggactctgga agtactgggg 4441 gcaacgaaaa aggagatcga cggcatgctg cgggacgaga gcatcctgta tttcctggga 4501 ggcatcgcgc tggggatccc cggcagcatc ggatttaaaa agctgatcga agtgctcatc 4561 atttcagaga gctacgccat caggatgcat gtgcagccga tggcttacgt ggtctcgttc 4621 gcgatgtgcg cgggcatgat gtggctggcc tggaagcagg atacgaaact catccgcacc 4681 atcgcgctga cggatatttt gaaggaaaga gaataggcaa tgaaacagtt cgggaagaaa 4741 aagatcatag cgtgcgtggc ggcggcagcc gtgctggcag ctgccgtatt ggggggcatc 4801 gccttccaaa acggaaagtc tgtggccgtg gagaaggcag cggcggtaag agaggcgttc 4861 gaagacacat acaccgtaag cggaaacgtc tctttcggcg attcttccat ggtcatctcc 4921 gaggtgacgg gacgggtcga ggagacgccg gtctccctca accagcgggt ggaagcggga 4981 gacgtgctga tgcgcatcga tccttcggag tacggatatc agcgggccca ggctgccgcg 5041 cagtccgccg gctactccgc ccagctttca caggcgaaga tcagccatct gatgacggct 5101 tcgccgggag aatatctttc caatctgcag ggcggcctga ccgcggcaaa ggatgctctc 5161 tccgcggcgg aaacgcagta caacgcagcg cagcagctgt acgaggcggg cggcgcatcc 5221 aaggtggaac tggacagcgc gaaggcggct tacgaccagg caaagcaggc ctacgatacg 5281 gcgaatgcgg gttacgaaaa aagcagcagc gtaaaggact cgctggaaaa acagggcatt 5341 acggaagcca acatcaacga gcagttctac aagagcgagg aggcccagct gggcgctctc 5401 atctccgccc agaataccgt ggtaagtcat ctggacgatc tgatcgccaa gtgcaccatc 5461 acggcgcctg cggcaggaac tgtggcgcag ctgccgctgg cgggggtcac gctggcaagc 5521 gccggccagg tcgtctgcgt cgtcgtgccg gacggcagca gcgtaacggt ggaaggggac 5581 gtgctgacca gcatcgcgcc ctatgtaaag gcgggtgacc ccgcggagat ctccctggat 5641 ctgcggggcg gaaagctcgt ctgcagcggc agagtgtccc aggtctacga ctatgccgtg 5701 gaagacgtat cgcccctggg gttgaaagaa tacaaggtgc atgtggtggt caccccggac 5761 gacccgtccc aactcgcctc catgagcggc tacgaagcgg atctgaagct gcagctgttc 5821 cgcggcagcg atgtgctgac cgtgccgtcc gaggcggtgt ttgagagcgg cggcgagtac 5881 ttcgtgttta cggtccggga cggaaaggcc gttaagacgg cggtcgaagt gggatatcag 5941 tcgccgcaga agaccgtcat cctctccggt ctgtccgagg gcgatgagat cgtcgcgcga 6001 gccgagaccg aaggcgtgta cgacggcgcg gccgtgcgtt ggaaatagcg ctttcgcttg 6061 acacttcagc gggtcaaagc gtacaatgaa atttaatatg gggcggaagg ccttataggt 6121 cttccgccgt ttgtttttaa ggagtttcga ctatggtaat gacaggcgcg cagatcctca 6181 tggagtgtct gctggagcaa ggcgttgaca cggtgttcgg gtatcccggc gggacgaacc 6241 tgaacgtcta cgacgaactg tacaagtatt ccgacaagat caagaactat ctgacgtccc 6301 acgaacaggg cgctgcccat gcggcggacg gctatgcccg gtccaccggc aaggtgggtg 6361 tatgtctggc tacgtccggc cccggagcta cgaacctgac gacgggtatt gcgacggctc 6421 atctggattc ctctcccgtg gtgttcatca cctgcaacgt gagcggcaat ctgttgggta 6481 aggatgcctt ccaggaggcg gacgtcgtgg gtattatgat gcccattacg aaatccacgt 6541 tcctcatcac ggacgtggag aaactggcgg ataccgtgcg cgaagccttc gcgttggctc 6601 gttccggacg gcccggcccg gttctgatcg acatcttaaa ggatgtgacc gccgccaaat 6661 gcgaatacga atatctgccc cgggagaagc acggcaccac cggttctttg gcagggcttt 6721 taaagagggc ccactcctcc agcctgcggc tgtttgagcc ggacaaggag gatgtggaca 6781 tcctggtgga catgatcgcc cagtccaaaa agcccatgct catctgcggc ggcggcgtca 6841 cgcgaagccg tgcccatgaa gaattccggg ccttcgcgag aaaactggat tccccggtcg // LOCUS sequence010 6372 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence010 VERSION sequence010 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..6372 /mol_type="genomic DNA" /organism="" /note="sequence010" misc_feature <1..548 /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_002680483.1:Mrp/NBP35 family ATP-binding protein" /note="WP_002680483.1 Mrp/NBP35 family ATP-binding protein (Treponema denticola) [pid:62.2%, q_cov:99.4%, s_cov:65.2%, Eval:2.5e-64, partial hit]" /note="MGA_75" /locus_tag="LOCUS_0590" CDS 557..856 /product="ribosome assembly RNA-binding protein YhbY" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_010941918.1" /transl_table=11 /codon_start=1 /translation="MLTGKQRAYLRGLAQELQPAVYVGKENLTAAVVTEMHDYLNAHEL LKVKIQEGSDLEAKACANEAAQRLGAEFVQAIGRRFVLYRKAQDPEKRKIVLPK" /locus_tag="LOCUS_0600" /gene="yhbY" /note="WP_010941918.1 ribosome assembly RNA-binding protein YhbY (Geobacter) [pid:46.5%, q_cov:100.0%, s_cov:98.0%, Eval:1.5e-17]" /note="MGA_76" CDS 892..1509 /product="MBL fold metallo-hydrolase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_004082876.1" /transl_table=11 /codon_start=1 /translation="MRITYYGHSCFTLESQGFRVVVDPYRDYVPGYRALHLEADAVFCS HGHDDHAWVQAVTIRENAPADPFTVTEVAGFHDDAQGAKRGPNTMRIFEAEGLKAVHLG DIGCMPPEADLEKLKGADVCLVPVGGFYTIDAVQAKALMDILQPKIVIPMHFRLGDMGF AEIGTLDEFTKLYAPESVCFPGTNTLELTKETPAGVTVLQYM" /locus_tag="LOCUS_0610" /note="WP_004082876.1 MBL fold metallo-hydrolase (Thermotoga) [pid:39.9%, q_cov:85.9%, s_cov:87.0%, Eval:7.5e-29]" /note="MGA_77" CDS complement(1707..2693) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MEQKSAKKKRIFDIIQIGNTSDTPSRVFDDVLIVMILVNIVMMFL QTFERFEPYMDIINVLEGITGLFFCVEYLLRLWTADLLYPEEKSMGAAAWRFAKSFDGV VLLLTILPFLPLAGFVVFRMLRVVRILRLFRVNQAFDSFNVITSVIYDKRNQIASSCFI IFILMMASSLCMYSVEHEVQPEAFKNAFSGIWWSMSTILTVGYGDISPITPLGQVMGII IAFLGVGAVAIPTGIISAGFVERYTEMQASSDPRDLNIQTVYIDFDSKWIGMTAKEIEN EFGVLILVVRRGMSKILPREDFRVMRGDALAVHILNITEWPEEPTGE" /locus_tag="LOCUS_0620" /note="WP_014207107.1 ion transporter (Acinetobacter pittii) [pid:28.9%, q_cov:68.9%, s_cov:69.4%, Eval:8.0e-28, partial hit]" /note="MGA_78" CDS 2828..3142 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MSDPNKALTKEEQLDILNAFLTVSLEKARSRKPSAKAQLNTLKYS VTDLFRPIPEAEKAEWRSAVQALNGQGPMKLDEMFKAVVAKDKQMKEIEDEAPQAQPQA " /locus_tag="LOCUS_0630" /note="MGA_79" CDS complement(3155..3733) /product="XRE family transcriptional regulator" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_000391311.1" /transl_table=11 /codon_start=1 /translation="MNASDMNRVIPENLKNLRAERKLSLGEAAELTGVSKSMLGQIERG ESSPTIATLWKIATGLGVSFTALLESPDQEIEIVKETDMTPLLSDYGHFRLFPVVPAHK DRSFEILDLELDEDAISDSKPHAPGTEEFTFVYEGALEIVLGGEEKKSYVVEKDCLMHY RADQHHTYKNAFAGTTKALMVIHYSQRDL" /locus_tag="LOCUS_0640" /note="WP_000391311.1 XRE family transcriptional regulator (Bacillus) [pid:41.3%, q_cov:95.8%, s_cov:97.8%, Eval:3.9e-37]" /note="MGA_80" CDS complement(3739..4635) /product="glycyl-radical enzyme activating protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_009896060.1" /transl_table=11 /codon_start=1 /translation="MAPSGYVMNLQPFSVNDGDGIRTTVFLAGCPLHCAWCANPEGCNQ TRKVGWHIRKCIGCGECAKVCPQGIGIDLNAEREKCIACGKCVEVCPQKARVLMVQKMD ADEVLKQVQTHRLFYSYSGGGITFSGGEACLQPEFLNYLTEQIYDMGYSMDIETCGVFD FEAVWPSLSRMDLIFMDLKHMDSAAHKRWTGAGNERILENMAKLAELPAEVVVRIPCIG GVNADEDNIRRSAAFVHRTLPKAHMELLPYHSFGIIKYEALGIPYDHPEFFRPSKEEME RLRGIVREEGVEVADFR" /locus_tag="LOCUS_0650" /note="WP_009896060.1 glycyl-radical enzyme activating protein (Clostridioides difficile) [pid:44.0%, q_cov:100.0%, s_cov:100.0%, Eval:2.3e-71]" /note="MGA_81" misc_feature complement(4636..>6372) /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_003438022.1:formate C-acetyltransferase/glycerol dehydratase family glycyl radical enzyme" /note="WP_003438022.1 formate C-acetyltransferase/glycerol dehydratase family glycyl radical enzyme (Clostridioides difficile) [pid:60.6%, q_cov:100.0%, s_cov:73.2%, Eval:1.5e-209, partial hit]" /note="MGA_82" /locus_tag="LOCUS_0660" ORIGIN 1 accagggcat cgttcccgtt aagaccgcga ccggcatcga cgtcatgtcc ctcaacctgc 61 tgatcgacaa cgagaccgat cccgtagtct ggagaggtcc catcatcgcg ggaaccgtga 121 agcagttctg gaccgacgtc atctgggaag acgaagatgt aatgtttatc gacatgccgc 181 caggaaccgg cgacgttacc cttaccgtgt tccagagcct tcccatcgac ggccttatca 241 tcgtcacatc tccccaggaa ctcgtcggca tgatcgtcga gaagtgcgtc aagatggcgc 301 agatgatgaa catccccgtg ctggccatgg tggagaacat gggctatgta gaatgcccgc 361 actgcggcga aaagatctat ccgttcggag aaagcagact cgcggacctg gcgaaggagt 421 atcacgtaaa ccttaccgct gcgcttccca tcgatcccaa gctggctgct gcctgcgaca 481 agggcgacat cgaagcattc gagggcaact ggctggacgg catcacggac gtcattcaga 541 atctgtaggt gatcttatgc ttaccggaaa acagagagcc tatctgagag ggctggcaca 601 ggaactgcag cccgccgtct acgtcggaaa agagaacctg accgctgcgg tggtcacgga 661 gatgcacgac tatctgaacg cccacgagct gctgaaggtg aagatccagg aaggatcgga 721 cctggaagcg aaggcttgcg ccaacgaagc ggcgcagcgc ctgggcgcgg aattcgtgca 781 ggccatcggc cgccgttttg tgctgtacag aaaagcacaa gatcccgaaa aaagaaagat 841 cgtactgccg aaataagcct gtcgaagcac cagcgtagga aggagacaaa aatgcgtatc 901 acttactatg gccattcctg ctttaccttg gaatcgcaag ggtttcgggt cgtggttgac 961 ccgtacaggg attatgtccc cggctaccgg gcgctgcatc tggaggcgga tgccgtcttc 1021 tgctcccacg gtcacgatga ccatgcctgg gtgcaggcgg taacgatacg cgaaaacgcg 1081 cctgcagacc cctttaccgt tacggaagtg gcagggttcc acgacgatgc gcagggcgcg 1141 aagcgcggac ccaacacgat gcgcatcttc gaggcggaag gcctgaaagc cgtccacctg 1201 ggcgacatcg gctgcatgcc gccggaagcg gatctggaga aactgaaggg cgcggatgtc 1261 tgcctggtgc ccgtgggcgg tttctacacc atcgatgcgg tgcaggccaa ggctctgatg 1321 gacatcctgc agccgaagat cgtcatcccc atgcatttcc gtttgggcga tatgggcttt 1381 gccgagatcg gcaccctgga cgaatttaca aaactctatg cgccggagag cgtctgcttc 1441 cccggcacga ataccctgga actgacgaaa gagacccctg caggggtcac cgtactgcaa 1501 tatatgtaga cattccaagc catacggagg tgttccatgt ccgagagcta ccaagacgtt 1561 cccttcagaa accgggaaga cctggaccgc tatgcggtcc gccggaatgc cgcacggtga 1621 aggatgcgat ctttttcctt cgaaaaagca gaagaaatgc aatatagaca tgaaaaaact 1681 cccggaagcg ctccgggagt ttgcttttat tcgccggtag gctcctccgg ccactccgta 1741 atgttgagga tgtgaacggc cagggcgtcg ccccgcatga cgcggaagtc ctccctggga 1801 aggatcttgg acatgcctct ccgcaccacc aggatcaaaa cgccgaattc attttcgatc 1861 tctttggcgg tcatgccgat ccatttactg tcgaaatcga tatagacggt ctggatgttg 1921 aggtctctgg ggtcggagct tgcctgcatc tccgtatagc gctccacgaa accggcggag 1981 atgatgccgg tggggatcgc cacggcgccg acgcctaaaa aggcgatgat gatgcccatc 2041 acctgaccca gcggcgtaat ggggctgatg tcgccgtagc ccacggtgag gatcgtggac 2101 atgctccacc agatgccgga aaaggcgttt ttaaaggctt ccggctgcac ctcatgctct 2161 acgctgtaca tgcagagcga cgaggccatc atcaggatga agatgataaa gcaggacgat 2221 gcgatctggt ttctcttgtc gtagatgacg gacgtgatga cgttaaagga atcgaaggcc 2281 tggttgaccc taaacagccg caggatgcgc accacccgca gcatgcggaa cactacgaag 2341 ccggccaggg gcaggaaggg caggatcgta agcagcagca cgacgccgtc gaaggacttc 2401 gcgaagcgcc aggctgcagc gcccatgctc ttttcctccg gatacagcag atctgccgtc 2461 caaagccgca gcaggtattc cacgcagaaa aacaggccgg ttatgccttc caggacgttg 2521 atgatgtcca tgtagggttc aaaccgctcg aaggtctgca ggaacatcat gacgatgttc 2581 accaggatca tcacgatgag cacgtcgtcg aacacgcggc tgggtgtgtc gctggtattg 2641 ccgatctgga tgatgtcgaa gatcctcttt ttctttgcag acttctgctc catagacgcc 2701 tcctgtctta tcgttataag tatacaacat ttgcgcaaat ttttttatcc gtgttggaca 2761 tttgctggac aaggccttgt tttaataaag gcagaattca tactggaaca actgggaaga 2821 cttaaaaatg tcagatccga acaaagccct cacaaaagaa gaacaactgg atatcttaaa 2881 cgccttttta accgtatcat tggagaaggc aaggagccga aagccatcgg cgaaggccca 2941 gctcaacacg ctgaaataca gcgttaccga cctgttccgt cccattccgg aggcggagaa 3001 ggcagagtgg cgctcggccg tgcaggcgct gaatggtcag ggaccgatga aactggacga 3061 aatgttcaag gcggtcgtcg ccaaggacaa gcagatgaag gagatcgagg acgaggcgcc 3121 ccaggctcag ccgcaagcat aaaaaagagg aaccctacag gtccctctgg gaataatgga 3181 tcaccatcaa tgccttcgta gttcctgcaa aggcattttt atatgtgtgg tgctggtccg 3241 ccctgtaatg catcaggcag tccttttcca ccacgtagct cttcttttcc tcgccgccca 3301 gcacgatctc cagggcccct tcgtagacga aggtaaactc ctcggtgccc ggggcgtggg 3361 gcttggaatc ggagatcgcg tcctcgtcca gctccagatc caggatctcg aaggaccggt 3421 ccttgtgggc aggtacgacg ggaaatagcc ggaagtggcc gtaatcggag agcagaggcg 3481 tcatgtccgt ctccttcacg atctcgatct cctggtccgg gctttccagc agggccgtaa 3541 aggacacgcc cagacccgtg gcgatcttcc agagcgtggc gatggtgggg ctggattcgc 3601 cccgctcgat ctgtcccagc atggacttgg agacgccggt gagttcggct gcctccccca 3661 ggctgagctt gcgctccgcg cgcaggtttt ttagattttc cgggatgacc cggttcatat 3721 ccgatgcgtt catagtcttt aacggaagtc cgcgacttcc acgccttcct cccggacgat 3781 gccccgcaga cgctccatct cctccttgga gggccggaaa aactccggat ggtcgtaggg 3841 gatgcccagg gcttcgtatt tgattatccc gaaggaatgg tagggcagca gctccatgtg 3901 ggctttgggc agggtgcggt gcacgaaggc cgcgctgcgg cggatgttgt cttcgtccgc 3961 gttgaccccg ccaatgcagg gaatgcggac aacgacctcc gccggcaatt ccgcaagctt 4021 tgccatgttc tccaggatgc gctcgttgcc ggcgccggtc cagcgcttat gggcagcgct 4081 gtccatgtgc tttaagtcca taaagatgag gtccatgcgc gaaagagagg gccacaccgc 4141 ctcgaaatcg aagacgccgc aggtctcgat gtccatggag tagcccatgt cgtagatctg 4201 ttccgtcagg tagttcagga attccggctg caggcaggct tctcctccgg agaaggtgat 4261 gccgcctccg ctgtaggaat agaacagccg gtgggtctgg acctgcttta acacctcgtc 4321 cgcatccatt ttctgcacca tcaggacccg ggctttctga ggacagacct ccacgcattt 4381 cccacaggca atgcacttct ctcgctccgc attcagatcg atgccgatgc cctgggggca 4441 gactttcgcg cattccccgc agccgatgca cttgcggatg tgccagccca cttttctggt 4501 ctggttgcag ccttcagggt tggcgcacca ggcgcagtgc aggggacagc ccgccagaaa 4561 caccgtggtc cggatgccgt ctccgtcgtt gactgagaac ggctgcaggt tcataacgta 4621 cccggaaggc gccatttaga aggcctcgtg ggcgtttctc gccatgatgg aatcctgcat 4681 ttccttggaa aggttcgtaa actgggcgga ataaccggct acccgcacca gcaggcttct 4741 gtatttctcg ggatgggcct gggcgtcctt cagcacctcg ttggaaatgg tgttgaactg 4801 gacgtggaag ccgcccagcg cgaagtagct ctgcagcatg gcacccaggt tggctctgcc 4861 gcgcttcgtc gccaccagat cgtggtttaa gcgcaggttg agcagggtgc cgccgctgtg 4921 cttttcgtgc tccatcttgg ccgcgctgcg cagggctgcc aggcaggtgg aggtgtcgga 4981 accggtgtag ggggatacgc cttcgttgat agggtcacag gcgtggcgtc cctcgggcgt 5041 cgcacccagc accttgccgg tgggcaggta gttggagatg cccatgaagg ccgttacgaa 5101 gtggttgccg tacagatcgt tgtaggaggt gacttcgtcg tagtagaagt ccgctagctg 5161 ccgcgcgatg ctgtccacgt agtcgatgtc attgccgtat ttcgggcagg ccagcgcctt 5221 ggcccgcagg tcttcgtatc cttcccagtt ggcgttgatg gcatcgatga tgtcggaaag 5281 cgtgcagacc ttgtcctcgt aaaccagctt cttgatgacg gccagggagt tggcggttac 5341 cgaaagaccg actcctgtaa acaccgggcc gatgctgtac ttggcgccgc cgtccaccag 5401 gtccgcgccg ttcttcatgc agtattcgtt gcaggcgctc atgaagggcc ggtggccgat 5461 ctctctgtgg atctcctggg ctgtgaccag agagatgacg ccctgcttta cgagatattt 5521 aaactgcttc ttccaggctt ccacgatctc ctcgtaggaa gcgaaggtct tcggatcctt 5581 ttcggggagg gagacctgct tgccggacag tctgctcttg ccttcgttga gggcgaattc 5641 cagggctgca gcgaaactga tgctggcagc ggacgtccac tcgaacgtct ttctggagtg 5701 gggcacgacg cagccgcagt tgttccagtc ccgggcgtcc ttgggggcgt agcccaggtt 5761 cgagagcatc tggtagcccg ttctgtcgcc gtggatggcg gggaagccgc agccggtgga 5821 gaccagctcg gtgaccgctt ccatgaattc gggcgggcag tccgggtgga tgcggcagct 5881 taaggtgggc tggtgggtca tacactcgcg ggtcgcctgg atcgccatgt aggagatggt 5941 gttggtggca tcggtgccgt ccaccttggt gccgcccacg gtgaggttct cgaaattcgt 6001 gtagccggca aagaaactgg cggtgttctt ggagatggtc caggcccact cggaatactt 6061 cagccacagg cactcgacga gttccagcgc ggtgtcgtag tcgatgcggc ctgcttcctc 6121 gtccgccttg tagtagggat acatgtactg gtcgaagcgg ccggggttcc aggccagggg 6181 attttctgcg atgatgccgc ccagctgcac gaaccagacg aactggatag cttctcggaa 6241 ggtcttgggc ggtttttcgg ggatgcgggc gcagatgtcc gcgatctctt ccagttcggc 6301 ctttctcttc gggtcagcct cggccttcgc catttcggcg gcctttgcgc tgtagcggcg 6361 gcccagtgcg at // LOCUS sequence011 6070 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence011 VERSION sequence011 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..6070 /mol_type="genomic DNA" /organism="" /note="sequence011" CDS complement(72..1754) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MSRTNDRKPTTFRRLVFQLSIRNMLVPVLVFVSVFLLGYNAYTQH VLVKRNADHCTAASRRMEALCRSYMDYLEGLAQSDLVDGPLSDGSGKEDLYADFYRFLN GQPYRGTFYLLDEDRDLLLSLSGDESSTSINSVRRLAARSEQDGYKAAEEKTIISISYT SNERLRAYTVAMPVLRDGEAEGYLAYRFYEQGLIEFLNAGRSPGLFVLTDRNGGIIAAN LDAAEDALDRFLPQISGEYNCTIGDEDFYIARQTVTGTTLELYTLSRQIFFINGGTLLM TAVILGLLVLSYLVYSQSLAKRMTEPVDELLEAIQQLKTGDFAPTESLTNLEEFRQLFD EYNGAIEQLDKLMETQQSLKIRQLEAQFNPHFLYNVLETLKYTIATDTEAAQDIVLRLS HLMRYAAKPAEQEVALGDDMVYIEDYLALQKQRFLDRLSYTLNVSEDARDAKIFRLLLQ PLVENSIKYGYVAKQRIHVDVDCRTEGSDLLMAVTDDGGGMTEERLAAVQKALDEGVNP GESLGLFNTHQMIRLKHGAPYGLSFENRPGEGLTVKVRMPYKR" /locus_tag="LOCUS_0670" /note="WP_000127990.1 sensor histidine kinase (Staphylococcus) [pid:28.0%, q_cov:50.4%, s_cov:55.6%, Eval:1.4e-34, partial hit]" /note="MGA_84" CDS complement(1778..3433) /product="iron ABC transporter permease" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_005896074.1" /transl_table=11 /codon_start=1 /translation="MLRRRRQFDQWTVITLCIILVYIVFMIYPVLSLLLASLRDAETGA LSLKHFQKFFSKSYYMKAVVNSFKVSVSVTLCAVIVATPLAYIISTVKIKGSSWIRVFI LISSMSAPFIGSYSWILLLGRNGYITRFFQNYLGITTPTIYGLPGIVLVLTLALVPLVF SYVCGALKNTDKSLLEAARNLGSGNFKIIMTIVVPLIIPTILAAGILVFMKALSDFGTP SLIGEGFKTVPQLIYNEFLGDVAADNGFAAAISVMVVVFALLAFIIQRAVSNHLAFSMS AMYPIEPLPAYGIKNVLCHVYVYLYMLIALLPQICIWVTAFRKTKGLTFDEGYSLQSMK TAVSQMSVSIRNTLVFALSAAAIIVLIAVLVSYASVRRPNPLTNSLDVLTMTPYIVPGS ILGIAFVSAFSRQPLKLTGTALIIIIVLAVKRMPYTVRSSTAILHNIPESLEEASLNLG ASSMKTFTRITMPLMKNGIISGAIMSILSIITELSSSIMLYTGRTQTMTIAIYAQIIRG NYGLASALSLILSIFTILLVFLVFKITGNKELSY" /locus_tag="LOCUS_0680" /note="WP_005896074.1 iron ABC transporter permease (Fusobacterium nucleatum) [pid:45.7%, q_cov:99.6%, s_cov:99.6%, Eval:1.0e-143]" /note="MGA_85" CDS complement(3435..4514) /product="ABC transporter ATP-binding protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_005902588.1" /transl_table=11 /codon_start=1 /translation="MSVTITCTDIVKRFGDNTVIPGLNLEIKESEFFTLLGPSGCGKTT LLRMVAGFNSIEGGTISFNDKVINNIAPNKRNIGMVFQNYAIFPHMSVFKNVAYGLTNR KVSKAETERRVNDVLEKVKITHLRDRMPENMSGGQQQRIALARAMVIEPDVLLMDEPLS NLDAKLRLEMREVIRDLQKSVGITTIYVTHDQEEAMAVSDRIAVMKDGVIQQIGTPRSI YHRPTNVFVANFIGSTNIINGTLSGRTLTVEGYSAEVPAIKDAQPENTPVKVSVRPEEL LLAPADVKGITGSVTNSTFLGSQTHYLVNLDNGDEIKIIQESSETDYLSAGDRVNLTIN TAKVNVFSEDGETNLTRGE" /locus_tag="LOCUS_0690" /note="WP_005902588.1 ABC transporter ATP-binding protein (Fusobacterium nucleatum) [pid:57.5%, q_cov:99.7%, s_cov:96.8%, Eval:1.9e-113]" /note="MGA_86" CDS complement(4543..5610) /product="ABC transporter substrate-binding protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_005902589.1" /transl_table=11 /codon_start=1 /translation="MKRFLALLLALAMVFSLAACTSSNEPAAEPETETEGEATGEDPDT GKLVIYTSFTDAQMPLITDFEAQTGIKVEVITDGASALLKRVEAEKDAPYADIIIGGSK TIYGDYLDLFEEYVTPNDEFLAENHHVEYNKLTPYSADSILIMWNTNLIGDIEIKGFAD LLKPELKGKIAMADPAAASSAASALCLMAWVMGDHQSYFSDASIEYLTEFAKNLDGKLA AGSSACHKSCADGEYTCAVTFNSAVYNYINEGAPVSFCYPEEGVSPFSDVGAIIKGAAN MKSAKMFMDYITSKEVQSRMGAEMFSNPVRVDAELPDYMVAPDAIYESDEDPVLRAENM AELKEKWNDIWASVN" /locus_tag="LOCUS_0700" /note="WP_005902589.1 ABC transporter substrate-binding protein (Fusobacterium nucleatum) [pid:32.1%, q_cov:98.6%, s_cov:99.1%, Eval:3.7e-37]" /note="MGA_87" ORIGIN 1 ccagggaaac accgcccgca ggcctttgcg gatccgctct tcatcttcca caagcaaaac 61 tttgtacatg gtcacctctt gtaaggcatg cgaaccttta ctgtaagccc ctcgcccggc 121 cggttttcga aggacaggcc gtagggggcg ccgtgtttta agcgtatcat ctggtgcgtg 181 ttgaaaagcc ccaggctttc cccggggttg accccttcat ccagcgcctt ctgcaccgcc 241 gctagccgct cctccgtcat gccgccgccg tcgtccgtga ccgccatcag cagatcgctg 301 ccctccgtcc ggcagtccac gtccacgtgg atgcgctgct tcgctacata gccgtacttg 361 atggaattct ccaccagagg ctgcagcagc agacggaaga tcttggcgtc ccgggcgtct 421 tcggagacat tgagcgtata gctcagccgg tccaggaaac gctgtttctg cagcgccaga 481 tagtcttcga tatagaccat gtcgtcgccc agggcgacct cctgctccgc aggcttggcc 541 gcatagcgca tcagatggga cagccgcagc acgatgtcct gagccgcctc cgtatccgtc 601 gcgatggtat atttcagcgt ttccagcacg ttgtacagga aatgcgggtt aaactgggct 661 tccagctggc ggatcttcag gctctgctgg gtctccatca gcttgtccag ctgctcgatg 721 gcaccgttgt actcgtcgaa tagctgccgg aactcctcca gattcgtgag ggattccgtg 781 ggggcgaaat cgccggtctt cagttgctgg atggcctcca gcagttcgtc caccggctcc 841 gtcatccgct tcgccagcga ctgggaatag accaggtagc tgaggacgag cagaccgagg 901 atgaccgcgg tcatcagcag cgtgccgccg ttgatgaaaa agatctgccg cgacagggtg 961 tacagttcca gggtcgtacc ggtcacggtc tgccgggcga tgtagaaatc ctcgtccccg 1021 atggtgcagt tgtattcgcc ggagatctgc ggcagaaagc ggtccaaggc gtcctctgcc 1081 gcatccaggt ttgcggcgat aatgccgccg ttgcggtccg tgaggacgaa gaggccgggc 1141 gatctgccgg cgttcaggaa ttcgatcagg ccctgctcgt agaaccggta ggcaagatac 1201 ccttccgctt ctccatcccg cagcaccggc atcgccacgg tgtaggcccg caggcgctca 1261 ttggacgtgt aggagatgga gatgatggtc ttctcctccg ccgccttgta gccatcctgc 1321 tcgctgcggg cggccagtct gcgcacggaa ttgatgctgg tgctggactc gtcgccgctt 1381 aaggacagca gcagatcccg gtcctcatcc agcagataga aggtgccccg gtagggctgt 1441 ccgttcagga agcgatagaa gtccgcatac agatcctctt tgccgctgcc gtccgagagc 1501 ggtccgtcca ccagatccga ctgagccaga ccttccagat agtccatata gctgcggcag 1561 agcgcttcca tccgccggct tgccgccgtg cagtgatccg cgttgcgctt taccagcacg 1621 tgctgggtgt aggcgttata gcccaaaaga aaaaccgaca caaacacaag gaccggcacc 1681 agcatgtttc gaatggaaag ctggaatacc aatctccgga atgtcgtcgg ttttctgtcg 1741 ttcgtgcggg acatgctatc cctctggtct gaatccctta ataactgagt tccttattgc 1801 ctgttatctt aaacaccaag aagacaagca gtatcgtaaa gatagacaaa ataaggctca 1861 gcgcagacgc aagtccgtaa ttgccgcgga tgatctgcgc gtagatcgcg atcgtcattg 1921 tctgtgttct tccagtatac aacataatcg aggaagacag ttcggttatg atggaaagaa 1981 tactcatgat cgcgccggaa ataatgccgt tcttcatcag aggcatcgtg atccgggtaa 2041 aggtcttcat gctggaggcc cccaggttga gggacgcttc ctccagcgat tcagggatat 2101 tgtgcaggat cgccgtcgac gaacgcacgg tatagggcat acgttttacc gccagcacga 2161 taatgatgat cagcgcggtc ccggtcagct ttaagggctg gcgggagaag gcggaaacga 2221 atgcgatacc caggatcgag ccgggaacga tgtagggggt catcgtgagc acgtccaggg 2281 aattggtaag gggattgggc cggcgcaccg aggcgtagga taccagcacc gcgatgagca 2341 cgatgatggc agccgcagag agcgcgaaca ccagcgtgtt gcggatggag acgctcatct 2401 gggagacggc ggtcttcatg ctctgcaggg agtagccttc gtcgaaggtg aggcccttgg 2461 tcttgcggaa cgcggtgacc cagatgcaga tctggggcag cagcgcgatc agcatgtaca 2521 gatacacata cacgtggcac agcacgttct tgatgccgta ggccggcagg ggttcgatgg 2581 ggtacatggc gctcatggag aaggccaggt ggttggagac cgcccgctgg atgatgaacg 2641 ccagcaacgc gaagaccacg accatcacgg agatggcggc cgcgaagccg ttatccgccg 2701 caacgtctcc caagaactcg ttgtagatca gctggggcac ggtcttaaag ccttcgccga 2761 tgagggaagg cgtaccgaag tcggacagcg ccttcatgaa caccaggatg ccggccgcca 2821 ggatcgtcgg gatgatgagg ggcaccacga tggtcatgat gatcttaaag ttgcccgaac 2881 ccagatttct ggccgcttcg agcagcgatt tgtccgtatt cttgagggct ccgcacacgt 2941 aggagaacac cagcggcacc agcgccagcg taagcacgag cacgatgccc ggcagaccgt 3001 agatcgtcgg cgtcgtaatg cccagatagt tctggaagaa ccgcgtaata tagccgtttc 3061 tgcccagcag caggatccag gaatacgatc cgataaatgg agccgacatg ctcgagatga 3121 ggatgaatac gcggatccag gacgagccct tgatctttac ggtcgagatg atgtaggcaa 3181 gaggcgtcgc cacgatgacc gcgcacaggg tgacggagac cgacacctta aaggagttga 3241 ccaccgcctt catgtagtag ctcttgctga agaacttctg gaagtgcttc agggagagcg 3301 cgccggtctc ggcgtcccgc agggacgcca gcagcaggct taagaccggg tagatcatga 3361 agacgatata gaccaggatg atgcacagcg taatgactgt ccactggtcg aattgtctgc 3421 gccgtctcag catgctattc ccccctcgtc aggttggtct cgccgtcttc ggagaacacg 3481 ttcaccttcg ccgtgttgat ggtgaggttc acacggtcgc ctgcggacag atagtccgtc 3541 tcggaggatt cctgaatgat cttgatctcg tcgccgttgt ccaggttcac cagatagtgg 3601 gtctggctgc ccaggaacgt gctgttcgta acgcttccgg taatgccctt tacatccgcc 3661 ggtgccagga gcagttcctc cggccgcacg gagaccttga caggcgtatt ttccggctgc 3721 gcatctttga tcgcggggac ctccgcggaa tagccttcca cggtgagagt cctgccggaa 3781 agggtgccgt tgatgatgtt cgtggaacca atgaagttcg cgacgaacac gttcgtcggc 3841 cggtgataga tgctgcgggg cgtgccgatc tgctggatga cgccgtcctt catgacagcg 3901 atccggtcgg acacggccat ggcttcttcc tggtcgtggg tgacgtagat cgtggtgatg 3961 cccacgctct tctgcaggtc gcggatgacc tcccgcatct ccagacgcag cttggcgtcg 4021 aggttggaga gcggttcgtc catcagcagc acgtccggct cgatgaccat ggctcttgcc 4081 agcgcaatgc gctgctgctg gccgccggac atgttttcag gcatgcggtc gcgcaggtgg 4141 gtgatcttta ccttctccag cacgtcgttg acgcgccgct ccgtttcggc cttggagacc 4201 ttgcggttcg taagaccgta ggccacgttc ttgaacacgc tcatgtgcgg gaagatggcg 4261 tagttctgga agaccatgcc gatgttccgc ttgttgggtg cgatgttgtt gatgaccttg 4321 tcgttaaagg agatcgttcc gccttcgatg gaattgaacc ctgctaccat gcggagcaga 4381 gtcgttttac cacagcctga ggggccaagg agagtgaaaa attcactctc cttgatctct 4441 aaattcagac cgggtattac tgtgttgtca ccgaaccgct ttacgatatc ggtgcatgtg 4501 atcgtaacac tcattgtctg attcctttat tccggttgca aattagttga cggaagccca 4561 gatgtcgttc cacttttcct tcagctcggc catgttctcg gcgcggagca cgggatcttc 4621 atcggattcg tagatggcgt cgggagcgac catgtagtcg ggcagctcgg cgtctacgcg 4681 gacggggttg gagaacatct ccgcacccat tctggactgg acttccttgc tggtgatgta 4741 gtccatgaac atcttcgcgg acttcatgtt agcagcaccc ttaatgatgg cgcctacgtc 4801 ggagaacggg gaaacgcctt cttcgggata gcagaaggaa acgggagcgc cttcgttgat 4861 gtagttgtaa acggcgctgt tgaaggtgac ggcgcaggtg tattcgccgt ctgcgcagga 4921 cttgtggcaa gcggaggagc cggcggccag tttgccgtcc aggttcttcg cgaactcggt 4981 gaggtattcg atggaggcat cggagaagta gctctggtgg tcacccatga cccaggccat 5041 caggcacagg gcggaagctg cagaagaagc tgcagcgggg tctgccatcg cgatcttacc 5101 cttgagttcg ggcttgagca ggtctgcgaa tcccttgatc tcgatgtcgc cgatcaggtt 5161 ggtgttccac atgatcagga tggagtctgc agagtacggg gtgagcttgt tgtactcgac 5221 gtgatggttc tctgccagga attcgtcgtt gggggttaca tactcttcga acaggtccaa 5281 atagtcgcca tagatggtct tggaaccgcc gatgatgatg tccgcatagg gagcgtcctt 5341 ttcggcttcg actctcttca gcagagcaga ggcgccgtcg gtgatgactt cgaccttaat 5401 acccgtctgg gcttcgaagt cggtgatcag cggcatctga gcgtccgtga aggaggtgta 5461 gatgaccagc tttccggtat ccggatcttc gccggtagct tcgccttcgg tctcggtctc 5521 gggttcggct gcgggctcgt tggagctcgt gcaggctgcc agagagaaga ccatcgcgag 5581 agccagcagc agtgctaaga atctcttcat agattttctc ctttccataa gaaaacacac 5641 ttttgggcag cataatatac tgcctctgag gtaattataa aaaatcgtga ccttctccaa 5701 aacagagaaa atcacgattt tatggtagaa aacacaggtg aggcgctacg ccttttcccc 5761 gcaaaagcgg gcgaggatct gttccacgat aggatagtcc gcggcagccc agtccagttt 5821 gggcatgtcc ttgggggcca gccagcaatg gtctacatgt tctttccgga cgaaacgggg 5881 atcggtgacc cggcacaaaa acgtgtccat ggtgatctca aattcggggt aaatatggtg 5941 caccgtggcg aaatagtcat cttcggagat ctctatgtta aagtccattt cctcgcgcag 6001 ctcgcgcatc agagcctggg gcttcgtctc cccttcctcg atcttgccgc cggggaactc 6061 ccacttgagg // LOCUS sequence012 6053 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence012 VERSION sequence012 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..6053 /mol_type="genomic DNA" /organism="" /note="sequence012" CDS 44..1177 /product="RNA polymerase sigma factor RpoD" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_054935954.1" /transl_table=11 /codon_start=1 /translation="MNYDSESEKKAYEQLDQILERAKKSGSITFNEVDDAFADLDMTQT EKDAFYDKLEDSGIEVKPLDIVDDFDFESLEPDSEAELEELVEAAETDDLTDMPKGVTV DDPVRMYLKEIGKVPLLTADEEMDLAQRMEQGDEEAKKRLCEANLRLVVSIAKRYVGRG MLFLDLIQEGNLGLIKAVDKFDWRKGFKFSTYATWWIRQSITRSIADQARTIRIPVHMV ETINKQIRVTRQLLQELGRDPTPEEIAAEMEIPVEKVREISKIAQEPVSLETPIGEEED SHLGDFIPDEDVPSPADAAAFSMLKEQLDEVLSTLTDREQEVLRLRFGLDDGRQRTLEE VGQMFKVTRERIRQIEAKALRKLRHPNRSKRLRDYLE" /locus_tag="LOCUS_0710" /gene="rpoD" /note="WP_054935954.1 RNA polymerase sigma factor RpoD (Moorella) [pid:69.2%, q_cov:98.1%, s_cov:99.4%, Eval:3.9e-141]" /note="MGA_89" CDS 1182..1874 /product="class I SAM-dependent methyltransferase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_009889262.1" /transl_table=11 /codon_start=1 /translation="MTLSERLKTIAGLVLAGRPMADVGTDHGFLPLYCLQEELVPYAVL SDINEGPLQRAKETMASSGISSQHYDLRLGGGLSVLHPGEAATVVIAGMGGELIASILA EDAAVTDSIERFVLQPRSRSGHLRSWLWEHGWQIREESLARERGRLCQILCVEKGRQDP YAYPDIPESEHPLMIEFLDKELVNIRVVTENLCRSKDPSDLQTADCLRRKAETLEKRRE ELWRKSFS" /locus_tag="LOCUS_0720" /note="WP_009889262.1 class I SAM-dependent methyltransferase (Clostridioides difficile) [pid:34.9%, q_cov:97.4%, s_cov:99.1%, Eval:1.2e-31]" /note="MGA_90" CDS 1853..2623 /product="Nif3-like dinuclear metal center hexameric protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_010964615.1" /transl_table=11 /codon_start=1 /translation="MEKELFLNVLNDIAPLSLQEEWDNSGVQIAFGDREISRVLVALEV TKDVIREAKREHCDFILCHHPLLFHPVKCIEPEFTVGAYIQELIRADIGVYAAHTCFDK APGGNNDYLMKALGCAFPEELAGGIARIGRLDRPVSFDEFISDVNAACGYEGLKIQGDS RREVQTIALCTGAGGEYVYDAVKAGADVYISGDISHHDAQAAKDLGICLIDAGHYGTEW QFVPNMAAHLNADKRVTAEIVKSEAMRNPFEYTL" /locus_tag="LOCUS_0730" /note="WP_010964615.1 Nif3-like dinuclear metal center hexameric protein (Clostridium) [pid:31.0%, q_cov:96.5%, s_cov:96.3%, Eval:3.0e-34]" /note="MGA_91" CDS 3198..4394 /product="methionine gamma-lyase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003400106.1" /transl_table=11 /codon_start=1 /translation="MSKEHAMRTRLIHGDKHEMNPFGSLQMPIFQTSTYQFESTKQGAD RFAGKEPGYIYARLGSPSTTQIEEKLAILENTECAVATSSGMGAISSGTIPFLQKGDRL VADKALYGCTFELFSQQLPKWGIDVEFIDFADLSAVRKALRKKTKMTYCETIANPTMKV VDLEKICKIAHEKNPDCICVVDNTFATGLICKPHDLGADIVVHSATKYLNGHGDIIAGF VCCDSKYYPAVLTNGLKNITGSVPAPLNAFLLNRGLKTLPLRMKAHCENAMKVAKWLEE NKDIEAVYYPGLKSHPQYKIAKKELAMTGGMIAFEPKTAKIAEKMMNNVKLCTLAVSLG DCETLIEHPGSMTHSTYTEEEMIDAGFNKKLIRLSVGLEDPDDIIADLDQALKAALKK" /locus_tag="LOCUS_0740" /gene="megL" /EC_number="4.4.1.11" /note="WP_003400106.1 methionine gamma-lyase (Clostridium) [pid:53.6%, q_cov:95.0%, s_cov:94.8%, Eval:3.1e-112]" /note="MGA_92" CDS 4561..5001 /product="2-oxoacid:acceptor oxidoreductase family protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_012582671.1" /transl_table=11 /codon_start=1 /translation="MGAPITAYNRISDKPIRVHSNIYDPDYVVVVDETLIEDIDVTAGL KEDGAIIINTAKSPEEIRPMLRGYKGRVCTIDARKVSLATLGKYFPNSPMLAATLKVTG LMDIDAFLKEMEKSYAHKFATKPEVIKGNMDALKMALEEVRG" /locus_tag="LOCUS_0750" /note="WP_012582671.1 2-oxoacid:acceptor oxidoreductase family protein (Dictyoglomus turgidum) [pid:46.9%, q_cov:99.3%, s_cov:75.3%, Eval:1.2e-34]" /note="MGA_93" CDS 5001..5306 /product="4Fe-4S binding protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_012546290.1" /transl_table=11 /codon_start=1 /translation="MKTDISKQGLDVKWKDMTVGASIVCAGGAVDFMTGEWRVDTPKFI EDKCKQCLLCVPVCPDSCIPVVDGKRADFDFDHCKGCGICAKACPFGAIEMRRGEK" /locus_tag="LOCUS_0760" /note="WP_012546290.1 4Fe-4S binding protein (Thermodesulfovibrio) [pid:54.4%, q_cov:78.2%, s_cov:83.2%, Eval:9.8e-22]" /note="MGA_94" ORIGIN 1 cgaactgcag cggaaattta tcaaataagg ggaaggaaaa ggaatgaatt acgacagcga 61 aagcgaaaag aaagcttacg aacagttgga tcagatcctg gaaagagcca agaaatccgg 121 ctccatcacg ttcaacgaag tggacgacgc ctttgccgac ctggacatga cccagaccga 181 aaaggacgcg ttctacgaca agctggagga ttccggtatc gaagtaaagc cgctcgacat 241 cgtagacgac ttcgacttcg aatcgctcga accggacagc gaagcggaac tggaagaact 301 ggtggaagca gcggagacgg acgatctcac ggatatgccg aagggcgtga ccgtagacga 361 tcccgtccgc atgtacctga aggagatcgg caaggtgcct cttctgaccg cggacgagga 421 gatggatctg gcacagcgca tggagcaggg cgatgaagaa gccaagaagc gcctgtgcga 481 agccaacctg cgtctggttg tctccattgc caagcgctat gtaggccgcg gcatgctgtt 541 cctggacctc atccaggaag gcaatctcgg tctcatcaaa gcagtcgaca agttcgactg 601 gagaaaggga ttcaagttct ccacctatgc gacctggtgg atccgccagt ccatcacccg 661 gtccatcgcg gaccaggcac ggacgatccg tatcccggtg cacatggtag agaccatcaa 721 taagcagatc cgggtgaccc gtcagctgct gcaggagctg gggagagacc cgactccgga 781 agagatcgca gcggagatgg agattcccgt ggaaaaggtg cgcgagatct ccaagatcgc 841 gcaggaaccg gtctctctgg agactccgat cggcgaggag gaggattccc acctcggaga 901 ctttatcccc gacgaagacg tgccgtctcc tgcggacgca gcggcgttct ccatgttgaa 961 agagcagctg gacgaagtgc tttccacgct caccgacaga gagcaggaag tactgcgcct 1021 tcgtttcggc ctggacgacg gacgccagcg cacgctcgaa gaagtcggac agatgttcaa 1081 ggtcacccgc gaacgcatcc gtcagatcga agcgaaggcg ctgcgcaaac tccgccaccc 1141 caaccgcagc aagcgcctga gagattacct cgaatagatc catgacgctg agcgaacggc 1201 tgaaaaccat agcaggtctc gtgcttgcag gaagacccat ggccgacgta gggacggacc 1261 atgggtttct gcctctttat tgcctgcagg aagagctcgt gccttatgcg gtgctctccg 1321 atattaacga agggcctctg cagcgggcga aagagacgat ggcctcgtcc ggcatttctt 1381 cgcagcatta cgatcttcgc ctgggcggcg ggctttccgt cctgcatccg ggcgaagcag 1441 cgaccgtagt catcgccggc atgggaggcg aactcatcgc ttccattctg gcggaagatg 1501 ctgcggtcac ggacagcata gaacgcttcg tcctgcagcc acgcagcagg agcggacatc 1561 tccgcagctg gctctgggaa cacggctggc agatccgaga agaaagcctt gcgagagaac 1621 ggggcagatt gtgccagatc ctgtgcgtgg aaaaaggccg tcaggaccct tatgcctatc 1681 cggatatccc ggaatcggaa catccgttga tgatcgaatt cctggataag gaattggtta 1741 acataagagt tgttacagaa aatctctgcc gttccaaaga tccgtccgat ctgcagacgg 1801 cggactgttt gcgccgcaag gcggaaacgc tggagaaaag gagggaagaa ctatggagaa 1861 agagcttttc ctgaacgtcc tgaacgacat cgcgccgctg tctctgcaag aagaatggga 1921 caacagcggc gtgcagatcg ccttcggaga cagagaaatc tcccgcgtcc tcgtcgcgct 1981 tgaggtcacg aaagacgtca tccgcgaagc gaaacgggag cactgcgact tcatcctgtg 2041 tcatcatcct ctcctgttcc atcccgtaaa atgcatcgaa ccggagttta ccgtcggcgc 2101 atacatccag gaactcatcc gcgcggacat cggcgtctat gcggctcaca cctgcttcga 2161 caaagcgccg ggcggcaaca acgactacct gatgaaggca ctgggatgcg ccttcccgga 2221 ggaactggcc ggcggcatcg cccgtatcgg cagactggac cgtccggtct ctttcgacga 2281 attcatctcc gacgttaacg cggcgtgcgg ctatgaagga ctgaagatcc agggagactc 2341 ccgcagggaa gtgcagacga tcgcgctgtg caccggtgca ggcggggaat acgtctacga 2401 tgcggtgaag gcaggggcgg acgtctacat ctccggcgat atctcgcacc acgatgccca 2461 ggcggcgaaa gatctgggga tctgcctcat cgatgccggt cattacggca ccgaatggca 2521 gttcgtgccc aacatggctg cccatctgaa cgctgataaa cgggtcaccg cggagatcgt 2581 aaagtccgaa gccatgcgca acccgttcga gtatacgttg taacgaaaca attttataaa 2641 gatccatgag cagcccatgc ggtcgcgggc gcgctgcgaa aagcgcgcgt gaggaaagtc 2701 cgggctccat agggcaagga tgacagctaa cggctgccgg gggtgacccc agggaaagtg 2761 caacagaaaa caaccgcccg caagggtaag ggtgaaaagg cgaggtaaga gctcaccggg 2821 tctctggcaa cagcgaccgt ccgtgtaaac cccatccgga gcaagaccaa acagggaggc 2881 aggtgcatcc gtgcaaaccg cctgaaaggg ggctgcccgt cccttcccgg gaggtaggtc 2941 gcttgagtcc tctggcgaca gaggtcctag aaagatgatc gcttaataca gaacccggct 3001 tataggctgc tcatgatttt tacagagtcc gcaaggactc ttttttgaat ttcttaatta 3061 attttgatgg attacattaa aaaaacgata gattctctcc gcattttctg ttgtattgcg 3121 catttcatag ttttataatg aaaacgaagt tgtaaacatt tggctaatct tttttaacca 3181 aaaggaagga gttaacaatg agcaaagaac atgcaatgcg aacaagactg attcatggcg 3241 acaagcacga gatgaatccg ttcggatccc tccagatgcc tattttccag acatctacgt 3301 accagttcga gagtaccaaa cagggcgcag acagattcgc cggtaaggaa cccggttaca 3361 tctacgctcg tctgggcagc ccctccacca cgcagatcga agagaagctg gcgatcctgg 3421 agaacaccga gtgcgcagtt gctacctctt ccggcatggg cgctatctct tccggtacca 3481 ttcccttcct gcagaagggc gacagactgg tcgcagataa agctctgtac ggctgtacgt 3541 tcgaactgtt ctctcagcag cttccgaagt ggggaatcga tgtggaattc atcgatttcg 3601 ctgatttgag tgcagttcgc aaagctcttc gcaagaagac caagatgact tattgcgaga 3661 ccatcgccaa cccgaccatg aaggtcgtcg atctggagaa gatctgcaag atcgctcacg 3721 aaaagaaccc cgactgcatc tgcgtcgtcg ataacacctt cgctaccggt ctcatctgca 3781 agccccacga tctgggcgcc gacatcgtcg tacactccgc aaccaagtat ctgaacggcc 3841 acggcgacat cattgcgggc ttcgtctgct gcgacagcaa gtactatccc gccgtgctca 3901 ccaacggtct caagaacatc accggttccg tacccgctcc gctgaatgca ttcctgctca 3961 acagaggtct caagactctg cccctgagaa tgaaggcaca ctgcgagaac gccatgaagg 4021 tcgcgaagtg gctggaagaa aacaaggata tcgaagcggt ttactatccc ggtctgaagt 4081 ctcatccgca gtataagatc gcgaagaagg aactggccat gaccggcggc atgatcgctt 4141 tcgagccgaa gaccgccaag atcgcagaga agatgatgaa caatgtcaag ctctgcacgc 4201 tggcagtatc cctgggcgac tgcgagaccc tgatcgaaca tccgggcagc atgacccaca 4261 gcacctacac agaagaagaa atgatcgatg ccggcttcaa caagaagctc atccgtctct 4321 ccgtcggtct ggaagatccc gacgatatca tcgcagacct cgatcaggca ttgaaggctg 4381 ctttgaaaaa ataaataaca tatttctaca accggaggtt attacatgaa aggtttaact 4441 gaaatcagat ggcatggccg cggcggacaa ggcgccaaaa cggctgcgct cctcctggcg 4501 gacgtttgct tttccaccgg tgccgaagta cagggcttcc ctgaatacgg tcctgagaga 4561 atgggcgcgc ccattaccgc ttacaacaga ataagcgaca aaccgattcg ggtacattcc 4621 aacatctacg accccgacta tgtcgtggtc gtagatgaga cccttattga agacatcgat 4681 gttacagcag gtctgaagga agacggtgcc atcatcatca acacggcgaa gagccccgaa 4741 gagatccgtc ccatgctgag aggctataag ggcagagtat gcacgatcga tgcccgcaag 4801 gtatccctcg ctacgctggg taagtatttc cccaactccc cgatgctcgc agctaccctg 4861 aaggtcaccg ggctgatgga tatcgacgcg ttcctgaagg aaatggagaa gtcttatgct 4921 cataagttcg ccacgaagcc cgaggtcatc aagggcaaca tggatgctct gaagatggct 4981 ttagaggagg tgcgcggata atgaagacag atatttctaa gcagggactc gacgttaagt 5041 ggaaggatat gaccgttggc gcaagcatcg tttgcgcagg cggcgccgtg gatttcatga 5101 ccggcgaatg gagagtcgat accccgaaat tcatcgaaga taaatgcaag cagtgcctgc 5161 tttgcgttcc cgtttgcccc gacagctgca ttcccgttgt cgacggcaag agagccgatt 5221 tcgacttcga tcactgcaag ggctgcggca tttgcgccaa ggcttgcccc ttcggtgcga 5281 tcgaaatgag aaggggggaa aagtaagatg gcaaaacaga tccgtgaaag attatccggc 5341 aacgaagccg tcgcaaccgc gatccgtcag atcaatcctg acgtcatggc tgcattcccc 5401 atcactccgt ccaccgagat ccctcagttc gtaagctctt acgtagcaaa cggcctgatc 5461 gataccgaat tcgtacctgt agaatctgag cactccgcca tgtccgctac tatcggcgca 5521 tccgctgccg gtgcccgcgc catgaccgct acttcttccg caggtctggc actcatgtgg 5581 gaagagctgc acatcgcttc ttccgacaga ctgcccgtcg tactggctct ggtcaacaga 5641 gctctgtccg gccccatcaa catcaacgca gaccattccg acggcatggg cgccaaggac 5701 tgcggctgga tccagctgta ttccgaggac aaccaggaag cctatgacaa catgtgcatg 5761 gcattccgca tctccgaaaa ggtaaagctg cccgttatgg tatgccagga cggtttcatc 5821 acgtcccacg ccgttcagaa catcattctg aacgaagatc aggacgtaaa ggattttgtc 5881 ggcacctatc agcccgagga ttatctgctg aacgcggaga accccatggc tgccggtcct 5941 tattccgtca cccagtatta catggaagcc cgcagaggcg tcgctcaggc tatgagagac 6001 tccaaggaga ccatcatcgc cgtttccaag gaatacggtg aaaagttcgg cag // LOCUS sequence013 6045 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence013 VERSION sequence013 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..6045 /mol_type="genomic DNA" /organism="" /note="sequence013" CDS 336..2891 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MHFMKKNRLIPVNIILMLCILVFVSLYARHQSQADFDAKVVSFQN MTTAMEQVTENYLEGEQRICDVWAHYISSHDMTLEEAVRFIRASHVSVHAAAHVLYTDD GSMEGLSTRPRTGSDDDFGVSYQNLDLFPDLAQIGAVGESVHITRAYTSPVSGIQSIGF YNKLALVDPDTGLPREGIVVRVVPISELRSKWVFPQEEYQNAEFSMIDAAGNYIIKGES FKNSSFLEFYKSYNAVDAGTLDRLAGSIRKESGSFFMNNSRGESCLVAHTPVRASEDWS LLSYIPVKDIQPASVDWRLIGVVFAGLLTILLLDAAYMRAFNKRLQQAAEEADAANRAK TDFLSTMSHDIRTPMNAITGLTVIAEKNADDPEAVRENLRKIGLAGNHLLTLINDILDI SKVESGKLTLSPVTFSIAETAENLVNLSQPMVKEKQIDFNFRINRIKTEYLYADQLRLN QIFINLLSNAVKYTGPKGRVCIDLREEESSVPGCIRLVYQVSDTGIGMTKEFMETMYQP FSRQTDSRVNKVQGTGLGLAITKQMVDLMGGTIDCESEEGKGTAFTVTLDIPAAEKQLD EMDLNGANILIADDDDVLLETAKDALLQLGAAVETAESGETAYEKTMQRHREGRPFDVI ILDWRMPGSDGVDTIRRIRSEVGADIPILLISAYDWSDIEETAKEAGANGFISKPLFRS KLYEAIRGAMGTPSAAVEPEEDNSDLAGMHALIAEDNDINWEIIHALLAMYGIDSVRAE NGQVCVDMFREAGEDVYDLIFMDIQMPVMNGLEAARTIRGLQDVPQAASIPIIAMTANA FSEDIAECKKAGMNSHIAKPIDIKFVIKELRKVREGSYQ" /locus_tag="LOCUS_0770" /note="WP_196793289.1 PAS domain-containing hybrid sensor histidine kinase/response regulator (Oxalobacter formigenes) [pid:43.8%, q_cov:59.9%, s_cov:63.6%, Eval:1.7e-114, partial hit]" /note="MGA_97" CDS 2888..4204 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MKQAKRYLCFALSLCLLFSLASCTSGSQPGEPAGPEEKPYEPALD PQTTGSVNVVGHYSNFEALESAFNRFAEFYPNVKMSYTYLDDYSNTLAAALTSEEAPDI FFMYPRMITGQAREDLLALAEDLSEDSLNIDLSSIRENLLQRDAEGHLPMVPVYCATYG MMVNEDLFAKEGIAIPETYADLISACDAFREAGYESPVMGYNQGSFFTFPLYYPYFCAQ ILSEGPESIEEVNGMGAAGGEHLRSTLELLDDFMNHGCADPELSKMMENDYQDVIMRFF EGNVPMMMASSNTVSGTQKRESQSEAFTASPFVYSFRPVPTTEEGGYFLTSVSMGFAVN QKSKNLDLTNEFMRFLVTTEQMNQVAADKRMVTPCKDMSLDSVYAAFGELPEDHVIYQY EIGISGDADSQVQKACWQLSNGLISIEDAVNGFGNLQDK" /locus_tag="LOCUS_0780" /note="MGA_98" CDS 4260..5873 /product="polysaccharide biosynthesis protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003425909.1" /transl_table=11 /codon_start=1 /translation="MDETNSKNKSFLKGAVILGLAGIIIKVLGAFFRIPLANIIGDDGM GYYQTAYPIYNLFLTLAIAGIPTAIARMVAERTALDRRYEAHRVFRVSFWLLFGTGVVT SAILFLGAGAITRAIKEPGAIYCMQAIAPALFFCPLMSSFRGYFQGLQDMTPTAVSQVV EQAFRVAIGLGLAVILLPKGLNIAAAGASFGATAGALFGFLGIGLVYLKRRKAILEEVS RDVRTDVESVGNIFKDILIIAVPITIGSAVLPVINTIDTAIVKTRLVSIGFDSDMARAL YGQLTGMAAPLLNFPQVLLQAVSMSIVPVVASAFKRQEMKFMHDNVNLAMRYASILSIP CAVGMSVLSTPIMLLFYPRVRESAASAGGCLQILAYGVIFLGMAHALNGILQGIGKQMI PVKNLCIGALVKICLTYLLTSIPALNVRGAAISTVAAYFTAAFLDFHAMKKHTGTRVDL KLTFGKPALCAAVMGVVVWAVYRICHGFLGNALSTVVAIGAGVVVYGILVLAVKAITLE EIERLPKGRKLANLLRRFRR" /locus_tag="LOCUS_0790" /note="WP_003425909.1 polysaccharide biosynthesis protein (Clostridioides difficile) [pid:43.0%, q_cov:99.1%, s_cov:99.1%, Eval:5.5e-118]" /note="MGA_99" ORIGIN 1 cgatacgttc gagcagttcg gctttcctct gatggaaaaa ctgggccgtc ccacgctgct 61 gtgcaacacg ctgcaggtgg ctccggacgg agagatcacc ggctttacca tgcgctgcgc 121 gcagagcaag ctcaccagcg ttaaggcgtt ccagtccatg ggctacgaga ccatcgctgc 181 tggcgattcc tataacgacc tgggcatgat ccgcgccagc aaggcgggca tcctgttccg 241 ggcgccggac aacgtaaagg cggaaaatcc ggacctcccc acctgcgaga cctacgaaga 301 gctgatggcc gcgatcaagg ctgcgctgta ataatatgca tttcatgaaa aagaatcgtc 361 tcattccggt caatatcata ctgatgctct gcatcctggt ctttgtctcg ctttatgcgc 421 ggcatcagag ccaggcggat tttgatgcaa aagtggtgtc gtttcagaat atgacgacgg 481 cgatggagca ggtgacggag aattacctgg agggtgagca gcgcatctgc gatgtctggg 541 cccattatat ctcctctcac gacatgacgc tggaggaggc tgtccgtttt atccgggcgt 601 ctcacgtttc cgtgcatgcg gctgcgcatg ttctctacac ggatgacggc agcatggaag 661 ggctctcgac ccggccgagg acgggaagcg acgacgattt cggggtgtcg tatcaaaatc 721 tcgatctttt cccggatctc gcgcagatcg gcgcggtggg agaatccgtc cacattacca 781 gagcgtatac cagcccggtg agcggcatac agtccatcgg gttctataat aaactcgctc 841 tcgttgaccc ggatacaggg ttgccgagag aagggattgt ggtccgtgtg gtgccgatct 901 cggaactgcg ttccaaatgg gtatttccgc aggaagaata ccagaatgcg gagttttcca 961 tgatcgatgc tgccggcaat tatatcatca agggcgaatc tttcaaaaac agcagtttcc 1021 ttgaattcta caaatcgtac aatgctgtag atgcgggaac gctggaccgg ctggccggtt 1081 ccatccgaaa ggaaagcggc tcctttttca tgaacaattc ccggggagaa tcctgtctgg 1141 tggcgcatac ccctgtccgc gcctctgaag actggagtct gctgagctat attcccgtaa 1201 aggacattca gcctgcgagc gtggattggc gcctgatcgg cgtggtcttt gcaggccttc 1261 tgacgatcct gctgctggat gccgcgtata tgcgtgcttt caataaaagg ctgcagcagg 1321 cggcggaaga agccgatgcc gcaaaccggg cgaaaacgga tttcctgtct acgatgtccc 1381 acgatatccg cacgccgatg aacgctatca ccggtcttac cgttatcgcg gagaagaatg 1441 cagatgatcc ggaagcggtc cgggagaatc ttcgcaagat cggtcttgcg ggaaaccatc 1501 tgctcacgct tatcaatgat attctggaca tctccaaagt ggagagcgga aaacttacgc 1561 tcagtcccgt caccttttcc atcgcagaaa cggcggagaa tctggtgaac ctttcccaac 1621 cgatggtgaa ggaaaagcag atcgatttca acttccgcat caaccggata aagacggaat 1681 atctgtatgc agatcagctg cggctcaacc agatcttcat caacctgctt tccaatgcag 1741 tcaagtatac gggccccaaa ggacgtgtct gcatcgatct gagggaagaa gaaagcagcg 1801 taccgggctg tatccgtctt gtatatcagg tgtcggatac cggtatcggc atgacgaagg 1861 aattcatgga aacgatgtat cagcctttct cccgccagac ggatagccgg gtcaataagg 1921 tgcagggcac cggcctgggt ctcgccatta cgaaacagat ggtggatctg atgggcggga 1981 ccatcgattg cgagagcgaa gaaggaaaag gtactgcgtt tactgttaca ctggatatcc 2041 ctgcagcgga aaaacagttg gacgagatgg acctgaacgg cgccaatatc ctgatcgcag 2101 acgacgatga tgtgctgctc gagaccgcga aggatgcgct gcttcagctc ggagctgctg 2161 tagaaacggc ggaaagcgga gagaccgcct atgaaaaaac gatgcaaagg catcgggaag 2221 gccggccgtt cgatgtgatc attctggatt ggcgcatgcc cggttcggat ggtgtggata 2281 ccattcgccg tatccggagc gaagtcgggg cagatattcc catcctgctg atctcggcct 2341 atgactggtc cgatatcgaa gagactgcaa aggaagccgg cgcaaacggg ttcatcagca 2401 aaccgctatt ccgttccaag ctgtacgaag cgatccgcgg cgctatgggg acgcccagtg 2461 ctgcagtgga accggaagaa gacaacagcg atctcgccgg gatgcatgcg ctgatcgcag 2521 aagataacga catcaattgg gaaatcatcc atgcactgct ggccatgtat ggtatagaca 2581 gcgtaagggc cgaaaatgga caggtctgcg tggatatgtt ccgggaagcc ggcgaggacg 2641 tttacgatct gatctttatg gatatccaaa tgcctgtcat gaacggcctg gaggctgccc 2701 gcaccattcg cggcctgcag gatgttcctc aggcggcgtc catccccatc atcgccatga 2761 cggcaaatgc cttttccgag gatatcgcgg aatgtaagaa ggcgggcatg aacagccaca 2821 tcgcaaaacc catcgatatc aaatttgtca taaaagaact gagaaaagtt cgggaaggat 2881 cttatcaatg aaacaggcca aacgatacct atgctttgca ttatccctgt gtctgctgtt 2941 ttctcttgcc agctgcacgt ccggcagcca gccgggggaa cctgccggac cggaagaaaa 3001 accgtacgag ccagccttgg atccgcagac gacaggctct gtaaacgtcg tagggcacta 3061 cagcaatttc gaggcgctgg agtctgcctt taaccgtttt gcagaattct atcccaatgt 3121 aaagatgtcc tatacatatc tggatgatta cagcaacacg ctggcggcgg cgctcaccag 3181 cgaggaagcc ccggatatct tctttatgta tccccggatg atcaccgggc aggcgcgtga 3241 ggatctcctg gcattggcgg aagatctttc cgaagactcc ctgaacatcg acttgtccag 3301 tattcgggag aatctgctgc agcgggatgc ggagggtcat ctgcccatgg tccccgtcta 3361 ctgtgcgacc tacggcatga tggtcaacga agatctcttt gcgaaggaag ggatcgccat 3421 acctgagacg tatgccgacc tgatctccgc ctgtgatgca ttccgggaag ccggttatga 3481 aagccctgtc atggggtata atcagggttc gttcttcacg ttccccctct attatccgta 3541 tttctgcgcg cagatcctgt cggaggggcc ggaatcgatc gaagaagtga acggtatggg 3601 cgctgccggc ggagagcatc tgcggtccac actggaactc cttgatgatt ttatgaacca 3661 tggctgtgca gaccccgaac tcagcaagat gatggaaaac gattatcagg acgttatcat 3721 gcgcttcttc gaagggaatg ttcctatgat gatggcttcc agcaataccg tatccgggac 3781 ccagaagcgg gagagtcagt ccgaagcgtt tacggcatcg ccgttcgtct acagcttccg 3841 gcccgttccc actacggaag agggcggcta ctttctgaca tcggtctcca tgggttttgc 3901 cgtgaatcag aagagtaaaa atctggacct gacgaacgaa ttcatgcgct tcctcgttac 3961 gacggagcag atgaatcagg ttgcggcgga taaacgcatg gtgacgccct gcaaagacat 4021 gtccctggac agcgtatatg cggcattcgg cgaacttccg gaagatcatg tgatctatca 4081 atatgagatc gggatctcgg gagatgccga ttcccaggtc caaaaagcct gctggcagct 4141 gagcaacggt ctgatctcca tcgaagatgc cgtgaacggc ttcgggaatc tgcaggacaa 4201 atagagcttt tcaagaaagg cggtttccgc ctttcttttt tatgctataa tgaatcatta 4261 tggacgaaac aaacagcaaa aacaaaagct ttttaaaggg cgccgtcatc ctcggcctcg 4321 ccggcatcat catcaaggtg ctgggggcct ttttccgcat cccgctggcc aacatcatcg 4381 gcgacgacgg gatggggtat taccagacgg cgtatccgat ctataatctg tttctgaccc 4441 tggccatcgc cggcattccc acggccatcg cccgtatggt ggccgaaagg accgccctgg 4501 accgccgcta cgaggctcac agggtatttc gcgtatcgtt ctggctgctg ttcggcaccg 4561 gcgtcgtcac gagcgccatc ctgtttttag gggcgggcgc cattacccgc gccatcaagg 4621 agccgggggc gatctactgc atgcaggcca ttgcgccggc gctgttcttc tgcccgctca 4681 tgagctcgtt ccgcggctat ttccaggggc ttcaggacat gacccccaca gctgtctccc 4741 aggtcgtgga gcaggcgttc cgggtggcga ttggcctcgg tcttgcggtc atcctgttgc 4801 ccaaagggct gaacatcgcc gcggcaggcg cttctttcgg cgctacggcg ggtgcgctgt 4861 tcggcttttt aggcatcggc ctcgtgtatc taaagcgcag aaaggcgatc ctcgaagaag 4921 tatcgcgcga cgtgcgcacc gacgtggaga gcgtcggcaa tatctttaaa gacattctga 4981 tcatcgcggt gcccatcacc atcgggtctg cggtcttacc ggtcatcaac accatcgaca 5041 ccgccatcgt caagacgcgg ctcgtctcca tcggtttcga ttccgacatg gcgagagcgc 5101 tatacggcca gcttacgggc atggcggcgc cgttgctcaa cttcccccag gtgctgctgc 5161 aggcggtctc catgagcatc gtgcccgtgg tcgcctccgc ctttaagcgc caggagatga 5221 agttcatgca cgacaacgtg aatctggcga tgcgctatgc gtctatcctc agcattccct 5281 gcgccgtcgg catgagcgtg ctgtccaccc ccatcatgct gctgttctac cccagagtgc 5341 gggagagcgc agcttcggcg ggcggctgcc tgcagatctt ggcctatggg gtcattttct 5401 taggcatggc ccacgccctc aatggcattc tgcagggcat cggcaaacaa atgatcccgg 5461 taaagaacct gtgcatcggc gctctcgtaa agatctgtct tacgtacctg cttacgagca 5521 ttccagcgct caacgtaaga ggcgccgcca tcagcaccgt ggctgcgtat tttacggctg 5581 ccttcctgga tttccacgcc atgaagaagc ataccggcac gagagtggat ctgaaactga 5641 cgttcggtaa gcctgcgctc tgcgcggctg tgatgggtgt cgtcgtatgg gccgtctacc 5701 ggatctgcca cggtttcctg gggaacgctc tcagcactgt ggtcgccatc ggcgccggcg 5761 tcgtcgttta cggtattttg gttctggcgg taaaggccat taccctcgaa gagatagaaa 5821 ggctgccaaa gggcaggaaa ctggcgaacc tgctgcggcg cttcaggaga taacatgtac 5881 gaagaactgt ttaaactatc gaatacagac gcggaagcct tcgcgcggct gcagcgggtc 5941 atcgagatcc tgcgcgcccc cggcggctgc ccctgggacc gcgctcagac ccacgaaagt 6001 cttacccggg gcatggtgga ggaggcctac gaagtcgtgc aggcc // LOCUS sequence014 5876 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence014 VERSION sequence014 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..5876 /mol_type="genomic DNA" /organism="" /note="sequence014" CDS complement(1813..3753) /product="DNA topoisomerase (ATP-hydrolyzing) subunit B" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003434229.1" /transl_table=11 /codon_start=1 /translation="MSAEDIKQTGGSGNYDASQIQVLEGLDPVRKRPGMYIGTTGPRGL HHCVYEIVDNSVDEALAGYCNNIQVTIHEDNSVEVLDNGRGMPVDEHPKMHKPAMEVIM TVLHAGGKFGGGGYKVSGGLHGVGASVVNALSDFMQVESMRGGKIYRQTYSRGKKTSEV EVVGDCGRQTGCRVIFHPDQEIFEEIEFSYNTLESHLRETAFLNKGIKITLTDERGEKK KKAVYHYEGGIKEYVKFQNANKEPIHPDIIYYEFKKKDQEVEVAMQYTDSYTETILSYA NNINTVEGGTHLVGFKSALTRAVNDYAKKAKLMKDNDEPLTGEDIREGLTAIISVKLTE PQFEGQTKTKLGNTEMRGFVETVTSENVFAFLEENPAQAKPIIEKCLKAFRAREAARKA RDLTRRKTALDNTSLPGKLADCSEKDPALSEIFIVEGDSAGGSAKEGRDRKRQAILPLR GKILNVEKARLDRMLNSDTIRDMITAFGCGIGSEFNIEKLRYHKIIIMTDADVDGAHIR TLLLTLFFRYMPKLIEEGYVYAAQPPLFRVKSGKEIWYTYSDKEQEKLLAELASQGKTK PEIQRYKGLGEMDATQLWETTMDYNTRTLIQITIDDFAAADQIFTTLMGDKVPPRRKFI EENAEYAKLDV" /locus_tag="LOCUS_0800" /gene="gyrB" /EC_number="5.6.2.2" /note="WP_003434229.1 DNA topoisomerase (ATP-hydrolyzing) subunit B (Clostridioides difficile) [pid:64.5%, q_cov:97.8%, s_cov:99.4%, Eval:2.4e-235]" /note="MGA_102" CDS 4142..5488 /product="chromosomal replication initiator protein DnaA" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011947895.1" /transl_table=11 /codon_start=1 /translation="MTKTELKEKWNVVLDLLYTSMERLKVDTFFRPLTPVKLSEKKETI YLKTAGSKSSVYQNSINNHKEFLSEALIKAFGKEYKLEIVDAEPPDDDDEGGSPIPEEK DYGFNPRYTFESFVQGPNNQLALAACLAIADKGYVKEYNPLFLYSGPGLGKTHLMHAVG QYIIKHFPKKRVMYVSSEAFTNELVTSIQEKSTDKFRNKYRKVDVLLFDDVQFISGKAA TQEELFHTFNDLYNARKQIIFTSDKPPQELVGIPDRLTSRFGQGLSVDINPPEYETRFA ILKNLAILSNVEVTPEIEDMLDLIAQNVTTNIRDLEGAFTRVHASSQLLGSPMNKDLAK MVLTDIFKNTKTKEITPDIIKKEVSKYFGVKVSDMESANRSKDVAFPRQIAIYLIREHT NYSLPQMGKLFGGRDHTTIRHSYEKIAEEIKKDKDLQETIETIYRQIEG" /locus_tag="LOCUS_0810" /gene="dnaA" /note="WP_011947895.1 chromosomal replication initiator protein DnaA (Clostridium botulinum) [pid:41.5%, q_cov:98.9%, s_cov:98.9%, Eval:5.4e-100]" /note="MGA_103" ORIGIN 1 cgcctggatg cgttctctct gcagcaggtt gaggaagttg accgccggcg tgcccttggc 61 ctgtctgttg gcctcgggga tctcgtacgc cttgatctta tacgccttgc ccatgctggt 121 gaagaacatc agattgtcgt gggtggacgt ggtgatgagg tgcttcacga agtcgttctc 181 tctggtggtg aggcccgtaa tgcccttgcc gccccgcttc tgcgtgcggt aggtgtcctc 241 ggagactctc ttcaggtagc ccaggtggga gacggtgatg accacattct cctcttcgat 301 gagctcggat tcgtccactt cctcctcgtc cgcgatgatc tcggtgcgtc tgtcgtcgcc 361 ccacttgttc ttgatctcgg tgagttcgtc cttgaccacg cccatcagca gcttttcgtc 421 cgccagcagg ctcttgtagt aggcgatctt ctttaagagt tcctgatatt ccgcctcgat 481 cttgtcgcgc tccagaccct gcagtctctt cagctgcatg tccaggatgg cctgggcctg 541 gatctgggac agaccgaact tcttcatcag ctgttctctg gcgtcatcgt agctttcgcg 601 gatcgtcttg atgatctcgt cgatgtggtc cagcgcgatg cggtaaccct ccaaaatatg 661 ggctctcgcc tcggccttgg caaggtcgaa cttcgtccgt ctggtgagga cttccttctg 721 atgcttgatg tattcggtta agatgtcgtg gatgttcagc agctggggcc ggccgtttac 781 cagcgcgatc atgatgatgg aaacgttggt ctccagctcc gtgtgcttgt acagccggtt 841 gagcatcacc ttcgggttga cgtccttctt cagctcgata acgacccgca cttcgccctt 901 ggaggactcg tcgcggatgt cccggatgcc gtccagcttc ttgtcgcgca cgagctccgc 961 gatgtgggag atcatggcgg ccttgttgac cccatagggg atctcgtgga agatgatgga 1021 ggtgatgcct ctcgcgcctt cttcgataac gcccttcgct ctgagtttta ccttgccctg 1081 accggtgcgg taggcttcct tgatggcggt cttgccgacg atggtggcac ccgtcgggaa 1141 gtccggtccc ttgatgatct tgatgagggt ctccacgtcc gcgttcggat cgtcgatgag 1201 cttgatggtg ccgtcgatga cctcgcggag gttatggggc gggatggcgg tggccatgcc 1261 gaccgcgatg ccattggcgc cgttgaccag cagattgggg aaacgggcgg gcagcaccac 1321 gggttctttt tcttcgccgt cgtagttgtc gacgaagtct acggtatcct tgtcgatgtc 1381 ccggagcatc tccagggcaa agggagccat gcgggcttca gtgtaacggg aagcggccgc 1441 gccgtcgccg tccatggaac cgaagttgcc gtggccgtcc acgaggcggt agcgcatgtt 1501 ccagggctgg gccaggcgca ccatggcgtc gtagatggat gcatcgccgt gggggtggta 1561 tttacccatg acttcgccca cgatacgggc ggacttttta tggggtttgt ccggcgtgat 1621 gcccagggca tccaggccgt acagaatgcg gcggtggacc ggcttaaggc cgtcccgcac 1681 gtcgggaagc gctcttgcaa cgattacgct catggagtaa tcgatgtagg aggtcttcat 1741 ttcttcgtat atctcgtgct gtaagatctt tctgtcttcg gtaagatccg gcatgttctc 1801 tcctccttcc tcttatacgt ccagttttgc gtattccgcg ttttcttcga tgaattttct 1861 tctggggggc accttatcgc ccatcaacgt cgtaaagatc tggtcggcgg ccgcgaagtc 1921 gtcgatggtg atctggatga gcgtacgggt gttgtaatcc atggtggtct cccacagctg 1981 ggtggcgtcc atttcgccca gacctttgta acgctggatc tccggcttcg tcttgccctg 2041 ggacgccagc tccgccagca gcttctcctg ctccttgtcg gaataggtgt accagatctc 2101 cttgccggat ttgacccgga acaaaggcgg ctgcgccgcg taaacatagc cctcttcgat 2161 gagcttcggc atgtagcgga agaacagcgt gagaagcagc gtgcggatat gagcgccgtc 2221 cacgtcggca tcggtcatga tgatgatctt gtggtagcgc agtttttcga tgttgaattc 2281 ggagccgatg ccgcagccga acgccgtgat catgtcgcgg atggtgtcgg agttgagcat 2341 gcggtccagg cgggccttct ccacgttgag gatcttgccg cgcagcggca ggatggcctg 2401 gcgctttctg tctctgcctt ccttggcgga gccgcctgcg gagtcaccct ctacgatgaa 2461 gatctcggac agagccggat ccttttcgga gcagtccgcc agcttgccgg gcagcgaggt 2521 gttgtccagc gcggtcttgc ggcgggtaag gtctctcgcc tttctggccg cttctctggc 2581 gcggaacgcc tttaagcact tttcgatgat gggcttggcc tgggccgggt tttcctccag 2641 gaaagcgaac acgttctcgg aggttacggt ctcgacaaag cctctcatct cggtgttgcc 2701 cagtttggtc ttggtctgac cctcgaactg gggctccgtg agctttacgg aaatgatggc 2761 cgtaaggcct tcgcggatat cttcgccggt gagaggctca tcgttgtcct tcatcagctt 2821 cgccttcttg gcatagtcgt tgaccgctct cgtaagcgcc gatttgaagc cgaccagatg 2881 cgtgccgccc tccacggtgt tgatgttgtt ggcataggaa aggatggtct cggtatacga 2941 atccgtatac tgcatggcca cttccacttc ctggtccttc ttcttgaact cgtagtagat 3001 gatgtcggga tggatgggtt ccttgttggc attctggaac ttgacgtatt ccttgatgcc 3061 gccttcgtaa tgatagacgg cttttttctt cttctctccc ctctcatccg tgagggtgat 3121 cttgatgccc ttgttcagga acgcggtctc ccgcagatgg gattccagcg tgttgtagga 3181 gaattcgatc tcctcgaaga tctcctggtc cgggtggaag atgacccggc aaccggtctg 3241 ccgtccgcag tcgccgacga cttccacttc gctggtcttc ttaccccggg aataggtctg 3301 gcggtagatc ttgccgccgc gcatgctctc cacctgcata aagtcggaga gcgcgttgac 3361 gacggatgcg cctacgccgt gcagaccgcc ggataccttg tatcctccgc cgccgaactt 3421 gccgccggcg tgcagcaccg tcatgatgac ttccatggcg ggtttatgca tcttgggatg 3481 ctcgtccacc ggcatgcctc tgccgttgtc cagcacctct acgctgttgt cttcgtggat 3541 ggtgacctga atattattgc aatagcccgc cagcgcttcg tccacggagt tgtccacgat 3601 ctcgtagaca cagtgatgaa gtcctctggg gccggtcgta ccaatataca tgcccgggcg 3661 ttttctgacc gggtcaagac cttccagcac ctggatctgc gacgcgtcgt aattgccgct 3721 tcctccggtc tgtttgatgt cttctgcaga cataaaaatt tcccccttat aaacattttt 3781 tctaagcttc tttaactttt ttataatagc acgattttct gcatatttca acgagaaggc 3841 cgaaaatcgc ccgaaattgc gattttacta taaatttaca ggaacatatg tttattatct 3901 ttcatttctt atataatata ttggtattac ggatgaaaaa aattttttcc gcacctttta 3961 tcactaaatc ttgtggtttt gcaaaaatgg gataaagtta tccacaacat gtgtaaaacc 4021 tgtggataac ttgacctgac tgtattcttc ccctctctat tcctgtggaa aactactttg 4081 tgatataatc ggtatcgccc atacatatgg tgttcaatac tagctatagg aatggtttga 4141 aatgacaaaa acagagctga aagaaaaatg gaacgtcgtg ctggatctgc tctacaccag 4201 catggaacgg ttaaaagtgg atacgttctt ccgcccgctg accccggtca aactgagcga 4261 aaagaaggag accatctacc tgaagaccgc cggatccaaa agcagcgtct atcaaaatag 4321 catcaacaat cacaaggagt ttctttccga agcgctgatc aaggccttcg ggaaagaata 4381 taagttggag atcgtcgacg cggagccgcc cgatgatgat gacgaaggcg gcagcccgat 4441 cccggaagaa aaggattacg ggttcaaccc cagatatacc ttcgaaagct ttgtgcaggg 4501 tcccaacaac cagctggcgc tggccgcctg cctcgccatc gcggataagg gatacgtaaa 4561 agagtacaac cccctcttcc tttacagcgg tcccggtctg gggaaaaccc acctgatgca 4621 cgctgtggga cagtatatta ttaagcattt cccgaaaaag cgcgtcatgt acgtctcctc 4681 ggaggctttc accaacgagc tggtgacgtc cattcaggaa aagagcaccg acaaattccg 4741 caacaagtac agaaaagtgg acgttctgct gttcgacgac gtgcagttta tctcgggaaa 4801 ggccgcgacc caggaggagc tgttccatac gttcaacgat ctgtacaacg cgagaaagca 4861 gatcatcttt acgtcggata agcctcccca ggaactggtg ggcatcccgg acaggctaac 4921 aagccgtttt ggacaggggc tttccgtgga tatcaatccg ccggaatacg aaacgaggtt 4981 tgccatcctg aaaaatctgg ctatcctctc caacgtggaa gtaacgccgg agatcgaaga 5041 tatgctggat ctgatcgccc agaacgtaac gacgaacatc cgcgacctgg aaggcgcctt 5101 tacgagagtg catgcttcgt cacagctgct ggggtcaccg atgaacaaag acctggcaaa 5161 gatggtcctt acggatatct ttaagaatac gaagacgaaa gagataacgc cggatatcat 5221 caagaaagaa gtttccaaat acttcggcgt aaaggtgtcg gacatggaaa gcgccaaccg 5281 ttccaaggac gttgcatttc caaggcagat cgccatctat ctcatccggg agcacacgaa 5341 ctattccctg ccccagatgg gaaagctgtt cggcggcaga gaccatacga cgatacggca 5401 cagctacgaa aaaatagcgg aagagatcaa aaaagataag gatctgcagg agacgatcga 5461 gacgatctac cgtcagatcg aaggatgatt ttccacagga tgtgtaaaac agggacttac 5521 ttttccacag cttttccatt ccgcgtccgc ttttctttca acggatgaga acggttatcc 5581 cccttttcca cagcctctat tactaaagct actaaaaata ctggaagaat ataaggagag 5641 ctcgcatgaa attcacatgt tctcagggcg ctttaacgag agcgctgaat acggtatcca 5701 aagcggtttc catccgtacg acgatcccca ttctcaaagg tatccttctt actgtcaaag 5761 gaaatgaact taccgttacg gcatcggatc tggacctttc catcgaaacg aagatggaag 5821 tacaggcagc ggaagaagga agcgccgtcg tttcctccaa actgttctcc gagatc // LOCUS sequence015 5855 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence015 VERSION sequence015 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..5855 /mol_type="genomic DNA" /organism="" /note="sequence015" CDS complement(1012..1638) /product="histidine phosphatase family protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_005903719.1" /transl_table=11 /codon_start=1 /translation="MKLLLIRHPQTEALKQRIIYGRTESPLTKEGSESIAWAADRLKTI DLAALYCSPQQRAKLLAEGIAAVHPELSLRIDERICELHCGIYEQMTFEEAVAVDAEDA NKFLYEFGFHRPKGGENFEDVKARTGPFLADLAAEAEKEGYGERPIAVVSHAMAIRSMI AHMTGFGLNDIWHIEIQPTGILEFDYQPEHKFGRLISMTGPASLI" /locus_tag="LOCUS_0820" /note="WP_005903719.1 histidine phosphatase family protein (Fusobacterium nucleatum) [pid:27.8%, q_cov:89.9%, s_cov:92.7%, Eval:5.6e-11]" /note="MGA_106" CDS complement(1635..2567) /product="DMT family transporter" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_010963403.1" /transl_table=11 /codon_start=1 /translation="MKNKKMLGNILLTLTALIWGTAFVGQRVGMESIEPITFGAARMAL AAVAVGIVALIVIKKERANPSSAYSLKSPEEQKAYNRNTVVGGICCGIFLCAASSFQQM GIVYTTAGKAGFITAMYMLLVPIINFLFFKKKNTWLVWLAVLVGVCGMYLLCMTEGFSL TRGDTLVCICAVLFALHILCCDHFVQLGNPIGISAIQFATTSVISWVIAFIAEEPTWAK IVSAAIPILYCGLMSGGLGYTLQIVAQKFTDPTIASLLMSLESVFAVLAGALLLNERMT GRELLGCVIMFAAIVMVQIPLPEKKKENA" /locus_tag="LOCUS_0830" /note="WP_010963403.1 DMT family transporter (Clostridium) [pid:40.9%, q_cov:99.4%, s_cov:97.4%, Eval:1.8e-58]" /note="MGA_107" CDS complement(2584..3300) /product="DUF554 domain-containing protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011462325.1" /transl_table=11 /codon_start=1 /translation="MLGIFTGTIVNALTVVIGTAVGCVFKGEKLKRIGERVFQGFGLFT VMLGISGAIDLPQPLFMLASLIIGTAIGELADLDDKFNRLANWLQSKFAKEGDTGFANG FISGTLLFCVGSMTIMGALQSGLSNQHTIYYTKSVLDGFSACMFAMGSGMGVGFASLAV LIYQGALVALSSLLAPIMTEEILAVSTAVGSLSVLGLGLNMLGITKLKVANFLPAMFVP IVYQIIMVLFHLGSAL" /locus_tag="LOCUS_0840" /note="WP_011462325.1 DUF554 domain-containing protein (Desulfitobacterium hafniense) [pid:39.0%, q_cov:93.7%, s_cov:97.4%, Eval:1.5e-45]" /note="MGA_108" CDS complement(3318..5090) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MNLCGFTMSFTTAGIHGLYAVMACFMWFVSLAFSLEYMHHYKHKP MYYAFLLATFGATAGVFLSADLLTTFVFFEVMSFTSYVLVIHDESKGAMRAGETYLAVA VIGGMVMLMGLFLLYDLTGTLKIAELPDACAPYAGSGRLYAAAICMLVGFGAKAGLFPL HIWLPKAHPVAPAPASALLSGILTKAGIYGMLIICCSMLAGDEHWAAAILALGAVTMFL GAFLALLSGNLKKTLACSSVSQIGFITTGIGIACLTNNLSEMASKGTVLHMVNHSLIKL LLFSCAGVVYMNLHKLALSDVRGWGRNKPLLGLYFAIGALTISGVPGTSGYISKTLLHE SIVEVIEELEHAGESIFLLKGLEWVFLISGGLTFAYMSRLFFCLFIRKNRAEEVQKRYN NKMHPYMNVLSACVIALPAIAMLCIGAVYWQHHYYTWTNLKGSLTSLAIGGLLCLLLKG RDLKELKFDLEDRVYRPLLLGVCVPLLGGVAKMLSAAGDVAAGLCVALMRTIAQALAGV IEGIMTRLNKGLLRQIQPHEERFSPMDWLRGRPIAQRWQEIRMDVLDSANSLSFGLLMA ILGLCVFLIYLVRN" /locus_tag="LOCUS_0850" /note="WP_048066018.1 proton-conducting transporter membrane subunit (Methanosarcina acetivorans) [pid:29.4%, q_cov:68.1%, s_cov:77.0%, Eval:4.5e-44, partial hit]" /note="MGA_109" misc_feature complement(5133..>5855) /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_064242829.1:monovalent cation/H+ antiporter subunit D family protein" /note="WP_064242829.1 monovalent cation/H+ antiporter subunit D family protein (Ensifer glycinis) [pid:35.6%, q_cov:97.1%, s_cov:46.6%, Eval:9.7e-32, partial hit]" /note="MGA_110" /locus_tag="LOCUS_0860" ORIGIN 1 gcgtcgacgc cgtagcgctc ggcaagcaga tagggatcgg cgacgttgcc cttggacttg 61 gacatcttgc cgccgtcgat cagcagccag ccgtggccga gaacgtgctg cggaatgggt 121 tcgtcgatgc tcatcagcat ggcaggccag atgatggagt ggaatcttac gatctccttg 181 cctaccaggt ggtagtccac cggccagtac ttctcgtaga gttcggtgct ttcgccgttt 241 acgggaggat agcccagcgc ggtgatgtaa ttggtgagcg catccagcca gacgtagatg 301 acgtgctttt cgtcgatggg cacggggatg ccccagtcga agctgctgcg ggagatgcac 361 aggtcttcca ggccggcgtc gatgaacgcg agcatctcgt tgacgcgggt ctggggctgc 421 aggaagtcgg tcgtcgtaaa cagctctctc agcttgtccg cgtacttgga aagcttaaag 481 aagtaggctt cttccttggc tctgccgatc tttctgccgc agtccgggca gatgccgtcg 541 ggcgcctggg tgtcggtcca gaacgattcg cagtcggtgc agtaccagcc ttcgtaagcg 601 gatttataga tatcgccctt cgcgtacatg cggcggaaga cctcctgcac gcggacggtg 661 tgccgcggct ccgtcgtacg gataaagtcg tcgtaggaga tctccatggt cgcccagagc 721 ttcttgatgc ccgcgacgac gcggtccacg tattcctggg gggtgacccc ggcagcctgc 781 gccttcttct ggatcttctg gccgtgttca tccgtgccgg tcaggaagcg cacgtcgtaa 841 ccctgcagtc tcttaaagcg ggccatcgcg tccgccatga cggtgcagta ggtgtggccg 901 atgtgcaggt tgtcgctggg gtagtagatc ggcgtggtga tgtagaatgt cttgctgttg 961 tctttcatgt ttcctccttg tccgcacaaa tgggtgcgga tctaaagtat tttatatcag 1021 ggatgccggg ccggtcatgc tgatgagcct gccgaacttg tgttccggct gataatcaaa 1081 ttcgaggatc cccgtgggct ggatctcgat atgccagata tcgttgagtc caaagcccgt 1141 catgtgggcg atcatgctgc ggatggccat cgcgtgagag accactgcta tgggtctctc 1201 gccgtatccc tccttctccg cttctgcggc caggtccgcc aggaagggac cggtccgtgc 1261 ctttacgtct tcgaaattct cgccgccttt cggccggtgg aatccgaatt catacagaaa 1321 tttgttggcg tcctccgcgt cgaccgcgac ggcctcttcg aaggtcatct gctcgtagat 1381 gccgcagtgc agctcgcaga tgcgttcgtc gatgcgcaga gacaattccg ggtggacggc 1441 tgcgatgcct tccgccagca gcttcgcccg ctgctggggg ctgcagtaca gcgcggccag 1501 gtcgatcgtc tttaagcgat ccgccgccca ggcgatgctt tcgctgccct ctttcgtgag 1561 gggcgattcc gtgcgcccgt atatgatcct ttgttttaac gcctccgtct ggggatggcg 1621 tatcagtagt aatttcatgc gttttctttc ttcttttccg gcagcgggat ctgcaccatg 1681 acgatcgccg caaacatgat gacgcagccc agcagctctc tgccggtcat gcgttcgttc 1741 aggagcagcg cgccggccag caccgcgaag acggattcca ggctcatcag cagcgacgcg 1801 atggtcggat ccgtaaactt ctgcgctacg atctgcagcg tatagcccag gccgccggac 1861 atgaggccgc agtacagaat ggggatggcg gcagatacga tcttggccca ggtgggttct 1921 tcggcgataa aggcgatgac ccaggagatg accgaggtgg tcgcaaactg gatcgcggag 1981 atcccgatgg gattgcccag ctgcacgaag tggtcgcagc acaggatgtg cagcgcgaac 2041 agcacggcgc agatgcagac gagcgtgtcg cctctcgtga gggagaagcc ttccgtcatg 2101 cagagcaggt acatgccgca tacgcccacc aggacggcca gccataccag ccacgtgttc 2161 tttttcttga agaacaggaa attgatgatg gggaccagca gcatgtacat ggcggtgata 2221 aagcccgcct tgcctgcggt ggtatagacg atgcccatct gctggaacga actcgccgca 2281 cagaggaaga tgccgcagca gatgccgccg acgaccgtat tgcggttata tgccttctgt 2341 tcctctggac tcttcaggct gtacgccgag gacggatttg cccgctcctt cttgatgacg 2401 atgagggcga cgatccccac ggcgacggca gccagcgcca tgcgggccgc accgaacgta 2461 atgggttcga tgctctccat tccgacccgc tgacccacga aagccgtgcc ccagatgagg 2521 gccgtgaggg tgagcaggat gtttccgagc attttcttgt tcttcatgtt accttatatc 2581 cttttacagc gccgatccca gatggaacag caccatgatg atctgataga cgatgggcac 2641 gaacatcgcc ggcaggaagt tggcgacctt cagtttcgta atgcccagca tgttgaggcc 2701 gaggcccagg accgaaaggc ttcccaccgc cgtgctcacc gccaggatct cttccgtcat 2761 gatcggagcc agcaggctgg acagcgccac cagcgcgccc tgatagatca ggaccgcaag 2821 ggaggcaaat ccgacgccca tgccggaacc catggcgaac atgcacgcgg agaatccgtc 2881 cagcacgctc ttggtgtagt agatcgtgtg ctgattcgac aggccggact gcagcgcgcc 2941 catgatggtc atggagccca cgcagaacag cagcgtgccg gagataaagc cgttggcaaa 3001 gcccgtgtcg ccctctttgg cgaacttgct ctgcagccag ttggccagcc ggttgaactt 3061 atcgtccagg tccgccagtt cgccgatagc cgtcccgatg atgagggatg ccagcataaa 3121 cagcggctgc ggcagatcga tggcgccgga aatgcccagc atcaccgtaa agagaccgaa 3181 gccctggaag acccgttctc cgatccgttt cagtttttct cctttaaaaa cgcacccgac 3241 tgcggtgccg atgaccacag tcagcgcgtt gacgatcgtt cctgtaaaga ttccgagcat 3301 gtcttgctat attgccttta gttcctaacc agataaatga ggaagacgca cagtcccagg 3361 atggccatca gcaggccgaa gctcagggag ttggcggagt ccagcacgtc catgcggatc 3421 tcctgccagc gctgcgcgat gggacgtccc cgcagccagt ccatggggga gaaacgctcc 3481 tcgtggggct ggatctgccg cagcaggccc ttgttgagcc gggtcatgat gccctcgatg 3541 acccccgcca gcgcctgcgc gatcgtgcgc ataagcgcaa cgcagagccc cgcagcaacg 3601 tcgcccgcag cggagagcat cttcgcgacg ccgcccagca gcggaacgca cacgccgagc 3661 agcagcggcc ggtagacccg gtcttccaga tcgaatttca gttcctttag atctctgccc 3721 tttaagagca ggcacagcag cccgccgatg gcgagagacg taaggctccc cttcagattc 3781 gtccaggtgt agtaatggtg ctgccagtac acggcgccga tgcagagcat ggcgatggcc 3841 ggcagcgcga tgacgcacgc gctcaggacg ttcatatagg gatgcatttt attattatat 3901 ctcttttgta cctcttctgc acggttcttt cgaataaaca ggcagaaaaa caggcgcgac 3961 atgtaggcaa acgtaaggcc gccggagatg aggaacaccc attccagccc cttgagcagg 4021 aagatggatt cgcccgcgtg ctccagttct tcgatcacct cgacgatgct ctcgtgcagc 4081 agcgtcttgg aaatgtagcc gctggtgccg ggcacgccgg agatcgtcag ggcgccgatg 4141 gcgaaataga ggcctaaaag cggcttgttc cggccccagc cccgcacgtc ggacagagcc 4201 agtttgtgca ggttcatgta gacgacgccc gcgcaggaga acagcagcag tttgatgagg 4261 gaatggttga ccatgtgcag caccgtgccc ttggaggcca tctcgctcag gttgttcgtg 4321 aggcaggcga tgccgatgcc ggtggtgata aagccgatct gcgacacgga ggagcaggcc 4381 agcgtcttct tcaggttgcc cgacagcagc gccaggaaag cgccgaggaa catcgtgacc 4441 gcacccagcg ccaggatggc tgccgcccag tgttcgtccc ccgccagcat actgcagcag 4501 atgatgagca tgccgtagat gccggccttc gtgaggatgc cggaaagcag cgcagatgcc 4561 ggggcgggtg ccaccggatg cgctttgggc agccagatgt gcagcgggaa gagaccggct 4621 ttggcgccga agcccacaag catgcagatg gcggcagcgt acagcctgcc ggagcccgca 4681 taaggcgcgc aggcgtccgg aagttccgcg atcttcaggg tcccggtcag atcgtacagc 4741 aggaacaggc ccatcagcat caccatgccg ccgatgacgg cgaccgccag ataggtctcg 4801 ccggcccgca tggcgccttt cgactcgtcg tggatgacga gcacgtagga cgtaaacgac 4861 atgacttcga agaacacgaa ggtcgtaagc aagtctgccg acaggaacac gcccgccgtc 4921 gcgccgaagg tggccagcag gaaggcgtag tacatcggct tgtgcttgta gtgatgcatg 4981 tattccaggg aaaaggcaag ggaaacgaac cacatgaagc aagccatgac agcgtagagc 5041 ccatggatgc ctgcggtcgt aaaactcatg gtgaatccgc aaaggttcat gcagttttcc 5101 tcctttcccg aaatttcagt gtcgaatgtc tgttacagcc ccggaaatgc cgccgggaca 5161 acgccgccga taaaggcctg cagggcgccg gggaagcagc ccaggagcac gatggctgtg 5221 gtcaggacca ccaggggaac ggtcatatac cagttggctt cccgcacgct ctttaaggac 5281 cagggttcga agtccgccgg cgggaaatag gcccgcacgc agatcgtcag cagataggcc 5341 gccgtaaaga cggcggagac gagcagcgct gcgacccctg cataagccag ggcagacccc 5401 tgcgccagcg ccgcttctgc gatggcgtat ttgcttaaaa agccgcacag gggcggaatg 5461 cccgtaaggg ctaaagacgc gatcgtaaac gtggcgaaac ttaccggcat agccctgccg 5521 aagccccgca gatccgtcac gtagatgcgg ccgctctggt gcatcacggt accggccacg 5581 aagaacagca cgatcttcat caagccgtgg aacatcatgt ggagcagccc tgccgtaagc 5641 cctgacgggg tcaccagcag gaacgcgaac acgatgtacg acaggttcga gaccgtggaa 5701 taggccagcc gctttttaaa gtggatctcc ttccaggcca tcaccgtgcc gtagatgatg 5761 gtgaacgcgg agaacgccag cccgactttc tgcacgaagc tgccggaaag atagcccgcg 5821 tcgtaggtga aatagaccac ccgtccgatg gcgaa // LOCUS sequence016 5660 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence016 VERSION sequence016 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..5660 /mol_type="genomic DNA" /organism="" /note="sequence016" misc_feature <1..514 /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_010920519.1:methionine ABC transporter ATP-binding protein" /note="WP_010920519.1 methionine ABC transporter ATP-binding protein (Caulobacter vibrioides) [pid:39.3%, q_cov:88.2%, s_cov:44.9%, Eval:3.2e-23, partial hit]" /note="MGA_111" /locus_tag="LOCUS_0870" CDS 504..1205 /product="ABC transporter permease" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_005459160.1" /transl_table=11 /codon_start=1 /translation="MFSNVFTPEQIEAAALCLKTEIPFAIWETLYITVLSTLLACVLGL PLGVLLVAGEKDGVRPLPSWLLHLLNGLINLLRSVPFLILMIMVFPLSRLLIGTAVGTK ATIVPLVVAAFPYIARLVEGNLRELDAGVIEAAQSMGATPWQIITKVMIPESVPGLLNS FTLALTTILGYSAMSGIIGGGGLGKIAINYGYYRYQYLIMYLAVILLVVLVQVFQSAGT KAVAKADKRLK" /locus_tag="LOCUS_0880" /note="WP_005459160.1 ABC transporter permease (Vibrio) [pid:44.9%, q_cov:88.8%, s_cov:91.6%, Eval:1.8e-48]" /note="MGA_112" CDS 1277..1546 /product="30S ribosomal protein S20" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_009890686.1" /transl_table=11 /codon_start=1 /translation="MANIKSAKKRIGVIEKKTAINRRVKNSLKGIIKGFERAVATGDID TAKEKLALAEKKLMKAAAKGTIHKNAASRKVSRLTKAFNKAKAE" /locus_tag="LOCUS_0890" /gene="rpsT" /note="WP_009890686.1 30S ribosomal protein S20 (Clostridioides) [pid:52.3%, q_cov:98.9%, s_cov:100.0%, Eval:8.7e-18]" /note="MGA_113" CDS complement(1647..1997) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MQLIASRLKYLRDREEESQKQVAEALDIKLSTYKSYETARRRIPV DILRNAALHYEVTMDFIIGITDIPYSINKEDEEIMRKYYSLKEENQLRIQERIMTFYET EHPPKTLKDKNK" /locus_tag="LOCUS_0900" /note="MGA_114" CDS 2189..4000 /product="translation elongation factor 4" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003416556.1" /transl_table=11 /codon_start=1 /translation="MKDQQQFIRNFCIIAHIDHGKSTLADRLLENTGSVAQRDMKEQFL DNMDLERERGITIKLQTSRLVYKAKDGNEYIFNLIDTPGHVDFNYEVSRSLAACEGAVL VVDATQGVEAQTLANVYLALDEDLEIVPVINKIDLASARPDEAKQEIEDVIGLDASDAP LISAKEGINIEGVLEAIVEKVPAPNGDPEAPLKALIFDSYYDNYKGVVIYTRVFDGVLK AGDKIKMMNTGAVYDVTEVGVNAPYQTPVKELSAGSVGYVCASIKQVRDARVGDTITLA DRPAKEHLPGYKKVQPMVYCGIYPTPDEKYENVKDCLEKLQVNDAAFVFEPETSQALGY GFRCGFLGLLHMEIIVERLEREFDLEIITTSPSVIYKVVMHDGSEVMIENPSNLPNPTE YDHIEEPMVKATIMLPKDYVGSIMALCQDRRGNMTHMEYITEDRVALHYDMPLNEVIYD FFDALKSKTRGYGSLDYEFDRYERSNLVKLDILLNKEIVDAFSMIVHESKAYGRARFVC EKLKEVIPMHQFEVPIQAAIGQKVIARETVKAYRKDVLAKCYGGDISRKKKLLEKQKEG KKRMRQFGTVEVPQEAFTAVLKYDDNK" /locus_tag="LOCUS_0910" /gene="lepA" /EC_number="3.6.5.n1" /note="WP_003416556.1 translation elongation factor 4 (Clostridioides) [pid:73.2%, q_cov:99.7%, s_cov:100.0%, Eval:1.9e-255]" /note="MGA_115" CDS 3984..5234 /product="radical SAM family heme chaperone HemW" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011392119.1" /transl_table=11 /codon_start=1 /translation="MTTTNKDGRILLTKHREDYLAENAQSSLKPLGLYLHIPFCVRKCN YCDFVSFPEQSGDVIEAYVGRLCEDIAAAGETYGSRYHVDTVFIGGGTPSLLTPQQLQR ILQAVDDAFLVGCEFAQNCGAGLKGCDGLEISMESNPGTFDAEKLRAFIDAGVNRLSIG VQSLDDDVLKRLGRIHDAGTALRAMRAAKSLNLNYNVDLMLGIPGQTLAVWEDTLKRTI AEEPKHISFYSLQLEMGTPFYRDFKEGRLTLPEWSENREMYHRALEVLKDAGYQHYEIS NAAIPGYECRHNLKYWTMQDYLGLGMAAHSFLAGRRCFTTSDLKEYLAGPAEAVWEESE PWDRKTDFVFTELRLIDGFKKEEYQNMFGCAFEDDFGPAYRNLLQEGRMEEKDGRVRLT PAGLDETNPVMEELLNV" /locus_tag="LOCUS_0920" /gene="hemW" /note="WP_011392119.1 radical SAM family heme chaperone HemW (Moorella thermoacetica) [pid:41.8%, q_cov:90.6%, s_cov:94.8%, Eval:3.3e-72]" /note="MGA_116" ORIGIN 1 cgaggcgact tccgcgcttg accccagcac cacccgccag atcctcagcc tcatcaagga 61 catcaacgcg aagaccggca tcaccgtggt ggtgatcacc caccagatga gcgtcgtgga 121 agagatctgc gaccacgtgg cgatcctgga cggcggcaga gtggcggagc agggacccgt 181 ttccagagtc ctgtcctccc cgcgttccga cgccggcaag cgtctggtct tcccgggccg 241 gacggacgag cgcatttcca tctccggcag agaccggcgc cttcgcatca tcttccggga 301 atccgccgcg accagtcttc ctctggtggc gacgatggca aaggaaaagg gcatcatcgc 361 cacggtgctc gaagccaata cccgcaaact gtccggagac gtatacggaa cgacgctcat 421 cggcctaccc gaaaacgatc tctacgaggc agcgaaattt ctgagttctt ttgaaaacgt 481 aagcgtagag gaggtgcccg ccgatgttca gtaacgtgtt tacccccgag cagatcgaag 541 cggcagctct ctgcctgaaa acggagatcc cgttcgcgat ctgggagacc ctgtacatta 601 ccgtattgtc cacgctgctg gcctgcgttc tgggcctgcc cctgggcgtg ctgctggtag 661 caggggagaa ggacggcgta agaccgctgc cttcctggct gctgcacctg ttgaacggtc 721 tcatcaacct gctgcggtcc gtaccgttcc tcattctgat gatcatggtg ttccctctgt 781 cccgcctgct catcggcacg gcggtcggaa caaaggccac catcgtaccg ctggtcgtcg 841 cagcgttccc ctatatcgcg cggctcgtgg agggcaatct gcgggagctg gatgcagggg 901 tcatcgaagc ggcccagtcc atgggcgcca cgccctggca gatcattacg aaggtgatga 961 tcccggagag cgtgcccggt cttttgaaca gctttacgct ggcgctgacg accatcctcg 1021 gctactccgc catgagcggc atcatcggtg ggggaggcct cggcaagatc gccatcaact 1081 acggctacta ccgctatcag tacctgatca tgtatctggc ggtcatcctc ttagtcgtgc 1141 tcgtacaggt gttccagagc gccggaacga aagcggtggc aaaggccgat aaaagattaa 1201 aatagcgctt gcaattccgc aaaatgccct gtatactcta ctggtgatat tttgtaaagt 1261 ggggtgaatc aaagaaatgg caaatatcaa atctgctaag aagagaatcg gtgttatcga 1321 aaagaagact gcgatcaaca gacgcgtcaa gaacagcctg aagggcatca tcaagggctt 1381 cgaaagagct gtcgccactg gcgatatcga taccgccaag gaaaagttag cactggcaga 1441 aaagaaactg atgaaggctg ccgctaaggg aaccatccat aagaacgcag cttccagaaa 1501 ggtttcgaga ctgaccaagg ccttcaacaa ggctaaggcc gagtaatctc acccgtcccc 1561 acacgcgcat aagttaaatg cgataaaagc ccggagtgtc tcccgggctt tttcctttgg 1621 ctcatattcc gtaaaggcct aaggccttac ttgtttttat cttttaacgt tttaggcgga 1681 tgttccgtct cgtagaacgt catgatgcgt tcctggatgc gcagctggtt ctcttcttta 1741 agagaatagt atttccgcat gatctcttcg tcctctttat tgatcgagta gggaatatcc 1801 gttatgccga tgatgaaatc catcgtcacc tcgtagtgca gcgccgcgtt gcgcaggatg 1861 tccacgggga tccttctgcg cgccgtctcg tagctcttat acgtggacag cttgatgtcc 1921 agggcttctg ctacctgttt ctgtgattct tcctctctgt ctctcagata tttcagtctc 1981 gaagcgatca gttgcatggg aagcgctcct ttctgtctca ttttagcgag agaaaagtta 2041 catatcgtaa ccaggatgcg ctattgttca aaaaggtgtc ataatgcaac tatttcgtgg 2101 ccggggaatg tgatcctaag ataaacggac ggacagccgc tgattatggt ataattattc 2161 tgtatatttg tgagaaaagg aaagcaacat gaaagatcaa cagcaattca tccgcaattt 2221 ctgcattata gcacatatcg atcacggcaa gagcacgttg gcagaccgcc tgctggagaa 2281 taccggcagc gtagcccagc gcgacatgaa ggagcagttc ctggacaaca tggatctgga 2341 acgggagcgc ggcattacga tcaagctcca gaccagccgt ctcgtgtata aagccaagga 2401 cggaaacgaa tatatcttca acctgatcga taccccgggc cacgtggact tcaactacga 2461 ggtctcccgc agcctcgcgg cctgcgaagg cgctgttctc gtcgttgacg ccacccaggg 2521 cgtggaagcg cagactctgg cgaacgtgta tctggctctc gatgaagatc tggagatcgt 2581 gccggtcatc aacaagatcg acctcgcttc cgcccgcccg gacgaagcga agcaggagat 2641 cgaagacgtt atcggtctgg acgcctccga tgcgcccctc atctccgcga aggagggcat 2701 caacatcgaa ggcgtgctgg aagccatcgt ggagaaggtc cctgcgccta acggtgaccc 2761 ggaagcgcct ctcaaggctc tgatcttcga ttcctactac gataattaca agggcgtcgt 2821 catctatacc cgcgtgttcg acggcgtttt gaaagccggc gacaagatca agatgatgaa 2881 caccggcgcc gtgtacgatg tgacggaagt cggggtcaac gccccgtatc agaccccggt 2941 aaaggagctt tccgccggat ctgtaggcta cgtctgcgcc tccatcaaac aggtgcgcga 3001 cgcccgggtc ggcgatacca ttacactggc ggaccgcccc gcgaaggagc atctgcccgg 3061 ctacaagaaa gtgcagccca tggtgtactg cggcatctat ccgacgccgg acgaaaagta 3121 cgagaacgta aaggactgtc tggaaaaact gcaggtgaac gacgctgcgt tcgtctttga 3181 accggagacg tcccaggcgc tgggatacgg cttccgctgc ggtttcctgg gcctgctgca 3241 catggagatc atcgtcgaac ggctggagcg ggagttcgac ctggagatca ttacgacgtc 3301 gccttccgtt atctacaaag ttgtgatgca cgacggctcg gaagtgatga tcgaaaaccc 3361 gtccaatctg cccaatccca cggaatacga ccacatcgag gaaccgatgg tgaaggcgac 3421 catcatgctg cccaaggatt acgtcgggtc catcatggcg ctgtgccagg accgccgggg 3481 caacatgacc cacatggaat acatcacgga ggaccgggtg gcgctgcatt acgacatgcc 3541 gctgaacgag gtcatctacg actttttcga cgccctcaag tccaagacga gagggtatgg 3601 ctccctggac tacgaattcg accgctatga gcgctccaac ctcgtaaaat tggacatcct 3661 gctgaacaag gagatcgtgg acgccttctc catgatcgtc cacgaaagca aagcctacgg 3721 cagagcccgt ttcgtgtgcg aaaaactgaa ggaggtcatc cccatgcacc agttcgaggt 3781 gccgatccag gctgcaatcg gacagaaggt gatcgcgcgg gagaccgtaa aagcctaccg 3841 caaagacgtg ttggccaagt gctacggcgg cgatatctcc aggaagaaga aactgctgga 3901 aaagcagaag gaaggcaaga agcgcatgcg ccagttcggt acggtggaag tgccgcagga 3961 ggcgtttacg gcggtgctga agtatgacga caacaaataa ggacggcagg atcctgctga 4021 caaagcacag agaggattat ctcgccgaaa atgcgcagtc ttcgttaaag ccgctggggc 4081 tctatctgca tatcccgttc tgcgtgcgca agtgcaatta ttgcgatttc gtgtcgttcc 4141 cggagcagag cggagacgtg atcgaggcct atgtcggaag gctttgtgag gatatcgcgg 4201 cagcgggcga aacgtatgga agccgctacc acgtcgacac cgtctttatc ggcggcggca 4261 cgccgtcgct tttgaccccg cagcagctgc agcgtatcct gcaggctgtg gatgatgcgt 4321 ttctcgtcgg ctgtgaattt gcgcaaaact gcggggcagg cttgaagggt tgtgacgggt 4381 tggagatctc catggagtcc aatccgggta ccttcgatgc agagaaactg agggcgttca 4441 tcgatgcagg ggtcaaccgg ctgagcatcg gcgtacagag cctggacgac gacgttctga 4501 aacggctcgg ccgcatccac gatgccggca cggccttgag ggccatgcgg gcagcaaaat 4561 cgctcaacct gaattacaac gtagacctga tgcttggtat ccccggccag accttagcgg 4621 tctgggagga tacgctgaag cgcacgatcg cggaggaacc gaagcacatc tcattctaca 4681 gcctgcagct ggagatgggc acgccgttct accgcgattt taaggaaggg cggcttactt 4741 tgccggaatg gagtgagaac cgggagatgt accaccgggc gctggaggtc ttaaaagacg 4801 ccggctacca gcattacgag atctccaatg cggccatccc gggttacgaa tgccggcaca 4861 acctgaagta ctggaccatg caggactacc tgggccttgg catggcggcc cacagctttc 4921 tggcagggcg caggtgtttt acgacgtcgg atctgaagga atatctggca ggccctgcgg 4981 aagctgtttg ggaagaaagc gagccttggg accggaaaac ggacttcgtg tttacggaac 5041 tccgcctgat cgacgggttc aaaaaagaag aatatcaaaa catgttcggc tgcgcgttcg 5101 aggatgactt cgggcccgct taccgaaatc ttttgcagga agggcggatg gaggaaaaag 5161 acggccgtgt acggctcaca cccgccggcc tggacgaaac gaatcctgtg atggaggaat 5221 tgctgaatgt ctaaatacgt gatggcgctg gatgcaggca ccacgagcaa ccgctgcatc 5281 atcttcgacc gcgagggcaa tcagatcgcg gtgtcgcaga aggaattcaa acagatctat 5341 ccccatcccg gctgggtgga gcacgacccg atggagatct gggcgaccca gctgggcgtg 5401 gcgcaggaag ccatcctgat ggcccgcacg gaggccaagg agatcgctgc gatcggcatc 5461 accaatcaga gagagacgac gatcgtctgg gataaaaaca cggggcttcc cgtctacaac 5521 gccatcgtgt ggcagtgccg ccggaccgcg gattactgcg agaccctgga gaaggattac 5581 gaggacatga tccgcgaaaa gaccggtctg aaggtcgacg cctacttctc cggcaccaag 5641 atccgctgga tcctggaaaa // LOCUS sequence017 5581 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence017 VERSION sequence017 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..5581 /mol_type="genomic DNA" /organism="" /note="sequence017" CDS complement(1254..2240) /product="ABC transporter permease" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_010963501.1" /transl_table=11 /codon_start=1 /translation="MKKYILKRVLLSILILFFVTLIIYTLIRCLPTSYIENIARQKSMQ PGSKSYEEWMEQLSAMYNLDTGILTGFFRWWGQMLRGNFGDSWVYTIPVTEEFNKTIWL SFVMGLITMFFEIIIAVPLGIIAATKQYSKTDYTISVIALAGISLPTFFFASLLKLVFS VKLGWFDLFGLVGRNYEQLDSFHQFLDKANHLVLPCVTLIVISIGGLMRYTRTNMLEVL NSDYIRTARAKGLSERKVIYHHAFRNTLIPLVTIIGGSLPGLFSGALITETLYAIPGIG YASYKAMVGGDIPFSMFYLTFLAILTLLGNLISDILYAVVDPRVRIS" /locus_tag="LOCUS_0930" /note="WP_010963501.1 ABC transporter permease (Clostridium) [pid:42.2%, q_cov:99.7%, s_cov:99.4%, Eval:5.7e-66]" /note="MGA_119" CDS complement(2348..4630) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MDKLRKVLALMLALAMIFGLAACTSGGSGEQGGTDEPETNETPLV VGYSPFSSKFSPFFSETAYDQDVYAMTQISLLNSDRMGAVVEKGIEGTTIPYNGTDYTY YGPADVEITQNADGTVYYDFTLRDDLTFSDGTPITIDDVIFSYYVLCDPTYDGSSTLFA QPIEGMQEYRSGMDTLFNLLVEAGEDNTDYTFWDEATQTAFWADLNQAGEAFAQEIVDY CVDAGYATNVAEAASAWGFDGLAEDATAADFFALLCEDYGWDLASMSSTESAGSSLFDL MEGYDNYTVGVVTGNSADHISGIQKTGDYSMRVVMSQFDATAIYNLGVSIAPLHYYGDP AQFDYDNNQFGFPKGDLSLVRAKTTEPMGAGPYKFIKFENGVVYFEANESYYLGAPKTK YVNFQECMSDDDKLNGVITGTIDITDPSFSTDVIDAIEQANGGELSGAKIETNTVDNLG YGYIGISADIMNVGGKENKASDASKALRKAFGTIFSVYRDVAVDSYYGDRATVINYPIS NTSWAAPQSTDDGYKLAFSVDVDGNDIYTSDMSAEDKYAAAKQAALGFFEAAGYTVEDG KCVAAPEGAALEYEVWIPADGTGDHPSFMILTESRDALAELGINLVIRDLSNSSDLWTG LEAGSVPMWCAAWGATADPDMYQIYYADVEGGGAHAGGSNYMYDIADADLDQMILDARM SADQTYRKAMYKACLDTIIDWAVEIPVYQRQNAIIFSAERVNLDTVTPDITTFYGWMSE IQNTELK" /locus_tag="LOCUS_0940" /note="WP_000730661.1 ABC transporter substrate-binding protein (Bacillus cereus group) [pid:25.2%, q_cov:54.9%, s_cov:61.2%, Eval:9.2e-16, partial hit]" /note="MGA_120" ORIGIN 1 aattcctgct ctcttaagga caggatctgt ccgcggatca tgcgggcgac gcccggccag 61 gacaggaagc ccaggatgag catcaggtac atcatacgga cggtcgggtc gaccatctgc 121 gcatccatcg cagcgcctaa gatgatgagg ataggcgtgg acgggatgca gtagaagata 181 tccacgatac gcatgatgag gttatccacc cagccgccga agtagccgga gataccgccc 241 aggataacac ccagcaggtt tgcgatcagc tcgacgataa agccgatgat gagggaaact 301 ctgccgccgt acatcagacg ggtgagcatg tccatgccgt tgcggtccgt gcccagccag 361 tgttccttgc tgggcgccgc ataggtgtcg tacacctggc tctcgcggga ctgcttaacg 421 gtgtacttgt gggacgccgc attgtattcg atgacgtaat cggattcgac gccgtcggga 481 tcggtgaaat agaagtcctt atcgccggtc tccagcgctt ccaggagctg ttccttgaag 541 tctctcgtca ggaacacgtc gctcatcaga ggctgtacaa cgtagcggga gatgtagccg 601 atctcggtgc tgccttgggt cacgatgccg ttttcgtcca gatcgtagtc ggtgccgtct 661 acggtaaagc tggtctcccc tgtcgcatct gcgctgagag cttcgcggag gaaggtgtag 721 cttgccttga aggacggatc gctctcggag aacacgttct tgaaggcgag accgatctcg 781 gtgccgttcg ccagttttac gatgtagaag tcttcgccta cgggttccat cacgtaattg 841 acgcccttga aggagaactc attgacgcct ttctgcgtcg cgagcaccat ctgagcctgg 901 atgatggagg tgaattcctg gccgtcagcc acagcatagc ggaattccgt gttttcgatg 961 gcggagcagt actccttgct cagagaatcc acgcggtaga agcgctggtc ctgggagtag 1021 ggagagatga tgcctccgat aaaggagaac acgaacatga agatcaggat gaccaggccg 1081 accatggcga tgcggttgcg gaagaaccgc ttggcgacca tggcgcccgg ggacagaact 1141 ttaacgcgtc tgtcgtcgtt taaggaatac tgaggttcct tcttttctgc agtctcggct 1201 tccgcctgct gcacgtcttt cttgatctcg tcagacatgt cagaacctcc ttcctaagaa 1261 atacgcacgc gcggatccac gacggcatac aggatatccg agatgaggtt acctaatagc 1321 gtgaggatcg cgaggaacgt caggtagaac atggagaacg gaatgtctcc gcccaccatg 1381 gctttatacg aagcatagcc gatgccgggg atcgcataca gcgtctcggt gatgagagcg 1441 ccggagaaca ggccgggcag gctgccgccg atgatggtga ccagcggaat gagcgtattg 1501 cggaacgcat gatgatagat gaccttccgt tcggaaaggc cctttgctct cgcagtacgg 1561 atatagtccg aattcaggac ttccagcatg ttcgtacggg tgtagcgcat cagaccgccg 1621 atgctgatca cgataagggt gacgcagggc agcaccagat ggttcgcctt gtccaggaac 1681 tggtggaagc tgtccagctg ctcgtagttt ctgcctacga ggccgaacag gtcgaaccag 1741 cccagtttga ccgagaatac cagcttaaga agcgatgcga agaagaatgt aggcaaagaa 1801 atgcccgcca atgcgataac gctgatggtg tagtctgtct tgctgtattg cttcgtagcg 1861 gcgatgatgc cgagaggcac ggcgatgatg atttcgaaaa acatggtgat caggcccatg 1921 acgaagctca gccagatggt cttgttgaac tcctcggtaa cggggatcgt gtagacccag 1981 ctgtcgccga agttgccgcg gagcatctga ccccaccagc ggaagaagcc ggtcaggatg 2041 cctgtatcca gattgtacat ggccgatagc tgttccatcc attcctcata gctcttggag 2101 ccgggctgca tggacttctg ccgcgcgatg ttttcgatgt acgacgtggg cagacagcgg 2161 atcagcgtgt agataatgag agtgacgaag aaaagtatga ggatcgacag caatactctc 2221 ttcaaaatat actttttcac gggggttcct ccgtattcca gaataatagt tgtgccagca 2281 atgcagaggg gatcgctccc ctcgcactgc tggcgcaatg acaagccttt gtaaagcttt 2341 cagccgatta cttcagctcg gtgttctgga tctcgctcat ccagccatag aaggtggtga 2401 tgtcgggagt aacggtatcc aggttgactc tctcagcaga gaagatgatc gcgttctgtc 2461 tctgatagac agggatctcg acggcccagt cgataatggt atcgaggcag gccttgtaca 2521 tagccttacg ataggtctgg tctgcagaca ttctggcatc caggatcatc tggtcgaggt 2581 ctgcgtccgc gatatcgtac atgtagttgg agccgccagc gtgtgcgccg ccgccttcca 2641 cgtcagcata gtagatctga tacatgtcgg ggtcagccgt tgcgccccaa gctgcgcacc 2701 acatgggtac ggagccagct tccagaccgg tccacagatc ggaggagttg gagaggtcgc 2761 ggatgaccag gttgatgccc agttcagcca gagcatctct ggattcggtg aggatcatga 2821 aggaggggtg atcgccggta ccgtcggcgg ggatccaaac ttcatattcc agagcagcgc 2881 cttcgggtgc tgctacgcac ttgccgtctt ccacagtgta gcctgcagct tcgaagaagc 2941 ccagagcagc ctgcttggca gcagcgtact tgtcctcagc ggacatgtcg gaggtgtaga 3001 tgtcgttgcc gtctacgtcg acggagaacg ccagcttata accgtcgtcg gtggactggg 3061 gtgcagccca ggacgtgttg gagatcgggt agttgatgac agtagctctg tctccatagt 3121 aggagtcgac tgctacgtct ctgtagacgc tgaagatggt gccgaaggcc tttctcagag 3181 ccttggaagc atcggaagcc ttgttttcct tgccgccgac gttcatgatg tctgcagaga 3241 taccgatgta gccgtagccc aggttgtcaa cggtgttggt ctcgatctta gcgccggaca 3301 gttcgccgcc gttagcctgc tcgatggcgt cgatgacgtc ggtggagaag gacggatcgg 3361 tgatgtcgat ggtgccggtg ataacgccgt tcagcttgtc gtcatcggac atgcattcct 3421 ggaagttgac gtacttggtc ttcggagcgc cgaggtagta gctttcgttc gcttcgaagt 3481 agacaacgcc gttttcaaac ttgatgaact tgtaggggcc tgcacccatg ggttccgtgg 3541 tcttcgctct tacgagggag aggtcgccct tggggaaacc gaactggttg ttgtcgtagt 3601 cgaactgtgc gggatcgccg tagtagtgca gcggtgcgat ggaaacgccg aggttgtaga 3661 tcgcggtcgc atcgaactga gacatgacaa cgcgcatgga gtaatcgccg gtcttctgga 3721 taccggagat gtgatctgcg gagttaccgg taacgacacc aacggtgtag ttgtcgtaac 3781 cttccatcag gtcgaacagg gagctgcctg cggattcggt gctggacatg gaagccagat 3841 cccatccgta gtcttcgcac agcagagcga agaagtcagc agcggtagcg tcttctgcca 3901 ggccgtcaaa gccccatgcg gaagcagctt ctgcaacgtt ggtggcatag cctgcatcta 3961 cgcagtaatc aacgatctcc tgcgcgaagg cttcgccagc ctggttcagg tctgcccaga 4021 aagcggtctg agtcgcttcg tcccagaagg tgtagtcggt gttgtcttcg ccagcttcta 4081 cgagcaggtt gaacagagta tccataccgc ttctgtattc ctgcatgcct tcgatgggct 4141 gtgcaaacag cgtggaagaa ccatcatagg tcgggtcgca cagaacatag taggagaaga 4201 tgacgtcatc gatcgtgatg ggggtgccat cggagaaggt gaggtcgtct ctcagggtga 4261 aatcgtaata aacggttcca tctgcgttct gggtgatctc tacgtctgcc ggtccatagt 4321 aggtgtaatc cgttccgttg taggggatcg tcgtgccttc gatacctttt tcgacgacag 4381 cgcccatacg gtcggagttc agcagactga tctgggtcat tgcgtagaca tcctggtcgt 4441 acgcggtttc actgaagaac ggagagaact tgctggagaa cggagaatat cctactacca 4501 gaggagtttc attcgtctcg ggctcgtctg ttccgccctg ttcgccggag ccgccgctgg 4561 tgcatgcagc caggccaaag atcatggcca gagccagcat cagtgcgagc acctttctta 4621 gtttgtccat tgtttgtttt cctcctaaat agaaatgata caatacagtt agagttattg 4681 taccacagac acaagagcaa gtaaacaaag agtggaaatt ccttttcatt tttacacaag 4741 ttacggtaca atagaggcag ttcaaaccta tcgatcggag gaaaccatgg tcaaagaagt 4801 caatcccaag atacacgtaa acgagacgga ctaccctgtt tcgggtcaca cctgcgatga 4861 cccggagaag aaaaagctcg tcctgaaact cgcgcgcatg atcacggaca acatcccccg 4921 caagctgccc ggcggcatga aggaaaacca tatggatttc tggatcctgg accggctgct 4981 tacgaaggaa gaagtcaagt ttatgctcag cttcgaaaag cgccgcttcg gtcttacgac 5041 gcccgagctc gcaaagcgca acggcatgac ggaagaacag gcgcagaaga tcatcgatca 5101 cctgctgtgg atcggcatcc tggaacagaa ccgggacaat gccgaccagc atatccagta 5161 ctggatcccg aaatgggtcg taggatccgg cgaatatatg gtagaacacc ccaccctcac 5221 cgatacgaat ccggaagtgg ccacgatgtt caacctggcg ccccaggaac ctctggaact 5281 ggcggcaaag ctcatcccgc cgggaggcgc cggcatcggt atgcacgtca tcccggtgga 5341 ggaagccatc gacggggcat cccgctccgt ttccgtcgaa catctgtccc actggctgca 5401 taaatacgat aaattctgca ccatggtctg cgcctgccgc aaagcccagc gtgtgcgggg 5461 cgaaggcgtc gtagacatcg aaggctatat gtgcattggc gtcggagaca tcgcggaatt 5521 cctcgtggaa tccggcaagg atgcccacta catcacccgc gaagaggcca tggagatcat 5581 c // LOCUS sequence018 5541 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence018 VERSION sequence018 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..5541 /mol_type="genomic DNA" /organism="" /note="sequence018" misc_feature <1..1634 /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_010966138.1:ATP-dependent RecD-like DNA helicase" /note="WP_010966138.1 ATP-dependent RecD-like DNA helicase (Clostridium) [pid:44.1%, q_cov:98.5%, s_cov:72.1%, Eval:9.0e-124, partial hit]" /note="MGA_122" /locus_tag="LOCUS_0950" CDS 1621..2352 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MDWNNFLKDSGKAALAAVFPENIYCICCGDVTDPDSRSGLCLRCS EKLPWAFENPFRSYMDEFAFDDVWPCVRYGSYARKIMNGLKNGGQSYMAENVGQMLAER VQLEWDMPDLFVAVPSHRSKMQKRGYNQSELLAEAVAKRLKLPYQKGLLEKTRATASMR MADGRTRRSMLEDSFAVSSRFASLVPGKKVCLVDDVTTTGSTADACARALKAAGAAKVV LLVFGASSGYKKVEENGAAEP" /locus_tag="LOCUS_0960" /note="WP_027480036.1 ComF family protein (Deinococcus radiodurans) [pid:37.5%, q_cov:69.1%, s_cov:77.7%, Eval:3.4e-16, partial hit]" /note="MGA_123" CDS 2632..3441 /product="diadenylate cyclase CdaA" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_106007069.1" /transl_table=11 /codon_start=1 /translation="MEFSDVIDVLIVAVIAYYVIRYVRSTRAAQLVYGLAIVLGVYLLS DVANLYTLNWLLKNLLSVGLIALVVVFQPELRRALEFLGRGRFTTRGFSLEKEKYNANI DILLRAIDYFAARKEGALIVVEHETALQDVADTGTMLDAQLTEPLIENIFYKGSPLHDG AVILRGNRILAAGCVLPLTENPNLSKDLGTRHRAGIGMTEVSDALVLIVSEETGIISMA KDGNLSRFLDLKAVEKALLNLYISKKPDITAVPRAGFSIFRKGGSDE" /locus_tag="LOCUS_0970" /gene="cdaA" /EC_number="2.7.7.85" /note="WP_106007069.1 diadenylate cyclase CdaA (Moorella) [pid:48.7%, q_cov:85.9%, s_cov:83.8%, Eval:1.1e-53]" /note="MGA_124" CDS 3434..4657 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MNRDEIINRVAAIVLAIVLWVYVISVVNPPTTVTVRQVPVTLLNQ EYLDDSKLAIAGDGKYTVDVDLSGKRKDLILGPSDLSATADLSGLTPGQNYITVRVTSP SNTTVESIRTEKIQVYVDNLVSVAKPVVLDVANVPSDTEFTVLDLSQEQILVSGAKSLV DMVDHLTVHVDAGGLSVDEATEQQYALTPMDVEGNVVKAVKLESPFVSMSSTLYTVKSV PLYTRVDGAPGYGLELLSSSIPSTVSIKGTLLDLAKVNYVDAQPLDITDITTNTELPVV PILPDGISLASNNGDMTASFTLSDQASMQMEADSASIVLEYLPEGFTAAAEGEPFTMQV TVKGPVETIANLTADMFSYYVDLSAIEEAGEYDLPIVSGTTVGDSLEVVIEPAALHVLV EAITPEEE" /locus_tag="LOCUS_0980" /note="WP_011393730.1 CdaR family protein (Moorella thermoacetica) [pid:24.4%, q_cov:68.6%, s_cov:88.0%, Eval:6.4e-12, partial hit]" /note="MGA_125" ORIGIN 1 agacgctggg tttcgaccgg gagagtccgt tccggatccg ggcgggcttc ctgttctgca 61 tggaaaacct ggcggcggaa ggggatacct atgcgcctaa gcgcgaattt atcgagcgct 121 gtgcggaatt cctggacgtc tcccgcgaaa aagtcgaaga agccatggtg gaactggcga 181 tcggcggccg cgtgttcgcg gaagtgctgg acggcgaaga gatcctgcag ctctggcgtt 241 tccggcgggc ggagcagaag gtggcggcaa agctctttct gctgtgcaat acgccgctgt 301 cccacgtcac cgctgacgcg gaaaaactca ttcgcgccgg cgaaaaggaa agcggcatcg 361 aactgtctcc tctgcagaag gctgccgtgc tcacgtcgct gcaaaacggc gtatccgtca 421 tcaccggcgg tccgggcacg ggtaaaacga ccatcatcaa cacgatccta aagatcttaa 481 atgcatccgg cgtaaaaaca gcgttggcgg cacctacggg acgggctgcc aagcgcatga 541 cggagaccac cggtgaagag gccagcacca tccaccgcct gctggagtat tactattccg 601 aagagggcga cgagatgcgt ttcggcaaga cggaggaaga cccgctggac tacgactgca 661 tcatcatcga cgagatgtcc atggtggata tcctgctgat ggagggactt ctggcagcgg 721 taaagcccgg cacgcggctc atcctggtgg gtgacgccga ccagcttccc agcgtcggcg 781 caggcaacgt gctgcgcgac atcttagcct ccgagacggt gcaggccgtg cgcctgaagg 841 acatcttccg ccaggcggcg gagagcctca tcgtcgtaaa cgcgcaccgg atcaaccggg 901 gcgaatatcc cagctacaac gaaaagggga aggatttctt cttcctggag cgctaccgtg 961 aaccggagat ccgtgacacg atccgcgacc tgcttacgac gcggctcccc gcttactata 1021 aagactgcga tccccaggcg gacatccagg tgcttacgcc cacgaaaaag ggcatgctgg 1081 gcagcgtgga gctcaacaag ctgctgcagt ccgtgctcaa tccgcccggt ccgggcaaac 1141 acgaaaagca gttcggcgag cgcatctacc gggagggcga caaggtgatg cagaacaaga 1201 acgactacct gcttacctgg aaggatctgc gcgtttttac cgagggcagc ggcgtgttca 1261 acggcgatct gggggtcatc cgcacggtgg ataacgacat gggcatcgtg agcgtcgtgt 1321 tcgatgggta ccgcctggcg acctacgatt tctctaacct ggacgagatc gagacggcgt 1381 tcgccatgac ggtgcacaag agccagggct cggaattccc tgtggtggtc atgccggcgg 1441 cgcggtttgc gcccatgctg gcgacccgca acctgctcta tacggcggtg acccgcgcaa 1501 agaagggcgc cgtcctggtc ggcctgcccc aggcggtgaa cgccatggtg gacaacaacg 1561 ccatcgcggt gcgccattcc ggcctgaagg cgaggctcgt aaatctgtgg ggatttgcgg 1621 atggattgga ataacttttt aaaggactcg ggaaaggctg cgcttgctgc ggtctttccc 1681 gaaaatattt actgcatctg ctgcggcgac gtaacggatc cggacagcag gagcggtctg 1741 tgccttcgct gcagcgaaaa gctgccctgg gcgttcgaaa acccgttccg ctcctatatg 1801 gacgagtttg ctttcgacga tgtctggccc tgcgtgcgct acggttcgta tgcccgcaag 1861 atcatgaacg gcttaaagaa cggcggacag agctatatgg cggagaatgt cggacagatg 1921 ctggccgaac gggtgcagct cgaatgggac atgcccgatc tgtttgtggc cgtgccatcc 1981 cacaggagca agatgcagaa gcgcggctac aaccagtcgg aactgctggc ggaagcggtc 2041 gcaaagcgcc ttaaactacc gtatcagaag gggctgctgg agaagacccg cgccacggct 2101 tccatgcgca tggcggacgg ccgcacccgg cgcagcatgc tcgaggacag cttcgccgtt 2161 tcctcccgct ttgcctcgct ggtgccgggg aaaaaggtgt gcctggtgga cgacgttacg 2221 acgacaggca gcacagcgga cgcctgcgca agggccctga aggctgcggg ggcggcaaag 2281 gtggtgctgc tcgtgttcgg cgccagcagc ggctataaaa aagtggaaga aaatggtgca 2341 gcggaaccat aaaattgcac atcagaccgc tacatatggt ataatataaa gtcagaaaag 2401 tgttcccggg tctgcggttg caagtccagg ccagctatgg gcaaagggat ccacgtaagc 2461 cgtcagcaaa gatctgcggt gatcatggca tagcttagaa gtaagtcctc gggaaaatcc 2521 cggtaaaggc aagtgtgggg tcaaagaccg ggtcagccgg agatgctttt ctgaatctgg 2581 ttggaaaaag ggggaatcat gcaggatagg ataatgagca tcatatcggt cttggaattt 2641 tccgatgtga tcgacgtact catcgtggcg gtcatcgcct attacgtcat ccgctacgtc 2701 cgttccacgc gggcggcgca gctggtgtac ggcctcgcca tcgtgctggg cgtgtatctg 2761 ctctccgacg tcgcaaatct ctatacgctc aactggctgc tcaagaacct gctcagcgtc 2821 ggacttatcg cgctggtggt cgtgttccag ccggagcttc gccgtgccct ggaattcctc 2881 ggacgcggcc ggtttacgac ccgcgggttc tctctcgaaa aagaaaagta caacgcgaat 2941 atcgacatcc tgctccgcgc catcgattac tttgccgccc gcaaagaggg cgcgctcatc 3001 gtcgtggagc acgaaacggc gctgcaggac gtggcggata ccggcaccat gctggacgca 3061 cagctgacgg agccgctgat cgagaacatc ttctataaag gttcgcccct ccacgacggc 3121 gctgttatcc tgcgcggcaa ccgcatcctg gcggcaggct gcgtgcttcc gcttacggaa 3181 aacccgaacc tcagcaaaga tctgggcacg cgccacaggg caggcatcgg catgacggaa 3241 gtgtccgacg cgctggtgct catcgtctcc gaagagactg gcatcatctc catggcgaag 3301 gacggcaatt tgtcgcgctt cctggatctg aaagccgtgg agaaggcgct gctcaatctg 3361 tatatcagca agaagccgga catcaccgcg gtgccgcggg caggcttcag catcttccgg 3421 aaaggaggca gcgatgaata gagatgagat catcaaccgg gtcgctgcca tcgttttggc 3481 gatcgtcctg tgggtctatg tcatcagcgt ggtcaatccg ccgacgacgg taacggtgcg 3541 gcaggtgccg gtgaccctgc tcaatcagga atatctggat gattcgaaac tggccatcgc 3601 cggggacggc aagtatacgg tggacgtgga tctgtcgggc aagcgcaagg acctcatcct 3661 gggaccctca gacctgagcg ctacggccga cctcagcggc cttacgccgg gccagaatta 3721 tattactgtg cgggtcacct cccccagcaa cacgaccgtg gagagcatcc gcaccgagaa 3781 gatccaggtg tacgtggaca acctggtgag cgtggcgaag cctgtggtgc tggatgtggc 3841 gaatgtcccc tccgacacgg agttcaccgt gctggacctc agccaggagc agatcctggt 3901 ctccggcgcc aagagcctcg tggatatggt ggatcacctc accgtgcacg tggatgccgg 3961 cggactgtcg gtggatgagg cgacggagca gcaatatgcg cttaccccga tggatgtgga 4021 aggaaacgtc gtaaaggcgg taaaactgga gagtccgttc gtttcgatgt cctccacgct 4081 ctataccgtc aagagcgtgc ccctttatac gcgggtggac ggcgctcccg gctacggcct 4141 ggaactgctc agttccagca ttccctctac ggtaagcatc aagggaacgt tgctcgatct 4201 ggcgaaggtc aactatgtcg acgcccagcc gctggatatc acggatataa cgacgaatac 4261 ggaactgccg gtcgtcccca ttttgccaga cggcatctcg ctcgcttcga acaacggcga 4321 catgacggcc agctttacgc tgtcggatca ggccagcatg cagatggagg cggacagcgc 4381 ttcgatcgtt ctggaatacc tgccggaagg ctttacggcg gctgccgagg gagaaccgtt 4441 taccatgcag gtcaccgtca aaggtcccgt ggaaacgatc gcgaacctta cggcggatat 4501 gttctcctat tacgtggatc tgtccgcgat cgaagaggcg ggcgaatacg atctgcccat 4561 cgtttccggc acgacggtcg gagactccct ggaagtggtc atagaaccgg ctgcgctcca 4621 cgttctcgtg gaggcgatca cgccggaaga agaatagagt tcagaaagga aacagactat 4681 gggaaagtat tttggaacag atggattcag aggaaacgct aacgtagatc ttacagcgat 4741 ccatgccttc aagatcggac ttttccttgg gtggtactac gcgaaagacc cgaagatgaa 4801 acatgccgaa ggctataaag cgaacatcgt cctcggcaag gatacccggc tttccagcta 4861 tatgttcgaa gacgcgctgt ccgcgggcct cgcagcctcc ggcgcagacg tctatatgct 4921 gcacgtaaca tcgacgccca gcgttgccta cgttacgaga acgggagatt tcgactgcgg 4981 catcatgatc tccgccagcc acaatccgtt ccacgacaat ggcatcaagc tcatcaacga 5041 gaacggcgaa aagatgccgg acgacgttat cgcagacgtg gaagcctatc tggacggcgt 5101 atataagccc gaagggttcg aaggcgagac ctgggacgtg cctcttgcca ccggcagcga 5161 tatcggccag gtgatcgact attccgccgg ccgcaaccgc tacatcggct atctcatctc 5221 ccttgccacc acgtcctata aaggcaagtg gatcggattg gattgctcca acggcagcac 5281 atggcagatc gcccgcagcg tattcgacgc gctgggcgcc aagactttcg tcatcaacga 5341 cagacccgac ggcacgaata tcaacatggg ctgcggctcc acccacattg aagggctgca 5401 gaagctcgta aaggaaaacc gtctggactg cggcttcgcc ttcgacggtg acgccgacag 5461 atgcctcgcc gtggacgaaa acggcgatgt cgtgaatggc gacgagatca tgtacatgtg 5521 cgctaaatat atgaaggaaa a // LOCUS sequence019 5524 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence019 VERSION sequence019 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..5524 /mol_type="genomic DNA" /organism="" /note="sequence019" misc_feature <1..583 /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_011057322.1:site-specific DNA-methyltransferase" /note="WP_011057322.1 site-specific DNA-methyltransferase (Thermosynechococcus vestitus) [pid:36.4%, q_cov:99.5%, s_cov:53.5%, Eval:1.3e-24, partial hit]" /note="MGA_127" /locus_tag="LOCUS_0990" CDS complement(580..1173) /product="lysine exporter LysO family protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_010868489.1" /transl_table=11 /codon_start=1 /translation="MMILILLVVLVAGFVSGRLGLFAFLAPLESEAVIYVLYAMVFAIS VGIGAQYRDGEGERLSFKALLYSVTTIAGSLLAAYLMSIVLPVSAKDALICASGMGWYS LSTGLVYTYSPSLSVATFVYCVSREVLSIFIMPLLIKKFRRPEVVAVGGTATIQSSVAC AAVTGDNTIVLYGLLVGTVISMLVPVLISFFMGI" /locus_tag="LOCUS_1000" /note="WP_010868489.1 lysine exporter LysO family protein (Pyrococcus abyssi) [pid:27.5%, q_cov:95.4%, s_cov:93.4%, Eval:2.9e-19]" /note="MGA_128" CDS complement(1170..1478) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MKILLIYILIMGAGIALGYKTRFSSKSRTRDFFQKGCLLIILFLL GHQLGANEEVANSMTSMGLTGLLLCLAAMAGSFVVVLLLRIALEGRKSARSGEEEQR" /locus_tag="LOCUS_1010" /note="MGA_129" CDS complement(1499..2593) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="METNRTIRAIDLTKEFDEFEELSVISFGSGANPNQSMYRWLFDED PYDPASGNLMFVMRDMDAGGKMIASDGLIPFDLQLGSRTVRAAHSVKSMTHPDYKRQGI FRTMTQNSLDRGKENGVQLVLGFANKNSYPAYQKFGWTTIFPREVYVFPSDISRKVAAK TKSKLLGKLGNIAFRIVSDAKRAELHAAKRFTVQNFDKVPPEAAQLWEKYKDKYENLIV RDATYLHWRYDERPDRSYETLLLSGEEGPVGYLILRQSVANGKPMVCVAENFTDPDNTE YIGALAETLIAYCRRCRTAYAVVCSSLYGKYDEVFRRYGFVPQKGQGNIVIIKALDPTI SEAELAGAEHWHMSQGDGESELDL" /locus_tag="LOCUS_1020" /note="MGA_130" CDS complement(2662..4494) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MRTTRKLITLIAALALLFTSVVPAFAADFTDLEGHWSKTFMERLV EKGIMAGYADKTVKPDKTLTAAEAFVMLANLYDLNDEAKAEIHKDFGEAVEKNADSKVK WAYPQLEICLAAEIFTESELKNITLTAEMPKQNLAVYMVRAIRKADDAAKLNDAKLDYK DAADITSKCLGSIALLTDMKVVSGDTNGNFTPKASVTRAVFATMLCNILDYLDKENIKL QIDDYLGLDSAEGILSSVSNTGIVVRGFDGIYHSFARDAELKTTVNGSAKTLSSSYAGD YIKVQSKEGKALIAAITEETNVSYKQGKLGTVASNTASIKLTDLATGASDSYVLSKAKI KQDGKEISFADLTKGAFLTLKVEKGTVTEVTSDTKEYTISGAVGIVSYDTIVTMTLKES ETAEAILYMDLADMPTIKRGSLSITVDRLSSSEEINARIKGGEVTRITTEGKDANASGV LTIITRTITDTTWTIKGDDGTSVTYAIDSAAAAFSGETAIKLDTINPGDEVSVIVTSGV ITEVNLKKSASPASDKLSAEILAVDPTNRVLTVLKEGKLTYINCKKAASILNSETGKTL SFSALAAGDMIVAYGSYTDSTNFAATSIVIELKH" /locus_tag="LOCUS_1030" /note="WP_113034874.1 DUF4838 domain-containing protein (Paenibacillus contaminans) [pid:25.8%, q_cov:30.5%, s_cov:10.2%, Eval:4.8e-12, partial hit]" /note="MGA_131" tRNA complement(4696..4772) /product="tRNA-Val" /inference="COORDINATES:profile:Aragorn:1.2.38" /locus_tag="LOCUS_t0020" /note="Aragorn_2" ORIGIN 1 ccgtctgctg aaggacagcg gcaccatcgc cgtacatctg gactggcacg cggtacatta 61 cgtgaaggtg atgatggacg gcatcttcgg catgaacaat ttcctgaacg agatcatctg 121 ggcgtataag tccggcggcg cgacaggccg gcggttcgcc cgcaaacacg atacgatcct 181 ggtgtacgcg aagacagacg actattattt ccgtacgcag aaggagcggt cctacaaccg 241 ggacaacaag ccctatcatt ttaagggcgt ggaggaattt caggacgaag agggaaaatg 301 gtataccatg gtcaataaaa aagacgtcct cttcgtggat atggtgggaa ggacgtcttc 361 agaaagaacg gattatgcga cgcagaaacc ccaggcctta ctggacatcc tgctggagag 421 cctgtgcccg gagaacggtc tctgtgcaga ctttttcgcc ggttccggca cgctgggcgc 481 ctgcgcgctg gagagcggca gggaatgcct gctgtgcgat tccagcaggg aagcagtcga 541 tacgatcctg gaccggctgg ggatgtttgt gagggaagtt tagatcccca taaagaaact 601 gatcaggaca ggaacgagca tggaaatgac cgttcccacg agaagaccgt agagcacgat 661 cgtgttgtcg ccggtaacag cggcgcaggc aacactggat tgaatggtag cggttccgcc 721 gacggcaacg acttccggac ggcggaattt ttttatgagc agaggcatga tgaagatgga 781 caacacttcc cggcttacgc agtagacgaa ggtcgcgacg gagagggaag ggctgtaggt 841 gtagacgaga cccgtggaca gggagtacca gcccatgccg gaagcgcaga tgagagcatc 901 tttcgcggag accggcagaa cgatagacat aaggtatgct gccagcagag accctgcgat 961 cgtcgtgacg gaatacagaa gcgccttgaa agagagccgt tctccttcgc catcccggta 1021 ttgggcaccg atgccgacgg agatcgcaaa gaccatggcg tagagcacgt agatgacagc 1081 ttccgattcg aggggcgcaa gaaacgcgaa aagcccgagc ctgccggaga cgaatcctgc 1141 gacgagaact acgagaagga taagtatcat catctctgct cctcctcgcc gctgcgggcc 1201 gattttcggc cttccagggc tattctgagc agaaggacca ccacaaaaga acccgccatg 1261 gcagccagac agagcagcag gcctgtaaga cccatagacg tcatggaatt ggcgacttcc 1321 tcgttcgcgc ccagctggtg acccaacaga aacagaatga tgagcagaca gcctttctgg 1381 aaaaagtcgc gcgttctgct cttggaagaa aagcgcgtct tatagcccag cgcgatgccg 1441 gctcccataa tgaggatgta gatcagcagg atcttcatag acgtcttttc ctttgctgtt 1501 acagatccag ttcgctctca ccgtcgccct ggctcatgtg ccaatgctcg gcacctgcca 1561 gctccgcctc ggagatggtg gggtcaagcg cttttatgat gacgatattg ccctggccct 1621 tttgcggcac gaaaccgtaa cggcggaaca cttcgtcgta ttttccgtac agggaactgc 1681 agaccacggc gtaggcggtc ctgcaccggc ggcagtaggc gatgagggtc tccgccagcg 1741 caccgatata ctccgtattg tccgggtcgg tgaagttctc tgcgacgcag accatgggct 1801 tgccgttcgc gacgctctgc cgcaggatga ggtagccgac gggaccttct tccccggaca 1861 gcagcagcgt ctcataggac cggtccggtc tttcgtcgta gcgccaatgc agataggtgg 1921 cgtctctcac gatgaggttt tcgtatttat ccttgtactt ttcccagagc tgcgccgctt 1981 cgggcggtac tttatcgaag ttctgcacag taaagcgctt tgcggcgtgc agttcggcgc 2041 gcttagcatc cgaaacgatg cggaacgcga tattgcccag ttttcccaat agtttgctct 2101 tcgtctttgc cgcgactttt ctgctgatat ccgacggaaa gacgtagact tcccgcggga 2161 agatcgtcgt ccagccgaat ttctgatagg cggggtagga gttcttattc gcgaaaccca 2221 gcacgagctg tacgccgttt tccttgccgc ggtccaggga attctgcgtc atggtgcgga 2281 agatgccctg gcgtttatag tccggatggg tcatggactt gacggaatgc gcagcgcgga 2341 ccgtgcggct gccgagctgc agatcgaagg ggatgagccc gtcagaagcg atcattttgc 2401 cgccggcatc catgtcgcgc atgacgaaca tcaggttgcc gcttgcggga tcgtagggat 2461 cttcgtcgaa cagccaccgg tacatggact ggttggggtt ggctccggat ccgaacgaga 2521 tcacgctgag ctcttcgaat tcgtcgaatt cttttgtaag gtcgatcgcc cggatcgttc 2581 tgttggtttc catgaaagta ccatgatatg agaaggccgc ccggcagggc cggacggctc 2641 ttctgaaaac aagtgtgtaa actagtgctt taattcgatg acgatggacg tcgctgcaaa 2701 gttcgtggaa tcggtgtagg aaccgtaggc cacgatcatg tcgccggctg cgagcgcgga 2761 gaagcttaag gtcttgccgg tctcgctgtt gaggatggaa gccgctttct tgcagttgat 2821 gtaggtgagt ttgccttcct tgagcacggt gagcacacgg ttcgtcgggt cgacggccag 2881 gatctcggcg ctcaacttat cggaagcggg ggaggcggac ttcttcaggt tgacctcggt 2941 aatgacgccg gaggtaacga tgacggaaac ttcgtcgccc gggttgatgg tatcgagctt 3001 gatggccgtc tcgccgctga aggctgccgc cgcgctatcg atcgcgtagg tgacgctggt 3061 accgtcgtcg cccttgatgg tccacgtggt atccgtgatg gtgcgggtga tgatggtgag 3121 cacgccgctg gcattggcat ctttgccttc cgtcgtgatg cgggtaactt cgccgccctt 3181 gatgcgggca ttgatctctt cgctggagct caggcggtcg acggtgatac tcagggagcc 3241 acgtttaatg gtgggcatat cagccagatc catgtagagg atggcttcag ccgtttcgct 3301 ttccttgagg gtcatcgtga cgatcgtgtc gtagctgact atgccgacag caccggagat 3361 cgtgtattcc ttcgtatcgg aggtgacttc cgtgacggtg cctttttcga ccttcagcgt 3421 gaggaatgcg cctttagtga ggtctgcgaa gctgatctcc ttgccgtcct gcttgatctt 3481 tgccttgctg agcacgtagg agtcggaggc gccggtggcc agatccgtca gcttgatgga 3541 agcggtattg gaggctacgg tgccgagctt gccctgttta taggaaacgt tggtctcttc 3601 cgtgatggct gcgatgagcg ctttgccttc cttggactgg accttgatat aatcgcctgc 3661 ataggaggag gaaagggtct tggcgctgcc gttgaccgtg gtcttcagtt cggcatctct 3721 tgcaaagctg tggtagatgc catcgaatcc gcgtacgacg atgccggtgt tggaaacgga 3781 ggaaagaatg ccttctgcgg aatccagtcc gagataatcg tcgatctgca gcttgatgtt 3841 ttccttatcc aggtaatcga ggatattgca gagcatggtg gcaaacaccg ctctcgtgac 3901 gcttgccttc ggcgtaaagt tgccgttcgt atcgccgctc accaccttca tgtcggtgag 3961 aagcgcgatg ctgcccaggc acttggacgt gatgtccgct gcgtctttat aatccagttt 4021 cgcatcgttc agcttggctg cgtcgtccgc cttgcggatc gcacgcacca tatagacagc 4081 cagattctgc ttcggcatct ccgcagtgag cgtgatgttc ttcagctcgg attcggtaaa 4141 gatctccgcc gcaaggcaga tctcgagctg cggataagcc catttgactt tgctgtccgc 4201 gttcttttcg acggcttctc caaaatcttt gtggatctcc gccttggctt cgtcgttcag 4261 gtcgtacagg ttggccagca tgacgaacgc ttccgctgcc gtaagcgtct tatccggctt 4321 tacggtcttg tccgcgtatc ctgccatgat gcctttttcg accagtcttt ccataaaggt 4381 cttggaccag tgaccctcca gatcggtgaa gtcagccgcg aaagcgggga cgacagaagt 4441 gaagagcagg gccagtgctg cgatgagcgt gatgagtttt ctcgtagtgc gcatagtggc 4501 ttcctcctta tgcaaataga tctctaatta caatctattc tattatatat cacattacag 4561 gatagtgtat atttttttga aaatttttgc ggaaaaacac aagaagtggt ggtctttgcg 4621 gttaacagaa gtttgttata cgacgatctg cagagaaaag gaaagacccg ggctgctttg 4681 cagtccgggt ctcgttggtg cgccatacag gactcgaacc tgtgacctcc tgcacgtcaa 4741 gcaggcgctc taaccaactg agctaatgtc gcgtatttga agtcaacaca aatatattag 4801 cgcaacagaa acagaaaagc aaggactttt tcccgaaaag agaaaaagtc ctgtatttca 4861 gctatttcga cagttcgatg gggatgcagc tgaagtctgt tccggtcacc gcccagggcg 4921 tttcgacgtc gaggacgaga tagagcgtgc cggccgccgc gtccagataa tacttctggg 4981 tgtggttaag accagggaag gcggtgaccc gcacaccagc cggcgccgcg ccttccgggg 5041 gaccgaacgt gtcctcgtcc tgatagaccg tgtccgcgtt ctgacgcagg tattgcccgg 5101 tctgcccgtc cagcgaagcg agcggggcga aagccgagat cagaacgtct ttccccgttg 5161 ccgggtcgat gttcatggtc tcgcatacgt tgaagaacag cgtctgcgtt ttgccgtctt 5221 ttcctgcggg cacttcgcag tccatgctgc aggtgaagac gatggagagc aggtcgctgc 5281 tggatgcggt cacgcgggtg tagacggtct tgtagcggca gctttcgggc gcaaggccgg 5341 ctgccttata ggtctcgatc ccctgaagat cgggaagata ggcggggtcg cagaggcggt 5401 ccagcttgct gcggatccgt tcgtttaccg ccttttccac gttgctgtcg gcaaatccgc 5461 gaacttcggc tcccatggca tagatgcggt catcttcctg atagacgctg tatgccacgg 5521 cgag // LOCUS sequence020 5471 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence020 VERSION sequence020 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..5471 /mol_type="genomic DNA" /organism="" /note="sequence020" CDS 117..1253 /product="alanine racemase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_010963814.1" /transl_table=11 /codon_start=1 /translation="MEKWMNRPAWVEIDLRKFDSNVKLIKSRIAPGAQMLAVVKADCYG HNMRECYKVLKENDIHNFGIASISEGIELRSYGDPTDRVVLFALVPPLFVEAVCDYNIV TLVQNLEYAKALSGEAVKRGITMEVMGCVDTGMGRIGYQWDDPAVVDELAEAASYPGLK MIGIFSHLSCEDFEDKYWSDLQHQRFEGVRKALEERGVDMSLSSLANSPATSHRPQLHY GLVRPGGSLFGRYQNCCVELPGIQPVMSIKANIVQLKSVPDNFSISYERSGRTSRPSKI ATLGLGFADGLVRYWGAGRGKVIVNGCFAPTIGNMCMDQFMIDVTDVPDVKVGDECILV GSDGKLEIRIEEMGSVCSTLGNEITCGMPIRLPYKFIR" /locus_tag="LOCUS_1040" /gene="alr" /EC_number="5.1.1.1" /note="WP_010963814.1 alanine racemase (Clostridium) [pid:34.5%, q_cov:98.4%, s_cov:95.9%, Eval:1.1e-58]" /note="MGA_133" CDS 1260..2531 /product="voltage-gated chloride channel family protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011037141.1" /transl_table=11 /codon_start=1 /translation="MKPIHKRLRIDPNLRVDSELRDKLSYRSVDVLQWCVYAVVVGIIC GTIATAFGMVIDAATEARKTYDWFVWLMPLAGVCIVALYHAAGITKPMGTNRVLLAVKE EEGVAIRMAPLIYVSSMLTHLTGGSSGREGAALQIGGSIANFIGRQFKLSHLDLRTITM CGMAAGFSGLFGTPLAAGIFAMEVAEGSLHYAVLFPCLLSSIVARVTAETFGVPATSFT VTGYPDLTLRTTAAALVFGVLCALLSILFVETLHCIDWTYAHYLKNPYLRIIVAGLIVA TATTLLGTRDYNGAGTEVIVRALQGEAEPLAFLFKILFTALTLEAGFKGGEIVPTFFIG ATFGCVAAPLLGLDPSFAAALGMTGLFCGVTNCPVASILLSFELFGGDSLVLFALCCSV SYMLSGHYSLYTVQRLEQDKFHLE" /locus_tag="LOCUS_1050" /note="WP_011037141.1 voltage-gated chloride channel family protein (Xanthomonas campestris) [pid:37.2%, q_cov:92.9%, s_cov:89.8%, Eval:2.8e-74]" /note="MGA_134" CDS 2560..3045 /product="tRNA adenosine(34) deaminase TadA" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_002287154.1" /transl_table=11 /codon_start=1 /translation="METHEEYMRIAIEEAKIAASLGESPIGAVIVQDGKVVGRGHNTTE TAKDPTCHAEMNAIRDAARNLGGWRLPHCSMYVTLEPCSMCAGAIVLARIEQLYIGTAD PKSGACGSLRNIVSDERLNHRVEVHTGVLQEECSGLLKDFFKQLRKKKNKTPEEQQV" /locus_tag="LOCUS_1060" /gene="tadA" /EC_number="3.5.4.33" /note="WP_002287154.1 tRNA adenosine(34) deaminase TadA (Enterococcus) [pid:50.6%, q_cov:95.7%, s_cov:90.1%, Eval:4.9e-44]" /note="MGA_135" CDS 3042..3953 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MRKRFPALLMAVLIVLASASLAFASGLEIVDISPADGSKGYQPAN MAVKIHFSEDMMDEDAIAANAGKFLIQDAEGTEQPYDIVYNADKYPNELWLVLQGDLQP DSEYTVTIEPGVVSSSGSTLADGMTTTFFTRNTRTDGLISMGLMVVLMVAMFGMTARAA RKQQEEEDPRAAEKAIEDSLNPYKIAKQKGISVEEAQAIVAKEKDKLEKKKAKAEADRI KREEIKAEERRKMEEELEFFGTDDSELKKELREEGIYLVKAPKSIKEAGGRIPRSVRQH NEAKRKKAAEKLKRAQRNKKKK" /locus_tag="LOCUS_1070" /note="MGA_136" tRNA 3990..4064 /product="tRNA-Arg" /inference="COORDINATES:profile:Aragorn:1.2.38" /locus_tag="LOCUS_t0030" /note="Aragorn_3" CDS 4425..4985 /product="DUF3793 family protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_002681044.1" /transl_table=11 /codon_start=1 /translation="MSEETLVAHCSPVLAGLKTANMFNVECSDAQILCLQLRDLNLRLG PKGVRILPLRFSSSRALLYLYRPSRLQKDLQDETAVEILKNYGYPQNSKGGCLGHLFRR LRSSDTFPHEIGLFLGYPPKDVKGFIEEGPRCAKCTGCWQVYGDEEKALKTFERYRKCT EVYCAQVSCGKSLERLTVKEKAN" /locus_tag="LOCUS_1080" /note="WP_002681044.1 DUF3793 family protein (Treponema denticola) [pid:33.2%, q_cov:93.5%, s_cov:93.3%, Eval:3.7e-18]" /note="MGA_137" CDS 5007..5189 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MSKIAVVYWSGTGNTEAMANAVFEGAKSKDPEAKLFTAAEFGPDQ MDNFEACKALGAALA" /locus_tag="LOCUS_1090" /note="WP_002666607.1 flavodoxin (Treponema denticola) [pid:50.8%, q_cov:95.0%, s_cov:42.1%, Eval:9.6e-12, partial hit]" /note="MGA_138" ORIGIN 1 gcgccggtca ccaatgcgat ttttgccatg ggaaacctcc gatctcattg aaatcctacc 61 acttaaaaga tatactaaaa ctgtaattta cgcaatcgac gggaaaggag caggcgatgg 121 aaaagtggat gaaccggccg gcatgggtcg agatcgatct cagaaagttc gacagcaacg 181 taaaactcat caagtccagg atcgcgccgg gagcgcagat gctggcggtg gtcaaagcgg 241 actgctacgg ccacaacatg cgggagtgct acaaggtgct gaaggaaaac gacatccata 301 atttcggcat cgcctccatc tccgagggca tcgaactgcg cagctacggc gatcccaccg 361 accgcgtggt gctgtttgcg ctggtgccgc ccctcttcgt cgaggccgtc tgcgactaca 421 acatcgtgac cctcgtccag aacctggaat acgcgaaagc cctgtcgggc gaagccgtta 481 aacggggcat caccatggaa gtcatgggct gcgtcgatac cggcatgggc cgcatcggct 541 atcagtggga cgaccccgct gtggtggacg aactggcgga agcagcaagc tatcccggcc 601 tcaagatgat cggcatcttc tcgcacctgt cctgcgaaga cttcgaggat aaatactgga 661 gcgatctgca gcaccagcgc ttcgaagggg tgcgcaaggc cctggaagag agaggcgtgg 721 acatgtccct gtcctcgctg gcgaactctc ctgcgacctc ccaccggccg cagctgcact 781 acggtctggt ccgtcccggc ggaagcctgt tcggccgcta ccagaactgc tgcgtggaat 841 tgcccggcat ccagcccgtc atgtccatca aggcgaacat cgtgcagctg aagagcgttc 901 ccgataactt ctccatcagc tacgagagaa gcggacgtac cagccggccc tccaagatcg 961 cgacgctggg cctcggcttt gccgacgggc tcgtgcgcta ctggggcgcc ggacgcggta 1021 aagtcatcgt caacggctgc tttgcgccca ccatcggcaa catgtgcatg gaccagttca 1081 tgatcgacgt tacggacgtg cccgacgtaa aggtcggcga cgaatgcatc ctcgtcggct 1141 ccgacggcaa gctggagatc cgcatcgagg agatgggaag cgtctgcagc accctgggca 1201 acgagatcac ctgcggcatg ccgatccgcc ttccctataa attcatcaga taagtacgaa 1261 tgaaacctat ccacaaacgg ctccgcatcg acccgaacct gcgggtcgac agcgagctgc 1321 gagacaagtt atcctaccgg tccgtagacg tgctgcaatg gtgcgtctac gctgttgttg 1381 tgggcatcat atgcggcacg atcgccacgg ccttcggcat ggtgatcgac gcagcgacgg 1441 aagccagaaa gacctacgac tggttcgtgt ggctcatgcc cctggccggc gtctgcatcg 1501 tggcgctgta ccacgctgcg ggtattacga agcccatggg caccaaccgg gtgctgctgg 1561 cggtcaagga ggaggagggc gtagccatcc gcatggcgcc cctcatctac gtttcctcca 1621 tgctcaccca ccttacaggc ggttcttccg gcagagaggg ggctgccctg cagatcggcg 1681 gctccatcgc caattttatc ggccggcagt tcaaactcag ccatctggac ctgcgcacca 1741 tcacgatgtg cggcatggcg gcgggcttct ccggtctgtt cggcacgccc ctggcggcgg 1801 gcatcttcgc tatggaggtg gcggaagggt cgctgcacta cgcggtgctg ttcccctgtt 1861 tgctgtcgtc cattgtggcg cgggtcacag ccgagacctt cggcgttccg gcgacatcct 1921 ttaccgtgac gggctatccg gacctgaccc tgcgcaccac tgcggcggct ctggtgttcg 1981 gcgtgctgtg cgcgctgctg tccatcctgt tcgtggaaac gctgcactgc atcgactgga 2041 cctacgcgca ttacctgaaa aatccgtatc tgcgcatcat cgttgcaggc ctgatcgttg 2101 cgaccgccac tacgctgctg ggcacccggg attacaacgg ggccggcacc gaggtgatcg 2161 tgcgggcgct gcagggggaa gcagagccgc tggcgtttct gtttaagatc ctgtttaccg 2221 cgcttacgct ggaggcgggc tttaaaggcg gcgagatcgt gcccacgttc tttatcggcg 2281 ccacgttcgg ctgcgtggcg gcgcctctcc tggggcttga tcccagcttc gctgcagccc 2341 tcggcatgac cgggctgttc tgcggggtca cgaactgtcc cgtggccagc atcctgctgt 2401 ccttcgagct gttcggcggc gacagcctcg tgctgttcgc cctctgctgc agcgtttcgt 2461 acatgctgtc cggccattac agcctgtata ccgtgcagcg gctggagcag gataagttcc 2521 accttgaata gaccctttgg tttatgataa aataacaaaa tggaaactca cgaagagtac 2581 atgcgcatag ccatcgaaga ggcgaagatc gcggcgtctt tgggggaatc tcccatcggt 2641 gccgtcatcg tgcaggacgg gaaagtcgtt ggacggggtc acaacaccac ggagacggcg 2701 aaagacccca cctgccacgc cgagatgaac gccatccgcg atgccgctcg gaatttaggg 2761 ggctggcggc tgccgcactg cagcatgtac gtgaccctgg agccctgcag catgtgcgcc 2821 ggcgccatcg tgctggcccg catcgagcag ctctacatcg gcaccgcgga tccgaaatcc 2881 ggtgcctgcg gatctcttcg caacatcgta tccgacgaaa gactcaacca ccgggtggaa 2941 gtccacacgg gggtcttaca ggaagaatgc agcggccttt taaaggactt cttcaaacag 3001 ctgcgcaaga aaaagaacaa aaccccggag gaacaacaag tatgagaaaa agattccctg 3061 ccctgctgat ggcagtcctc atcgtcctgg cgtccgccag tctggcgttc gcgtcgggcc 3121 tggagatcgt cgatatctcg ccggccgacg gcagcaaggg ctaccagccg gccaacatgg 3181 cagttaagat ccacttttcc gaagacatga tggacgaaga tgccatcgcg gccaatgcgg 3241 gcaaattcct gatccaggat gcggaaggca ccgagcagcc ctacgacatc gtctacaacg 3301 cggacaagta tcccaacgaa ctgtggctcg ttctgcaggg cgatctgcag ccggattctg 3361 aatacaccgt aacgatcgaa cccggcgtcg taagcagttc cggcagcacg ctggccgatg 3421 gcatgacgac gacgttcttc accagaaaca cccgcaccga cggcctcatc tccatgggcc 3481 tgatggtggt gctgatggtg gccatgttcg gcatgaccgc aagagccgcc agaaagcagc 3541 aggaagagga agatccgaga gccgcagaaa aggcgatcga agacagcctc aatccctata 3601 agatcgcgaa gcagaagggc atctccgtag aggaggccca ggcgatcgta gccaaggaaa 3661 aggataaact ggagaagaag aaggccaagg ccgaagcgga ccgcatcaag cgcgaagaga 3721 taaaggccga agagcgcaga aagatggaag aagagctgga gttcttcggc acggacgatt 3781 ccgaactgaa gaaggagctc agagaggaag gcatctacct cgtcaaggcg cccaagtcca 3841 tcaaggaagc gggcggccgc atccccagaa gcgtgcgcca gcacaacgag gcgaagcgca 3901 agaaggctgc ggagaagctg aagagagcgc agcgcaataa gaaaaagaag taaaagaaac 3961 gggctggctt tgcggccggc ccgcgttatg ccctcatagt taaatggata taacggaggt 4021 ttcctaaacc tttgttcgtg gttcgattcc gcgtgggggt gccagtgaag gatgatcctg 4081 ggaagggtca tcctttttta tgtttttgtt ttatatttcg cctcggggtc ctgtcaccca 4141 acacatcctc atcttcgctc attcgcttgg ccgcgacggg agcagactcg gatgtcgcgg 4201 cgcccgctca atcgctcgat gagcctcttt gggtgccacc cctcggcgta aggtttaaca 4261 ttttttttaa aaagccttga caagatgttg gagatagtgt ttaatgaaag agaagttagc 4321 aatggctaac taattatttg gggaaatggt tagttgccac taactcaagg aacgtattag 4381 cacagatcgg gttttttatt ctccttattc ccgaaaagaa cgctatgtcc gaagaaacat 4441 tggtagcaca ttgctcgccg gtactggcgg gactgaaaac tgcaaacatg ttcaacgtgg 4501 aatgcagcga cgcgcaaatc ctttgcctcc agctgagaga tctcaatctc cggctggggc 4561 ctaagggcgt ccgcatcctt ccgctccggt tttccagcag cagggctctg ctgtatctgt 4621 accggcccag ccggctgcag aaggatctgc aggacgagac cgcagtggag atcctgaaaa 4681 actacggata tccgcagaat agcaagggcg gatgtctggg tcacctgttc cggcggctgc 4741 gcagcagcga tacgtttcct cacgagatcg gattgttttt aggctatccg cctaaagacg 4801 tgaagggctt tatcgaagaa ggcccccggt gtgcgaaatg caccggttgc tggcaggtct 4861 acggggacga ggaaaaggcc ttaaagacat ttgaacgata cagaaagtgc acggaagtgt 4921 actgcgcaca ggtctcctgc ggcaagagcc tggagaggct caccgtaaag gaaaaggcaa 4981 attaagaaaa gaaaggctgg taacacatga gcaagatcgc agtggtttat tggagcggca 5041 cgggcaacac cgaggcaatg gcaaacgccg tctttgaagg cgccaagagc aaggatcccg 5101 aagccaagct gtttacggcg gctgaattcg gcccggacca gatggataac ttcgaagcct 5161 gcaaagcgct gggtgctgct ctggcataaa cgtcatctga atagcctgcc tccgagggct 5221 aaccatacta aaaatatcag ttaaaccgta aaagacccgc cggatcggcg ggtctttgcg 5281 ttgcgtattt gtattttaca attttacagc ttcgtcgcga tgggcgccac gctgtgcttg 5341 ttcttgagcg tggacaggat gacgttcgtc tgggtgtgct taatgctttc gacgctcttg 5401 atcttgttca tcagttgctc taaggtcgcg gtgttcttcg tcgtgatctt cagaacgtag 5461 tcgtattcgc c // LOCUS sequence021 5459 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence021 VERSION sequence021 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..5459 /mol_type="genomic DNA" /organism="" /note="sequence021" CDS 251..910 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MKGPVITKDCVKTLLDGKFIKVYDLQYAEGKHYYDASRRAAEDLA AVKTDEEFRDMLPDAVSCCVILRCPGEEPRLLLSYEYRYPCGRFLLSPPAGLIDPEEKG HPDALIRTAVREIAEETGLLIGPSDRVEVIDPCLFSSPGMTDECNAMVCAVVDAPDLSS LNQNGAVGTEQFDGFLLVTKKEAEDILRSGRDPQGIFYSVFTWIVLAWFAGGFWER" /locus_tag="LOCUS_1100" /note="MGA_141" CDS 916..2163 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MKGQEEFMDLRPKHKCIIALLLLVSFVLLCGCTEVRAQADVTEEA AGSGAAPHIAVMIEGDNISRVMSSMTLREKIGQLFIIRPDTLGGSVQNLTKEGMALYTS YPAGGFCLFARNIADPQQLKSFTSQLHGLGDRFQPLLTIDEEGGPVVRIVANSRFDVPR FPAMGKLTAAGDPPEVRRLASFECSKAIGTYLKEYGFDLDFAPVADVNTNPHNPVIGTR AYSNDPLTAADLVGAACAGLHEGGSGSCLKHWPGHGDTKTDTHKGRASTAKTWEEILDC EAIPFRAGIDAGTDMVMVSHIAAPAVTGSDEPASLSHVLITEKLRRELGYEGVVITDAL DMGAVSHYYSPGEAAVQAFLAGADILLMPSDYFEAFDAMVAAVNDGTIPKERLDESVRR ILQLRLSLAALSQNSM" /locus_tag="LOCUS_1110" /note="WP_011028566.1 glycoside hydrolase family 3 protein (Streptomyces) [pid:36.7%, q_cov:87.5%, s_cov:60.3%, Eval:3.3e-56, partial hit]" /note="MGA_142" CDS 2274..3647 /product="NAD(P)/FAD-dependent oxidoreductase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_012048439.1" /transl_table=11 /codon_start=1 /translation="MDYDVIIIGAGPGGIFTAYELLQAQKGLKIGVFELGGPLNERKCP IDGVKVKSCVRCKTCSIMSGFGGAGAFSDGKYNITNDFGGTLYEYIGKQRALDLMHYVD KINCENGGGGTTLYSTANSDFKTQCLRNDLHLMDAQVRHLGTDINYVVLQNLYDKLKDG VDFHFRSRVSTVAKTEDGYEIDVDGQKFSAPYCVVSAGRSGSKWMEDVCGDLGLATKSN RVDIGVRVELQADIFKHITDELYESKIVYRTKQYQDLVRTFCMNPKGAVVNENTNGIVT VNGHSYEDPALQTNNTNFALLVAKHFTEPFKDSNGYGESIAKLSNMLGGGVIVQRFGDL VRGRRSVEKRIRESFLTPTLEATPGDLALVIPKRILDDIVEMIYALDKIAPGTANDDTL LYGVEVKFYNMEVELNSDLETSLPGLFVIGDGSGVTHSLSHASASGVHVARVLLDRIE" /locus_tag="LOCUS_1120" /note="WP_012048439.1 NAD(P)/FAD-dependent oxidoreductase (Clostridium botulinum) [pid:64.0%, q_cov:99.1%, s_cov:98.3%, Eval:3.2e-172]" /note="MGA_143" CDS 3651..4151 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MEHVRLNKTAFYLLSFTWGLPTTLAGCLTAAVLRLTGKHPQRFGW CWYFEVGSHWGGCSMGPFFFKQKEPSRHICIHESGHAIQNCWFGFFMPFLVSIPSSIRY RVHRYKRRRHRPLPPYDAIWFEGQATRLGRMYFAPSGDDHVFYETQEQKTDTEPEETQP EER" /locus_tag="LOCUS_1130" /note="MGA_144" CDS 4081..4782 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MFFTKRKSRRQIQNLRKLSRKNVDLGKFVKDFYVEKGLAYISCNV SGYNDIIDRYSVKGYEWVEESFARFVEENAIYIPPEYPIVLEICGHRFTEAQKTTIEET ILDYYALKMGDVQMSIQANNRRILFMFLLVAVFAVILYLVTMFPGIPKVLSEAVFVLFW MALWDASEFFFVDGRDLQEDKLEAAQLASMAVTFFDKFEDGPAEPEVVQQIMEEMEEEV ILPSTQWEQEE" /locus_tag="LOCUS_1140" /note="MGA_145" ORIGIN 1 cctggaccag cactatgaga agcacggcat cgacatgggc tttgaaaatg cgcagctgta 61 cgaagaatct gcgaacctgg tgatccacca tccggacgtt ctgcacaaga tcgaaaagga 121 agacggggac acctgcttct atctggagga gacgaatgaa ttcgtcgtgc tgtccaagga 181 cggctacatc cgcacgtact tctggccgga ttccgggaaa aagtattacg ataagcaata 241 gaggcgcaag atgaagggtc ccgtcattac aaaagactgc gtaaagacgc tgctggacgg 301 taagttcatc aaggtctacg acctgcagta tgcggaagga aagcattatt acgatgccag 361 cagaagggcg gcggaggatc tggccgcggt caaaacggac gaggaattcc gggacatgct 421 gccggacgcc gtaagctgct gcgtcattct gcgctgcccc ggcgaagagc cccggctgct 481 gctttcctac gaataccgct acccctgcgg ccggtttctt ctgagtccgc ctgcgggatt 541 gatcgatccg gaagagaaag ggcatccgga cgcgctcatc cgcacggcgg tgcgggagat 601 cgcggaggaa acgggtcttc tgatcggacc ttccgatcgc gtagaagtca tcgacccctg 661 tctgttcagt tctcccggca tgacggatga atgcaacgcc atggtctgcg ccgtggtgga 721 tgcgccggat ctgtcgtccc tcaaccagaa cggcgcggtc ggaacagaac agttcgacgg 781 ttttctgctg gtcacgaaga aagaggcgga ggacatcctc cgcagcggca gagatccgca 841 ggggatcttc tattccgtgt ttacctggat cgtgctggcc tggtttgccg gcgggttctg 901 ggagagatag ctgctttgaa gggtcaggaa gagtttatgg atcttcgtcc gaaacacaaa 961 tgcatcatag ccttgctcct tctcgtcagt tttgtgctgc tctgcggctg cacggaggtg 1021 cgcgcgcagg cggatgtaac ggaagaggcg gcaggcagcg gcgctgcgcc tcacattgcg 1081 gtgatgatcg aaggagataa cataagcaga gttatgtctt ctatgacgct tcgggaaaag 1141 atcggacagc tgttcatcat ccggccggac acgctgggcg gatcggtgca gaaccttaca 1201 aaagagggta tggcgctcta tacgtcgtac ccggccggcg gtttctgtct gtttgcacgg 1261 aacatcgcag atccccagca gctgaagtcc tttacgtcgc agctgcacgg tctcggagac 1321 cggttccagc cccttttgac gatcgatgag gaaggcggtc ctgtcgttcg catcgtagca 1381 aacagccggt tcgacgtgcc gcgttttccc gccatgggaa aactgaccgc agcgggagat 1441 cctcctgaag tgcgccgtct cgcatccttc gaatgcagca aggccatcgg gacctatctg 1501 aaggaatacg gattcgatct ggatttcgcg cctgtcgcgg acgtcaacac caatccccat 1561 aatcccgtca tcggcacgcg ggcgtacagc aacgaccccc tgacggcagc ggacctagta 1621 ggcgctgcct gcgcaggcct gcacgaaggc ggttccggca gctgtttaaa gcattggccg 1681 ggtcatggcg acacgaagac ggatacccac aaaggccggg cttccaccgc aaagacctgg 1741 gaggagatcc tggactgcga agcgatcccg ttccgggccg gtatcgacgc cgggacggat 1801 atggtcatgg tgtctcacat cgcggcgccc gccgtcaccg gcagcgatga gcctgccagt 1861 ctctcccacg ttctgatcac ggaaaaactc agacgggagc tggggtacga aggtgtcgtc 1921 atcaccgacg ccttggatat gggcgcggtt tcccattact acagcccggg cgaagcggcc 1981 gtgcaggcct tcctcgccgg cgctgatatc ctgctgatgc cttcggacta tttcgaagcg 2041 ttcgacgcga tggtcgcggc tgtcaatgac gggacgatcc cgaaggaaag actggacgaa 2101 agcgtgcggc gcatcctgca gctgcggctt tctctcgccg cattgtcgca aaattccatg 2161 taatatgata aaatgaaaca ggaaacagca gacggacaag accgcaaaga cacggcttgc 2221 ctgatgtttt gttgatttaa gaaaaaaatt cacaggagag gaatatcaga taaatggatt 2281 atgacgtgat catcatcggg gcgggccctg gcggtatctt tacagcttat gaactgctcc 2341 aggcgcaaaa aggtcttaag atcggcgttt tcgaactggg cggaccttta aacgagagaa 2401 aatgccccat cgacggggtc aaggtaaagt cctgcgtgcg ctgcaagacc tgctccatca 2461 tgagcggttt cggcggcgcc ggcgcgttct ccgacggcaa gtacaacatt acgaacgatt 2521 tcggcggcac gctgtacgaa tacatcggaa agcagcgggc attggacctg atgcattacg 2581 tggacaagat caactgcgag aacggcgggg gcggcacgac gctgtactcc accgccaact 2641 ccgatttcaa gacgcagtgc ctgcgcaacg acctgcatct gatggacgcc caggtgcgcc 2701 atctgggcac ggacatcaat tacgtcgtgc tgcagaatct gtacgacaag ctgaaggacg 2761 gcgtggattt ccatttccgc agccgcgtct ccaccgtcgc caagacagaa gacggctacg 2821 agatcgatgt ggacggtcag aaattttcgg cgccttactg cgtcgtatct gccggccgca 2881 gcggcagcaa gtggatggag gatgtctgcg gagatctggg gcttgccacc aagtccaacc 2941 gcgtggacat cggcgtccgc gtggagctgc aggcggatat ctttaagcac atcacggacg 3001 aactgtacga gagcaagatc gtctaccgta cgaagcagta tcaggatctc gtgcgcacgt 3061 tctgcatgaa tccgaagggc gccgtggtaa acgagaacac gaacggcatc gttacggtaa 3121 acggccacag ctacgaagat cccgcgctgc agacgaacaa cacgaacttc gctctgctgg 3181 tggcgaagca tttcacggag ccgttcaaag attccaacgg ctatggcgaa agcatcgcca 3241 aactgtccaa catgctgggc ggcggcgtta tcgtacagcg cttcggcgat ctggtaagag 3301 ggcgccgttc cgtggaaaag cgaatccggg agagtttcct tacgccgacg ctggaagcga 3361 cgccgggcga tctggcgctg gtcatcccca agcgcatctt agacgacatc gtggagatga 3421 tctacgcgct ggacaagatc gcgccgggca cggccaacga cgacacgctg ctgtacggcg 3481 tggaagtcaa gttctacaac atggaagtgg agctcaacag cgatctggag acctcgcttc 3541 ccggcctgtt cgtcatcggc gacggctcgg gggtcaccca ttcgctgtcc cacgcgtccg 3601 ccagcggcgt gcacgtggcg agagtgctgc tcgaccgcat cgagtaaact gtggaacacg 3661 tacggctgaa taaaactgca ttttacctgc tgtcctttac ctggggactg cccacgacgc 3721 tggcgggctg cctgacggcc gccgtgctgc gcctgacggg aaaacatcct cagcgtttcg 3781 gatggtgctg gtatttcgag gtagggtcac actggggcgg ctgcagcatg ggtccgttct 3841 tctttaagca gaaggagccc agcaggcata tctgcatcca cgagagcgga cacgccatcc 3901 agaactgctg gttcggcttt tttatgccgt tcctcgtatc gatcccctcg tccatacggt 3961 accgcgtcca ccggtataaa agaagacgcc acagaccgct gccgccctac gatgccatct 4021 ggttcgaagg gcaggccacg agactcggca gaatgtattt cgccccgtca ggagacgacc 4081 atgtttttta cgaaacgcaa gagcagaaga cagatacaga acctgaggaa actcagccgg 4141 aagaacgttg acctcgggaa gttcgtcaag gatttctacg tagagaaagg cctcgcctat 4201 atctcctgca acgtatctgg gtacaacgac atcatcgacc gctattccgt aaagggctac 4261 gagtgggtcg aagagtcctt cgcgcgcttc gtggaggaga acgcgatcta catcccgccg 4321 gaatatccca tcgtgctgga gatctgcggt caccgcttta ccgaggcgca gaagaccacg 4381 atcgaagaga cgatcctgga ttattatgcc ctgaagatgg gcgacgtaca gatgtccatc 4441 caggccaaca accggcgcat tcttttcatg ttcctgctgg tggcggtttt tgccgtcatc 4501 ctgtatctgg taacgatgtt ccccggcatt ccaaaggtcc tgtccgaagc ggtgttcgtg 4561 ctgttctgga tggcgctgtg ggacgcctcg gagttcttct tcgtggatgg aagagatctg 4621 caggaagata aactggaagc cgcacagttg gccagcatgg ccgtcacatt cttcgacaag 4681 ttcgaagacg gtccggcaga gccggaagtg gtgcagcaga tcatggagga gatggaagag 4741 gaggtcattc tgccgtcaac gcaatgggag caggaggagt gaccccgaaa gaggtaaacc 4801 atgcgtaaac acccggacag gcatacatac ctgaccgaaa cccccatacc gaaactcatc 4861 cccgcactgg ccgtgccgac catcatcagc atgctggtga cgggtattta taattccgcc 4921 gacacatatt tcgtcggccg catctccacc caggcaacgg ctgccgtcgg cctggtcttt 4981 tccgtgatgg cgatcatcca ggcgttcggc ttcttctgcg gtcagggctc cggcaactat 5041 ttgtcccggc tgctgggcgc ggggaagaaa caggaagcga acgaggtggc gatcaccggc 5101 tttctgatgg ctttggtgat cggactgctg atcgccgcgc tgggcaactg gcaggcggag 5161 cgcctcgcgg actggatcgg cgccacggac acgtcacggg cagataccat cgcctatatg 5221 cggatcatcc tgatgggcgc gcccttcatg acctgccagt tcgtcatcaa caaccagctg 5281 cgtttccagg gcagcgccat gtacgccatg atcggtctga tgtgcggcgc ggtcgtcaat 5341 atcattctgg accccgtcct gatctttggg ttcgacctgg gcatccgggg cgcagcgctt 5401 gccacggtgg cggggcaggc gatcagcttt ttcgcgcttc tcatcggcag cagaaaagg // LOCUS sequence022 5432 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence022 VERSION sequence022 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..5432 /mol_type="genomic DNA" /organism="" /note="sequence022" CDS 570..740 /product="4Fe-4S binding protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_010963626.1" /transl_table=11 /codon_start=1 /translation="MAYVIGDACISCGACADNCPVEAISQGDGKYEIDAEKCIECGACA DNCPVEAPHQA" /locus_tag="LOCUS_1150" /note="WP_010963626.1 4Fe-4S binding protein (Clostridium) [pid:67.3%, q_cov:98.2%, s_cov:98.2%, Eval:9.6e-17]" /note="MGA_148" CDS complement(792..1430) /product="redox-sensing transcriptional repressor Rex" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_010966000.1" /transl_table=11 /codon_start=1 /translation="MKQEGKISSAVIRRLPRYLRALEDLESSGTERISSGELSKLIGYT ASQIRQDLNHFGGFGQQGYGYNVKDLKAEIGKILGLGQKYKMVIVGSGRLGQAINSFIS SYSENFCVTSLFDVKEDLIGKEKSGVLIRDFADLEDYLKNNPTDIGVITVTKESAQNAC DKLMAGGVDGIWNFAPIDLENTGSTPVENVHLSDNLHSLVYYINHPEQI" /locus_tag="LOCUS_1160" /note="WP_010966000.1 redox-sensing transcriptional repressor Rex (Clostridium acetobutylicum) [pid:49.5%, q_cov:95.3%, s_cov:94.4%, Eval:6.3e-50]" /note="MGA_149" CDS 1526..3388 /product="ABC-F family ATP-binding cassette domain-containing protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_012048250.1" /transl_table=11 /codon_start=1 /translation="MSILTASKLNKSFGIETVLEDVTFHVNAGDRVGIVGANGAGKSTL MRILAGELQPDSGELYFEKGASIGYLKQRDHFPDGGTVQEEVSKAATEKQKEAFEERHG YSYDKGLKGILRSLAFTDDYLDKPVGTLSGGERTRLAMASLLLQEPDLLLLDEPTNHLD IGTLKWLEGYLKGYRGTLVIISHDRYFLDKLATRIFEIEHCHLKAYDGNYTTFKEKKQL QYEQDLRHYEQMKAEVARQEEIIRRFKEHNTEHLVKRAQSREKRLAMLDMPDKPTFFRE KLKIRFDEKLKSGQDVLQAEDLAMSFTGPEGVKHLFSGVNMDIKKGDRICMVGPNGVGK TTLLKIILGELDPDSGWLKLGQNVVCGYYDQEQKLLDPEKTVLDEVHSTYIKYDQVELR KLLGRLGFYGDDVFKQVKDLAGGEKAKLSLLKLMMTGANFLILDEPTNHLDIAAKEVFE DALLDFPGTLLIVSHDRYLLQKIPTAIYELKPEGITVYLGSYDYYEQKSSSVTSGKAYL ETLAKGANPADAQKLLSKEERTLLRQKEKEEAAAKRKRERQLQAAEETVSEAENRVTEL ENRLCLPEIYSDPEKAREVNSELLAAREGLEKAYEDWMELQEEA" /locus_tag="LOCUS_1170" /note="WP_012048250.1 ABC-F family ATP-binding cassette domain-containing protein (Clostridium botulinum) [pid:39.2%, q_cov:99.7%, s_cov:100.0%, Eval:1.4e-139]" /note="MGA_150" CDS 3475..3705 /product="acyl carrier protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003419132.1" /transl_table=11 /codon_start=1 /translation="MVFDKVREIIAEQLDVDTEEITLDTNLIKDLEADSLDAVEIIMAL EDEYDIEIPDEVAEEFATVGDIVKCVEDYIS" /locus_tag="LOCUS_1180" /gene="acpP" /note="WP_003419132.1 acyl carrier protein (Bacteria) [pid:69.0%, q_cov:93.4%, s_cov:95.9%, Eval:1.1e-20]" /note="MGA_151" CDS complement(3746..4663) /product="DMT family transporter" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011861204.1" /transl_table=11 /codon_start=1 /translation="MDPKRSATRGYIEVFLAGALWGCIGPFMQGMSNMGAGSGLISLMR QGFGTLMMIPVVLIACKGIKPLKVDRKSLFVLLLMGLLSEAVFNLCYSACVARLGVAAA AVLLYTAPIFVMILSRILYAEQITSRKVLAIVLNLAGCALTVTNGEFSAEDLAAAGILF GVLAGFFYATITIFGKYVSGSVNPYVTCFYNFLFGTGFLILFTRPWTMDLSFFDAKFCL LGAGIGLFGTVLPYIFYMTGLTHPVEASKVPVVASVETVVAAVLGAVLFREAVGPAKIL GILLVFVSVAVINSGGKKAKEENA" /locus_tag="LOCUS_1190" /note="WP_011861204.1 DMT family transporter (Clostridioides difficile) [pid:30.9%, q_cov:93.4%, s_cov:90.1%, Eval:4.2e-36]" /note="MGA_152" CDS complement(4663..5208) /product="ECF transporter S component" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_012583215.1" /transl_table=11 /codon_start=1 /translation="MENVSTKTNTMAKLGILAAISVVLVAIVHFPLIPAASFLEYDPAD VPILLGTFALGPAAGLLLTITASVIQGVTVSAASSWYGIVMHIIATGTYVLVAGNIYRQ NKTKKQAILALLCGTLAMAAVMVPANLFITPVFMGAPREVVAGMIPTAILPFNLLKAGI NSVITFVLYKRVSPLLHR" /locus_tag="LOCUS_1200" /note="WP_012583215.1 ECF transporter S component (Dictyoglomus turgidum) [pid:39.2%, q_cov:84.5%, s_cov:84.2%, Eval:1.2e-29]" /note="MGA_153" ORIGIN 1 gatgatgtgg gtgccgtcct ccttgcgctc cttcgatgcc ttcgttcgct gcgccggcgt 61 cgtaatgtcc tcgatgtgga tgatgcgcga cggcttcggc aggccaaggc gctctgcgat 121 cttttccacc atgtcgtcgg atgtgcccag gatgaggatg ctgtcgggct tcgtacggcg 181 gatggcagcg cggacctggg cgcagtggtc gttgtccatg aacagcgcgg tcttgaccgc 241 cccgatccgg gtctcctgct ttttggcgga gttgcccgca gcgatgctgc tgccgtagat 301 gtacagcccg tcgtcgatga tcgccgggat atgcatgcgg ccgcacagtt cgcccgcgtt 361 atagcttttt cctgttccgc tcttgccgga aagtccgtag atcttcatgg ggtcacccgc 421 taatggagtt agccgttgct attatttcgc gctcttgaca attctgttac aaataaagat 481 tatgccattg aaaaacggag aaagaatgct atactgtcat tgtgccaaag ggcacagatg 541 acgtcattct acaaaaggag gaaaaaaaca tggcatatgt aattggtgat gcttgcatca 601 gctgcggcgc ttgcgcagat aactgccccg tagaagctat ctcccaggga gacggcaagt 661 acgagatcga cgctgaaaag tgcatcgagt gcggtgcttg cgcagataac tgccccgtag 721 aagcccccca tcaggcataa ggcaaggaaa taacagccgt ttctttcgag aaacggctgt 781 ttttttatgc tttagatctg ttcgggatga ttgatgtagt acacgaggct gtgcaggttg 841 tccgagagat gaacgttctc caccggcgta ctgcccgtgt tctccagatc gatgggtgcg 901 aagttccaga tgccgtccac cccgcccgcc atcagtttgt cgcaggcgtt ctgggcgctt 961 tctttcgtta cggtgatgac cccgatatcc gtggggttgt tcttcagata gtcctccaga 1021 tctgcgaaat cccggatgag gacgccgctt ttttctttgc cgatcaggtc ttccttcacg 1081 tcgaacaggg acgttacgca gaagttttcg ctgtaggagc tgataaagct gttgatcgcc 1141 tggcccagac ggccgctccc cacgatgacc attttgtatt tttgccccag gcccaggatc 1201 tttccgatct ccgccttcag gtcttttacg ttgtagccgt agccctgctg gccgaatccg 1261 ccgaaatggt tgagatcctg ccggatctga gaagctgtat atccgataag ttttgagagc 1321 tcgccggagg agatgcgttc cgtaccgctg ctttcaagat cctccagggc ccgtaaatat 1381 ctgggtagtc ttctgatgac cgccgatgag atctttcctt cttgtttcat atattatcct 1441 ttcatggttt taaacacacc ttgttaattt tatcactaac agaggatttg ttacaacact 1501 ttctttatgg taaaatagca gagttatgag catcctaacg gcgtcaaaac tgaataagag 1561 cttcgggatc gagaccgttc tggaagatgt caccttccac gtaaacgcgg gcgaccgcgt 1621 cggcatcgtc ggcgccaacg gcgcgggcaa gagcacgctg atgcgcatcc tcgcgggcga 1681 actgcagccg gacagcggcg aactttactt tgaaaaaggc gccagcatcg gctatttaaa 1741 gcagcgcgac cacttccccg acggcggcac cgtgcaggag gaagtttcga aagccgcaac 1801 ggaaaagcag aaagaagcct ttgaagagcg tcacggatac agctacgaca agggtctgaa 1861 gggcatcctg cgcagcctcg cttttacgga cgactacctg gacaagccgg tgggtaccct 1921 ctccggcggc gaacgcaccc ggctggccat ggcttccctg ctgctgcagg agccggatct 1981 gctgctcctg gatgagccga cgaaccacct ggacatcggc acgctcaagt ggctggaagg 2041 ctatctgaag ggctaccgcg gcacgctcgt catcatctcc cacgaccggt atttcctgga 2101 caaactggcg acccgcatct tcgagatcga gcactgtcat ttaaaggcct acgacggcaa 2161 ctacacgacg ttcaaagaga agaagcagct gcagtacgaa caggatctgc gccactacga 2221 gcagatgaag gcggaagtcg caaggcagga agagatcatc cggcgcttta aggagcacaa 2281 cacggagcat ctcgtaaagc gcgcccagtc cagggaaaag cggcttgcca tgctggacat 2341 gccggacaag cctaccttct tccgcgaaaa gctgaagatc cgcttcgacg aaaagctcaa 2401 gagcggacag gacgtgctgc aggcggagga cctggcgatg tcctttaccg gcccggaggg 2461 cgtaaagcac ctgttttccg gggtcaacat ggacatcaaa aaaggcgacc gcatctgcat 2521 ggtcggtccc aacggcgtcg gcaagacgac gcttttaaag atcatcctcg gcgaactgga 2581 tccggacagc ggatggttaa agctgggtca gaacgtcgtg tgcggctact acgaccagga 2641 gcagaagctc ctcgatccgg agaagaccgt gctggacgaa gtccattcca cctatatcaa 2701 gtacgaccag gtggagctgc gcaagctgtt gggacggctg ggtttctacg gagacgacgt 2761 ctttaagcag gtgaaggatc tggcgggcgg cgaaaaagcc aagctgtcgc tgctcaaact 2821 gatgatgacc ggcgcaaatt tcctcatcct ggacgagccc acgaaccacc tcgacatcgc 2881 ggcgaaggaa gtgttcgagg atgccctgct ggacttcccc ggcacgcttc tcatcgtgtc 2941 tcacgaccgc tatctgctgc agaagatccc cacggcgatc tacgagctca agcccgaggg 3001 cataacggtc tacctgggaa gctacgatta ctacgagcag aaatcctcct cggtgacctc 3061 cggcaaagcc tatctggaga cccttgcgaa aggcgccaat cccgcggatg cacagaagct 3121 gctgtccaag gaagagcgca cgctgctgcg tcagaaggag aaagaggaag ccgccgcgaa 3181 gagaaagcgg gagaggcagc tccaggcggc ggaggaaacg gtctcagagg ccgaaaatcg 3241 ggtcacagag cttgagaacc ggctttgcct gccggaaata tactccgacc cggaaaaggc 3301 cagagaagtc aattctgagc ttctggcggc cagagaaggt ctggagaaag cttatgaaga 3361 ctggatggaa ctgcaggaag aagcgtaaaa acttcttgca tacggttcca catatattat 3421 aatttaggtg tgttacatag tgcgggacgt cccgtgcgtt caacggaggg aaaaatggta 3481 tttgacaaag tacgcgaaat cattgcagag cagcttgacg tagatacaga agagatcacg 3541 ctggatacga acctgatcaa ggatctggaa gcggattctc tggatgccgt cgagatcatc 3601 atggcgctgg aagatgagta cgacatcgag atccccgacg aagttgcgga agaattcgcg 3661 actgttggcg atatcgtcaa gtgcgtagaa gattacatca gctaagcaga aaaaacgacc 3721 gcggagcctg ggctccgcgg tttttttatg cgttttcttc cttcgctttt ttgccgccgc 3781 tgttgatgac ggctaccgat acgaacacca aaaggatgcc gaggatcttg gccggtccca 3841 ctgcttcccg gaacaggaca gcgcccagga cagctgccac gaccgtttcc acggaagcga 3901 cgacgggcac cttagacgct tccaccggat gggtaagccc cgtcatgtag aaaatgtagg 3961 ggagcaccgt gccgaacagg ccgatgcctg cgcccagcag gcaaaatttc gcgtcgaaga 4021 aggaaagatc catcgtccag ggccgagtaa aaagaataag aaatccggtg ccgaacagga 4081 aattgtagaa acaggtaacg taaggattta cgctgccgga tacgtatttt ccgaagatcg 4141 tgatggtcgc gtagaaaaaa cctgccagaa cgccgaacag aatgccggcg gcagccagat 4201 cttccgcgga aaattccccg ttggtgacgg tcagggcaca ccctgccaga ttcagcacga 4261 tggccagcac cttgcgggaa gtgatctgct ccgcatagag gatacgggag aggatcatga 4321 caaagatcgg cgccgtatac agcaggaccg ccgcagcggc aactcccaga cgggcaacgc 4381 aggcggagta gcacaggttg aagaccgcct ccgaaagcag gcccatcaat agcaggacaa 4441 acaggctttt gcggtccact ttcagcggtt ttattccttt gcaggcgatg aggaccacgg 4501 ggatcatcat cagcgtgccg aaaccctgac gcatcaggga gatgaggccg gagccggcgc 4561 ccatgttgga catgccctgc ataaaggggc cgatgcaccc ccagagggca ccggccagaa 4621 aaacttcgat atatcctctt gttgcagatc ttttcgggtc cattatctat gcagcagcgg 4681 gctgactctc ttatacagta cgaacgtgat gacggaattg atgcctgcct tcagcagatt 4741 gaagggaagg atcgctgtgg ggatcatgcc ggcaacgacc tcccgaggcg ctcccatgaa 4801 gaccggcgta atgaacaggt tggcggggac catgacggct gccatggcca gcgtgccgca 4861 aagcagcgcc agaatcgcct gcttcttggt cttattctgc cggtagatgt tgccggcgac 4921 cagcacgtag gtgccggtgg cgatgatgtg catcacgatg ccgtaccagc tgctggctgc 4981 gctcacggtg accccctgaa taacgctggc ggtgatggtg agcagcagtc ccgcggcggg 5041 tcctaaggcg aaggtgccca gcaggatggg gacatccgcc ggatcgtact ccaggaacga 5101 tgccgccggg atgagcggga agtggacgat ggccaccaga acgacggaga tcgccgccag 5161 gatgccgagt ttcgccatgg tgttggtctt tgtgcttacg ttttccatag attcctcctt 5221 gaaacgttga aaaagttagg ttcggaatct gtcaggcaat aaaaatgccg ctgcatcgct 5281 gcagggcaaa caaaagaaag aatcgtttct tccatccgga ctataccgtc ggtaccggat 5341 tcgcaccggt tctgcctttc ggctcgcgga cttgcggctt tcgccgatca ccgccggtgg 5401 ggaattgcac cccgccctga aacagatcta ca // LOCUS sequence023 5378 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence023 VERSION sequence023 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..5378 /mol_type="genomic DNA" /organism="" /note="sequence023" CDS 359..1744 /product="electron transport complex subunit RsxC" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011948145.1" /transl_table=11 /codon_start=1 /translation="MSSGKHLNGIHVNHCKNTAGQAIIPMTLPEKVYIPMSQHIGAPCQ PVVAVGDHVKVGQKIGDSEAFVCAPIHSSVSGDVTAINKAMSQMGRIDTIIEIVPDGKQ EIAETVVPPVITDKASFIKAVRESGVVGLGGATFPMSVKFNVKPPAKVDTFIVNGAECE PYITVDHQNMLTHAQEIIDGVKAVLSWLEIERAFIGIETNKPDAIKLFKDLLKDEKNIS VAELRQVYPQGAERVIIYETTGRHLIAGKLPADVGCIVSNVTSVLKMQQFLATGMPLVS KAMTVDGNAVANPQNVEVPIGTPLCDVIEFCGGTKAEVKKIVLGGPMMGRAIPKDEYGV MKGNSAILCFDETAGTQLPDTACISCGRCVRGCPMNLMPTKLAKAWERQDIDTLREYDV TTCMECGCCSYSCPARKQLSFEIKLAKTWVMGEDRKAAEKAKAEAEAAKAKEEAEKKEG GEK" /locus_tag="LOCUS_1210" /gene="rsxC" /note="WP_011948145.1 electron transport complex subunit RsxC (Clostridium botulinum) [pid:42.6%, q_cov:92.4%, s_cov:97.7%, Eval:2.2e-96]" /note="MGA_155" CDS 1744..2715 /product="RnfABCDGE type electron transport complex subunit D" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011948146.1" /transl_table=11 /codon_start=1 /translation="MSTKHTNLIVSSAPHVNNPVDTRSIMRDVVIALCPALLVSIYVFG ARALIMTAVCVAACVIFEGCTRKLLNRPQTIGDWSAVVTGVILAFNLPVTLPIWMAIIG CFVAIVIVKQVFGGLGENFANPAIVGRIVLFIGFATPMTNWAVTSRMSSVIRENAADAV TGATPLGLLASGKPVPSNLDMFLGTINGSMGEISAIALLIGGCYLLWRKVITWEIPVAF LGSMVVMAVLMHQDPVFHIFAGGAMLGSIFMATDYVTSPITGKGKIIFGIGCGVLTMLI RVFGSYPEGVSFAILLMNILTPHIDRWTRTHINGVDRKAVKK" /locus_tag="LOCUS_1220" /note="WP_011948146.1 RnfABCDGE type electron transport complex subunit D (Clostridium botulinum) [pid:47.5%, q_cov:94.7%, s_cov:96.8%, Eval:1.9e-77]" /note="MGA_156" CDS 2715..3269 /product="RnfABCDGE type electron transport complex subunit G" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011948147.1" /transl_table=11 /codon_start=1 /translation="MTDKKEMLAPSIVLVCICLVASMLLAATYQITKPIIDNLAIQMAN ESRAEVLPEADGFSPMDVDLVDGVTEVYKADNGAGYVMTATFKGFGGPVTVMTGMDADG VIQNVKVTDASNETPGLGSKTTLPDHTGKFQGISGAITMDKESTEGTYVAPVTGASYSS KAVFNAVSAALAQYAQIGGSF" /locus_tag="LOCUS_1230" /note="WP_011948147.1 RnfABCDGE type electron transport complex subunit G (Clostridium botulinum) [pid:32.6%, q_cov:95.1%, s_cov:80.7%, Eval:1.1e-19]" /note="MGA_157" CDS 3269..3952 /product="electron transport complex subunit E" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_005904084.1" /transl_table=11 /codon_start=1 /translation="MDNKKSKLSIFTNGFIKENPILVLVLGTCPTLAVSTQASNGIGMG LCVTFVLTFSNIFISALKKIIPDKVRIPCYIVVISTFVTVLQLLLQAYLPDLNKSLGLY VPLIVVNCIILGRAEAFANKNSVVDSALDGLGMGLGYTCALTIMACIRELLGAGTLFGK VITANLFSPMSIFVLAPGGFFTFGCIIAALNKLTKGKREKKQKENKCLGCGNADGCPAA EEGGC" /locus_tag="LOCUS_1240" /note="WP_005904084.1 electron transport complex subunit E (Fusobacterium) [pid:51.7%, q_cov:89.4%, s_cov:99.0%, Eval:5.1e-56]" /note="MGA_158" CDS 3955..4548 /product="electron transport complex subunit RsxA" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_005904083.1" /transl_table=11 /codon_start=1 /translation="MKEMLMIIMAAVLANNYVLVRFLGICPFLGVSKKLDSAVGMSVAV IFVMVLATAATWPIQHLLLDPNGIGYMQTTVFILVIAALVQLIETFMKKSIPSLHKSLG IYLPLITTNCAVLGVCVLNIDEGYTFIQSIMNAFGSGVGFLLAMFLFAGVRSKIEDNDY PESFKGIASTLVAASILSVSFMGFSGMIDNIFGM" /locus_tag="LOCUS_1250" /gene="rsxA" /note="WP_005904083.1 electron transport complex subunit RsxA (Fusobacterium nucleatum) [pid:51.9%, q_cov:94.9%, s_cov:96.4%, Eval:1.4e-56]" /note="MGA_159" ORIGIN 1 cgcctgcgag gactacgatc ttctgatctg catggacgag tggaatatcc agagcatgca 61 ccgcatgttc ggtcatgatt tcgacgcgaa actgtcgaaa ctgctggacc acacgccctt 121 aaagcgcgac gtggccgacc cctggtacac cggcgacttc gagcagacct acgaggacgt 181 ggtgctgggc tgcgaagcgc tgctgaaaga gcccgggatc tgcccgccga acattcgtta 241 aattgcctac aatctttcct tgaaattcca tacaatttga tatattctat actgtgcagg 301 tctatgctgc gttttttgac gtgtgccaag acccggtaga aaaataagga gaaatagtat 361 gagttcaggc aaacatctga atggcatcca tgtgaaccat tgcaagaaca ctgccggcca 421 ggccatcatc ccgatgaccc tgccggaaaa ggtttacatt ccaatgagtc agcacatagg 481 tgccccctgc cagcctgtcg tggccgtagg cgaccacgtt aaggttggcc agaagatcgg 541 agacagcgaa gccttcgtat gcgcgcccat ccacagcagc gtatccggcg acgtcacggc 601 catcaacaag gccatgtctc agatgggcag gatcgacacc atcatcgaga tcgtgcccga 661 cggcaagcag gagatcgcag agactgtcgt gccccccgtc atcacggata aggccagctt 721 catcaaggct gtccgcgaat ccggcgtggt aggcctcggc ggcgctacgt tccccatgag 781 cgtcaagttc aacgtaaagc cccccgcaaa ggtggacacc ttcatcgtga acggcgcgga 841 atgcgagccc tacatcaccg tcgaccacca gaatatgctc acccacgccc aggagatcat 901 cgacggcgtc aaggcagttc tgtcgtggct ggagatcgaa agagcgttca tcggcatcga 961 gacgaacaag cccgacgcga tcaagctctt caaggacctc ctgaaggacg aaaagaacat 1021 ttccgtcgcg gaactgcgcc aggtctatcc gcagggcgca gaacgcgtca tcatctatga 1081 gacgaccggc cgccatctga tcgcaggcaa gctgcccgca gacgtgggat gcatcgtatc 1141 caacgttacg tccgttctca agatgcagca gttcctggcc accggcatgc cgctggtatc 1201 caaggccatg actgtcgacg gcaacgccgt cgctaacccc cagaacgtgg aagtgcccat 1261 cggcaccccg ctgtgcgacg tcatcgaatt ctgcggcggc accaaagcgg aagtcaagaa 1321 gatcgttctg ggcggaccga tgatgggccg cgccatcccc aaggatgaat acggcgtcat 1381 gaagggcaac agcgccatcc tgtgcttcga cgagaccgca ggcacccagc tgcccgacac 1441 cgcatgcatc agctgcggcc gctgcgtacg cggctgcccg atgaacctga tgcccaccaa 1501 gctggcaaag gcctgggaac gccaggacat cgacactctg agagagtacg acgtcaccac 1561 ctgtatggaa tgcggctgct gctcttactc ctgcccggca agaaaacagc tgagcttcga 1621 gatcaagctc gcgaagacct gggtcatggg agaagacaga aaggctgcgg aaaaggccaa 1681 ggccgaggcg gaagccgcca aggctaagga agaagcagaa aagaaggaag gaggagaaaa 1741 gtaatgagca ccaagcacac aaatctgatc gtatcctccg ctcctcacgt caataacccg 1801 gtcgatacca ggagcatcat gagagacgtc gtgatcgctc tctgcccggc gcttctcgtc 1861 tccatctacg tattcggagc aagagcgctc atcatgaccg ctgtctgcgt cgcagcctgc 1921 gttatcttcg aaggctgcac cagaaagctt ctgaacagac cccagaccat cggcgactgg 1981 tccgcagtcg ttaccggcgt catcctcgcc ttcaacctgc ctgtcaccct gccgatctgg 2041 atggccatca tcggctgctt cgtggcgatc gtcatcgtca agcaggtatt cggcggcctg 2101 ggcgaaaact ttgcgaatcc cgcgatcgta ggacgtatcg tcctgttcat cggcttcgcg 2161 accccgatga ccaactgggc agtcacttcc cgcatgagct ctgtcatccg cgagaacgct 2221 gccgacgccg tcaccggcgc caccccgctg ggactgcttg cttccggcaa gcccgttccc 2281 tccaacctgg acatgttcct gggaaccatc aacggctcca tgggcgagat ctccgcgatc 2341 gctctgctga tcggcggctg ctacctgctc tggagaaagg tcatcacctg ggagatcccc 2401 gtggcattcc tgggttccat ggtcgtcatg gcagtcctga tgcaccagga tcccgtcttc 2461 catatctttg caggcggcgc gatgctcggt tccatcttca tggcgaccga ctacgtcacg 2521 tccccgatca ccggcaaggg taagatcatc ttcggcatcg gctgcggcgt tctgaccatg 2581 ctcatccgcg tattcgggtc ctatcccgag ggcgtatcct tcgccatcct gctgatgaac 2641 atcctcaccc cgcacatcga tcgctggacg agaacgcaca tcaacggcgt ggacagaaag 2701 gcggtgaaga agtaatgact gataagaaag aaatgctggc tccgtccatc gttctggtct 2761 gcatctgcct cgtagcttcc atgctgctcg ccgcgaccta tcagatcacg aagcctatca 2821 tcgataatct cgccatccag atggcgaacg aatccagagc ggaagtcctt cccgaagcgg 2881 acggtttctc cccgatggac gtcgacctgg ttgacggcgt cacggaagtc tacaaggccg 2941 acaacggcgc aggctatgtc atgactgcca ccttcaaggg attcggcggc cccgtcactg 3001 ttatgaccgg tatggacgcg gacggcgtca tccagaacgt taaggtcacg gacgcttcca 3061 acgaaacgcc gggcctgggc tccaagacca cgctgcccga tcatacgggt aaattccagg 3121 gcatcagcgg cgccatcacc atggataagg aatccacgga aggcacctac gttgcgcctg 3181 tcaccggtgc aagttattcc tccaaggcag tgttcaacgc ggtcagcgct gcgctcgccc 3241 agtatgcaca gatcggaggg agcttctaat ggataacaag aagagcaaac tgagtatctt 3301 cacaaacgga tttatcaagg agaacccgat cctggtcctc gttctgggca cctgccccac 3361 gctggcagtt tccacccagg cgtccaacgg tatcggcatg ggcctgtgcg tcacgttcgt 3421 actgaccttc tccaatatct ttatctccgc gctgaagaag atcattcccg ataaagtgcg 3481 tatcccgtgc tacatcgtgg tcatttccac cttcgttacc gtcctgcagc tgctgctgca 3541 ggcatacctg cccgacctga acaagtctct gggcctgtac gtgcctctga tcgtggtcaa 3601 ctgcatcatc cttggccgcg cggaagcatt tgccaacaag aacagcgtcg tagactccgc 3661 tctggacggt ctcggcatgg gcctgggcta tacctgcgcc ctcaccatca tggcctgcat 3721 ccgcgagctg ctgggcgccg gaacgctgtt cggcaaagtg atcactgcca acctcttcag 3781 cccgatgtcc atcttcgtgc tggctcccgg cggcttcttc accttcggct gcatcatcgc 3841 cgcgctgaac aagctgacca agggcaagag agaaaagaag cagaaggaaa acaagtgcct 3901 gggatgcggc aatgcagatg gctgccctgc cgctgaggaa ggaggttgct gattatgaaa 3961 gaaatgttaa tgatcatcat ggcagcagtc cttgccaata actacgtcct ggtgcgcttc 4021 ctgggcatct gcccgttcct gggcgtttcc aagaaactgg actctgccgt cggtatgtcc 4081 gtagccgtta tcttcgtcat ggtcctggca actgccgcga cctggcccat ccagcacctg 4141 ctgctggacc cgaacggcat cggctacatg cagaccactg tgttcattct ggtcatcgcc 4201 gcgctggtac agctcatcga gacctttatg aagaaatcga tcccctcgct gcataagtcg 4261 ctgggtatct atcttccgct gatcaccacg aactgcgctg ttctgggtgt ctgcgttctg 4321 aacatcgacg aaggttacac cttcatccag tccatcatga acgctttcgg ttccggcgtc 4381 ggcttcctgc tcgccatgtt cctgttcgca ggcgtgcgca gcaagatcga agacaacgat 4441 tatcccgaga gcttcaaggg catcgcgtcc actctggttg ccgcatccat cctgagcgtc 4501 tccttcatgg gattctccgg catgatcgac aacatcttcg gcatgtaaag gaggatagaa 4561 agtatgttaa ctgcatctgc ttttgtaact cctgtcctgc tgaccgttat caccggcctg 4621 atcgcaggcg ttctgctcac catcgccgcg aagatcttcg cggttcccgt ggacgagacc 4681 caggtgaaga tccgcgaatg cttgccaggc gcgaactgcg gcgcctgcgg ctacgtaggc 4741 tgcgacgact atgctgcggc tctggcgaag gaccatacca ttgcacctaa taagtgcgtt 4801 cccggcggcg ccggcgctgc tgtaggcatt gcggcagttc tgggcgtaga agccggcgcg 4861 accgaagaaa gagtcgcgaa agtcatgtgc tccggcacct gcgacaatac gtcccccgaa 4921 atggactatc agggctacaa gtcctgcgcc gccgtcaaga atttcttcgg cggccccggc 4981 acctgcaagt tcggctgcat cggtctgggc gactgcgtca aggcctgcaa attcgacgcc 5041 atccatgtgg aagacggcgt agcgaaggta gaccgcgaca agtgcgtcgc ctgcggcgcc 5101 tgcgcgaaca cctgcccgca gaagatcatc gacatcctgc cgaaggccag ccgcgtcacc 5161 gtcgactgct ccagcaagga tatgggcaag ttcgtcacga aggcctgcaa agttggctgc 5221 atcggctgca agatgtgcga aaagacctgt aagttcgacg cgatccatgt cgtggacaac 5281 cttgcaaaga tcgatcccga gaagtgcaag aactgcggca tgtgcgccaa ggcctgcccg 5341 cgcaagatca tcacggtcat tccgcgcccc ggccagaa // LOCUS sequence024 5376 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence024 VERSION sequence024 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..5376 /mol_type="genomic DNA" /organism="" /note="sequence024" misc_feature <1..933 /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_011861083.1:RluA family pseudouridine synthase" /note="WP_011861083.1 RluA family pseudouridine synthase (Clostridioides difficile) [pid:38.2%, q_cov:97.1%, s_cov:92.7%, Eval:1.5e-57]" /note="MGA_161" /locus_tag="LOCUS_1260" CDS 917..1978 /product="membrane protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011393376.1" /transl_table=11 /codon_start=1 /translation="MNTNNKPLSVLRIGLIYTGCLVGAGFASGREAWQFFGVFGKWGYA GVIVATLLYIGVGLMTVDIAHRKNTADISALINPIDNKALNTFVGVMMCFFLLVAYVAL TAAGGALLESKTGLSHAAGSLLICLLCIITALGGFSSISDKAGKISPVLVVGTLVLGIY LIATHTDAVSHLEPHRTSKVASHWLTAVIGYVGYNASAAVPVLGQCAMHSDSRKRSENG AILGGIILGTCTLILFLSTSTDPALSGQSSFPMMDLCERVFPALGKVYAVLLLLAIFMT QTTVFYGFTTKLGNRKNSKAIAWAVGLAGYVCSLYGYYNFVANIVPIVGYVSLAFFGLE IINLIKVKRKQSF" /locus_tag="LOCUS_1270" /note="WP_011393376.1 membrane protein (Moorella thermoacetica) [pid:28.2%, q_cov:94.3%, s_cov:87.3%, Eval:1.2e-32]" /note="MGA_162" CDS 1997..4675 /product="valine--tRNA ligase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011861890.1" /transl_table=11 /codon_start=1 /translation="MENNLAKNYKPKDFEDRIYAMWEENGAFVPDENAPKDPYTVMMPP PNITGQLHMGHALDQSLQDVLIRYKRMQGHKTLWLPGTDHASIATEVKVVDKLREEEGK TKEEIGREAFLERAWAWKKQYGGRINEQIRRLGSSCDWNRERFTMDEGCNKAVKEHFIN LYNKGLIYKGARLINWCPVCGSALSDIEVEHVDHNGSYWYFRYPGADGSEGIVVATSRP ETMFADTAVAVHPSDERYKDMVGKKVILPLVGREIPVIADEYPDPEKGTGAVKITPSAD PNDFEVGLRHGLEMIECIDEKAKMTAAAGKYEGMDRYECRKAWVADLEAAGYLVKVEKM VIPAGECYRCHTVVEPRISEQWFVKMKPLAEPAIEAVRTGKTKFVPERFDKTYYHWMED IKDWCISRQLWWGHRIPAYYCEECGEMVVAKEEPSVCPKCGGTHFHQDEDVLDTWFSSA LWPFSTLGWPENTEDLKKYYPTSTLVTGYDIIFFWVARMIFSGVEVMKETPFEYVLIHG LVRDAQGRKMSKSLGNGIDPLEVIDTYGADALRFMLLSGISPGSDIRYQVEKVEGARNF ANKLWNASRFAIMNIKDEEGNFLPIASEEDAKLQAEDRWILQTINDALPEINQNMERFE FALAAQKIYELIWGEFCDWYIELIKPRLYGEDEADKASARYCLVKCLKSLLKLLHPFMP FITEEIWSFLPKDADAKQFLMLEGWPEYDASMNYAEDKAVLNLSMDIIRAIRGIRHEAE ALPSRKLHAVILAEADQEKLAKAGERYIKTLGNLEGLDFIASKEALPEETMSAALPGLE VYVPLDDLMDYEAEYARLTKEKERLTKEVARVTNQLANEKFVSRAPAHVIQAERDKLAG YQDMLEKTLARIPVVEKKLNK" /locus_tag="LOCUS_1280" /EC_number="6.1.1.9" /note="WP_011861890.1 valine--tRNA ligase (Clostridioides difficile) [pid:55.9%, q_cov:99.8%, s_cov:99.9%, Eval:0.0e+00]" /note="MGA_163" ORIGIN 1 ctctacgtaa aggaagtgct gcagcgccgc ttttcccttt cttcccggct catgcggaag 61 atcaaggtgt cggggcagat cgtcctggat gaccaaaagg cgcggctccg ggacaaggga 121 cgtcccgggc aggtccttac ggtttctttc cccgaggaaa gcagttactt cgaccccgag 181 aacatcccac tggacgtggt ctacgaggac gacgacctgc tcgtcgtaaa caagcagccg 241 ttcctcgtgg tgcatcccac gaagaattac cagagcggca cgctggccaa cgcgctggcc 301 taccgtctgc aggagcgggg cgaatcctgg aagatccgct tcatcaaccg gctggaccgc 361 gatacgtccg gtctggtgcg ggtggccaag aacggccatg cccaggatgc ggtgagcgcc 421 cagatggagc aggggaccac agaaaagaaa tacctggcgc tggtgcacgg cttgttcgaa 481 gaaacagaag gccgcatcga tgcgccgatc gataaggatc cggaccataa ggcacgccgc 541 atggtgcgcg aagacggcta cccgtcggtg accctctaca aggtcctgga cagctggaac 601 gtgccggatc tcggcccgga ttttacgccc tggcagggcg caaagcgcat cgacggctac 661 agcctggtgg aacttacgct gctgaccggc cgcacccatc agatccgggt gcacctcacg 721 catctcggtc accccatcgc gggagacgaa ctctatggac agctgttcgg ctacgaagcc 781 ggaacggatg tcttgaaccg ccaggcgctg catgcctaca gcctgcggct gaaacagcct 841 ctgacgggcg gacccataca tttgcaaaca ccgatgccgg acgacataaa ggcctgcatc 901 gaaaggatag aacactttga acacgaacaa taaaccttta agcgtactgc ggatcggcct 961 tatctacacg ggctgccttg tgggcgccgg atttgcttcc ggacgggaag cctggcagtt 1021 cttcggcgta ttcgggaaat ggggttatgc cggggtcatc gttgccacgc tgctgtatat 1081 cggcgtcgga ctgatgacgg tcgacatcgc ccaccgcaag aacacggccg atatctccgc 1141 tctcatcaat cccatagaca acaaagcgct gaatacattc gtcggcgtta tgatgtgctt 1201 ctttctgctt gtggcttacg tagctcttac ggcggcaggg ggagcactgc tggaaagcaa 1261 gacgggcctc agccacgccg ccggaagtct gctcatctgc ctgctgtgca tcatcaccgc 1321 actgggcggc ttctccagca tatccgataa ggcaggcaag atctctccgg tcctggtcgt 1381 cggcacactg gtgcttggca tctatctgat cgccacgcat acggatgcgg tatcgcacct 1441 ggaacctcac cggaccagca aggtggccag tcattggctc accgcggtca tcggctacgt 1501 gggctataac gcatcggcag ccgttcccgt tctgggacag tgcgccatgc actcggattc 1561 ccgcaaaaga agcgagaacg gggcgatcct gggaggcatc atcctgggca cctgcacgct 1621 cattctgttc ctgtcgacct cgacagatcc ggcgctgagc ggccagagca gctttccgat 1681 gatggatctc tgcgaacggg tgttccccgc gctgggcaag gtctacgccg tattgctgct 1741 gctggcgatc ttcatgaccc agacaacagt gttttacggg tttacgacga aactgggaaa 1801 ccgcaaaaac agcaaggcga tcgcctgggc tgtaggtctg gcgggctatg tctgctcgct 1861 gtacggctac tataatttcg tcgcaaacat cgtgcccatc gtcggctacg taagcctcgc 1921 gttcttcgga ctggagatca taaacctgat caaagtgaaa agaaaacaat cgttttaaca 1981 tacagagagg atagccatgg aaaacaatct cgctaaaaac tacaagccaa aggatttcga 2041 agaccgcatc tatgcgatgt gggaggaaaa cggcgccttt gttccggatg aaaacgcgcc 2101 taaggatcct tacaccgtca tgatgccgcc gcccaacatc acgggacagc tgcacatggg 2161 tcacgcgctg gaccagtccc tgcaggacgt cctcatccgt tacaagagga tgcagggcca 2221 caagacgctg tggctgccgg gtacggacca cgcctccatc gccacggaag tcaaagtcgt 2281 ggacaaactg agagaagaag agggcaagac caaggaagag atcggccgcg aggccttcct 2341 ggagagagcc tgggcatgga agaagcagta cggaggccgc atcaacgagc agatccgccg 2401 gctgggctct tcctgcgact ggaaccggga acggtttacc atggacgaag gctgcaacaa 2461 ggccgtaaag gaacacttca tcaacctgta caacaagggg ctcatctata agggcgcgcg 2521 cctcatcaac tggtgcccgg tctgcggttc cgccctgtcc gacatcgaag tcgaacacgt 2581 ggaccataac ggcagctact ggtacttccg ctatcccggt gcagacggca gcgaaggcat 2641 cgtcgtcgca acttcccgtc ccgagaccat gtttgcggat accgcagtag ccgtccatcc 2701 ctccgatgag cgctacaagg acatggtggg caagaaggtc atcctgcctc tcgtaggcag 2761 agagatcccc gtcatcgcgg acgaatatcc cgatccggaa aagggtaccg gcgccgttaa 2821 gatcacgccg tctgcggacc ccaacgactt cgaagtcggt ctgcgccacg gtctggagat 2881 gatcgagtgc atcgacgaaa aggcgaagat gaccgctgcc gccggcaaat acgagggcat 2941 ggaccgctac gagtgccgca aggcctgggt cgccgacctg gaggctgcag gctacctcgt 3001 caaggtggaa aagatggtga tccccgcagg ggaatgctac cgctgccata ccgtcgtgga 3061 accgcgcatc tccgaacagt ggttcgtcaa gatgaagccg ctggcggaac ccgccatcga 3121 agcggtccgc accggcaaga ccaagttcgt gcccgagcgt ttcgataaga cgtattatca 3181 ctggatggaa gacatcaagg actggtgcat ctcccgtcag ctctggtggg gtcaccggat 3241 cccggcctat tactgcgaag aatgcggcga gatggtcgtg gccaaggaag aaccctctgt 3301 ctgcccgaag tgcggcggca cgcattttca tcaggatgaa gacgtgctgg atacctggtt 3361 ctcctccgcg ctgtggccgt tctccacgct gggctggccc gaaaatacgg aggatctgaa 3421 gaagtactat cccaccagca ccctggtgac cggctacgac atcatcttct tctgggtcgc 3481 gagaatgatc ttctccggcg tggaagtcat gaaggaaacg cccttcgaat acgtgctcat 3541 ccacggtctg gtgcgcgacg cccagggccg caagatgtcc aagtctttgg gcaacggcat 3601 cgatcctctg gaagtcatcg acacctacgg cgccgacgcg ctgcggttta tgctgctgtc 3661 cggcatctcc ccgggaagcg acatccgcta ccaggtggag aaggtggaag gcgccagaaa 3721 cttcgccaat aagctctgga atgccagccg cttcgccatc atgaacatca aggacgaaga 3781 aggaaacttc ctgcccatcg cttctgaaga agatgccaag ctgcaggcgg aggatagatg 3841 gatcctgcag accatcaacg acgcgctgcc cgagatcaac cagaacatgg aacgcttcga 3901 gttcgcgctg gccgcccaga agatctacga gctcatctgg ggcgagttct gcgactggta 3961 catcgaactc atcaagccca gactgtacgg cgaagacgaa gcggataagg caagcgcccg 4021 ttactgcctc gtcaagtgcc tcaagagcct gctcaagctg ctgcacccgt tcatgccgtt 4081 cattacggaa gagatctgga gcttcctgcc caaggatgca gacgcaaagc agttcctgat 4141 gctggaaggc tggcccgaat atgatgcttc catgaactac gccgaagaca aggctgtctt 4201 aaacctgtcc atggacatca tccgcgccat ccgcggcatc cgccacgaag cggaagcgct 4261 gccctccaga aagctgcatg cggtcatcct ggcggaagcc gatcaggaga agctggcaaa 4321 ggccggtgaa cgctacatca agaccctggg caacctggaa ggtctggact ttatcgcttc 4381 caaggaagcg ctgcccgaag agaccatgtc cgcggcgctg cccggtctgg aagtctatgt 4441 accgctggac gatctgatgg attacgaggc ggaatacgca cgtctgacga aggagaagga 4501 gagactcacg aaggaagttg cgcgggtcac caaccagctg gccaacgaga agttcgtctc 4561 cagagcgcct gctcacgtca tccaggcgga gcgcgacaag ctggcaggct accaggatat 4621 gctggaaaag acgctggcga gaattcccgt cgtggagaag aaactgaaca aatagcgata 4681 acgaggaccg tcttcgggcg gtcctttttt gcaggaagag gaaaacagca atgatcgcag 4741 atctgaaaaa atacgatcag aagtacgttc tgatcaagga tatctatggg gagactcata 4801 ccggtcttgc gcgctatgaa aacgccgact ttttggagtg cgaatggggc ggcgaaggag 4861 atggtctgtt tatcgaggac ttcctgatct acaacgatca gatcgcttcc atcgaagaga 4921 cggtcgtgca cggcacggcg gagttatgga cggagcagct catcctgcgc aaagcccgtc 4981 cggaggatgc agaggaactg catcactatc tgggacggga tccggaattc tcgcgctatt 5041 ccggatggaa cccgtacgcg accctggaaa tggcacagga gacggtgcgc aggtttatcg 5101 aaggctatgg ggaagaacat ttctattcct ggatcatgga tgtagatgat gtcgtggtgg 5161 gaacggtcgg cgcctacgac tatgcggacg gcaggatcga ggtgggtgta agcgtcgtaa 5221 agggctggca gggccgtggt tttgcgaccg aggcgctgcg taaggtgctg gtctacctga 5281 cggaaaacga aggcatcccc tgtgtaacgg cctggtgcgc ggcagacaat acaggatcgc 5341 gccgtgcgat ggaaaaggcc ggcatgcagc tcgtcc // LOCUS sequence025 5250 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence025 VERSION sequence025 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..5250 /mol_type="genomic DNA" /organism="" /note="sequence025" misc_feature <1..888 /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_011391759.1:polysaccharide pyruvyl transferase CsaB" /note="WP_011391759.1 polysaccharide pyruvyl transferase CsaB (Moorella thermoacetica) [pid:33.2%, q_cov:88.5%, s_cov:71.0%, Eval:1.3e-34, partial hit]" /note="MGA_165" /locus_tag="LOCUS_1290" CDS 885..2039 /product="glycosyltransferase family 1 protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011038780.1" /transl_table=11 /codon_start=1 /translation="MRKILCLSTSNYYPFPTRKQNIMNRMTDCTILYVDPPVTLIAPLK DPKARERLSLYKEGPKQALPNLKVYAQPPVLPFFNKRRDINERNQKKLAKYLAKILREN DFGDDFWIWCYSPTSCDVIAPLAKEMGLEPASLWKRTVYDCVDRHSAYPGHIDPKVVDE MEEDLARSCGCVFATAQGLYERLKAFNENTHLIPNGCAFELFHTAADMEKEGISPHFGF VGMLQECLDYDCIRAVAEAFPDGKVTLIGRTLPGVDMTWTDNYPNVEMKGLVPQRELPG YIKDFDVCLNVFADNDLSRDVSPLKFYEYLATGKPVVSTLVPLQVLDYVDCIYLAETPD EFVTRCREALEEGPDSPKRTERIEAARRNSWDEKVAEMKEILAW" /locus_tag="LOCUS_1300" /note="WP_011038780.1 glycosyltransferase family 1 protein (Xanthomonas campestris) [pid:28.6%, q_cov:99.2%, s_cov:91.4%, Eval:8.5e-27]" /note="MGA_166" CDS 2070..2603 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MKIINEKGKLFGLINVVDLIVLLLVIAVIGVLATKLLGNRVTEAV VQKVDCYAQVRIIGAHPTLVEEVQRQNLVGQRMVAGSVYIDGTIEDVWLEDYKVQVQTD DGRIVTATDPDKKDIIFAIKFPIAKDTPNPKLGSQEVRAGRTLIVKTQTFETSGTIRYV QIGEYDPPEAFQKP" /locus_tag="LOCUS_1310" /note="MGA_167" CDS 2610..4247 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MTEIVKNSLVIRFIVCVYEGLRRFWRSSLLGRGWKGWHESWLQSN TKVHWENWCGMDDPAEHSVYAKFLRTLEKLLQKVGEWLRCSLFYRIVIAVRDWYFRISE GSRILSAVNRVPLRRWLFVAFALYLPIEYALRDVLQISILASVWEEVFLMAGVALVLWR TMLKQSDGFRRATALETALLLYMAVGLLLMMLNRPFPGIAWAGYRAQVEYILWFFILLR LIDDEQDAKTLLFGFAAVVLVLALHGIYQYIAAVPIPDSWVTKTEAGVRTRVFSLTGSP NIFGSLLLMAAPTAAAGIYYFKNGWMKFLSLCATGVICLSILFTFSRGSWVGLIVAIVL FSLFMDKRLIGLMGIAMAGVVALVPSITSRLTYLMTPEYKVASEVGGRALRWETGRALL HENSPWLGFGLGRFGGAVAMNNQVLDKTDEFEYFYMDNYYLKTLVEMGYLGIIFYIVAL IAFAVMALRAIHACNQGRAYGLADDALTRNDGNLKCLAAGLFAGMAGVLVHCYFENIFE EPYMMAYFWGLAACLQRLGAVSKERSRT" /locus_tag="LOCUS_1320" /note="WP_015158974.1 IctB family putative bicarbonate transporter (Chamaesiphon minutus) [pid:23.8%, q_cov:48.4%, s_cov:57.5%, Eval:4.9e-13, partial hit]" /note="MGA_168" ORIGIN 1 aagaccagcc tgttcgtgtc cggcggcggc acgctcatcc aggacgttac gtcctcgcgg 61 tcgctgtatt tctacctgtt tacactgctg gcggcgaaac tgtccggcag caaggtcgtc 121 atgtacggct gcggcatcgg ccccatccac ggcaatgcca accgcagata tacgggccgg 181 gtgctcaaca aggcggcgga catcatcacg ctgcgcgatt ccatctccat gcagctgctg 241 caggatatcg gggtcacgaa accggagatc atcctgtcag cggacccgac ggtcaatctg 301 cctgcggtta gccgcgatgt ggtggaggag gcgttccgtc tggacgatat ccccgccggt 361 acgcccaaga tcgccttctg cctgcgcagc tgggacgaat tcacgaatta cgaagcggtc 421 gcaaaggcgg cggaccacgc ctgggagaag cacggcttac ttcccgtatt cctgcccatg 481 gaatacccga gagacgtggc gatcggcgaa aagatcggcg gcatggtctc cgtgccccac 541 gcggtctgca gcaggcggca cagcgtcgaa gagctgcggg gcatgctctc ctccatggaa 601 gtcgtatgcg gcatgcgtct gcactctctc atcttcgctt cggcaggcgg tacgcccatc 661 gtgggcatct cctacgacgt taaggtggac agctttatcc gggacagcgg cgccaaacgc 721 tgcatccagc tgaaggatct gtcggaggaa cagcttaccg cctatatcga cgaagcggtc 781 gcaggcggca gaagccacgg caacgaaacg aaactgcgtc tgcaggcaat ggaactcaaa 841 aacggtgagg cagcggagaa actcctcacc ggaaaggcgg catcatgaga aagatcctct 901 gtctttcgac ttcgaactat tatccgtttc ccacgcggaa acagaacatc atgaaccgga 961 tgacggactg caccatcctg tacgtcgatc cgccggtcac ccttatcgct cccctcaagg 1021 acccgaaagc cagggaacgg ctttccctgt ataaagaagg gcccaagcag gctctgccga 1081 acctgaaggt ctacgcccag cctccggtgc tgccgttctt caacaagcgc cgggacatca 1141 acgagcgcaa tcagaagaaa ctggcgaagt atctggcgaa gatcctgcgc gaaaacgatt 1201 tcggcgacga tttctggatc tggtgctaca gtcccaccag ctgcgatgtc atcgccccgc 1261 tggcaaaaga gatgggcttg gaacctgcct cgttatggaa acgcacggtg tacgactgcg 1321 tggaccggca ctccgcttat ccgggtcaca tcgatccgaa agtggtcgat gaaatggagg 1381 aagacctggc caggagctgc ggctgcgtct tcgcgacggc acagggcctg tatgagcggc 1441 tgaaggcgtt caacgagaat actcacctca tccccaacgg ctgcgccttc gaactgtttc 1501 acacggctgc ggacatggag aaggagggca tttcgcctca cttcggtttc gtcggcatgc 1561 tgcaggaatg cctggactac gactgtatcc gggcggtagc cgaggcgttc ccggacggaa 1621 aggtgaccct cataggccgc acgctgccgg gcgtcgacat gacctggacg gataactacc 1681 ccaacgtgga gatgaagggc ctcgttcccc agcgggaact gcccgggtat atcaaggatt 1741 tcgacgtttg cctcaacgta tttgcggata acgacctgtc ccgggacgta agtccgctga 1801 agttctacga atatctcgcc accggaaagc ccgtggtgag caccctcgtg ccgctgcagg 1861 tgctggatta cgtagactgc atctatctgg cggagacgcc ggatgaattc gtgacgcgct 1921 gccgggaagc tctggaagaa gggccggaca gccccaaacg gacggagcgc atcgaagccg 1981 cccgccgcaa ttcctgggac gaaaaagtgg cggaaatgaa ggagatcctg gcctggtaag 2041 gcctcaatcg aaacataaag gagaaagtga tgaagatcat caacgaaaaa ggaaagctgt 2101 tcgggctcat caacgtcgtg gacctcatcg tgctgctgct ggtcatcgct gtcatcggcg 2161 tgctggcgac aaagctgctg ggcaaccgcg taacggaagc cgtcgtgcag aaagtggact 2221 gctacgccca ggtgcgcatc atcggcgccc atcccaccct ggtggaggaa gtgcagcgcc 2281 agaatctggt cggccagcgc atggtggcgg gcagcgtcta catcgacggg acgatcgagg 2341 acgtctggct ggaggactat aaggtccagg tgcagacgga cgacggccgc atcgtgaccg 2401 ccacagaccc cgacaagaag gacatcatct ttgcgatcaa gttccccatc gccaaggaca 2461 cgccgaaccc caagctgggc agccaggaag tccgcgcggg cagaacgctc atcgtaaaga 2521 cccagacctt cgagaccagc ggcaccatcc gctacgtgca gatcggcgaa tacgatcccc 2581 ccgaggcgtt ccagaagccc tgatgaccta tgactgagat cgtaaaaaac agtctcgtca 2641 tccgcttcat cgtctgcgtt tacgagggat tgcggcgctt ctggcgcagc agtctgctgg 2701 gcagaggatg gaaaggctgg cacgagagct ggttacaatc gaatacgaaa gtccattggg 2761 agaactggtg cggcatggat gaccctgcgg aacattccgt gtacgcgaag ttcctgcgca 2821 ccctggagaa actgctgcag aaggtggggg aatggctgcg ctgcagcctg ttctaccgca 2881 tcgtcattgc tgtgcgggat tggtatttcc gcatcagcga aggcagccgc attttgtcgg 2941 cggtcaaccg ggtgcccctg cgccgctggt tgttcgtggc cttcgccctg tatcttccca 3001 tcgaatacgc gctgcgggat gtgctgcaga tcagcatcct ggcgtcggtc tgggaggaag 3061 tgttcctgat ggccggcgtc gccctggtgc tttggcggac aatgctgaaa cagtcagacg 3121 gattccggcg ggctacagcc ctggaaaccg cgcttctgct ctacatggcc gtcggactgc 3181 tgctgatgat gctcaaccgg ccgttccccg gcatcgcctg ggcgggatac cgggcccagg 3241 tggaatacat cctctggttc ttcatcctgc tgcggctgat cgacgatgag caggacgcga 3301 agacgctgct cttcggcttt gccgccgtcg tgcttgtgct ggcgctgcac ggcatctatc 3361 agtatatcgc cgccgtgccc attccggatt cctgggtcac taagaccgag gccggcgtgc 3421 gcacccgggt cttctccctg acgggaagcc ccaacatctt cggatcgctg ctgctgatgg 3481 cggctcccac cgctgcggca ggcatctact atttcaagaa tggatggatg aagttcctgt 3541 cgctgtgcgc gacgggcgtc atctgcctgt ccattctctt tacgttttcc cggggctcct 3601 gggtcggact catcgtcgcg atcgtgctgt tctccctgtt tatggacaag cgcctcatcg 3661 ggctgatggg gatcgccatg gccggggtgg tggcgctggt gccgtccatc acgagtcgcc 3721 ttacctatct gatgaccccg gaatacaagg tcgcctcgga agtgggcggc agagccctcc 3781 gctgggagac cgggcgggcg ctgctccacg agaattcccc ctggctgggc ttcggcctgg 3841 gccgtttcgg cggtgccgtc gccatgaaca accaggtgct ggacaagacc gacgagttcg 3901 aatactttta catggacaat tattacctca aaacccttgt ggaaatgggg tatttgggca 3961 taatattcta tatagtcgct ctgatcgctt ttgcggtcat ggcgctccgg gccatccatg 4021 cctgcaatca gggcagagcg tacggcctgg cggacgatgc gctcacgcgc aatgacggca 4081 atctgaagtg cctggcagca ggcctgtttg ccggcatggc gggcgtcctc gtccactgct 4141 attttgaaaa tatcttcgaa gagccataca tgatggctta tttctggggc ctcgccgcct 4201 gtctgcagcg gctgggcgcc gtcagcaagg aaaggagcag aacgtgaagg tttgcgttat 4261 cgggctcggc tacatcggcc tgcccaccgc cgccatgttt gccaacgcag gacacgaggt 4321 cctgggcgta gataaaaagc ctcagatcgt ggaggcgctc aacagaggag agatcatcat 4381 cgaggagaac ggcctggcgg aattcatcaa ggccgtcgtg gacaaggggc atctgcgtgc 4441 cgcgcttgac cccgagacaa gcgatgccta catcatctcc gtccccacgc ccatcacgga 4501 ggacaagaag gcggatatgc gctttgtgga aagcgccacc cgcagcgtcg ttcctctgct 4561 gaagaagggc gatctcgtca tcctggaatc cacgtccccc gtgggcaccg tggacagcct 4621 gatgctgccc atcctggagg agagcggctt aaaggcggga agggacttcg gtctggggca 4681 ttcccctgag cgggtcatcc ccggcaagat cctgtacgag ttggtgcaca actcccgcat 4741 cgccggcggc atcgataagg aatctgccca tcgcatcgca gaactgtaca agagcttcgt 4801 ggagggcgag atctacgaga ccgacgcccg caccgcggag atgtgcaaat tgtccgagaa 4861 tacgttccgg gacgtcaaca tcgctttcgc caacgagctg gcgaagatct gcgaagatca 4921 gggcataaac gtctgggaac tcatcgagat ctgcaacaag catccgagag tcaacatcca 4981 ccagcccggc cccggcgtgg gcggccactg catcgcagtc gatccctggt ttatcgtgga 5041 gaaagagccg ggtctggcgc agatcatccg caaatcccgg gagaccaacg attccatgcc 5101 cggctacgtc gcaaagcggg cggaggagat cctgacaggt gtggcggatc cgaagatctg 5161 catcctcggc gccacctata aacccgacgt ggacgacatg cgcgaaagcc ccatcctgca 5221 cctggtggac gagctccggg cgaagggcat // LOCUS sequence026 5223 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence026 VERSION sequence026 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..5223 /mol_type="genomic DNA" /organism="" /note="sequence026" CDS complement(974..2620) /product="endonuclease MutS2" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011015882.1" /transl_table=11 /codon_start=1 /translation="MSTAYKPPLSKTATRQVVGFAYVWDEIGPHTPYGAKLKRDFKPYM PGDEDDLRGHLQDMALLADQICADEKTVSAVLNDLCELKEIGLSVSNSAAQTLSVPELF NIKSFLVHTRKIRLLMHEKMGKAPKRYALRDTTELLDIMDPTGEYMDTFFVYDAFSETL AAYRSESRDIEREIRRAKKGIREQLQREHHFMMTPKFELSVPRSDKALLELAESLPELE RTSEDYMNVIFEIKPNDEIFAIEQRQRELNGLIEEEEQVVCRQLSLQIAEHAEELTANC GAIGRMDLDMAKCLYAKSHDCTAPVVCQEHTIHIEDGRNLQVEDALKAQRRSYIPVSID LADGVTAITGANMGGKTISLKMVTQCCLLMQYAMYVPAKRMEAGLSNYIHVLIGDSQNV QRGLSSFGSEMEELKEMLDNAQDRSLLMIDEIASGTNPAEGFALTKSFMKYFSTKPYIT IITTHFDHAASGEEVHNLQVRGLSGADFGKLARELSTANRRQRIEILGKYMDYRLIPVD TVGEVPRDALNIAKILGIYDEIIDEARTYLI" /locus_tag="LOCUS_1330" /note="WP_011015882.1 endonuclease MutS2 (Fusobacterium nucleatum) [pid:29.3%, q_cov:95.3%, s_cov:95.1%, Eval:1.3e-53]" /note="MGA_171" CDS complement(2617..3654) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MGFIADIQKKYKTVSIVGMAKNAGKTTALNYLLEEAYDEGLRMGV TSTGRDGETSDLVFETDKPKVYLFEDTIVTVPEQLFGLAETSLEILKRTSCRTALGQVL LCRVARSGYVQIAGPGSIMEHKKLCAQMFEQGIDMIIIDGAIDRKSIADPATSDAIILS TGAVISRRIKNVVEETVHVVSVYKSPLVEDEKLRAILEKEDRDVFRILTIDKDYNVAQV PVRTALGAGPIVNDAIGEDTRFVYIPGAITERILDHISPAKLKQVTIVLPNPTKVFVGA TRWQQLRKMGLHVQVLENIEVAAVTVNPFSPHGYSFDRDELLNAVKEALPGLPVVDVRV GGLDL" /locus_tag="LOCUS_1340" /note="MGA_172" CDS complement(3739..4995) /product="lysine 2,3-aminomutase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_005902971.1" /transl_table=11 /codon_start=1 /translation="MARYFKDIELWKDVTEEQWNDWHWQVANRVTTVEDLKKVVNLTEQ EEADIREVAKNFRMGITPYYASLMDPDDPRCPVRMQAVPVIAENHRSDADMLDPLHEDE DSPAPGLTHRYPDRVLFLITDQCSMYCRHCTRRRLAGETDGARSLEDIDKCIEYIRKTP VVRDVLLSGGDALLVEDDVLEYIIKKLREIPHVEIVRIGSRTPVVCPMRITEDLCNMLK KYHPIWLNTHFNNPKEITEYSKKACARLADAGIPLGNQSVLLRGVNDCPHIMRELVQKL VQMRVRPYYIYQCDLSLGIEHFRTPVSAGIEIIEALRGHTSGYAVPTFVIDAPGGGGKT PVMPQYVISQSPGKYVLRNYEGVITTYTEPTNLPKLPCTCDYCTGKKKYEYEGVEGLHR GQRLAMEPQDLLRHRRNKK" /locus_tag="LOCUS_1350" /gene="ablA" /EC_number="5.4.3.2" /note="WP_005902971.1 lysine 2,3-aminomutase (Fusobacterium nucleatum) [pid:69.5%, q_cov:98.1%, s_cov:96.2%, Eval:1.5e-168]" /note="MGA_173" ORIGIN 1 cttcgatggc atcgtcggtc gtcaggtagt tatcttcgcc ggagttgaag ataatgccgc 61 agtagccgat gatgactctg gagaagaact ggtctacaat ggttctctgc atgttgatgt 121 cgcggaacag aatgccgtac agggcgtcgt tgagcatgac gtccagacgt tccagagcac 181 ccatggctgc gatctcgggc atgcacagac cggaggagta gttgcacagg cggatgtatc 241 tgccgatgtc ttcgccgact ctgtccagtc tctctctcat gatgcggaag ttttcctggg 301 ttgcataggt accgccgaaa ccttcggtgg tggcgccgta gggaacgtag tccagcaggg 361 actgtgcagt cgttctgatt acggcgatga tatctgcgcc ctggcgggct gcagcttctg 421 cctggttgac gtcttcgtag atgttgccgg tcgcaacgat gacatacaga tacggcttct 481 ttccttcgcc aatcgtcgcc aggtattctt ctctcttagc cgtctgcttg cggatctttg 541 caagtgcttc ttctacgtac ggctcgatgg ccttgcgggc ctcctccatg gaaacgggtt 601 ctaatttcat cagatccagc tgacccagag aaactgcctc ggcaatttcc tggggcgtct 661 tgcccgtttt aatgatcgcg ttgcccatcc agtaggcaat gcccttcgga agaccgccgc 721 cgtccttgat cgcgtctaca agaacattgg gaagaggtct ttcgacgtcg tccacgccgt 781 ctacgcccag aagtctcaga acggttcttt cggtagagac ggtagtgtgc gcgttgatga 841 actcctgcat gctttctgcg atgttcttag catggtttct tgcgctcgcg atgacgtttt 901 ggtccaaatt cagtttgctt gtcatcctta ttctccttca atatgttaaa taattaacta 961 tgcaaccaac gtattatatc aaataagtac gggcctcgtc tataatttca tcgtaaattc 1021 ccagtatttt tgcgatattt aaggcgtccc gaggcacttc tcccacggta tctacgggaa 1081 tcagacgata atccatgtat tttcccagga tctcgatgcg ctgccggcgg ttcgcagtgg 1141 atagttctct cgccagcttt ccgaaatcgg cgccggacag gcccctcacc tgcagattgt 1201 gcacttcttc gccggaggcg gcgtggtcga agtgcgtcgt aatgatggtg atatagggct 1261 tcgtcgaaaa atacttcata aagctcttcg taagagcgaa cccttccgcc ggattcgtgc 1321 cggaggcgat ctcgtcgatc atcagaagcg agcggtcctg ggcgttgtcc agcatctcct 1381 tcagttcctc catctcgctg ccgaaactgg agaggccccg ctgcacgttc tgggaatcgc 1441 cgatcagcac gtggatgtag ttggaaagcc ccgcttccat gcgcttcgca ggcacgtaca 1501 tcgcgtactg catcagcagg cagcactggg tgaccatctt caagctgatg gtcttgccgc 1561 ccatgttggc gccggtaatg gcggtgaccc cgtcagcgag gtcgatgctt acggggatgt 1621 agctgcggcg ctgcgctttg agggcatctt ccacctgaag atttctgccg tcttcgatat 1681 ggatcgtatg ctcctggcag acgacgggcg ccgtgcagtc gtggcttttg gcgtacaggc 1741 acttcgccat gtccagatcc atgcggccga tggcaccgca gttggcggtc agttcttcgg 1801 catgctctgc gatctgcagg gacagctgcc ggcagacgac ctgctcctcc tcttcgatga 1861 gcccgttcag ctctctctgc cgctgttcga tggcgaagat ctcgtcgttt ggtttgatct 1921 cgaagatgac gttcatgtaa tcttcgctgg tgcgctccag ctcgggcagg ctttccgcca 1981 gctccagcag cgccttgtcg gaccggggca cggacagctc gaatttcggg gtcatcataa 2041 aatgatgctc gcgctgcagc tgctcgcgga tacccttctt cgcccgtctt atctcccgtt 2101 cgatgtcgcg gctctcgctg cggtaggcgg ccaacgtttc ggaaaacgca tcgtacacga 2161 agaacgtgtc catgtattcg ccggtgggat ccatgatgtc cagcagctcc gtcgtgtctc 2221 tgagggcgta gcgcttcggc gccttgccca tcttttcgtg catcagcaga cgaatcttgc 2281 gggtgtgcac gaggaagctc ttgatgttga agagctcggg cacgctgagg gtctgagccg 2341 cgctgttgga aacagacaga ccgatctcct tcagctcgca cagatcgttc agcacggcgc 2401 ttacggtctt ttcgtccgcg cagatctggt cggccagcag tgccatatcc tgcaggtgac 2461 cccgcagatc gtcctcgtct ccgggcatgt agggtttaaa gtcccgtttc agcttggcac 2521 cgtagggcgt atggggcccg atctcgtccc agacgtaggc aaatcctacg acctggcggg 2581 tcgcggtctt ggaaagaggc ggtttatagg cagtgctcac agatccagtc ctcctactct 2641 tacgtccacg acgggaaggc cgggcagggc ttccttgacg gcgttcagca gctcgtcgcg 2701 gtcaaagctg tagccgtggg gcgagaacgg gttgaccgtt acagcggcca cctcgatgtt 2761 ctccagcacc tgcacgtgca gtcccatttt tctcagctgc tgccagcgcg tagcgcccac 2821 gaagaccttc gtcgggttgg gcagaacgat ggtcacctgc ttgagcttgg cagggctgat 2881 atggtccagg atacgttcgg tgatggcacc cggaatatac acgaaacggg tgtcttcgcc 2941 gatggcatcg tttacgatag gacctgcgcc cagcgcggtg cggaccggca cctgggcaac 3001 gttatagtct ttatcgatcg tcaggatgcg gaagacgtcc cggtcttcct tttccaggat 3061 ggcgcgcagc ttttcgtcct ctacgagggg gctcttgtag acgctcacca cgtggacggt 3121 ctcctccacc acgttcttga tccggcggga aatgaccgcg ccggtggaca ggatgatggc 3181 atcggaggtg gcggggtccg cgatggattt gcggtcgatg gcgccgtcga tgatgatcat 3241 gtcgataccc tgttcgaaca tctgggcgca cagtttcttg tgctccatga tgctgcccgg 3301 acccgcgatc tgcacgtaac cgcttctggc gacccggcac aggagcacct ggcccagcgc 3361 cgtgcggcag ctcgtgcgtt tgaggatctc gaggctcgtc tccgcaaggc cgaacagctg 3421 ctcgggaacg gtgacgatgg tgtcttcgaa cagatagacc ttcggcttat ccgtttcgaa 3481 caccaggtcg ctcgtctcgc cgtcgcggcc tgtggaggtc acccccatgc gcaggccttc 3541 gtcgtaagct tcttcgagaa gatagttgag cgccgtcgtc tttccggcat ttttggccat 3601 gccgacgatg gaaacggtct tgtatttttt ctggatatcg gcgataaagc ccataaaaac 3661 tcctgatact tattggaaaa caaagggcgg aaatgatttc cgccctctgc tggatagttg 3721 ttgctgaaaa cgcaggaact acttcttgtt tcttctgtgt ctgagcagat cctggggttc 3781 catagccagt ctctggcctc tgtggagacc ttcgacgcct tcgtattcgt acttcttctt 3841 gccggtgcag tagtcgcagg tgcaaggcag cttcggcaga ttggtcggct cggtgtaagt 3901 cgtgataacg ccttcgtagt tgcgcagaac gtactttccg gggctctggg agataacgta 3961 ctggggcatg acaggagtct tgccgccacc gcccggggcg tcgataacga acgtcggaac 4021 agcgtagccg gaagtgtggc cgcgcagagc ttcgatgatc tcgatacctg cggaaacggg 4081 ggttctgaag tgttcgatgc ccagggacag gtcgcactga tagatgtagt acggtctgac 4141 tctcatctgg accagcttct ggaccagttc tctcatgatg tgcgggcagt cgttgacgcc 4201 gcgcagcagt acggactggt taccgagggg gataccggcg tcagcaagtc ttgcgcaagc 4261 cttcttggag tactcggtga tctccttggg gttgttgaag tgggtgttca gccagatggg 4321 gtgatacttc ttcagcatgt tgcacagatc ttccgtaata cgcatcgggc atacgacggg 4381 agttctggag ccgatacgga cgatctccac gtgggggatc tctctcagct tcttgatgat 4441 gtattcgagg acgtcatctt ccaccagaag agcgtcgccg ccggagagca gaacgtctct 4501 gacaacgggg gtctttctga tgtactcgat gcacttatcg atatcttcca gggaacgggc 4561 gccgtccgtt tcgccagcca gtcttcttct ggtgcagtgt ctgcagtaca tggagcactg 4621 gtcggtgatc aggaacagaa ctctgtccgg atatctgtgg gtgaggccgg gagccgggga 4681 gtcttcatct tcgtgaagcg ggtccagcat gtccgcatcg cttctgtggt tctcagcgat 4741 aacgggaaca gcctgcattc tgaccgggca acggggatcg tccggatcca tcagggaagc 4801 atagtacggg gtgatgccca tacggaagtt cttagcgact tcgcggatgt ctgcttcttc 4861 ctgttcggtg aggttaacta ccttcttcag gtcttcaacc gtggtaactc tgttcgctac 4921 ctgccaatgc cagtcgttcc actgctcttc ggtaacgtcc ttccacagtt cgatgtcctt 4981 gaaatagcgt gccataaata atttctcctt attctatgcg cgtttgctat acggaattat 5041 gcgtacattt cttcgaacag cttgcggatg ccttcgtgtt ctctcaggac ctgcagcgtg 5101 atctcagcgt gacccttagc atagccgttg cccatgatca tggtgacgtc cttgcctacg 5161 ccttcagcgc ccagggcagc cttggtgaag ctggtcgcca tggagaagaa gtaaacggtg 5221 ccc // LOCUS sequence027 5214 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence027 VERSION sequence027 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..5214 /mol_type="genomic DNA" /organism="" /note="sequence027" CDS complement(616..1602) /product="2-C-methyl-D-erythritol 4-phosphate cytidylyltransferase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_012546162.1" /transl_table=11 /codon_start=1 /translation="MDAFSVVAAAVPAEDMAYCRDLFDRYGLPGVALTAGGATRQESVY NALKSLPQDVDAVLVHDAARPFVDEGVIRGVLDALETASAAVPCVHPKSTIRTQSETLD RNALYEVQTPQGFDRKLLEEAFRYAQETGFSGTDEAGVFEHYGKGGPVRITEGSYANYK ITTPEDLPVNIRTGNGYDVHRLVPGRKLMLGCCEIPYEKGLLGHSDADVVAHAIADALL GAAALGDIGRHFPDSDPAYEGMSGTEILQRTAEILKQNGFAIGNVDATLVAQKPKIAPY AQTMMENTAKALDVPVSAVSIKATTEEGLGFTGDGSAMACLATATVK" /locus_tag="LOCUS_1360" /gene="ispD" /EC_number="2.7.7.60" /note="WP_012546162.1 2-C-methyl-D-erythritol 4-phosphate cytidylyltransferase (Thermodesulfovibrio) [pid:42.7%, q_cov:89.0%, s_cov:79.6%, Eval:1.8e-56]" /note="MGA_176" CDS complement(1747..2859) /product="PIN/TRAM domain-containing protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011860623.1" /transl_table=11 /codon_start=1 /translation="MLNKVFRIVVCLSGALVGYGITTFSARPEILGDAWGMTPGQKVLW ICTGTAFFAFIFDFLFGFFRKRGEKIMETVDSRLKKVPATEIAASSIGLVVGFVIAFLI SQIINEIQILRAMNLNVVISLALYLFFGAVGVTVGRRLNSDLGKPLFSSITSKEPTAKS KAKNAGASPKILDTSVIIDGRIADILKTGFIEGNIIIPDFVLVELRHIADSSDSLKRNR GRRGLDILNRIQSDYGIEIYDTTAEKSLEEIPEVDVKLLKLAQIMKGMVVTNDFNLNKV ATITGIGVLNINELANTLKPVVLPGEEMQVFLVKEGKENNQGVGYLDDGTMIVVEDGKK FIGQTINVAVTSVLQTSAGRMIFVKPAPIL" /locus_tag="LOCUS_1370" /note="WP_011860623.1 PIN/TRAM domain-containing protein (Clostridioides difficile) [pid:50.8%, q_cov:98.9%, s_cov:99.5%, Eval:1.8e-87]" /note="MGA_177" CDS complement(2929..3402) /product="CarD family transcriptional regulator" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_005810219.1" /transl_table=11 /codon_start=1 /translation="MFSIGDKVVYPMHGAGTIQNIEEKEVLGETRAYYILRIPYGNLQV MVPVKGSDAAGLRPIVSEEEVSGVLDVLAAESTPMDENWNRRYRENMDKLRSGDPAKVA EVIRNLMRVERAKRLSTGEKKLLANARQILASEIVLVRGVAEKDAMDMIDSAV" /locus_tag="LOCUS_1380" /note="WP_005810219.1 CarD family transcriptional regulator (Desulfitobacterium) [pid:53.6%, q_cov:97.5%, s_cov:96.8%, Eval:3.6e-41]" /note="MGA_178" CDS complement(3441..4850) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MRFRLTAYFIIFALILMGMLWFFQTVFLEQYYESEMEKKIQTAVS SLSLQYSVSETLDLESYLQEIGTISNANDMYFFIEAEDESFNISSTDQGSAGRYYYGRS GVDLARERLLANNGEPVTFKISNQTGEVVTQVYAAKVDSQYRPNVRFYAFAPLTPMGPA VGILAKQLLTVTAISLVVAGILALYISSRIARPITGITKQAAELAEGHYDVEFEGSSYR EINDLAGTLNTTAEALSKTDQLQRDLMANVSHDLRTPITMVRSYAEMIRDLSGDNPEKR NEHLGVIIEESDRLNTLVNDILTLSRIQAGVETMKMEPVDLQKCAESILATYRVLEEQE GFTISLETLDEPVLVNADEHRMQQVLSNLISNAVRYSGDRKEVTVAFSRKKKMLRCEVR DKGIGIAPEDIENIWNRYERASSRGHRSKGGTGLGLSITKEILERHDAKYGVESTLGEG SIFWFELPAID" /locus_tag="LOCUS_1390" /note="WP_015261871.1 HAMP domain-containing sensor histidine kinase (Desulfitobacterium dichloroeliminans) [pid:33.8%, q_cov:62.3%, s_cov:61.3%, Eval:2.1e-46, partial hit]" /note="MGA_179" ORIGIN 1 cggtatccgc ctccacgggc ctgtacttta tgccgcagcg gtcgaacaca ttgcagtaag 61 cgtcgtagtt cagctgatag gacttgtcca ggccttccgt atcccggtcg aagctgtagt 121 tatccttcat gacgaactcg cggctgcgga tgagcccgaa acggggacgc gcttcgtctc 181 tgtatttgtt ctggatctga tacagctgca ccggaagctg gcggtaggac gtgatgttct 241 ggcgggcgat gtccgtaaag acctcctcgt gagtgggtcc cagacagaac tctctgccgt 301 cgcggttctt gatgcgccac agctcgggtc cgtaggccgt ccagcggccg gattcctgcc 361 acagttcggc gggttccaga atgctgggct tgatctcctg ggcgccgatg gcgtccatct 421 cttcgcgcac gatgttctcg atcttgcgca gcgtgcgggc gccgaggggc agataggcgt 481 aaacgcctgc cacctgtttg cggatgaatc cggcgcgcag cagcaggata tggctggcga 541 tctccgcttc cgcgggaact tcccgcagcg tatacagata catgttcgat gctctcataa 601 gggtgtattt cctttctatt tgacagtcgc ggtcgccagg cacgccatgg cgctgccgtc 661 gccggtaaag cccagacctt cttcggtcgt ggctttgatg gacacggcag agacgggcac 721 gtctaacgct ttcgcggtgt tttccatcat ggtctgcgcg tagggcgcga tcttcggctt 781 ctgcgcgacg agcgtggcat ccacgttgcc gatggcgaag ccgttttgtt ttaagatctc 841 tgcggtcctt tgcaggatct cggttccgga catcccctca taagcggggt cgctatccgg 901 gaaatgccgg ccgatgtcgc ctagggctgc ggcgcctagc aaggcgtcgg cgatggcgtg 961 ggcgaccacg tccgcgtcgc tgtgacccag caaacccttc tcgtaaggga tctcgcagca 1021 gcccagcatg agttttcttc cggggacgag ccggtgtacg tcgtagccgt ttcctgtgcg 1081 gatgttcacg ggcagatcct ccggagtcgt gatcttatag ttcgcgtaag agccttcggt 1141 gatccggaca ggcccgcctt tgccgtagtg ttcgaagacg cccgcttcgt ccgtaccgga 1201 gaacccggtc tcctgcgcat agcggaaggc ttcctccagg agtttccggt cgaagccctg 1261 gggcgtctgc acctcgtaca gagcgttccg gtccagtgtc tcggactgcg ttctgatggt 1321 gcttttcggg tgcacgcagg ggacggcggc agaagccgtt tccagcgcat ccagcacgcc 1381 gcggatgacc ccctcatcca caaagggacg cgccgcgtcg tgcacgagca cggcatccac 1441 atcctgcggc aggctcttca gcgcgttgta cacgctctcc tgacgggtgg caccgccggc 1501 tgtgagggcc acgccgggga ggccgtagcg gtcgaacagg tcccggcagt aggccatatc 1561 ctccgccggc accgcagccg caacgacgga aaacgcatcc atagcacaaa aagccctggc 1621 ggctttcacc aagaccggag catctcccag aaggcggtat tgctttggaa cgccgccgcc 1681 cattcggctt cccgaaccgg cggcggctaa aagtactgcg gtattcttgc ctgtcataga 1741 tgctgactac aggatgggag cgggctttac gaagatcatg cggccggcag aagtctgcag 1801 cacgctcgta acggccacgt tgatggtctg gccgataaat ttcttaccgt cttcgaccac 1861 gatcatggtg ccgtcgtcca ggtagcccac gccctggttg ttttccttgc cctccttgac 1921 gaggaagacc tgcatttcct cgccgggcag caccaccggt tttaaggtat tggcgagttc 1981 gttgatgttg agcacgccga tgcccgtaat ggtggcgacc ttgtttaagt taaagtcgtt 2041 cgtaacgacc atgcccttca tgatctgggc gagttttaaa agctttacgt ccacctccgg 2101 gatctcctcc agggatttct ccgcggtggt gtcgtagatc tcaatgccgt agtcgctttg 2161 gatacggttg aggatatcca gccccctgcg tccgcggttg cgcttgagcg aatccgagga 2221 atccgcgatg tggcgcagct cgacgagcac aaaatcgggg atgatgatat tgccttcgat 2281 aaagcctgtc ttgaggatgt ctgcaatacg accgtcgatg atgacgctgg tatccagtat 2341 ctttggcgaa gctccggcgt tctttgcctt gcttttcgcc gtcggttctt tgctggtaat 2401 ggaggagaac agcggttttc cgaggtctga attcaggcgg cgcccgacgg tgactccgac 2461 agcgccgaaa aacagataaa gcgccaggga tatgacgacg ttcagattca tcgcccgtag 2521 gatctggatc tcattaataa tctgcgagat cagaaaagcg atgacgaaac cgacgaccaa 2581 tccgatggaa cttgccgcga tctccgtggc cgggactttt ttcagtctcg agtccacagt 2641 ttccattatt ttttccccgc gtttacggaa aaacccgaat aaaaaatcaa aaataaatgc 2701 gaaaaaagcg gtaccggtgc agatccagag gaccttctgt cccggggtca tcccccaggc 2761 gtctccgagg atctcgggcc tggcactgaa tgtggtgatt ccgtaaccga caagcgctcc 2821 gctcagacaa acgacgatgc ggaacacttt gtttagcatt gtgtctcctt tctttttcgt 2881 taagtttttt atctatatca aacgatgcag cctcgtcttg cggggaagct agacggcgct 2941 gtcgatcatg tccatggcgt ccttttccgc cacgccccgc accagcacga tctcgctggc 3001 caggatctgg cgggcattcg ccagcagttt cttctctccg gtggagaggc gttttgcgcg 3061 ttccacgcgc atcaggttgc ggatgacctc cgccactttc gcggggtctc cgctgcggag 3121 cttatccatg ttctcccggt atctgcggtt ccagttctcg tccatcggcg tggattcggc 3181 agcgagcacg tccagaacgc cggagacttc ctcctccgac acgatgggcc ggaggcctgc 3241 tgcgtccgag cctttgaccg ggaccatcac ctgcagattt ccatagggaa tgcgcaagat 3301 ataataggcc ctggtctcgc ccaggacctc tttttcctcg atattctgaa tggtgccggc 3361 cccgtgcatg gggtaaacga ccttatctcc tatggaaaac atgacaatcc tccaaacata 3421 ttatatatgc cggagattgt ttagtcaatc gcgggaagct caaaccagaa aatacttccc 3481 tctcccagcg tgctttccac gccgtatttc gcatcgtgcc gttccaggat ctccttcgtg 3541 atggacagac cgaggcctgt gccccccttg gagcggtgac cccgggagct ggccctctcg 3601 taccggttcc agatattttc gatatcctcc ggcgcgatgc cgatgccctt gtcgcgcacc 3661 tcgcagcgaa gcattttttt cttccgggag aaggcgaccg tcacttcctt gcggtctccg 3721 ctgtagcgca ccgcgttgga gatgaggttg gacagcacct gctgcatgcg gtgctcgtcc 3781 gcgttcacca gcacgggttc gtccagcgtt tccaacgaga tcgtaaagcc ctcctgctcc 3841 tcgagcaccc ggtaggtcgc caggatgctc tcggcgcatt tctgcaggtc cacgggttcc 3901 atcttcatgg tctccacgcc ggcctggatg cgcgacagcg taaggatgtc gtttacgagc 3961 gtattcaggc ggtcggactc ctcgatgatg acccccagat gttcgttccg cttttccgga 4021 ttgtcgccag agaggtcgcg gatcatctcc gcgtaagacc ggaccatggt gatgggcgtg 4081 cgcaggtcgt gcgacacgtt cgccatcagg tcgcgctgca gctgatccgt cttggacagc 4141 gcttccgccg tcgtgttgag cgtgccggcc agatcgttga tctcccggta gctgctgcct 4201 tcgaactcca cgtcgtaatg cccttccgcc agttcggcag cctgcttcgt gatgccggtg 4261 atgggccggg cgatgcggct ggagatgtag agcgccagga taccggctac caccagcgag 4321 atcgccgtga ccgtcagcag ctgctttgcg aggatgccga cggcgggacc catgggcgta 4381 aggggcgcga aggcatagaa ccgcacgttg ggacggtact ggctgtccac cttggcggca 4441 tatacctggg tcacgacctc tccggtctgg ttggagatct tgaacgtcac cggctcgccg 4501 ttgttggcca gaaggcgttc tctggccaga tccacgccgc tgcggccata gtaatagcgg 4561 cccgcagagc cctggtccgt ggaggagatg ttaaagcttt cgtcctccgc ctcgataaag 4621 aaatacatgt cgttggcgtt ggagatggtg ccgatctcct gcagatagct ctccagatcc 4681 agcgtttcgc tcacggaata ctgcaggctg agggagctga ccgcagtctg gatcttcttc 4741 tccatctcgc tctcgtaata ctgctcgaga aacacggtct ggaagaacca gagcatgccc 4801 atgaggatga gcgcgaaaat gataaaatac gcagtgagcc gaaagcgcac actgcgtgtt 4861 ctgtattgtt tcgggctttt taccgtacta gtcttcaaac ttatacccta tgcctctcac 4921 tgtcgcgatc ttgtcgcggt aatctcccag acggccccgc aggttcttga tgtgggtgtc 4981 gatggtgcgg tcatcgccga agaaatcgta gccccagata tcctgcagca gtttgtcgcg 5041 ggacagggcg atgttcttgt tctccatgag atagaccagc agctcgtact ctttgagggt 5101 cacatcgatg cgtttgccgt cgatcgttac ggtgcggctg ttcttgttga ccacgagacc 5161 gccggaaacc agctccgcag agggcgcctg gttctccgat gccttgcggc gcgc // LOCUS sequence028 5151 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence028 VERSION sequence028 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..5151 /mol_type="genomic DNA" /organism="" /note="sequence028" misc_feature <1..725 /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_010969422.1:homoserine dehydrogenase" /note="WP_010969422.1 homoserine dehydrogenase (Sinorhizobium meliloti) [pid:47.7%, q_cov:97.9%, s_cov:53.2%, Eval:6.4e-52, partial hit]" /note="MGA_181" /locus_tag="LOCUS_1400" CDS 738..1238 /product="SEC-C metal-binding domain-containing protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_010966802.1" /transl_table=11 /codon_start=1 /translation="MTLFKEWNKLISGQTKATIDKFWEEYAGGEKKIYQDILANYPAKP AGKIGELAEKYGVRPVIFMGFLDGIQTSIANPMDLDTLDADSEIELDIQWETLLFNMFK ADADYLYGLEEWLSIVSEERYKEIYDDFRRSRTVHVEKKPGRNDPCPCGSGKKYKNCCG KNA" /locus_tag="LOCUS_1410" /note="WP_010966802.1 SEC-C metal-binding domain-containing protein (Clostridium) [pid:47.6%, q_cov:99.4%, s_cov:100.0%, Eval:9.2e-41]" /note="MGA_182" CDS 1243..1878 /product="endonuclease III" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_010886934.1" /transl_table=11 /codon_start=1 /translation="MAKLTKAQIKQAIDALMAEYPDAGCALDHGSTFQLLVSVVLSAQT TDVSVNKVTPALFAKAPDAFAMAQLSEEEIAGFIRTIGMYRTKSANVKKLSQILAEQYG GEVPSDYDELVKLPGVGRKTANVVLAEGFGQQRIAVDTHVFRLANRIGFTAEKDVFATE DALMKAIPEDHWTKMHHALIWHGRRVCHARKPACEGCCLDGICKKNGL" /locus_tag="LOCUS_1420" /gene="nth" /note="WP_010886934.1 endonuclease III (Deinococcus radiodurans) [pid:51.9%, q_cov:97.6%, s_cov:91.6%, Eval:2.9e-55]" /note="MGA_183" CDS 1881..2351 /product="tRNA (uridine(34)/cytosine(34)/5-carboxymethylaminomethyluridine (34)-2'-O)-methyltransferase TrmL" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003429657.1" /transl_table=11 /codon_start=1 /translation="MALHIVLVEPEIPPNTGNISRTCAATGTWLHLVKPLGFNIDDRTL KRAGLDYWPFVKVEIHESLDAFLEEYQGHRMWLSTTKGKQLYTDVRYQDEDMLLFGKET AGLPRDFIAAHQEQAIRIPMSEDTRLRSFNLSNSAAIVLFEALRQLEFPGLA" /locus_tag="LOCUS_1430" /gene="trmL" /EC_number="2.1.1.207" /note="WP_003429657.1 tRNA (uridine(34)/cytosine(34)/5-carboxymethylaminomethyluridine (34)-2'-O)-methyltransferase TrmL (Clostridioides) [pid:53.5%, q_cov:99.4%, s_cov:99.4%, Eval:2.4e-45]" /note="MGA_184" CDS 2597..3037 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MLIRYCVRYTKDHYKAEDTAQEALCLAWENLEQLEDPQRADRWLF SIAANLLRRRDPYSGEELPPEDDLPSCESAEEQLLKEEWIREVAALIQELPMLQRQAVY FCLVLERSPAQLAAVLNVSPHAVSARLYRGLQTLRKKWKALR" /locus_tag="LOCUS_1440" /note="WP_063172686.1 sigma-70 family RNA polymerase sigma factor (Mesorhizobium ciceri) [pid:31.0%, q_cov:95.2%, s_cov:46.6%, Eval:3.6e-10, partial hit]" /note="MGA_185" CDS 3080..4432 /product="RNA polymerase factor sigma-54" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011462176.1" /transl_table=11 /codon_start=1 /translation="MKQGYELKIEQSQKLTMTPALLQAINVLQLNTMQLDQYVQEQLLS NPMLERDESAPPEEPKAVDWAEYAKSVAYEPMQQDEDPADDTRETAGRSGMTLADFLGT QLQTSGLRSDILPVCLYVACCLDDSGYLRISLEEIAEQTGADVNTVRQALLHVQGMDPA GVGARNLTECLSLQLIRAGLDTPLAMVLVKEHLEDIAANRIGSLAKQLGVKPVEIQDTC DIIRTLDPKPGRRFSKDTEAQYIVPDVFIELRGGQLAVSVSESASPRLIISPYYRHLLE DPDADAQLKDFLEDRLNSAAWLIRSIQQRSQTILGVTRAIASMQEDFLKNRGGLVPMTL AQIAQMAGVHESTVSRCTSGKFVQTPRGVFELKDLFRGGYSAGSGEVSTESVKRQIRAY IEAEDGKHPLSDQTIAERLQEEKGVEISRRTVAKYREALGIPSSSGRKRFE" /locus_tag="LOCUS_1450" /gene="rpoN" /note="WP_011462176.1 RNA polymerase factor sigma-54 (Desulfitobacterium hafniense) [pid:43.4%, q_cov:99.8%, s_cov:100.0%, Eval:1.1e-89]" /note="MGA_186" ORIGIN 1 ccgcaggcaa gcatgtcgtg accgccaaca aagcagccct ggccgtgcac ctgcccgacc 61 tgaacaaggc agcggcgttc cacaagtgca tgctgcgcta cgaggcgtcc gtatgcggcg 121 cgatccccgt catcggctgc atctcccggg cgcttacggc caaccgcatc acggcggtga 181 agggcatcgt aaacggcacg acgaactata tcctcacccg tatggcggcg gaaggcgcat 241 cctatgagga tgtgctgaag gacgcccagg ctctgggctt tgcggaagcc gaccccacgg 301 gcgacgtgga aggctgcgac gcagccaata agctgagcgt gctgatagcg acggcgttcg 361 gcgtctacag agcgccggac agcttcgagc gcgtaggcat taccggcgtc accatggaag 421 acctggctgc ggctgaggcg gaaggcaagg tcattaagtt actggcgtgc gcggaggaaa 481 aagacggcgg catcgaagcg tacgtaaagc ccgtcgcggt ggagaaggac agcttcctgg 541 gccgctgcgg cagcgaattc aacgcggtgc agatcgactg caacatggcc ggccccatct 601 tcctgcaggg caagggcgca ggccccgaac ccacgggttc tgctgtcctc ggcgacatca 661 tcgagatcgc ccaggccatc gcagcaggca cggaacacga acaacccttt acagcattga 721 tctaggagga aatacttttg acacttttta aggaatggaa caaactgatc agcggtcaga 781 ccaaggcgac catcgacaag ttctgggaag aatatgccgg cggcgaaaaa aagatctatc 841 aggatatctt agcgaactat ccggccaagc ccgccggcaa gatcggcgaa ctggcggaga 901 agtacggcgt ccgccccgtt atctttatgg gcttcctgga cggcatccag acctccatcg 961 ccaaccccat ggatctggat accctggatg cggacagcga gatcgaactg gacatccagt 1021 gggagaccct gctgttcaac atgttcaagg ccgacgccga ctatctgtac ggtctggaag 1081 aatggctgtc catcgtaagc gaggagagat ataaggagat ctacgacgat ttccgcagat 1141 cccgcaccgt tcacgtggag aaaaagcccg gccgcaacga tccctgcccc tgcggcagcg 1201 gcaagaagta caagaactgc tgcggcaaga acgcataaga aaatggcaaa actgacgaaa 1261 gcacagataa aacaggccat cgacgcgctg atggccgaat atcccgacgc gggctgtgcg 1321 ctggatcacg gcagcacgtt tcagctgctg gtgagcgtcg tcctgtccgc ccagaccacg 1381 gatgtttccg tcaataaagt cactccggcg cttttcgcaa aagcgccgga tgcttttgct 1441 atggcgcagc tgtccgaaga ggagatcgcc ggattcatcc gcactatcgg catgtaccgg 1501 acaaaatccg ccaacgttaa gaagctgtca cagatcctgg cggagcagta cggcggggag 1561 gtgcccagcg actatgacga actggtaaag ctccccggcg tgggcagaaa gaccgcgaac 1621 gtcgtgctgg ccgaagggtt cggacagcag cgcatcgccg tggataccca cgtgttccgc 1681 ctggcgaacc gcatcggctt tacggcggag aaggacgtgt ttgcgacgga agatgcgctg 1741 atgaaggcta ttcccgaaga ccactggacg aagatgcacc acgcactcat ctggcacggc 1801 cgcagggtct gccatgccag aaagccggcc tgcgagggct gctgtctgga cggcatctgc 1861 aaaaagaacg ggttatagat atggcgctgc acatcgtttt ggtagaaccg gagatcccgc 1921 ccaacacagg caacatctcc cgcacctgcg ccgcgaccgg cacgtggctg cacctcgtaa 1981 aaccgctggg ctttaacatc gacgaccgca cgctaaagcg ggccgggctg gattactggc 2041 ccttcgttaa ggtggagatc cacgaaagcc tcgacgcctt tttagaggaa tatcagggtc 2101 accgcatgtg gctgtccacg acgaagggca aacagctgta taccgacgtc cgctaccagg 2161 acgaagatat gctgttgttc ggcaaggaga cggcaggcct tccccgggac tttatcgcag 2221 cgcatcagga gcaggcgatc cgcatcccca tgagcgaaga cacgcggctg cggtcgttca 2281 acctctccaa ttctgcggcc atcgtcctgt tcgaggcgct ccggcagctg gagttccccg 2341 ggctcgcgta ggatacgcag cgtatccttt ttgagaaaaa ctgtcgccat aacctttttc 2401 tgttcttcct gtttttacaa ttaaagtgaa aatcatattg tggaacagga ggtgtaaggc 2461 aatgttgtat ttttacttcc gtcttgtccg tttccgcagt tcttctttcc gggaaaggag 2521 gcagtagcag cccacctttg ctacgccgca ggagcgcaga tccttctacg aacggaaact 2581 gttcgtcctg cgaaaggtgc tgatccggta ttgcgtccgg tatacgaaag atcattacaa 2641 agcagaagat actgcccagg aggctctttg tctcgcctgg gagaacctgg aacagctgga 2701 ggatccgcag cgcgcggatc gctggctgtt ttctattgcg gcgaatctgc tccgccggcg 2761 ggatccctac agcggcgagg aactgccgcc ggaggacgat ctgccgtcct gtgagagcgc 2821 ggaagagcag cttctgaagg aagaatggat ccgggaagtc gccgcgctga tacaggagct 2881 ccccatgctg cagcgtcagg cagtctattt ctgcctcgtc ctcgaacgca gccccgccca 2941 gctggctgcc gttctcaacg tcagtcccca cgccgtatct gcccgcctgt accgggggct 3001 gcagacgctg cgcaaaaaat ggaaggcctt gcgctagagc gttcaaaagt ccgcgggatt 3061 gttatataat agaaatgcta tgaagcaagg ctacgagttg aaaatcgaac agagccagaa 3121 gcttacgatg acgcctgcgc tgctgcaggc gattaacgtg ctgcaactca acacgatgca 3181 gctggaccag tacgtgcagg agcagctgct gtccaatccc atgctggagc gggacgaaag 3241 cgcgccgccg gaagagccca aagccgtcga ctgggcggaa tacgccaaaa gcgtggcgta 3301 cgaacccatg cagcaggacg aagatcctgc ggacgacacc cgggaaacgg caggccgcag 3361 cgggatgacc ctggcagact ttctgggcac acagctgcag acttccggtc ttcgcagcga 3421 catcctgccc gtgtgtcttt acgtggcctg ctgcttagac gacagcggct atctgcggat 3481 aagcctggag gagatcgcgg aacagaccgg cgcggacgtg aataccgtgc gccaggcgct 3541 gctccacgtg cagggcatgg atcctgccgg cgtaggtgcc agaaacctca cggaatgcct 3601 gtctctgcag ctcatccgcg ccgggctcga taccccgctg gccatggtcc tggtaaagga 3661 acatctggaa gacatcgcag ccaaccggat cggcagtctc gcgaagcagc tgggcgtaaa 3721 accggtggag atccaggata cctgcgacat tatccgcacg ctggatccga aacccggccg 3781 gcgcttttcg aaagacaccg aagcgcagta tatcgtgccg gacgtgttta tcgaactgag 3841 aggcggtcaa ttggctgtct ccgtcagcga atctgcgtct ccccggctca tcataagccc 3901 gtattaccgg catctgctgg aagacccgga cgccgacgcg cagctgaagg attttctgga 3961 ggacagactg aattccgctg cctggctcat ccgcagcatc cagcagagga gccagaccat 4021 actcggggtc acccgggcca tcgcatcgat gcaggaggac ttcctgaaga accgcggcgg 4081 cctcgttccc atgaccctcg cacagatcgc ccagatggcc ggcgtgcacg aatccaccgt 4141 aagccgctgc accagcggca agttcgtgca gacgccaagg ggcgtgttcg aactgaagga 4201 tctgttccgg ggcggctaca gcgcagggag cggcgaggtg tccaccgaga gcgtaaaacg 4261 ccagatccgc gcgtacatcg aagcggaaga cggcaaacat cctctgagcg accagacgat 4321 cgcggagagg ctgcaggagg aaaaaggcgt agagatctcc cgcaggacgg tagcgaaata 4381 cagggaagcc ctcggcatcc cgtcgtcctc gggcagaaag cgctttgaat aaaaggagat 4441 ctatctatga aaaagactgt aagagacgtg gaactgaagg gaaagcgggt catctgccgc 4501 tgtgacttca acgtacccat gaaggaaggc gccatcacgg atgacacccg catccgggct 4561 gcgctgccca ccattcagta catgctggaa gaaggcgcat ccgttatcct gatgagccac 4621 ctcggccgtc ccaagggcaa gccgaatcac gattttacgc tggcaccggt cgcgcagcgc 4681 ctggaggaac tgctgggaag acccgtgcag ttcgcaccct ccgacaccgt cgtggacgac 4741 ggcgtgcggg agaaggctgc ggcgcttaga cctggcgacg tgatgcttct ggagaacgtc 4801 cgctacagag cggaagaaga gaagaacgac ccaagtttca gcaaggaact ggcaggtctt 4861 gcggacctgt tcgtaaacga tgcgttcggc acggcgcaca gagcgcattc ttccaccgca 4921 gggatcgcag acttcctgcc ggccgtaagc ggattcctca tcgagaagga gctgcagttc 4981 ctcggcgaag ccgtggacga tccgaagcgg cccttcgtcg ccatcctggg cgggtccaag 5041 gtgtccgaca agatcggcgt catcgagaac ctcatcgaga aggcggacac gatcctcatc 5101 ggcggcggta tggcctacac cttcatcaag gcggcaggct gcggcatcgg c // LOCUS sequence029 4862 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence029 VERSION sequence029 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..4862 /mol_type="genomic DNA" /organism="" /note="sequence029" CDS complement(67..2130) /product="elongation factor G" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011393940.1" /transl_table=11 /codon_start=1 /translation="MPRKFSLENTRNIGIMAHIDAGKTTTTERILFYTGKTHKMGETHE GAAVMDYMVQEQERGITITSAATTAQWKNTRINIIDTPGHVDFTVEVERSLRVLDGAVT VLCAKGGVEPQSETVWRQAEKYGVPRMIFVNKMDIMGADFYHVLDMVKNRLKANAVAVQ LPIGVESTFRGIIDLIKMKAEIYEDDLGTVIEEQDIPEDMMDLAEEYRQKMLESVAECD EDLMMKYLEGEELTAEEIKSTIRKMTIANKMVPVLCGSAYKNKGVQLMLDAVVDYMPSP LDIPPIKGIIPRLEKEAERPADDKGPFSALAFKIVADPYVGKLAFFRVYSGTLESGSYV YNSTKGKKERIGRILQMHANHREDIEQVYSGDIAAAVGLKDTTTGDTLCDEKHPIILES MEFPDPVIQIAIEPKTKAGQEKMGIALAKLAEEDPTFKTYTDPDTGQTIIAGMGELHLE IIVDRLLREFKVEANVGKPQVSYKETITKEAIVDNKYAKQSGGHGQYGHVKIRLYPRQP GEGYEFVNKIVGGAIPKEFIPKIDEGIREAMETGPLAGYQVVDVGVELFDGSYHEVDSS EMAFKIAASMAFREAAAKAAPILLEPIFKVEVTAPEEYMGDVIGDISSRRGRIEGTDIR NGAATVDAMVPLSQMFGYATDLRSKTQGRGTYVMQMDHFEKLPDNLLDKINK" /locus_tag="LOCUS_1460" /gene="fusA" /note="WP_011393940.1 elongation factor G (Moorella thermoacetica) [pid:71.1%, q_cov:99.7%, s_cov:99.0%, Eval:2.2e-295]" /note="MGA_188" tRNA 901..991 /product="tRNA-Met" /inference="COORDINATES:profile:Aragorn:1.2.38" /locus_tag="LOCUS_t0040" /note="Aragorn_4" CDS complement(2182..2652) /product="30S ribosomal protein S7" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003421180.1" /transl_table=11 /codon_start=1 /translation="MPRRGNVPKREVLPDPVYGSVVVAKLINSIMLDGKKGVAQKIVYD AFETIKAKTGEEPLEVFNKAMNNIMPQVEVKARRIGGANYQVPIEVRPERRQTLGLRWL TKYTRARGERTMSDRLANELMDAANGLGGSVKKKDDTHKMAEANRAFAHYRF" /locus_tag="LOCUS_1470" /gene="rpsG" /note="WP_003421180.1 30S ribosomal protein S7 (Clostridioides difficile) [pid:77.6%, q_cov:100.0%, s_cov:100.0%, Eval:7.6e-68]" /note="MGA_189" CDS complement(2794..3213) /product="30S ribosomal protein S12" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011860632.1" /transl_table=11 /codon_start=1 /translation="MPTINQLVRQGRVMSEKKSNSPALLKSMNSIKRVPTDTKAPQKRG VCTSVKTVTPKKPNSALRKVARVRLTNGLEVTAYIPGEGHNLQEHSVVLIRGGRVKDLP GVRYHIVRGTLDTAGVANRGQARSKYGAKRPKQKK" /locus_tag="LOCUS_1480" /gene="rpsL" /note="WP_011860632.1 30S ribosomal protein S12 (Clostridioides difficile) [pid:80.6%, q_cov:100.0%, s_cov:99.3%, Eval:3.6e-59]" /note="MGA_190" misc_feature complement(3335..>4862) /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_003429485.1:DNA-directed RNA polymerase subunit beta'" /note="WP_003429485.1 DNA-directed RNA polymerase subunit beta' (Clostridioides difficile) [pid:64.3%, q_cov:88.0%, s_cov:38.4%, Eval:5.4e-160, partial hit]" /note="MGA_191" /locus_tag="LOCUS_1490" ORIGIN 1 aatttttctt ttgccatttt actttctcct tttcacgtga tttggtttat aaaattgcaa 61 ttttggttac ttattgatct tgtccagcag gttgtcgggc agcttctcga agtgatccat 121 ctgcatgacg tacgtgcctc tgccctgggt cttggaacgc aggtcggtgg cgtagccgaa 181 catctgggag aggggtacca tggcatccac ggtggctgcg ccgttgcgga tgtcggtgcc 241 ttcgatcctt cctctgcggg aagagatgtc tccgatcacg tctcccatgt attcctcggg 301 agccgtaact tctaccttga agatgggttc cagcaggatc ggagcagcct ttgctgcggc 361 ttctctgaag gccatggaag cggcgatctt gaacgccatt tccgaggagt ccacttcgtg 421 gtaggaaccg tcaaacagct cgacacccac gtcgaccacc tgatagccgg ccaggggacc 481 cgtctccatc gcttcgcgaa taccttcgtc gatcttgggg atgaattcct tggggatggc 541 gccgccaacg atcttgttga cgaactcgta gccttctccc ggctgtctgg ggtagaggcg 601 gatcttgacg tgaccgtact ggccgtgtcc gccggactgc ttggcgtatt tgttgtcgac 661 gatggcttcc ttcgtgatgg tctctttgta ggaaacctgg ggcttgccca cgtttgcctc 721 gaccttgaac tcgcggagca gtctgtcgac aatgatctcc agatggagtt cgcccatgcc 781 cgcaatgatc gtctgaccgg tgtcggggtc ggtgtaggtc ttgaaggtgg gatcttcctc 841 ggcaagcttt gccagggcga tgcccatctt ttcctgaccg gccttcgtct tgggttcgat 901 ggcgatctgg ataacgggat cggggaattc catggattcc agaatgatgg ggtgcttttc 961 gtcgcacagg gtgtcgcctg tggtcgtatc cttcagaccg accgcggctg cgatatcgcc 1021 ggaatagacc tgttcgatat cttctctgtg gttggcgtgc atctgcagga tgcggccgat 1081 ccgttccttc ttccccttgg tggagttgta aacgtaggag ccgctctcca gcgtgccgga 1141 gtagacacgg aagaacgcca gcttgccgac ataggggtct gccacgatct tgaatgcaag 1201 tgcggagaac ggacccttgt cgtccgcagg acgctctgcc tctttctcca gtctggggat 1261 gatgcccttg atgggcggaa tatccagcgg agaaggcata tagtccacga cggcatccag 1321 catcagctga acacccttgt ttttataggc ggaaccgcac agaacgggga ccatcttgtt 1381 cgcgatggtc atcttgcgga tcgtcgactt gatctcttcg gcggtgagtt cttcaccttc 1441 cagatacttc atcatgagat cttcgtcgca ttccgcaacg gattccagca tcttctgccg 1501 gtattcctct gcgaggtcca tcatgtcttc ggggatgtcc tgctcttcga tgacagtgcc 1561 gagatcgtct tcgtagatct ccgccttcat cttgatgagg tcgataatac cccggaatgt 1621 gctctccacg ccgatgggga gctgcactgc caccgcattg gccttcagtc tgttcttgac 1681 catgtccagc acgtggtaga agtctgcgcc catgatatcc atcttgttga cgaagatcat 1741 tctgggaacg ccgtacttct ccgcctgccg ccagactgtt tcggactggg gctctacgcc 1801 gcctttggcg cagagaacgg tgacggcacc gtccagtaca cgcagagatc tctccacctc 1861 tacggtgaag tctacgtgac ccggtgtatc gataatattg atcctagtgt ttttccactg 1921 agcggtcgta gcagcagaag tgatggtgat gcctctttcc tgctcctgga ccatatagtc 1981 cattacggct gcaccctcgt gggtctcgcc cattttatgg gtcttaccgg tatagaacag 2041 aatacgctct gtagtcgtcg tcttaccggc gtcgatgtgc gccatgatgc cgatattacg 2101 agtattttcc agcgaaaact ttctaggcat gtcttcctcc tttcctgccc ggtacctgat 2161 ggctgtactg catggatcct attagaatct gtagtgagcg aacgctctgt tcgcttctgc 2221 catcttatgc gtatcgtctt tcttcttgac ggatccgccg agtccgttgg cggcatccat 2281 gagctcgttg gcgagtctgt cggacatcgt ccgttcgcct ctggctctcg tgtacttggt 2341 gagccatctc agacctaagg tctggcgtct ttccggtctg acttcgatag gaacctggta 2401 gttcgcacca ccgattcttc tggccttgac ttcaacctgg ggcatgatgt tgttcattgc 2461 cttgttgaag acttccaggg gttcttcgcc ggtctttgcc ttgatggtct caaaagcatc 2521 gtagacgatc ttctgtgcta cacccttctt gccgtcgagc ataatgctgt tgatgagctt 2581 agccacaaca acactgccgt atacaggatc ggggagcact tccctcttgg ggacgtttcc 2641 acgtcttggc acttcacttt cctccttgcg tatgttgcgc aaatcatcgg tactcgcagc 2701 gggtcacccg ccgcgcggtg ccattatcta tatgataagg gcactctagt ttacccgata 2761 tgaacaataa cttctgaatg gtttcggtaa gaattacttc ttctgcttgg gtctcttcgc 2821 accgtacttg gaacgggcct ggcctctgtt ggcaacgccg gcggtatcca gcgtacctct 2881 tacgatgtga taacgcacac cggggaggtc cttgactctg ccgcctctga tcagaacaac 2941 gctgtgttcc tgcagattgt ggccttcacc gggaatgtaa gcggtaactt ccagaccgtt 3001 ggtgaggcgt acacgggcga cctttctcag cgcagagttc ggcttcttcg gagttactgt 3061 cttaacggaa gtgcaaacgc ctctcttctg aggtgccttc gtatcggtcg gcactctctt 3121 gatgctgttc atgcttttca gcagagccgg agagttggac ttcttttcgg acattactcg 3181 tccctgtctt accagttggt taatggtagg cattcatatt ctcctttctt caagattttt 3241 atattgaccc gcccgcacgc tgcgcgtgcg ggcagaaatc aacagcacaa caggattagt 3301 gtaacacagt gcatcccttg atgtcaaagg ctttctaggc ttcttcctca ggaatttctt 3361 cctcgaaagc ttcctcttcc gccatggctt cttccgccgg gagatgagtc tcgtccgccg 3421 gatcgtccgc gtagagttcg tcgggcgttt cgtcctcggt atactcgctg cggatctcct 3481 tcgtattgaa ggattccatg tattccgtgt ttacaccgta atcgatgtcg atattcttgt 3541 aaggcttcat gccggtaccg gccgggatga gcttaccgat gatgacgttc tccttcaggc 3601 cgagcagtct gtcgcgcttg cccttgatgg cagcgtcggt caggactctg gtcgtctcct 3661 ggaaggaagc cgcggacagg aaggaattcg tagcaaggga ggccttcgtg ataccgagga 3721 gctctctctt gtactgggcg ggttctttgc cttcttccag cgcgttgttc tcgtcttcga 3781 tctcgaagag gttgtagagg gcgccgggca gcaggtgggt gtctcccgcg tcgtcgatgc 3841 ggtacttgga cagcatctgg gacacgatga cttcgatgtg cttatcgttg atgtctacac 3901 cttgctgctt gtatactctc tgcacttcct tgagcagata ctggtatacg ccttccacgc 3961 cgtttaagcg catgatgtcg tgcgggttga gcggaccctg ggtgatgcct tcgcctgcgt 4021 ggaccacgct gccttcggtc accttgagtc tcgcgccgta aggaatgatg tagactcttt 4081 cctcttcgcc gcggatgcgc acttcggtct tgttgtcggg acgcggttcg atggagacga 4141 cggtgccgtc cgcctcgcag atctccgcga tacccttcgg cttacgggct tcgaaaagtt 4201 cttcgactct cggaagaccc tgggtgatat cgttacccgc gacggatacg ccgccggtat 4261 ggaacgttct catggtcagc tgcgtaccgg gttcgccgat ggactgcgcg gcgatgatgc 4321 cgacggcttc gccgatgttc acgtgggaac cggtggccag gttgcggccg tagcaggcgg 4381 cgcagatgcc ggtcttgctc ttgcaggtca tgaccgaacg gatcttgacg gcttcgatgc 4441 cggcgtcctc gatggcctgg gcctgctttt cgttgatctc ttcaccgcct tcgacgatga 4501 cttcgccggt ggccgggtca acgatgtcct cgagcgccgt tctgcccacg atacgcaggc 4561 gcagggcctc gatgacttcc ttgccgtccg tgaaggctct gacttcgatg ccttcgtcgg 4621 tgccgcagtc gttctcgcgg acgatcacgt tgtgggatac gtcgacgaga cggcgggtca 4681 gataaccgga gtccgcggta cgcagagcgg tatctgccag accctttctg gcgccgttgg 4741 cggagatgaa gtattccatg accgtcagac cttcgcggaa gtttgcggtg ataggaattt 4801 cgatggtctt accggcagcg ttgcccatca gaccgcgcat gccgccgatc tgacggatct 4861 gg // LOCUS sequence030 4837 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence030 VERSION sequence030 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..4837 /mol_type="genomic DNA" /organism="" /note="sequence030" misc_feature <1..921 /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_011986771.1:HAMP domain-containing sensor histidine kinase" /note="WP_011986771.1 HAMP domain-containing sensor histidine kinase (Clostridium botulinum) [pid:60.2%, q_cov:95.4%, s_cov:70.2%, Eval:1.3e-93, partial hit]" /note="MGA_192" /locus_tag="LOCUS_1500" CDS complement(982..1143) /product="rubredoxin" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_010966063.1" /transl_table=11 /codon_start=1 /translation="MDKYVCSVCGYEYDPAVGDPDNGIEPGTAFEDLPADWVCPLCSVG KDEFEKAE" /locus_tag="LOCUS_1510" /note="WP_010966063.1 rubredoxin (Clostridium) [pid:75.5%, q_cov:100.0%, s_cov:98.1%, Eval:6.5e-21]" /note="MGA_193" CDS complement(1175..1549) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MGKFVIKETKTGFTFRLKAGNGEVIGTSEVYKAESSCKNGIASVA KNAPIAAIEDQTTEEFEKAKNPKFEVYTDKAGETRFRLKAANGEIILASEGYAAKKSCL NGIESVRKNAVDAEIVKEEA" /locus_tag="LOCUS_1520" /note="WP_002672132.1 YegP family protein (Treponema denticola) [pid:61.1%, q_cov:43.5%, s_cov:93.1%, Eval:5.0e-13, partial hit]" /note="MGA_194" CDS 1729..3570 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MDGNTKKTLHIPSLCAFFLCLVLLDLVFRAAFLEGGFAESCSGTA LLFSLFWAAGLTGFVCLLPDRGRRIAMPLLVAFWSALCLVHSVIHHLTGSFFSVADLDY AEDGVKFFSKEYLIFSPGFMICALCVFLAVLCMSVCMEKSSYSRGRAILGAVLLAAGVT GGAVTHFQLMPEITTQMSWRVQSEDKTTDNYIYHDMSNANRAMELCGMYQYLWRSFVVS TLQSDARQYGKMYEELDAWFAEKQASPHRSNAYSGKLAGKNCFFILLESIDTWLLTEDY MPNLYAVRQQSVDFANHYSSLYITASTFNTEFIANTGQIPPSAGLDTSAYEENTFPMAL AKLFTEAGYTAKTFHSADPVIYNRGSIHKNLGYGPYYYHYNMGMDDYMLDTQLMRGFGY MTADQPFFDFILTFSGHGPYTEEMANISDPHLAVAKTAVARASIPIEARRSEEYLLAVA HAMETDAFVGELMQALEDSGLAEDTALVFFTDHYCKYMTDTDLVMKLKGVSDMDAICHT PFFIWSKDLPARSIPKVTSTMDIAPTIVNLFGLDADYAWYPGSDIFSADGGTAIFRGGS WYDGREWGGPTPETLQFLSLAGDVLRCDYFGRSVNPQ" /locus_tag="LOCUS_1530" /note="WP_011460023.1 LTA synthase family protein (Desulfitobacterium hafniense) [pid:23.9%, q_cov:51.9%, s_cov:51.3%, Eval:1.2e-18, partial hit]" /note="MGA_195" ORIGIN 1 gtcatcgttt tgctccggct catcctggat ctgctgcgga tccggaagca gcttaagcct 61 ctggacgaga tggcccgggc cgccatggac ctgagcaata tcgacgtatc gatcgatgac 121 cgcttccaaa agctcgagag cgccatcgac cgtctgagcc cggcggagga agatgcggcg 181 ctcgcgacgg gagacgcgga gctggaaggg ctggaaagcg ccgtcaacaa gctggtggag 241 cgcatgcgcg acgcctaccg gcagcaggcc cgcttcgtgt cggacgcctc ccacgagctg 301 cgcacaccga tcgcggtcat caagggctac gcggacatgc tggaccgctg gggcaaggag 361 gatgaggcta tcctggagga gtccatccaa gcgatcaaga cggagagtga cgccatgcag 421 catctggtgg aacagctgct gttcctggcc cggggcgatt ccggcagaac gccggtggag 481 cgggtggatt tcagcctgac ggatatgatg aaagaggcct gcagcgaatc cgccatgatc 541 gacgagacgc acacgtaccg tctgcaggcg gaggaaggcg taaacgccta cggcgatgct 601 tccctgctga agcagaccgt gcgcatcctg acggagaacg ccaagaagta ctctccggag 661 ggcagcgaga tcgtgctggg gactaaatat aaggacggca ggccctgctt ctgggtggaa 721 gaccggggca tcggcatgga cagcgacgcg cagacccaca tgttcgagcg cttttaccgg 781 gcggacgatt cccgggcgcg ccagaccggc ggatccggac tgggccttgc catcgcgaaa 841 tggatcgtgg accggcacgg cgggcgcttc gaggtcgtgt cgcgcaccgg tatcggcacg 901 cgcatctcgg tgatcctgta gaaaataaaa taacacaggg ggacaggtat ctgtccccct 961 gtgttgtttt tgtcttaatg cttattcagc cttttcgaat tcgtccttgc caacgctgca 1021 gagcgggcag acccaatctg cgggcagatc ttcgaaggcg gtgccgggtt cgataccgtt 1081 atcgggatcg cctactgcgg ggtcatactc ataaccgcag acgctgcata catacttgtc 1141 cattggtgat agtctccttt aacaatatgg tggattatgc ttcttccttg acgatctcgg 1201 cgtctactgc gttctttctg acgctctcga tgccgttcag gcagctcttc tttgctgcat 1261 agccttcgga agccagaatg atctcgccgt tggcagcctt caggcggaag cgggtctcgc 1321 cggccttgtc ggtgtacact tcgaacttgg ggttcttagc cttttcgaat tcttccgtgg 1381 tctggtcttc gatggcagcg atcggagcgt tcttggcaac gctggcaatg ccgttcttgc 1441 agctgctctc agccttgtaa acttcggaag tgccgatgac ttcgccgttg cctgccttca 1501 ggcggaacgt aaagccggtt ttggtctctt tgataacaaa tttgcccatg ggtgttgcct 1561 cctttttcga aaaagtaagt attgcgatat atcgacttca gtatagcatt ttattcacaa 1621 aaataaaaga tgtgcatttt atcccgtttc ggagcacaaa acgcgcaccg gtttatggta 1681 tactgtaaaa atcctcgcaa aataaagaaa gaaacggatc gttccgacat ggatggcaat 1741 accaagaaaa cccttcatat tccaagcctt tgcgcgtttt tcctgtgcct ggtcctcctg 1801 gacctcgttt ttcgtgccgc ttttctggaa ggcggctttg cggaaagctg ttccggcacg 1861 gcgctgctct tctcgctgtt ctgggctgcc gggctcacgg gcttcgtctg tctgctcccg 1921 gaccggggcc ggcgcatcgc catgcctttg cttgttgcct tctggagcgc gctctgcctt 1981 gtgcacagcg tcatccatca tctgacgggc agcttcttct ccgtcgcgga cctggattat 2041 gcggaggatg gcgtcaaatt cttcagcaag gagtatctga tcttctcccc cggctttatg 2101 atctgcgctt tatgcgtatt tcttgccgtt ttatgcatgt ctgtgtgtat ggaaaagagc 2161 agctacagcc gcggccgggc gatcctcggc gcggtcctgc tggctgccgg ggtcaccgga 2221 ggcgctgtga cccatttcca gctgatgccg gagatcacca cgcagatgtc ctggcgcgtg 2281 cagtcggagg ataagacgac ggacaactac atttaccacg acatgagcaa tgcgaaccgg 2341 gccatggagc tgtgcggtat gtaccagtat ctgtggcgca gtttcgtcgt gtcgacgctg 2401 cagtcggatg cccgccagta cggcaagatg tacgaggaac tggacgcctg gttcgcggaa 2461 aagcaggcat cgccccacag atccaacgcc tacagcggaa agctggccgg aaagaactgc 2521 ttcttcatcc tgctggaatc catcgatacc tggctgctca cggaagacta tatgccgaat 2581 ctgtatgcgg tgcggcagca gagcgtggac tttgcaaacc actattccag cctctacatt 2641 accgcttcca ccttcaatac cgaattcatc gccaacaccg gccagattcc gccctctgcg 2701 ggcctggaca cctccgccta cgaggagaac acgttcccca tggcgctggc caagctgttt 2761 acggaagcgg gctataccgc caagaccttc cacagcgcag atccggtcat ctacaaccgg 2821 ggcagcatcc acaagaacct cggctacggt ccctactatt accactacaa tatggggatg 2881 gacgactata tgctggatac ccagctgatg cggggcttcg gctatatgac cgcggaccag 2941 ccctttttcg actttattct tacgttctcg ggtcacgggc cctatacgga ggagatggcc 3001 aacatctccg atccccatct cgccgttgcg aagaccgcgg tagcccgggc cagcattccc 3061 atcgaagcca gacgttctga ggaatacctg ctggcggtgg ctcacgccat ggagaccgac 3121 gccttcgtcg gcgaactgat gcaggcgctg gaggacagcg gcctcgcgga ggatacggcg 3181 ctggtgttct ttacagacca ttactgcaag tacatgacgg atacggacct cgtgatgaag 3241 ctcaagggcg tgtccgacat ggacgcgatc tgtcatacgc ctttctttat ctggtcgaaa 3301 gacctgcctg cccgcagcat ccccaaggtg acctccacca tggacatcgc acccacgatc 3361 gtcaacctgt tcggtctgga cgcggactac gcctggtatc cgggcagcga tatcttctcc 3421 gcggacggcg gcactgccat cttccggggc ggctcctggt acgacggcag ggagtggggc 3481 ggacccaccc ccgagaccct gcagttcctc tctctcgcag gcgacgtgct gcgctgcgac 3541 tatttcggcc gctctgttaa tccccagtag tttatggtat aatatactgt cttattgggt 3601 ggagtttcgc ccaatgaaag gatggtatca tgaacgggaa atttcttcac aatctgatcc 3661 ggagctttac ccggatcgat atgatcgtaa tgatcgttct ggccctcatc atcctgtggc 3721 tgaacgtata cgcgggcatc gtcgcgtttc tgatcgtcgc cgctctcagc atctaccaca 3781 cgaagctgat ggggcaggcc tcggaagaat ccatcaagga gtacgaggaa tcggtcatcc 3841 gtcaacacat ggacgaagcg ggcatcaagg aagacggcac cgttacggat aaggcggcag 3901 ctgcggagat cgagcgcctg aagaaggcga acgaggacgc ccagagctgc atcgctctca 3961 tcaacatcga caactacgac gaactgctgg cgagctctcc cgtggaggag cagtcctcca 4021 tcggtgcgga gatcgacaag aagatccgcg cctggacgca gtatctggac gcagccgtca 4081 cccgggtgcg cagcaaccgg tactacgcgc agttcgagaa caaatatctc gccgaacaga 4141 agcgcagcga attccccatc atcaaccaga tgcacgagat cgagacccag gcggatttcc 4201 ccacctccgt ctccatcggc atcggaacgg gcagcggcag tttctcccgc atccaggccc 4261 tggcagagga agccatggat ctggcgctgg gcagaggcgg cgaccaggcg gtcatcaagc 4321 acgaggacgg ggacatcgaa tactacggcg gctcccttcc cagcgtggaa aagcgcaaca 4381 agggcaaggc ccgcatcatg gcccacgccc tgatgcagct ggtcaaaagt tccgaccggg 4441 tgttcatcat gggtcacgca aggcccgaca tggactgcat cggctccgcc atcggcatgt 4501 acaccttcgc ccgcagcgcc ggcaagccca cggacatcat cctggacaac gtgggccagg 4561 cgatcgatat catctacgag gcggcggtca agaccggccg gtacagcttt atcagcggcg 4621 aaaaggcgtc ccagctggcg acggacaata cgctgatcat cctcgtggat tcgcacatcc 4681 cggccatcgc ggaatatccg cccatcctgc agcaggtaaa ccggatcgca gtcatcgacc 4741 accacagaaa gtcgaaggac gcggtggaga accccacgct gatgcacatg gagacctacg 4801 cgtcttcggc cagcgaactc gtaacggaac tgctgca // LOCUS sequence031 4797 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence031 VERSION sequence031 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..4797 /mol_type="genomic DNA" /organism="" /note="sequence031" CDS 3..362 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MYDTNIPCEPAGVFHGNMVVSMRPIPYELVSKAVQITAAMPRVHG APVHIGAPEAIGIRDLSRPDYGEAVTIKEGEVPVFWPCGVTPQNALMRSKPSFAITHAP GHMLISDVKNVNLKY" /locus_tag="LOCUS_1540" /note="WP_010886407.1 putative hydro-lyase (Bacillus) [pid:63.2%, q_cov:98.3%, s_cov:45.5%, Eval:8.8e-42, partial hit]" /note="MGA_197" CDS 365..1198 /product="DUF4392 domain-containing protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011011337.1" /transl_table=11 /codon_start=1 /translation="MNEKKTIEDIILTGSHRGMDELRLYLPEFYCEEAAKAILSWSRGP VLLATGFYVAGHAETDGPTGTVVLAKALQKLGFEPHILTDEACSHYFEPEGLDVIYMDV AEGNAFSEDLLKNLQPAGLISIERCGRNVKGDYANMHGESVRSHTARIDGLFELAYGSV PTIGVGDGGNEIGMGNLADVIEEKLNLVPCRVKTDHLVIASVSNWGAYGITAYLEKLTG EKVFPGLDEVEGYLSRTILLGSVDGVLRQNVCSVDGYPLAESERVYRLLQQAVTV" /locus_tag="LOCUS_1550" /note="WP_011011337.1 DUF4392 domain-containing protein (Pyrococcus furiosus) [pid:34.4%, q_cov:97.8%, s_cov:98.5%, Eval:1.2e-26]" /note="MGA_198" CDS complement(1188..1451) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MKLLMKPIDAIVVFKGSGKPLPYKFRYTDTEGISREVYVKRILTA AEEKFAGIPVYVYDCQSDIGGAEKRYQLKYFIPECRWELFKL" /locus_tag="LOCUS_1560" /note="MGA_199" CDS complement(1570..2385) /product="MBL fold metallo-hydrolase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_010963856.1" /transl_table=11 /codon_start=1 /translation="MKLTILSENSTHTREPYLMGEPGFCCYIECSGKRLILDSGYHGIA LKNAAMLGIDLNGLDYIAISHGHDDHTHGLLPLLEAGLDVTHTKLVAHPKALKRKVVDG VESGFPWPEEEIRSRFDILEAKEPVELAENLWYLGQIPRTNNFENQKPVGFVVEDGTEE EDYLLDDTALAYRAKDGVFIITGCSHSGIVNICEYAKTVLGEERLLGVIGGFHLLQPGT QLDETIRYFEREKPEKLCPCHCISMRCKFRIAQQLPIEDVAVGFELEVE" /locus_tag="LOCUS_1570" /note="WP_010963856.1 MBL fold metallo-hydrolase (Clostridium) [pid:45.5%, q_cov:98.9%, s_cov:99.3%, Eval:7.4e-66]" /note="MGA_200" CDS 2475..3068 /product="Maf family protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_005816795.1" /transl_table=11 /codon_start=1 /translation="MDLKNTTVVLASGSPRRIDMLRADGIEPHIVKPDCEENIHIGLSP AQEVMALALRKNLRAVEMLKEQGDLPAEGVVLSADTMVVLDGVPMGKPRDEEDAFRILS LLRGKTHTVQSGACIRDLASGRLLLFSEGTDVTFMEYTDEDIRAYVATGEPMDKAGAYA IQGGFAPYVTHTNGPLDNVIGFPYASIKRILEAW" /locus_tag="LOCUS_1580" /note="WP_005816795.1 Maf family protein (Desulfitobacterium hafniense) [pid:43.2%, q_cov:96.4%, s_cov:88.7%, Eval:7.5e-31]" /note="MGA_201" CDS 3178..3873 /product="DNA repair protein RadC" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011392073.1" /transl_table=11 /codon_start=1 /translation="MDAPLAVRELPAAERPREKILSQGVQTLSNTELLAVLIASGSAEN SAIGLAGKVLAMGEGSLASLSGFLPEEFMHIPGIGPAKACLLSAAVELGRRIATAPAAD RTVISGPADSAKLFMGEMRYLKQEVIQVALLNVKQELLMKERVAAGGLFSASAHSREIF SSAVRKGAFGVILAHNHPSGDPQPSDEDIAMTKQVEDAGKVLGIRLLDHIIIGDGRYFS FLDAGYLQK" /locus_tag="LOCUS_1590" /gene="radC" /note="WP_011392073.1 DNA repair protein RadC (Moorella thermoacetica) [pid:48.4%, q_cov:97.4%, s_cov:97.4%, Eval:2.3e-51]" /note="MGA_202" CDS 3964..4680 /product="septum site-determining protein MinD" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_010964562.1" /transl_table=11 /codon_start=1 /translation="MGIVALITSGKGGAGKTTITVNLGATLAQKGARVVLVDFNMGLRN LDIYLGMEDTCLFDLGDVLTGVCKVEKALVHDDRFGRLYMLPCPQFKEINGVTPQHVAG LFAVLKKNFDYILVDMPLGIGSPLENVAQAADLGIVVVTPDYVSLRNADTVDRKLESCG LQKRCFLINQVDLELLRTGNVPGIEQIARGMSTPMAGIVPYDENIHAGNNMGNPVVLAS DSYIAKNFSSIALRVF" /locus_tag="LOCUS_1600" /gene="minD" /note="WP_010964562.1 septum site-determining protein MinD (Clostridium) [pid:40.5%, q_cov:99.6%, s_cov:90.1%, Eval:1.9e-48]" /note="MGA_203" ORIGIN 1 ccatgtacga cacgaacatc ccctgcgaac cggccggcgt tttccacggg aacatggtgg 61 tctccatgcg gcccatcccc tatgaactcg tgagcaaggc ggtgcagatc acggcagcga 121 tgccccgggt gcacggcgcg ccggtgcaca tcggagctcc ggaagcgatc ggcatccgcg 181 atctgtcccg cccggattac ggcgaagccg tcactatcaa ggagggtgag gtaccggtgt 241 tctggccctg cggcgtgacc ccgcagaacg ccctgatgcg gtcgaagcct tcctttgcca 301 ttacccatgc gccgggtcac atgctgatct cggacgtaaa gaacgttaac ctgaaatact 361 gaaaatgaac gaaaaaaaga ccatcgaaga cattatcctg acgggttccc accggggcat 421 ggacgaacta cgcctctatc tgccggaatt ctactgcgaa gaggcggcga aagccatcct 481 ttcctggagt cgcggtcccg tgctgctggc taccggtttt tatgtggctg ggcatgccga 541 gacggacgga cccaccggga cggtcgtcct ggcaaaggcg ctgcagaagc tgggatttga 601 gcctcatatc ctgacggatg aggcctgcag ccattacttc gaaccggaag ggctggacgt 661 gatctatatg gacgttgcgg aagggaacgc cttctcggag gacctgctga agaatctgca 721 gcctgccggc ctgatctcca tcgaacgctg cggacggaac gtgaaaggag actacgccaa 781 catgcatggc gagagcgtgc gcagtcacac ggcccggatc gacggactgt tcgagctggc 841 ctacggcagc gtgcccacca taggtgtggg ggacggcggc aacgagatcg gcatgggaaa 901 tctggcggat gtgatcgagg agaaactgaa tctcgtgccc tgccgggtaa aaacggatca 961 tctggtgatc gcttcggtct ccaactgggg cgcctacggc ataacggcgt atctggaaaa 1021 actgacgggg gagaaggtct ttcccggtct ggacgaggtg gagggatatc tgtcccggac 1081 gatcctgctg ggcagcgtag acggcgtact gcggcagaac gtttgcagcg tggacggcta 1141 tccgctggcg gagagcgaaa gggtatacag actgctgcag caggcggtta cagtttaaac 1201 aattcccagc ggcattccgg gatgaaatat ttgagttgat agcgcttttc cgcgcctccg 1261 atgtcgctct gacagtcgta cacgtagacg gggatgccgg cgaatttttc ttcggctgcc 1321 gtcaggatac gcttgacgta gacttcgcgg ctgatgcctt ccgtgtcggt gtagcggaat 1381 ttatagggca ggggtttgcc gctgccttta aagacgacga tggcgtcgat gggtttcatc 1441 agaagtttca tgggtgcttg tcctccggga tgtgtgcctt acaaggttat tataaagaac 1501 atatgttctt ttctcaagca caaaaagaga gtttacgcgg aactgtccgt ctaaactctc 1561 ttttgcgttc tattccactt ccagttcgaa cccgacggcc acgtcctcga tgggcagctg 1621 ctgcgcgatg cggaacttgc agcgcatgga gatgcaatga caaggacaca gtttttcggg 1681 cttttctctc tcgaaatagc gtatggtctc gtccagctgc gttccgggct gcagcaggtg 1741 gaagccgccg atgaccccca gcagccgctc ttcgcccagt acggtcttcg catattcgca 1801 gatgttgacg atgccgctgt gggagcatcc ggtgatgatg aagacgccgt ccttcgcccg 1861 gtaggcgagg gcggtgtcgt ccagcaggta gtcttcctcc tccgtaccgt cttcgacgac 1921 gaaccccacg ggtttctggt tttcaaagtt gttcgtccgg gggatctggc cgagatacca 1981 caggttttcc gccagctcca ccggctcctt cgcctccagg atgtcgaagc ggctgcggat 2041 ctcttcttcc ggccagggaa agccggattc tacgccgtct acgactttcc gcttcagcgc 2101 tttcgggtgc gcaacgagct ttgtatgggt cacgtcgagg cctgcctcca gcaggggcag 2161 cagtccgtgg gtgtggtcgt cgtgcccgtg ggagatcgcg atatagtcca ggccgtttaa 2221 gtcgatgccc agcatcgccg cgttcttcag tgcgatgcca tgatagcccg agtccaggat 2281 cagacgcttg ccgctgcatt cgatatagca gcagaagccc ggttctccca tcaggtaagg 2341 ttctctcgta tgggtgctgt tttcggaaag gatcgtcagt ttcatggggt gcctcctgta 2401 tcttttttat tatagcagac ggcgtttttg acagaaaggc ctccgtcgct tataatcccg 2461 gggtgaggtg ttttatggat ctgaagaata cgactgtcgt cctggcttcc ggctctcccc 2521 ggcgcatcga catgctgcgc gcggacggga tcgagccgca catcgtaaag ccggactgcg 2581 aagaaaatat ccatatcggg ctgtctcctg cccaggaagt gatggcgctg gcgctgcgca 2641 agaacctgcg tgccgtcgag atgctgaaag agcaggggga tctgcctgct gaaggcgtcg 2701 tgctgtccgc cgataccatg gtggtgctgg acggcgtccc catgggaaaa ccgcgggacg 2761 aagaagacgc gttccgcatt ttaagcctgc tgcggggcaa gacgcataca gtgcagagcg 2821 gcgcctgcat ccgggatctg gcaagcggac ggctgctgct gttctccgag ggaacggacg 2881 tgacctttat ggagtatacg gacgaagaca tccgggcgta tgtcgcaacc ggcgagccga 2941 tggacaaggc cggggcctat gcgatccagg ggggcttcgc gccctacgtg acccatacga 3001 acggtcctct ggacaacgtg atcggatttc cttacgcgtc gatcaagcgc attctggaag 3061 cgtggtaaaa tatctatata tttacaggta aattatagca attttgctgc gtttatgata 3121 aactattctc cgctcggacg cggagaattt tttatgaaac aaaacagaat caggagaatg 3181 gatgcgccgc tggcggtccg ggaactgcct gcagcagagc ggccgcggga gaagatcctg 3241 tcccagggcg tacagaccct ctcgaacacg gagctgctgg cggtgctcat cgcctccggt 3301 tccgcggaaa acagcgccat cggtctggcg ggcaaagtgc tggcgatggg agaaggcagt 3361 ctcgcttctc tgtcggggtt ccttccggag gaattcatgc acatcccggg gatcggtccc 3421 gcaaaggcct gtctgctctc ggctgccgtg gagctgggcc ggcggatcgc tactgcgccg 3481 gctgcggaca gaactgtcat cagcggaccg gcggattcgg cgaagctctt catgggcgag 3541 atgcggtatt tgaagcagga agtcatccag gtggcgctgc tgaacgtaaa gcaggagctg 3601 ctgatgaagg aacgcgttgc cgcgggcggc ctgttcagcg catctgccca ttcccgggag 3661 atcttctcca gcgcggtgcg caaaggggct ttcggggtta tcctcgccca caaccatccc 3721 agcggagacc cgcagccctc cgacgaagac atcgcgatga caaagcaggt cgaagacgcc 3781 ggaaaagtgc tgggaatacg gcttctggac cacattatca taggggacgg ccgctatttc 3841 agctttttgg acgcggggta tctgcaaaaa taattccccg gatttttccc gatttttatt 3901 ccaaaccccc cttgccgatg gtaaaattat cttgtacaat gacttgcatt tggaaggaca 3961 tgtatgggaa tcgtcgcttt gatcacctcc ggtaagggag gcgcaggaaa aaccaccata 4021 accgtaaact taggagcaac cctggcgcag aaaggcgcga gggtcgttct tgtggatttt 4081 aacatgggac tgcgcaacct ggatatctat ctgggcatgg aggatacctg cctgttcgac 4141 ctgggcgacg tgctgacagg cgtatgcaag gtagaaaagg cgctggtcca cgacgaccgg 4201 ttcggccggc tctacatgct gccctgtccc cagttcaagg agatcaacgg cgtcacgccc 4261 cagcatgtgg cagggctgtt cgccgtcctg aagaaaaatt tcgactatat cctcgtcgat 4321 atgcccctcg gcatcggaag ccctctggaa aacgtggcgc aggcggcgga tctgggcatc 4381 gtggtcgtta cgccggacta cgtgtcgctg cgcaacgcgg atacggtgga ccgcaagctg 4441 gagagctgcg ggctgcagaa gcgctgcttc ctcatcaacc aggtggatct cgaactgctg 4501 cgcactggaa acgtccccgg catcgagcag atcgcccggg gcatgagcac accgatggcc 4561 ggcatcgttc cctacgacga gaatatccac gccggcaaca acatgggcaa ccccgtggtg 4621 ctggcatcgg attcctatat cgcgaagaac ttcagcagca tcgcgctccg cgtcttctag 4681 aaaaataaac aacggggacg gttctttgaa ccgtccccgt tatagattct agaaaatgcg 4741 gagcgcgatg ctgctgaagt tcttcgcgat ataggaatcc gatgccagca ccacggg // LOCUS sequence032 4736 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence032 VERSION sequence032 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..4736 /mol_type="genomic DNA" /organism="" /note="sequence032" CDS 648..1619 /product="dipeptidase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003434938.1" /transl_table=11 /codon_start=1 /translation="MKPFQIIDLHCDTIVECVTNGADFRSGTGHISLDKLAAGGSLAQC FAIWIPTGKAAERHHTAGVGYYDYYKTAKAFFKKAMAENSDVVRQARTVAEIEQNKADG KLSAILTVEDSIFVEGKMERIDEMKEDGVRMASLIWNNENCMGYPNRRDFTEHMMGLKP FGYDAIAKMNEYGIVVDVSHLNEGGFWGVAKTSKKPFAASHSCARALCDHPRNLTDEQL KALGEAGGVVGVNFYDAFLHEEETEYTSIADIVKHLEYMKDKAGIEALAFGSDFDGISS KLEFGDFAGFPQIVAALEGKFTDDEIDKICHGNFLRVLKDNE" /locus_tag="LOCUS_1610" /note="WP_003434938.1 dipeptidase (Clostridioides difficile) [pid:37.7%, q_cov:98.1%, s_cov:99.0%, Eval:1.5e-58]" /note="MGA_206" CDS complement(1661..2992) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MRILTVISGMLLAIAGAFTFAFYSNAFTGLAFILGLVMLISGLCI LGAYILSGKVGRLPDTVLVEGMVTTLFGFAVLNNEVMDAMVTLFFGTWMTLSGVTRISQ SFAVSRYRPKDWAKIMPLALAGTILGVIMLMPSLTNYMNPMFLVGAAFIVNGFSQLIYS MYMRKHELTDREIEAQERAEARKVAKAEERKQRNASRSTSWHEREEQRDEQRRQEKRRL AEQRAAKMQELQERRAARRPAAEATMQFTPEEVEEINRLADAPEETVEDELPVTEVQRP KTVVEPEEPAPEETPLEEALEKAKAPVWNRPENIPSLRAKKLEEEAAAAPAAPQAEEEV PDPLAKRAAVNVEKIEEGLESMEFEPVELPDVELESTGGEAEERQEIIEKLETEVKKDD PFKPFEALKLEDLFGEDYVPLREKDPKEATRFTQSLNLDWTKHQ" /locus_tag="LOCUS_1620" /note="MGA_207" CDS 3146..4015 /product="phosphoribosylaminoimidazolesuccinocarboxamide synthase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_010942733.1" /transl_table=11 /codon_start=1 /translation="MTEYQPIKEGKVREIYDIGDYLILVATDRISCFDVILHNTVNKKG TVLTQMSKFWFDLTSDIVPNHMISTDVQDMPEFFRQPRFDGNSMMVKKLTMLPVECIVR GYITGSGWASYQKDGTVCGIKLPEGLKESEKLPEPIYTPSTKAEIGDHDENISFEQSID YLEKRFPGHGEEYATKLRDLTLAIYKKCAAYALERGIIIADTKFEFGLDEDGDVVVGDE MLTPDSSRFWPLEGYEAGKSQPSFDKQFARDWLKANEHDWTLPQEIVDKTIAKYLQAYE LLTGKPLE" /locus_tag="LOCUS_1630" /EC_number="6.3.2.6" /note="WP_010942733.1 phosphoribosylaminoimidazolesuccinocarboxamide synthase (Geobacter sulfurreducens) [pid:53.2%, q_cov:98.6%, s_cov:97.0%, Eval:4.7e-82]" /note="MGA_208" ORIGIN 1 aacttggaat ccttgcggcc ggtcacgata tagtcgtggg tgtcgacctc gacgcagggg 61 gtgacccgga tgaggatatc ggtcttcttg ccgagctttt cgcagatctg ctcgatgagc 121 gccagttcct gctcgccgtc gatgatgatg cgttctacgc cgtagtcgat ggcggcttcc 181 agttccttcg gcagtttgtt gttgccgttg aattccagct tcttcggatc gatgccggcc 241 ttcatggcgg tgtagagctc gccgccggag acgacgtcca tgctgatgcc ttcgttttcg 301 cacagcttat acatgcccat gcagcagaac gctttggcag cgtacgcgat cctgtttttc 361 ggatagggtt ttacgaaaca ttccttcagc tcgttgatgc ggctgacgat atccgtcttg 421 gacatgacgt acagcggcgt gccgaattcc ttcgccagtt ccacggtgtc gcagccgtcg 481 aaccacagat gacttccttt gatctcgctg accatattca tacgcattca ctccttttct 541 ctgcgaaaaa cgaaaggtta aactcaatac atttttatta tatgccttgc gccgcttctt 601 ctcaatcgct aaaatagaga cggtgtttgt accagaaagg cttaatcatg aaaccattcc 661 aaatcatcga tctgcattgc gacacgatcg tcgaatgcgt cacgaacgga gccgatttcc 721 gcagcgggac cggccatatc tctctcgata agctggcggc aggcggaagc ctcgcccagt 781 gctttgccat ctggatcccc acgggcaaag cggcggagcg ccaccacacc gcaggcgtag 841 ggtattacga ttattacaag actgccaagg cgttttttaa gaaagcgatg gcggagaaca 901 gcgacgtcgt gcgtcaggca agaacggtcg ctgagatcga acagaacaag gcggacggca 961 aactgtctgc gatcctcacg gtggaagatt ccattttcgt cgaaggcaag atggaacgca 1021 tcgacgagat gaaagaggac ggcgtgcgca tggccagcct catctggaac aacgagaact 1081 gcatgggcta tcccaaccgc agagatttta cggagcacat gatgggcctg aagcccttcg 1141 gatacgacgc gatcgcgaag atgaacgaat acggcatcgt cgtagacgtt tcccacttaa 1201 acgaaggcgg cttctggggc gttgccaaga ccagcaaaaa gccctttgcg gccagccatt 1261 cctgcgccag agcgctgtgt gaccatccca gaaacctgac ggacgaacag ctgaaggcgc 1321 tgggcgaagc cggcggcgtc gtaggtgtaa acttctacga tgcgttcctg cacgaggagg 1381 agacggaata cacgtccatc gcagacatcg taaagcacct ggaatacatg aaggataagg 1441 ctggcatcga agcgctggcc ttcgggtccg acttcgacgg catcagctcc aagctggagt 1501 tcggcgattt tgcgggcttc ccgcagatcg ttgccgcgct ggaaggtaag tttacggacg 1561 acgagatcga caagatctgc cacggaaact tcctgagagt gctgaaggat aacgaataaa 1621 aaggatacga aaaagccggc cgcacaggcc ggcttttgtt ttactgatgt ttcgtccaat 1681 ccagattgag ggattgggta aagcgggtgg cttccttggg atctttctcc cgcagcggca 1741 cgtaatcctc gccgaacagg tcttccagct ttagagcttc gaagggtttg aaggggtcgt 1801 ccttcttgac ttcggtctcc agcttttcga tgatctcctg ccgttcttcc gcctcgccgc 1861 cggtggactc cagttccacg tccggcagtt ccacgggctc gaactccatg ctctccagac 1921 cttcttcgat cttctcgacg ttaacggcgg cgcgctttgc cagcgggtcg ggcacttcct 1981 cctccgcctg cggcgctgcc ggggctgccg cagcttcctc ctccagtttc ttcgcacgga 2041 gggaggggat gttctccgga cggttccaga ccggcgcctt tgccttttcc agcgcttctt 2101 ccagaggcgt ttcctccggg gcgggctctt ccggctcgac gaccgtcttc ggacgctgca 2161 cttcggtaac gggaagttca tcttcgaccg tttcctcagg cgcatcggcc aggcggttga 2221 tctcttcgac ttcctccggc gtaaactgca tggtggcttc cgccgcgggg cggcgggccg 2281 cccgtctttc ctgcagctcc tgcatcttgg cggcgcgctg ttccgccagt ctgcgctttt 2341 cctgacggcg ctgctcgtct ctctgctctt ctctttcgtg ccagctcgtg ctgcggctgg 2401 cgttgcgctg tttgcgctcc tccgcctttg cgacctttct ggcttccgct ctctcctgtg 2461 cttcgatctc ccggtccgtc agctcatgct ttctcatgta catggagtag atgagctggg 2521 agaaaccgtt gacgatgaat gcggcgccca cgaggaacat ggggttcatg tagttcgtga 2581 gggacggcat cagcatgatg acgcccagga tggtgccggc cagcgccagc ggcatgatct 2641 tcgcccagtc tttcgggcgg tagcggctca cggcgaagct ctgggagata cgggtgaccc 2701 ctgacagggt catccaggtg ccgaagaaca gcgtgaccat ggcatccatg acctcgttgt 2761 tgagcacggc aaatccgaac agcgtcgtga ccatgccttc cacgaggacg gtgtcgggca 2821 atctgcccac tttcccggac aggatgtagg cgcccaggat gcacagtccc gagatgagca 2881 tgacgagacc caggatgaac gccaggcctg taaacgcgtt ggaatagaat gcaaatgtaa 2941 aggcacctgc tatggcgagc agcatgccgg atatgacggt caaaattctc atagatccag 3001 cctttctgaa aacctaatca ttatattaga atacggctga ttagtcaaat tttgcgtcgc 3061 cttgcagtcc aaagccttgc gcgctttccc gctttgtatt attctatttt tgttaacgtt 3121 gcattggcag gacaggaggg aactcatgac agaatatcaa cccatcaaag aaggcaaagt 3181 ccgcgagatc tacgacatcg gagactatct gatcctggtc gcgaccgacc gcatcagctg 3241 cttcgacgtg atccttcaca acaccgtaaa caagaagggc accgtgctta cccagatgtc 3301 gaagttctgg ttcgatctta ccagcgacat cgtgcctaac cacatgatct ccaccgatgt 3361 gcaggatatg cccgagttct tccgtcagcc ccgcttcgac ggcaacagca tgatggtcaa 3421 aaaactcacg atgctgcccg tggaatgcat cgtccgcggc tatattaccg gcagcggctg 3481 ggccagctat cagaaggatg gcacggtctg cggcatcaaa ctgcccgaag gcttaaagga 3541 atccgaaaag ctgcccgaac ccatctacac gccctccacg aaggcggaga tcggcgacca 3601 cgacgagaac atctccttcg agcagagcat cgactatctg gagaagcgct tcccgggtca 3661 cggggaagaa tacgcgacga agctcagaga ccttacgctg gcgatctaca agaagtgcgc 3721 ggcgtatgcg ctggagagag gcatcatcat cgcggatacg aagttcgagt tcggtctgga 3781 cgaagacggc gacgtcgtgg taggtgacga gatgcttacc ccggacagct cccgcttctg 3841 gcccttggaa ggctacgaag ccggcaagag ccagccgtcg ttcgacaagc agttcgcccg 3901 cgattggctg aaagccaacg aacacgactg gacactgccg caggagatcg tcgacaagac 3961 cattgccaag tacctgcagg cttacgaact gcttacgggc aagcctctgg aatagggctc 4021 caggaacaga atacgaaaag accgctcccc ctgtgttttt gtgcgaacaa atgatataat 4081 caatacggat ccgggcagcg gtctttctgt tgtctggatc ataacatacg gaaagtccca 4141 taaatgggtc aattcaagag aaaaggagtt agagatggca ggagtaatct taggaatcat 4201 cgttgttttg cttctcatca ttctgtgcat ccgctgcatc tgcatcgtgc cgcaggccag 4261 cgcatggatc gtggaagcgt taggtcagta taaggctacg tggggtgccg gccttcattt 4321 caaggtgccc atcatccacc gcgtcgtcaa gaaagtgtcc ttaaaggaac aggtcgcgga 4381 cttcgaaccg cagcccgtta tcacgaagga taacgtaacc atgatggtgg actccgtcgt 4441 attcttctac attttcgacg ccaagctgtt cgcctacggc gtggagagac cgatcgcggc 4501 gatcgagaat ctgtctgcta cgactcttcg taatatcatc ggctccatga ccctggacga 4561 gaccctcacg agccgcgacg acatcaacag ccgcatcacc gctatcctgg acaacgccac 4621 cgataagtgg ggcatcaagg tgagccgggt agaagtcaag aacatcgcgc cgcccagaag 4681 catccaggaa gccatggaaa agcagatgaa ggcagaacgc gaaaagagag aagcga // LOCUS sequence033 4723 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence033 VERSION sequence033 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..4723 /mol_type="genomic DNA" /organism="" /note="sequence033" CDS complement(327..1349) /product="phenylalanine--tRNA ligase subunit alpha" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003436795.1" /transl_table=11 /codon_start=1 /translation="MKERLTQLMQEAEKKMGSISSLQEAEELRIKLLGKKGELTEMLKG MKALAPEERKSFGQAANEARAKIENTLNERMEYFRNAQKELALAAEKVDVTEPAVPCEL GSRHLLSITIDEITRCFRSMGFSVSEGPEVETVFNNFDALNAGPNHPARDMTDTFYITD DVLLRTQTSPVQVRTLLSQKPPIKVIAPGRCFRCDTPDATHSPMFHQVEGLVVDEGITM ADLKGVLDQFAKQMFGSSTRTKFRPHHFPFTEPSAEMDVSCFKCGGKGCKVCKGSGWIE ILGCGMVHPNVLKVGGIDTEKYTGFAFGMGVERVAMLKYEVDDIRLLYENDIRFVKQFK " /locus_tag="LOCUS_1640" /gene="pheS" /EC_number="6.1.1.20" /note="WP_003436795.1 phenylalanine--tRNA ligase subunit alpha (Clostridioides difficile) [pid:61.4%, q_cov:99.7%, s_cov:100.0%, Eval:3.2e-120]" /note="MGA_211" CDS complement(1368..2234) /product="RNA methyltransferase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_010965655.1" /transl_table=11 /codon_start=1 /translation="MANLLRMQHAGRNNCIEIHSKDNKTVKLAASLAEKKHRDALGAYL IEGPNLVREALQQGVRIQFIFTGAGALNQQQEIQDILSLAEDSDSAVCVLSEDCFAKIA TSQTPQPIMAVAEKRTWQMRDVFSPGGNVLVLDRIQDPGNLGTLLRTAEATGFAGALIV KGGADPYGPKAVRAGAGCVFRFPLLLCESPAEALDILAKQRKQVWTADMEGTPCYDAEL AQNVAIVIGNEGNGADALFKENSGRVTVPMAGQAESLNAGIAAAILMYESLRQRAARSV RENTATL" /locus_tag="LOCUS_1650" /note="WP_010965655.1 RNA methyltransferase (Clostridium) [pid:34.7%, q_cov:89.6%, s_cov:97.7%, Eval:9.3e-38]" /note="MGA_212" CDS complement(2301..3404) /product="cell division protein FtsZ" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_009890867.1" /transl_table=11 /codon_start=1 /translation="MSPMLQFEKPEETSANIKVIGVGGAGCNAVNRMIESNLKGVSFIA VNTDRQALNNNRAETKIQIGEKLTKGLGAGGNPEVGQKSAEESLENLEKIITGSDMVFI TAGMGGGTGTGAAPVIAKAAKSMGALTVGVVTKPFTFEGRKRKEHAELGIKFLKNYVDS LVVVPNDRLLQVSETNTSMLDAFRMADDVLKNGVEGISSLISEDGLINLDFADVKTVMS DRGIAHMGIGRASGEHRVEEAIKMAIDSPLLETSIKGAKAVLLNIMGGYDLGMLEVSGA SDAIAKEVAEDAFIIFGTSVKEDMQDEIRVTVIATGFEEENQGLGLEEPAAEAPAAPEA PKTEPEPAVPSANDFPIPSFLNKKFEL" /locus_tag="LOCUS_1660" /gene="ftsZ" /note="WP_009890867.1 cell division protein FtsZ (Clostridioides difficile) [pid:62.3%, q_cov:87.5%, s_cov:83.4%, Eval:8.3e-109]" /note="MGA_213" tRNA complement(3547..3623) /product="tRNA-Val" /inference="COORDINATES:profile:Aragorn:1.2.38" /locus_tag="LOCUS_t0050" /note="Aragorn_5" CDS complement(3637..4143) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MAGKKGQRTINIYAFFFSLVAFLFVLQLGTGLAGALMGFRYPDGL LGMTTLFGTISLVLVLTVIFLVASQAGFAIIRRAEADKKNYIIYHSLVIFVMAISAVYV GVAYKNAWFVLPNVLTIAATAYSLKNVNRSKYEVVRGTRAWRNEQARKERQELKRKMKS SKGSK" /locus_tag="LOCUS_1670" /note="MGA_214" ORIGIN 1 ggtccgggga ccttggcgcc gtccacggcc acgggcacga agaaatcctt catgccgggc 61 acgctgttgg gtgcgccggt gcagatctgg acaggttctc ccctgcccac gtcgatctgg 121 cagaccgtca gcttatccgc attgggatga ggttcgaccg agagtacctt gccgatgacg 181 acgccctcga tgtccttgtt ataatagtcg acggtctcca ggttggatcc gctcaggata 241 agacggtcgc agaattcctg cacgccgacg ttgatatctg tatattcttc taaccatttg 301 atcggtgcta acatgggaag cctcctttac ttgaactgct tgacaaagcg gatgtcgttc 361 tcgtacagca gacggatgtc gtccacttcg tacttgagca tggcgacgcg ttcgacgccc 421 atgccgaagg cgaatcccgt gtacttttcg gtatcgatgc cgccgacctt cagtacgttc 481 ggatgcacca tgccgcagcc taagatctcg atccagccgg agcctttgca gaccttgcag 541 cccttgccgc cgcacttgaa gcagcttacg tccatctccg cggagggttc ggtgaacggg 601 aagtgatggg gacggaactt cgttctggtg cttgacccga acatctgctt cgcaaactga 661 tccagcacgc ccttcagatc cgccatggtt atgccttcgt ccaccacgag accttccacc 721 tgatggaaca tcggggagtg ggtggcatcc ggcgtatcgc agcggaagca tcttccgggt 781 gcgatgacct tgatgggagg cttctgggat agcagcgtgc ggacctggac cggagaggtc 841 tgggtgcgca gcagcacgtc gtcggtaata tagaacgtat ccgtcatgtc tctggcggga 901 tggttcggcc ctgcgttaag cgcgtcaaag ttgttgaaca cggtctccac ttccggtcct 961 tcggacacgg agaagcccat gctgcggaag catctggtga tctcgtcgat cgtgatggac 1021 agcagatgtc tgcttcccag ttcgcaggga acggcgggtt cggtaacatc caccttttcc 1081 gcagcaagcg ccagctcttt ctgggcgttg cggaagtatt ccatgcgctc gttgagggtg 1141 ttctcgatct tcgctcttgc ttcgttggct gcctggccga aggattttct ctcctcggga 1201 gccagggcct tcatgccctt gagcatctcg gtgagttcgc ccttcttgcc cagcagttta 1261 atgcggagtt cttctgcttc ctgcagagaa gagatgcttc ccatcttctt ttctgcttcc 1321 tgcatcagtt gtgtgagtct ttctttcatg taaattagcc tccatcgcta aagtgttgct 1381 gtattttccc gtacgctccg cgccgctctc tggcgcaggg attcgtacat caggatcgcc 1441 gcggcgatgc ctgcgttcaa ggactcggcc tgccctgcca tgggcacggt gacccttcca 1501 ctgttttctt tgaataaggc gtctgcaccg ttcccctcgt ttccgatgac gatagccaca 1561 ttttgggcca gttctgcatc gtaacagggc gttccttcca tgtcggcggt ccagacttgt 1621 ttacgctgct ttgccaggat gtccagcgcc tcggcgggac tttcgcaaag cagcaacgga 1681 aatcggaaga cgcatccggc gccggcccgc acggctttcg gtccgtaggg atccgccccg 1741 cccttcacga tgagcgcgcc ggcaaagccc gtcgcttccg ccgtgcgcag cagcgtgccc 1801 aggttgccgg ggtcctggat gcggtcaagc accagcacgt tgccccctgg ggaaaaaacg 1861 tcgcgcatct gccacgtccg cttttccgcc accgccatga tgggctgcgg cgtctgcgac 1921 gtcgcgatct tcgcaaaaca atcttccgat aaaacgcata cggccgaatc gctgtcttct 1981 gccaggctga ggatgtcttg gatctcctgc tgctggttca gcgctccggc ccccgtaaag 2041 atgaactgta ttctgactcc ctgctgcagc gcctcgcgca cgaggttcgg accctcgatc 2101 aggtaggcgc ccagggcgtc cctgtgcttt ttctccgcca gggacgcggc gagttttacc 2161 gttttattgt ctttggaatg gatctctatg cagttgtttc tgcctgcatg ttgcattctc 2221 aataagttcg ccaaagggac ggtcctcccg tcgaggcgct tggcctgcgg gctgaccgtc 2281 cccgtgatat tcagtgggct ttagagttcg aacttcttat tcaggaacga agggatcggg 2341 aagtcgttgg cggagggaac tgcgggttcc ggttccgtct taggcgcttc cggtgcagca 2401 ggtgcttccg ctgccggttc ttccaggccc agaccctgat tctcttcctc gaaaccggtc 2461 gcaatgacgg ttacgcggat ctcgtcctgc atgtcttcct tgacggaagt accgaagatg 2521 atgaaagcgt cttccgcgac ttccttggcg atggcgtcgg atgcgccgga gacttccagc 2581 atacccagat catagccgcc catgatgttg agcagcactg ccttcgcgcc cttgatactg 2641 gtctccagca gcgggctgtc gatagccatc ttgatcgctt cttcgactct gtgctctccg 2701 ctggcgcggc cgatgcccat gtgggcgatg cctctgtcgc tcatgacggt cttgacgtcc 2761 gcgaagtcca gattgatgag tccgtcctcg gagatgaggc tggagatgcc ttctacaccg 2821 ttcttcagca cgtcgtccgc catgcggaac gcatccagca tgctggtgtt ggtctcagag 2881 acctgcagca gtctgtcgtt gggaacgacg acgagagagt cgacgtagtt cttcaggaac 2941 ttgatgccca gctccgcgtg ctcttttctc ttgcggcctt cgaaggtaaa gggctttgta 3001 acgacgccta cagtaagggc gcccatggat ttggcagcct tcgcgatgac cggtgcagca 3061 cccgttccgg tgccgccgcc catgcctgcg gtgatgaaga ccatatcgct tccggtgatg 3121 atcttctcca gattctcgag gctctcctct gcggacttct gtccgacttc gggattgccg 3181 cctgcgccca gacccttcgt cagcttttcg ccgatctgga tcttggtctc ggctctgttg 3241 ttattgagcg cctggcggtc ggtgttgact gcgatgaagg aaacgccctt cagattggat 3301 tcgatcatgc ggttgaccgc attgcagccg gcgccgccga cgccgatgac tttaatattg 3361 gccgatgttt cttccggctt ttcaaattgt aacattgggg acatgtttgg cctcctgaac 3421 aaaaacacag ttgtatacgc aataagttta gcacaatctg cggatgaatg caccacctga 3481 atacaacata ttgtgatttt tttatggaaa aaggaaaagg agacccaagc ggatctcctt 3541 acggtttggt gggctgtatt ggactcgaac caacggcctc ttgcatgtga cgcaagcgct 3601 ctaaccaact gagctaacag cccttacaaa gagcagctac ttactgcctt tgctgctctt 3661 catcttccgt ttcagttcct ggcgttcctt gcgtgcctgc tcgttgcgcc acgcgcgggt 3721 gccccttacg acctcgtact tcgaacggtt tacgttcttt aaactgtatg cggtcgccgc 3781 gatcgtgaga acgttcggta aaacgaacca ggcgttctta taggcaactc ctacatagac 3841 cgcactgatc gccatgacga agatgaccag cgaatgatag atgatatagt tcttcttatc 3901 cgcctcggct ctgcggatga tcgcaaagcc cgcctgggat gctaccagga agatgacggt 3961 gagcaccagc acgagagaga tcgtgccgaa cagtgtcgtc atacccagca gtccgtcggg 4021 ataacggaat cccatcaaag cgccggcgag accggtaccc agctgcagaa caaagagaaa 4081 tgcaaccaga gaaaagaaga aagcgtaaat attgatcgtg cgctgtcctt ttttgcctgc 4141 cattgaaagc tccttttgtc tctaattgag taccctatta ttataccgct tttcgcgaaa 4201 aaaacaaccc cattcccagg cagaaaaagc ggcgcccgca aaggcgccgc tgaagtccca 4261 aaagcgttgc aatatcaact gttgctgctg ggcagaactc tcgcgatggt gttcgcgaaa 4321 ttggagatgg gcatggtctg aagcacgacg ttgccggggc cagtcagcgt ggtgtggaac 4381 agtccttcac cgccgaacat tatgttcttg gcgcccttca ctctctggat gtcgatggag 4441 acggtgctgt ccaccatggc gacattgccg gtatccacga tgagccgctg accggcttcc 4501 agtctgtact ccacagcgct gccgtcgatc tcgacgaatg cgatgccacg gcccgaaagc 4561 ttctgcataa tgaatccctc tccgccgaag aaaccggtga gcgccttgtt ctggaagaac 4621 acggacagct gtacgccgtc agtcgccgcg aggaacgcgg atttctggca gatgatgggc 4681 ttgtccgggg tcacctcgat cgcacggatg gaaccgggga aac // LOCUS sequence034 4699 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence034 VERSION sequence034 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..4699 /mol_type="genomic DNA" /organism="" /note="sequence034" CDS complement(176..1594) /product="NADP-dependent phosphogluconate dehydrogenase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_002211888.1" /transl_table=11 /codon_start=1 /translation="MKERSDIAVIGLGVMGSGIARNLESKGFTVSVYNRSEEGLAAFFE QYGEGNFRRADSLEELCSQLEVPRKVLLMVKAGAAVDEVLAQLTPYLEPGDVVIDGGNS YYKDTQQRAQAMEDQGLLYVGCGISGGEEGALHGPSLMPGGSEAAKDLVMPLLLQICAR TDIGEACCSWMGSGGAGHFVKMIHNGIEYGEMQLLCETYDLMHRYLGMDTAMCGRTLAR WAKQTPGFLLEAAETVLQKQEEDGSLLVEHILDAAGQKGTGAWTVDTAMALGVPVPVIS EAVNARALSARKDLRTSLSEKYGKTVYDGKVMPAELRFEKLQMLQAALLQARILCYAQG FEVLQAASDVYGWNWNLGEISQVWRAGCIIRSSLLSDIKKAYVYDRNLPNLLEANLIHS MLSEGKNALKETCIAAADNGIAAPAFSAALQYFNGYTSLSLPANLLQGMRDLFGAHTYE RTDAARGEVFHTEW" /locus_tag="LOCUS_1680" /gene="gndA" /EC_number="1.1.1.44" /note="WP_002211888.1 NADP-dependent phosphogluconate dehydrogenase (Yersinia pseudotuberculosis complex) [pid:45.4%, q_cov:99.4%, s_cov:99.1%, Eval:2.2e-115]" /note="MGA_216" CDS complement(1591..2253) /product="membrane protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_017869617.1" /transl_table=11 /codon_start=1 /translation="MASEYFKRWCVCMAGLLLCGTGSYCTVQASAIGIGAWETFQTGLS LSTGILYGNCTVMVSFAIILIDLLLKGKIGIGTLCNAVIIGKTVDFWHLTFDFLPLAQT LPVGLLYLVCGQLLNAFGSYLYMKPALGCGPRDTLMVILAKRFPKVNIGIVRFCMELCV FFVGVLLGAPYGWGTLFAMGITSFIMQAVFKLCKFRARDVQHENLVDTYRRIRGKEA" /locus_tag="LOCUS_1690" /note="WP_017869617.1 membrane protein (Deinococcus wulumuqiensis) [pid:32.4%, q_cov:78.2%, s_cov:82.4%, Eval:7.8e-14]" /note="MGA_217" CDS complement(2261..2914) /product="ribulose-phosphate 3-epimerase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_010943985.1" /transl_table=11 /codon_start=1 /translation="MAYLTPSILTADFADLKTQLKALEEGGADFVHLDVMDGSFVPNIT FGQPVVRSIAKATTLPLDVHLMIVRPELCLEEFALPQTEFITVHQEACLHLHRTVQQIK ALGKKAGVALNPATSLSVLDYILPDLDMVLLMSVNPGFGGQKFIEASWQKIRELDKLRK EKNPDLLIELDGGVNLNNAAALKEAGVDVFVAGNAVFSAEDMAERVREFQRILK" /locus_tag="LOCUS_1700" /gene="rpe" /EC_number="5.1.3.1" /note="WP_010943985.1 ribulose-phosphate 3-epimerase (Geobacter sulfurreducens) [pid:52.5%, q_cov:100.0%, s_cov:98.2%, Eval:1.4e-60]" /note="MGA_218" CDS complement(2925..3818) /product="ribosome small subunit-dependent GTPase A" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_010965036.1" /transl_table=11 /codon_start=1 /translation="MAGSLQGTIVKGIAGFYYVLAGEGESQALYECKARGIFRLDGVTP LAGDRVTISLQEDGTGSIDEILPRVNVFDRPPVANVETMVLVAASKEPEPNFPLLDRFC VMAEQKNCRIAVCVNKADIGDPVVLQRFRNVYGPIYPVFIVSTVTGEGFEELRAFLKGT QAALAGPSGVGKSSIANVLLDFEASETGEISRKTLRGKNTTRHTELFDAGEFRLFDTPG FTSFELGEVEEAQLQHFFPEFAPYLGKCRFDNCRHLEEPGCAVAKAAEEKQISRRRYAS YRDMMKTLQQMEKEKY" /locus_tag="LOCUS_1710" /gene="rsgA" /note="WP_010965036.1 ribosome small subunit-dependent GTPase A (Clostridium acetobutylicum) [pid:41.3%, q_cov:96.0%, s_cov:97.6%, Eval:7.2e-57]" /note="MGA_219" misc_feature complement(3818..>4699) /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_011861606.1:PASTA domain-containing Ser/Thr kinase PrkC" /note="WP_011861606.1 PASTA domain-containing Ser/Thr kinase PrkC (Clostridioides difficile) [pid:43.7%, q_cov:42.3%, s_cov:18.8%, Eval:1.2e-19, partial hit]" /note="MGA_220" /locus_tag="LOCUS_1720" ORIGIN 1 aagtcattgc ttctccattc gttgaatgct ttttaaaaac tatgcatcta ctctagcatt 61 cggcatatag ggctgtcaac cccattttta aaattatttt tttaaatatg caggataaaa 121 tttgggctat acattatatg acaccagttt ttgcgggtgg cgttcaaaag cccgcttacc 181 attccgtatg gaaaacctct ccccttgccg cgtccgtccg ttcgtacgta tgcgccccga 241 acagatcgcg catgccctgc agcagatttg cgggaagaga cagcgacgtg tatccgttga 301 aatactgcag cgcagcggag aacgcaggcg cagcgatccc attgtccgcg gcagcgatgc 361 aggtctcttt cagagcattc tttccttccg acagcatgct gtggatgagg tttgcctcca 421 gcagattcgg cagatttcta tcgtatacgt aagctttttt tatgtcgctc aacagactgc 481 tgcggatgat gcacccggca cgccagacct gggagatctc gccgaggttc cagttccagc 541 catagacgtc cgatgcagcc tgcagcactt cgaagccctg cgcatagcac aggatgcggg 601 cctgcagcag cgccgcctgc agcatttgca gcttctcgaa gcgaagttct gcaggcatca 661 ccttgccgtc gtacacggtc tttccgtatt tttcggacag cgacgtgcga agatcctttc 721 tggcggacag cgctctcgcg ttcaccgcct cggagatgac gggcaccggc acgcccagcg 781 ccatcgcggt atccaccgtc caggcacctg tccccttctg gcctgccgca tccaggatat 841 gctccaccag aagcgatccg tcttcctcct gcttctgcag cacggtctcc gccgcctcca 901 gaaggaagcc cggcgtctgc ttcgcccagc gggcaagcgt ccggccgcac atggcggtat 961 ccatgcccag atagcggtgc atcaggtcgt acgtctcgca cagaagctgc atttccccgt 1021 attcgatgcc gttatggatc atcttgacga aatgtccggc gccgccgctt cccatccagc 1081 tgcagcaggc ttccccgatg tccgttctcg cgcagatctg aagcagaagc ggcatcacca 1141 gatcctttgc cgcctcgctg cctccgggca tcagggacgg accgtgcaga gcgccctctt 1201 caccgccgga aatgccgcag cccacgtaca gaagcccctg gtcttccatg gcctgtgccc 1261 tctgctgcgt atccttgtaa taggaattgc cgccgtcgat cacgacgtcg cccggttcca 1321 gatacggggt caactgcgca agcacctcgt ccaccgcagc ccccgccttt accatcagca 1381 ggacttttct gggaacttcc agctggctgc agagctcctc caggctgtcc gctctgcgga 1441 aattgccctc cccatactgt tcaaaaaacg cagcgagacc ctcctcgctg cggttgtata 1501 cgcttaccgt aaagcctttg ctctccaggt tgcgggcgat gccgctcccc attacaccaa 1561 ggcctatcac ggcgatatcc gatctctctt tcatgcctct ttccccctga tccgtctgta 1621 cgtatccacc agattctcgt gctgcacgtc cctcgcccgg aacttgcaga gtttaaagac 1681 cgcctgcatg ataaacgacg tgatgcccat cgcgaacaga gtgccccatc cataaggagc 1741 accaagcagc acgccgacaa agaaaacgca tagctccatg cagaaacgga cgatgccgat 1801 gttcaccttc gggaaacgct ttgccaggat caccatcagc gtatcccggg gaccgcagcc 1861 cagcgcaggc ttcatgtaga ggtaactgcc gaaagcgttc agcagctgac cgcacacaag 1921 atagagcagt ccgaccggaa gcgtctgtgc cagaggcaga aagtcgaacg tcagatgcca 1981 gaaatccacg gtcttgccga tgatgacggc gttgcacagc gtgccgatgc cgatcttgcc 2041 cttcagcagc aggtcgatga ggatgatcgc gaaactcacc atgacggtgc agtttccgta 2101 caggatgccc gtgcttaaag agagtccggt ctgaaacgtt tcccaggcgc cgatgccgat 2161 ggcggacgcc tgaacggtgc aatacgatcc ggtgccgcag agcagcagtc ctgccataca 2221 gacgcaccat ctcttgaaat actcggatgc catagatgtc ctactttaaa atgcgttgaa 2281 attcccgtac tctctccgcc atatcttccg cagagaacac ggcgttgcct gccacgaaca 2341 catccacgcc ggcttctttg agcgccgccg cgttgttcag gttcacgccg ccgtccagct 2401 cgataagcag atccggattc ttctctttgc gcagtttatc cagctcgcgg atcttctgcc 2461 agctcgcttc gataaacttc tggccgccga agccggggtt gaccgacatc agcagcacca 2521 tgtccagatc cggaaggatg taatccagca cggaaagaga agtggcggga tttaacgcga 2581 cgcctgcctt cttgcccagc gccttgatct gctgcaccgt gcggtgcaga tgcaggcagg 2641 cttcctggtg caccgtgatg aattccgtct ggggcagcgc gaactcctcc aggcagagct 2701 cagggcggac gatcatcaga tgtacgtcca acggcagcgt cgtcgccttc gcgatgctgc 2761 gcacgacagg ctgtccgaac gtgatattcg gaacgaaact gccgtccatc acatcgagat 2821 gcacgaaatc tgcgccgcct tcttccagcg ccttcagctg cgtcttcaga tccgcgaaat 2881 ctgccgtcag gatcgacggg gtcaaatagg ccatggcctc ctcctcagta tttttccttt 2941 tccatctgct gcagggtctt catcatgtcc cggtaggacg cgtagcgcct ccggctgatc 3001 tgtttttcct ccgccgcttt cgcgacggcg catccgggtt cttccagatg ccggcagttg 3061 tcgaaccggc attttcccag atagggcgca aattccggga agaaatgctg cagctgcgct 3121 tcttccactt cgcccagttc gaaactcgta aagcccggcg tgtcgaacag gcggaactct 3181 cccgcgtcga acagttcggt atgccgggtc gtattctttc cccgcagggt cttgcggctg 3241 atctctccgg tctcgctggc ctcaaaatcc agcagcacgt tggcgatgct ggatttgccc 3301 acaccggaag gacccgccag agccgcctgc gttcccttta aaaacgcgcg cagttcttcg 3361 aagccctcgc ccgtcaccgt gctcacgata aagacgggat agataggacc gtacacgttg 3421 cggaaccgct gcagtacgac ggggtcgccg atgtccgcct tattgacgca caccgcgatg 3481 cggcagttct tctgctccgc catcacgcaa aagcggtcga gcaaggggaa attcggctcc 3541 ggttctttcg aagccgccac gagcaccatg gtctccacgt tggcgaccgg cgggcggtcg 3601 aacacgttga cccggggaag gatctcgtcg atgctcccgg taccgtcctc ctgcagggag 3661 atggtcacac ggtcgccggc aagcggcgtg acgccgtcca gacggaagat cccccgcgcc 3721 ttgcactcgt agagcgcctg ggactcccct tctcccgcga gcacgtagta gaagcccgcg 3781 atgcctttta cgatcgtacc ttgcaaagat cctgccatta atggatctct ccggtatcga 3841 agtttacgtc gtactcatag acgagcgcgt tgtcgaagaa cacgagcacc ttgccgtccg 3901 ggccggatcc ttctgcactg aaggactcgc cgttgtcgct cttatggcgc gccgcctggc 3961 tgagcggcgt tctgggactg ttaacggaat cggataccgt caccgtcatg gtgaagtcct 4021 cgttgacggc ggggctgtaa tcgatccaga ccgccacggc gttcgtaacg ggtgcgggcg 4081 gagtctccgg ttccggttcg atgacgggtt cgggcgcttc cggctctttg gataccacca 4141 ggtcgatggt gtcgccttcc gcgatggcca tgcccggcgc cgggctctga gtgatgaccg 4201 tatcttcctt gcggttgatg tcttccacat aggagatctc gcccagttta aggtccagtt 4261 cttcgatctg cttcttcgct tcgtccaggc tcttgccctc cacgttgaat tctgcgcgtg 4321 cgacatcctt ctcggaacca agggagacga cgagcgtaac ctcctgaccg tcgggatacg 4381 tcgtgcctgc gaccgggctc tggctgatga ccgtgccctt gggaccggtc tcgctcactt 4441 cttccgaaac gacgccgagc ttgaatttat aggtttccag catggtgcgg gcgttggcca 4501 gagactttcc gaccacatcg gggacggagc cgtccacctt gcccttgctg atgttgactt 4561 cgatgctctg accggatttg atggaagcgc ctgcatccgg cgtctggctg aggatgattc 4621 cttcctccac gtcgttgctg ggcagttcca tgcccacctt gacatccagt ccgaactcct 4681 tgaggatctc ttccgcttc // LOCUS sequence035 4664 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence035 VERSION sequence035 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..4664 /mol_type="genomic DNA" /organism="" /note="sequence035" CDS 1285..2820 /product="ribonuclease Y" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003428216.1" /transl_table=11 /codon_start=1 /translation="MLVTALIAIAFLAIGILVGYIIRKNKAEKTIGSAETMAKNLILDA ENRSEAIRKETLADARAEAHSIKQDAERDIRERREEVKKTERRLVQKEESLDRKIENIE QKEEGISKKQRALAEKEKELDGFIEKQIAELERISGCTAEEAKAQLLESIEKDVRRDAS IMIKDIETKAKEEADRKAKEIITGAIQRCAADHVAETTVSVVPLPNDEMKGRIIGREGR NIRAIETATGVDLIIDDTPEAVILSGFDPVRREIARVALEKLIVDGRIHPARIEEMVEK AEKEVNNIIKEEGESATFEMGIHNLHPELVKLLGRLKYRTSYGQNVLKHSLEVAHLAGL MAGELGMDVKLAQRAGLLHDIGKALDHEIQGTHVDIGIDVLRKYKESEAVIDAMAAHHG DYEPKSPEAVLVAAADALSAARPGARRETLDTYIKRLQKLEEIANTTPGVEKSFAIQAG REIRIIARPDEVSDDAMALLAREISKKIESELEYPGQIKVNVIRETRAIDYAK" /locus_tag="LOCUS_1730" /gene="rny" /note="WP_003428216.1 ribonuclease Y (Clostridioides difficile) [pid:64.3%, q_cov:97.7%, s_cov:97.3%, Eval:1.5e-186]" /note="MGA_222" CDS 2833..3990 /product="cysteine desulfurase family protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_009895806.1" /transl_table=11 /codon_start=1 /translation="MFVYLDNSATTQVKPLVAEIMAKTMTEDFGNPSSLHRMGVNAEKI LKKARAQVAAALNASPEEIFFTSCGTESDATVLRGVWESRKKQGRRIITTAVEHPAILR NCEQLAREGADVIYLPVNRDCTFDMDAFRSALTPDTILVSVMHVNNEAGSIMPLAQIRS EIDRVNKGILFHTDAVQSFEKLDTDVHKLGVDMLSLSGHKIHACKGIGALYVKKGLHIQ PYLLGGGQESNFRSGTENLPAIAGLGEAVRLAEENKQARIAHIADVRNYLMHLLQDNIE DITVNSPEDGVCSVLNVSFLGCRGEVLLHTLEQDDIYVSTGSACSSHKKGSHVLTAMGL SDAQIEGAIRFSFCEDNTREQMEYVCEKLKTAVESQRRLRKAFKR" /locus_tag="LOCUS_1740" /note="WP_009895806.1 cysteine desulfurase family protein (Clostridioides difficile) [pid:47.3%, q_cov:100.0%, s_cov:99.7%, Eval:4.2e-98]" /note="MGA_223" ORIGIN 1 aagaagatcc gtttgccgcc tgcgtaaggg cgcaccgtac cgatcctctg cgggctcaac 61 accttgccct gcagcatcgc gaggcatttc tccgcgtcct gcggcgccac cgcagccagc 121 aggccgcctg aggtctgggg atcgaacagc gcgtcgcaca gggcggcgtt tacgccgttt 181 tcctccacct gaacgctgca gtaatcccgg ttgcggtaca tgccttccgg cagcaggccc 241 atggatgcaa attccagaga agagggcaga acgtccagtt ctgcggtctc caccagcgct 301 tccacatccg tatccttcac catctcgtac aggtggccca tcagaccgaa ccccgtcaca 361 tcggtgcagg cgtggacttc gcattgcacg aacacgtccc gcgcgttttt attgagctcc 421 gtcatgatgc ggatcatggt cttttcgtcg tcttctgaga gcataccggc ttttgcggct 481 gtcgtcagga tgccggtgcc gatcggcttc gtcaggatga gcacgtctcc gggtctcgcg 541 ccgcagttgc ggtagaactt ttccggatgg acgtagcccg ttacggaaag accgtatttc 601 ggctcttcgt cgaggatcgt gtgacccccg gcaaggatcg cgccggcttc gttcacttta 661 tcgtagccgc cccgcaggat ctcccgggtc acttccttgg gaaagtccct ggggatgccc 721 atgatgttca tgcaggtctt cggcgttcct cccatggcgt agacatcgga cagggcgttg 781 gctgccgcca cctggccgaa ggtgtagggg tcatccacga cgggcgggaa gaaatccacc 841 gtctgcacga gggccagctc gtcgtttact ctgtagacgc acgcgtcgtc gctcttatcg 901 aatcccacga gaaggtcggg atcgctcttc atggagatgc cgtccaaaac ttcagcgaga 961 actcccgctc cgagttttgc ccctcatcct gcgcagcctg caagggtcgt gagttttatc 1021 tcctttgcag tcattggcgg tcacctcctt tcgtgccttg aattctatcg gtttcgaaca 1081 aataaagtat atatcttttt tctctttttg tgcaagtgca accgattttt atgcacggaa 1141 gcataaacta tccctttaca tttatgcgca tattatagta aaatatattg gtatttttgt 1201 aatgctgatt tttgcctgcg cattgcgcag tttgtataaa accagacata tacaaacatc 1261 agaataacgc agaggaggga cagcatgctt gtaacagctc tcattgccat cgcctttctc 1321 gcgatcggaa tacttgtagg ttatatcatc cgcaagaata aggcagaaaa gaccatcggc 1381 agtgccgaga ccatggccaa gaaccttatc ctggatgcgg aaaaccgctc cgaagccatc 1441 cgcaaagaga ccctggccga tgccagagcg gaggctcatt ccataaagca agatgcggaa 1501 agagatattc gcgaacgcag agaagaggta aagaagacag aaagaagact cgtccagaag 1561 gaagaatccc tggacagaaa gatcgaaaac atcgaacaga aggaagaagg catctccaag 1621 aagcagagag ccctggccga gaaggaaaag gaactggacg gctttatcga aaagcagatc 1681 gccgagctgg agcgcatctc cggctgcacg gcggaagagg cgaaggccca gctgctggaa 1741 agcatcgaga aagacgtgcg cagagacgct tccatcatga tcaaggacat cgagaccaag 1801 gccaaggaag aagcggaccg caaggcgaag gagatcatca ccggcgccat ccagcgctgc 1861 gctgcagacc atgtggcgga gaccaccgtt tccgtggtgc ccctgcccaa cgacgagatg 1921 aagggccgca tcatcggccg cgagggccgc aacatccgcg ccatcgaaac ggcgaccggc 1981 gtggacctca tcatcgacga tacgcccgag gccgtcatcc tgtccggatt cgaccccgtc 2041 agaagagaga tcgccagagt cgctctggag aagctcatcg tggacggccg tatccatccc 2101 gcacgcatcg aggagatggt cgagaaggcc gaaaaggaag tcaacaacat catcaaggag 2161 gagggcgaat ccgccacctt cgagatgggt atccataacc tgcaccccga gctcgtaaag 2221 ctgctgggca ggctcaaata ccgcaccagt tacggccaga acgtgctgaa gcactctctg 2281 gaagtcgccc acctggcagg tctgatggcc ggcgaactgg gtatggacgt aaagctggcg 2341 cagagagccg gtctgctgca cgatatcgga aaggctttgg accatgagat ccagggcact 2401 cacgtggata tcggcatcga cgtcttaaga aaatataagg aatccgaggc ggtcatcgac 2461 gcgatggcag cccaccatgg agactacgag cccaagagtc cggaagcggt gctggtagcc 2521 gcggcagacg cgctgtccgc agcccgtccc ggcgccagaa gagagacgct ggacacttac 2581 atcaagcgcc tgcagaagct cgaagagatc gcgaacacca cccctggcgt ggagaaatcc 2641 ttcgccatcc aggcgggccg cgagatccgc atcatcgccc gtccggacga agtgtccgac 2701 gatgcgatgg ccctgctggc cagagagatc tccaagaaga tcgagagcga actggagtat 2761 ccgggtcaga tcaaggtaaa cgtcatccgc gaaacgagag cgatcgacta cgcgaagtaa 2821 cacaggagag gcatgttcgt atatttagac aacagcgcta ccacccaggt aaagccgctt 2881 gtcgcggaaa taatggcaaa gacaatgacg gaggattttg gaaatccttc gtctttgcat 2941 agaatgggtg tgaacgcaga gaaaatttta aagaaagcgc gtgcccaggt ggccgcagcc 3001 ctcaatgcgt ccccggagga gatcttcttt acgtcctgcg gcacggagag cgacgctacg 3061 gtgctccgcg gcgtctggga aagccgcaaa aagcagggca gacgcatcat cacgacagcg 3121 gtggagcatc ctgccatcct ccgcaactgc gagcagctgg cgagagaggg tgcagacgta 3181 atttatcttc cggtaaaccg cgactgcacg ttcgatatgg acgctttccg cagcgccctt 3241 acaccggaca ccatcctggt atccgtaatg cacgtcaaca acgaagccgg atccatcatg 3301 cccctggccc agatccgcag cgagatcgac cgggtgaaca agggcatcct gttccacacg 3361 gacgccgtgc agtccttcga gaagctggat acggacgtcc ataaactcgg cgtcgacatg 3421 ctgagtctgt cgggtcacaa gatccacgcc tgcaaaggca tcggcgccct gtacgtaaag 3481 aaaggtctgc atatccagcc ctatctgctg ggcggcggcc aggagagcaa tttccgttcc 3541 ggcaccgaga atctgcctgc catcgcaggc ctcggcgaag ccgtgcggct ggcggaagaa 3601 aacaagcagg cacgtatcgc ccatatcgcg gacgtgcgga attatctgat gcacctgctg 3661 caggacaata tcgaagacat tacggtgaac tcgccggagg acggcgtctg ttccgtcctg 3721 aacgtcagct ttttgggctg ccggggcgag gtgctgctgc acacgctgga gcaggacgac 3781 atctacgtat ctaccggttc cgcgtgctcg tcccacaaga aaggcagcca cgtgctgacg 3841 gctatgggcc tgtccgacgc gcagatcgaa ggtgctatcc gcttctcgtt ctgcgaggac 3901 aataccagag agcagatgga atatgtctgc gaaaagctga agaccgccgt cgaaagccag 3961 agaagactca gaaaggcgtt taagagataa tggagaatat ctatatcgtc cgctgcggtg 4021 agagcgcgct caagggaaag aacaagcctt atttcgagcg catgctggtg cagcggatca 4081 agaaaaatct gaaggatgaa ggcggcgtca ccgtcgaacg ggtggacggc ctcatctttg 4141 tgcgcacgcc ggaggagatc ccgcaggagg acgtcttaaa gcgggtcggc cgggtgttcg 4201 gcgtggactc catcagtccc gccgtggaag tgcccatcga agggctcgac gcggaaagcg 4261 cgctggacgc gatcggccgc gaagccgtgg cgttcatgat gaagcagatc gaatcgcgcg 4321 gcataaagac ctttaaggtc gacgcgaaac gggcggacaa gatgtttgcc atccagtctc 4381 cggacatcgg caagcgcatc ggcgcgcgcg tcctgaaggg ctgcaaggtc ttgaaagtgg 4441 acgtgcacga gccggactgc ttcctgtata tcaacgtgcg cagaaatttt gcgtatttgt 4501 acgacaaaaa gatcgcaggg tacggcggac tgcccctcgg caccaacggc aggggcatgg 4561 tgctgctgtc cggcggcatc gattctccgg tggcgacatt tatgatggct caccgcggca 4621 tgtacatgga cgctgtccat ttccattcct atccgtacac ctcc // LOCUS sequence036 4660 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence036 VERSION sequence036 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..4660 /mol_type="genomic DNA" /organism="" /note="sequence036" CDS complement(91..1299) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MNFSKAELKYLKLLAEEYGTVSAASAEIINLTAIQNLPKGTEHFL SDIHGEYESFNHILRNASGTIKLKIDETFTDMTPEERRSLATLIYYPEEKLEIIKEKLD GDYHDFYFETLTRLIKLLELVTFKYTRSYVRRRLDKEYAYIIEELLYGSNSVALGRGDH RKNIIESIIEVDAADDFIISICKLISKLSIFKLHILGDVYDRGPGGDVVLDTLKNYHSV DIQWGNHDILWMGAAAGNKACIANVIRICTRYDNLHTLEVGYGISLRPLVTFAMNTYGN DPCPNFKAVASTKDAMYDADLASLSKISKAIAIMQFKLEGQLIEKHPYYEMDALRLLDK VDYEKYTVTIDGKEYPMNNTFFPTIDPADPYKLSDEEEAVMDRLQRAFLESELPIGTHF SQQ" /locus_tag="LOCUS_1750" /note="WP_010964880.1 fructose-1,6-bisphosphatase (Clostridium) [pid:51.2%, q_cov:95.5%, s_cov:57.6%, Eval:9.4e-109, partial hit]" /note="MGA_225" CDS 1425..2666 /product="3-phosphoshikimate 1-carboxyvinyltransferase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011249218.1" /transl_table=11 /codon_start=1 /translation="MIRIYPSQFKGHIKAPASKAHAQRLLFASALTNTATLIKNVPECD DIDTTLQCLLDFGCTVEKHGETEIKIFPFVKTNPVPSAEFDFKQSGTTAHLAIPLAAAF GIRSDCRASGTLVKRPLISLSSRMALRGVKFSSFNLPLSMSGMLQPGEYVFPGDEGSQY ISGALMALPILRDDSIIRLSSPLVDGTFIDVTLDTMEAFGVHVDVDEEGFHIPGRQFYK SPGKTVVENDWGLGSMWACAGCLSRDEENPVIVDGLPARTVQMYRSFKNVMSLLRYDVK YLNVDASETPNLACLYAIIAASKGSGMDITGVPQLRFKETNRLKAVSECIRALGATAHA TDDGIHIEERDAFDYPEDVKLECKGDPWIFMSLALAAGCLPKPIVLDDEHCAEKVYRHF LRDYKALGGKYEIL" /locus_tag="LOCUS_1760" /gene="aroA" /EC_number="2.5.1.19" /note="WP_011249218.1 3-phosphoshikimate 1-carboxyvinyltransferase (Thermococcus kodakarensis) [pid:27.6%, q_cov:96.6%, s_cov:97.7%, Eval:1.0e-28]" /note="MGA_226" CDS 2834..3373 /product="bifunctional pyr operon transcriptional regulator/uracil phosphoribosyltransferase PyrR" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_010887753.1" /transl_table=11 /codon_start=1 /translation="MEFKATLMSEEDMRRALKRMAHQIIEKNEGCGGLVLLGIKTRGLP LAKQLAAFIREIEGAEVPVGELDITHYRDDLSEIAKDPVLSEAPSDVEVDKKVVVLVDD VIYTGRTARAALDAVSALGRASRIQLAVLVDRGHRELPIRPDYVGKNVPTAKSEVVSVF MQETDGRTGVDLYENR" /locus_tag="LOCUS_1770" /gene="pyrR" /EC_number="2.4.2.9" /note="WP_010887753.1 bifunctional pyr operon transcriptional regulator/uracil phosphoribosyltransferase PyrR (Deinococcus radiodurans) [pid:60.3%, q_cov:97.2%, s_cov:95.1%, Eval:1.3e-54]" /note="MGA_227" ORIGIN 1 gagtccagct atgtccgatc gatggagagc cgttatgccg acatcagttc ttacccttgc 61 gaacaggctt tgcggggttg gctctattca ctattgctgg ctgaagtgtg tcccgatagg 121 tagttcgctc tccaggaagg ctcgctgcag acggtccatg accgcctctt cttcgtccga 181 cagcttgtag ggatcggctg gatcgatggt cgggaagaag gtgttgttca tcggatattc 241 cttgccgtcg atggtgacgg tgtacttttc gtaatccacc ttatccagca gacgcagagc 301 gtccatctca tagtacggat gcttttcgat cagttgtccc tcgagcttga actgcatgat 361 ggcgatcgcc ttcgagatct tggacagcga cgcgaggtcc gcatcgtaca tggcgtcctt 421 cgtggaggcc acggccttga agttcgggca gggatcgttg ccgtaggtgt tcatggcgaa 481 cgtgaccagc ggccgcagcg agatgccgta gccgacttcc agcgtatgca ggttgtcgta 541 ccgcgtgcag atacggatga cgttggcgat gcaggccttg ttgcccgctg ccgcacccat 601 ccagaggata tcgtggttgc cccactggat atccacgctg tggtagttct ttaacgtatc 661 cagcaccaca tccccgcccg gacctctgtc gtacacgtcg cccaggatgt ggagtttaaa 721 gatggaaagt ttcgagatga gcttgcagat gctgatgata aagtcgtccg cggcgtccac 781 ctcgatgatg gactcgatga tgttcttgcg gtggtcaccc cggcccaggg ccacgctgtt 841 tgacccatac agcagctcct cgatgatgta ggcgtattcc ttgtcgaggc ggcgcctcac 901 gtaggaacgg gtgtatttaa aggtgaccag ttccagcaat ttgatgagcc tggtgagggt 961 ctcgaagtaa aaatcgtgat aatcgccgtc cagtttctcc ttgatgatct ccagtttctc 1021 ttccggatag tagatcaaag tcgccagaga acggcgttct tccggcgtca tgtccgtaaa 1081 ggtctcgtcg atcttcagtt ttatggttcc ggaagcgttg cgcaggatgt gattgaaaga 1141 ttcgtattct ccgtggatat cggaaaggaa gtgctcggtg cctttcggca gattctggat 1201 ggcggtaagg ttgatgatct cggcagaagc ggcggaaacg gtgccgtatt cctctgccag 1261 aagctttaaa tacttcagct cagcctttga aaaattcata ttgtcctccg cagcccgtaa 1321 cgagggctat atacatagtt agtataccat accccgctgg ggcagttgca cctttttctg 1381 agtcgctttt tgtgctatac tatttcagtt gaaaggcaga aaacatgatc cgcatttatc 1441 cgtctcagtt caaagggcat atcaaagcac cggcctccaa agcgcacgcg cagaggcttt 1501 tgtttgcgtc tgcccttacg aacacggcga cgctcatcaa gaacgtgccg gaatgcgacg 1561 atatcgatac gacgctgcag tgcctgctgg atttcggctg cacggtggag aagcacggcg 1621 aaacggagat caagatcttc cccttcgtca agacgaaccc ggtgccgtcc gcggaattcg 1681 attttaagca gagcggcacg actgcccatc tggcgatccc tctggcggca gccttcggca 1741 tccgttccga ctgcagagcg agcggcacgc tggtcaagcg tcccctcatc tccctctcga 1801 gccgcatggc gctgcgggga gtcaagttca gcagttttaa tctgcccctc tccatgagcg 1861 gcatgctgca gcccggcgaa tacgtattcc ccggggacga aggatcgcag tacatctccg 1921 gcgccctgat ggcactgccc atcctgcggg acgacagcat catccgcctg tcttctcccc 1981 tcgtggacgg cacgttcatc gacgttacgc tggatacgat ggaagcgttc ggcgttcatg 2041 tcgacgtgga cgaagagggt ttccacatcc cgggaagaca gttctacaag agcccgggca 2101 agaccgtcgt agaaaacgac tggggcctcg gttccatgtg ggcctgcgcg ggatgcctct 2161 ccagagacga ggagaatccc gtcatcgtgg acgggctgcc tgcccggacg gtccagatgt 2221 accgcagctt taagaacgtc atgtcgctgc tgcgctacga cgtaaaatat ctcaacgtcg 2281 acgcgtcgga gactcccaat ctggcctgtc tgtacgccat catcgcggcg agcaaagggt 2341 ccggcatgga catcaccggc gtgccccagc tgcgctttaa ggagacgaac cggctgaagg 2401 cggtcagcga atgcatccgc gccctgggtg ccacagccca tgcgacggac gacggcatcc 2461 acatcgagga aagggatgcg ttcgactatc ccgaagacgt aaaactggag tgcaaaggtg 2521 acccctggat cttcatgtcg ctcgcgttag ccgccggatg ccttcccaag cccatcgtgc 2581 tggacgacga gcactgcgcc gaaaaagtct accgccactt cctgcgcgac tataaagcgc 2641 tgggcgggaa atacgagatt ctgtaattga caaccccctt tccagggggt tatatttatg 2701 tcagcaaaag tattctttaa gttggtacag agagaccgac aagatcaata tcgatgcacc 2761 tgtttttctg tgtgcgttaa gcgatctcgt cttgccggtc ggcaaggcat tttttatgcc 2821 ggaaagaagc gccatggaat ttaaagcgac cctcatgagc gaagaagata tgcgccgtgc 2881 cctcaaacgc atggcgcatc agatcatcga aaagaatgaa ggctgcggcg gcctggtgct 2941 tctcggcatc aagacccgcg gactgcctct cgcaaaacag cttgccgcct tcatccggga 3001 gatcgaaggc gccgaagtgc ctgtcggaga actcgacatc acccactacc gcgacgacct 3061 gagcgagatc gcgaaagatc ccgtgctcag cgaagcgcct tccgacgtgg aagtcgacaa 3121 gaaggtcgtg gtgctcgtgg acgacgtcat ctacaccgga cgcacggcaa gggctgccct 3181 ggacgcggtc tcagccctcg gcagagcatc ccgcatccag ctggccgtac tggtggacag 3241 gggtcaccgg gagctgccga tccgccccga ctacgtcggg aaaaatgtgc ctaccgccaa 3301 aagcgaagtc gtttccgtct ttatgcagga gacggacgga cgcacaggag tcgatctgta 3361 cgaaaatcgg taaaaggaga gcattatgaa caaccagaac ggcgctatct acaacgccag 3421 agaactggga ccgggcaaat accttgtcct gggtctgcag cacatgttcg ccatgttcgg 3481 cgcaacggtg ctcgtgcccc tcatcacagg gctgagcgtt acggcaaccc tgctgtttgc 3541 aggtcttgcc accttattct gccactttgt cacgaagggc aaggtccccg tattcctggg 3601 gtcatccttc gcctatctgg gcggctatgc agcggtcgtg accgcaggaa gcgctatcgg 3661 gctttcccag agagaagcgc tgccctacgc ctgcgtcggc gtcgcctgtg caggcctgct 3721 gtacctggtg cttgccggga tctgcaaagc atatggttcc aagaaagtca tgcggttctt 3781 cccgcctgtc gtcaccggcc ccatcatcat cgccatcggc ctcaacctgg cgccttctgc 3841 gatcaataac tgctctgcga actggcccat cgcgctggtc gccatcgccg tggtcatcgt 3901 ctgcaacatc tggggcaagg gcatgatcaa gatcatcccc atcctgctgg gcgtcatcgc 3961 ctcctatgcg gttgcggccg ttaccggcaa cgtggactgg accatggtaa aggaagccag 4021 catcatcggc atgccgttcg agatgcagga caccgtattc ggcctgttcg gcggaagcgt 4081 agacacgtcc ttcctgctct cctccatcat caccatcgtc cccatcgcgt tcgcgaccat 4141 gatggaacac gtcggcgata tctccgccat cggcggaacc gtcggccaga atttcatcga 4201 agatccgggt ctgcaccgca ccctgctggg tgacggcgtc ggtaccacca tcgcggcgct 4261 gttcggcgct ccggccaaca ccacctacgg cgaaaatacc ggcgttctgg cgctcaccaa 4321 ggtctacgat ccgttcgtta tccgtctggc agccgtctac gccatcgtgc tctccttctt 4381 cccgaagttt gcggcactca tccgggtcat gcccgctgcc accatcggcg gcgtttccct 4441 catcctgtac ggcatgatct ccgccatcgg catccgcaac gtcgtcgaga acaagacgaa 4501 cttccaggag agcagaaacg tcatcatcgc ggctctcatc ctgggcctgg ccgtcggcat 4561 ctcctacagc gaagccggcg ccatccacat cggaagcgta tctctctccg gcatcgcggt 4621 agcgtccatc gtcggcatcg tgctcaacgc catcctgccc // LOCUS sequence037 4634 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence037 VERSION sequence037 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..4634 /mol_type="genomic DNA" /organism="" /note="sequence037" CDS 1275..3101 /product="ABC transporter ATP-binding protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_005814508.1" /transl_table=11 /codon_start=1 /translation="MAPGPGGHGPVHFMTDEEKQQVPKVTKGLLLRIASYLKPYKFQFA LVFITILLSAAIGLLPSIITGRIVDQALVGKNLQLLVKLLIAAFATMALSQIIGVLESY INAWISSRIIFDMKNQMYAHLQSMPHSFFTTEKQGDIITRMNSDIDGVSSVISGTLTSV VSNIATVVTTVIALFAMSPRLAIVGIAIVPLLVIPTKKVGVTRFKLLTEARAKADEMNQ IVDETLSVSGSLLVKLFTKEEVEYERFVRINEEVTRYNIKEQRSGQWFRVMMGMFTQVG PLLIYFAGGYLIIAKGDPKLTVGTITATVALINRLYRPVQSLLNIQVDFTRSLALFTRI FDYFDKTNNIKDPLLGTAPDLSNPSVEFQHVAFSYTPDKPILTDINFFVPGGQMYAIVG RSGSGKSTVVNLIPRLYDVNGGHVKVAGQDVRSIKLKMLRQAIGMVSQESYLFNGTIRE NLLYAKPDATQEEIEAACRIANIHDMIAGLEKGYDTEVGNRGLKLSGGEKQRISLARVV LKDPKILILDEATSALDSISENAIQDALDKVMEGRTSIVIAHRLSTILSADKILVVDGG VIAESGSHEELLAKGGIYKELYETQFSKVLKE" /locus_tag="LOCUS_1780" /note="WP_005814508.1 ABC transporter ATP-binding protein (Desulfitobacterium hafniense) [pid:54.1%, q_cov:97.9%, s_cov:97.1%, Eval:2.0e-180]" /note="MGA_230" CDS complement(3204..4196) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MKNDLSCAVVRDLLPSYIDKLTSEETNEAVERHLEGCEDCRKVLA AMQGEGGPAAEENKAEAKEIDYLKKVRTGTWKRVIAGILAAAFVFGAGAWIKLYRIGSY VDPSAVNINCISQEHGIAIDGSLKDKSLGVTHADLLLREDGTKMELGFRAAKKGGKDND FFYAVGAEGAAGEAYRNIQEIWLGDRIVWYQGTLIDEQTAAVWNARHAYVGDMPANAAL ADALGIREKLGPYTNELQTSEKPYSWTITLENEKNYHDASLSYQLGYATILLATIDNLD SVTFAYSQEGVSSLTITTEMVTEQLPVGVKDLASDPAELQYWMGQFGLL" /locus_tag="LOCUS_1790" /note="WP_005809618.1 zf-HC2 domain-containing protein (Desulfitobacterium) [pid:32.8%, q_cov:37.9%, s_cov:59.9%, Eval:4.5e-10, partial hit]" /note="MGA_231" ORIGIN 1 gccgatcagg tccatctcct tcatcttttc gtactggtcc ggattcatga tctggcagtg 61 gatgatgccg tctctgccct tgccgcagcc cggattgttc tttctggcct tttcgatggc 121 ttccatcacc atgtccatgc ccttgtcgcc gatggcgtgg atcgcgatct ggcagttgtg 181 tttataggcg ttgtccacca ggaaatccag ttcgtcctgg gtcagcatcg cgacgccgca 241 gttcttgccg tcgccgtcct tgtacgggtc acgcataagg gccgtccggg cgcccagcgc 301 gccgtcgatc agcaccttgt acggtcccag cgtatatttt tcggtgttct gccagccggt 361 gccgtagccg ttggcaaaga agtcggcctg ccattcccgc acgggcaggt tgcactgctc 421 gtagacgcgg atcttcatct tgccttcctg gatgagttcg tcgtaagcct gcatcacctt 481 cttgtagttg cccggcacgt ccttaaagtc gtcggagtgg atctccacga tgccgcactt 541 taaggccttc tcctgggaca ggaggatgag ttccttcacc ccttccagcg tctcctcggg 601 gatcgcgttg agcacgcagg cccgggcgtt ctcgcggaag atgcccagcg gccgtccggt 661 ctcgtcccgg tcgatgacgc cgccttccac gtcgtccgcg tgttcgctca tgcccatgat 721 gttgagggca gcggtgttgc agacgatcac gtggccgcag gtgcgggtga acgccagagg 781 cacggtcgtc gagatcttgt ccaggtcatc gcgggtgata aaccgcttct cgtcggagaa 841 attgtcctgg ttccagccgc ggccccgcac ccagcgtccc tcggggatgt cgtgggtcgc 901 caggaagttg cgggaatatt cgatgagccc cgcaatggac gtacactcgt tatggttcat 961 gtcgcggagg atgaggcctt cggacaggtt atgcatatgg gtctcgaaaa aggcggggag 1021 tatggtcttg cccttcatat cttcggcttc gacagcgccg acggatccca ggatctcttc 1081 gttgctgccg accgccgtaa aatggccgtc ctccactacg aacgcctgcg cgtgcatggc 1141 gtctttttcc attgtgatca cgttagcgtt gtaataaact ttcttcatgc tgcctcctag 1201 ccaagtggcg aaatccaaaa ataaatacta taattatttt atagttgcag ctcaggtaaa 1261 tcaaggagga acctatggca ccaggaccgg gcgggcacgg acccgttcat tttatgacag 1321 acgaggaaaa gcagcaggtg ccgaaagtca cgaagggctt gctcctgcgc atcgcctcct 1381 atctcaaacc ctataaattt caattcgctt tggtgttcat caccatcctg ctctcggcgg 1441 ccatcggcct gctgccctcg atcatcacgg gacgcatcgt agaccaggcg ctggtgggca 1501 agaatctcca actgctcgta aaattactga tcgcggcctt cgccaccatg gcgctgtcgc 1561 agatcatcgg cgtgctggag agctacatca acgcgtggat cagttcccgc atcatcttcg 1621 acatgaagaa ccagatgtac gcccatctgc agagcatgcc ccattcgttt ttcacgacgg 1681 aaaagcaggg cgacatcatc acgcgcatga attccgatat cgacggggtg agcagcgtca 1741 tctccggcac gctcacgtcg gtggtcagca atatcgcgac ggtcgtgacc acggtcatcg 1801 ccctgttcgc catgagccct cgcctcgcca tcgtcggcat cgcgatcgtg cctcttttgg 1861 tcatccccac gaaaaaagtg ggcgtcacgc gctttaagct gctgacggaa gcccgggcaa 1921 aagccgacga gatgaaccag atcgtggacg agacgctgtc ggtctccggc tcgctgctcg 1981 taaagctgtt tacgaaggaa gaggtggaat acgagcgctt tgtgcggatc aacgaggaag 2041 tgacccgcta caacatcaag gaacagcgct ccggccagtg gttccgggtg atgatgggca 2101 tgttcaccca ggtcgggcct ctgctgatct acttcgccgg cggctatctg atcatcgcaa 2161 aaggtgatcc gaaactgacg gtaggcacca ttacggcgac ggtagccctc atcaaccggc 2221 tgtaccgccc ggtgcagagc ctgctgaaca tccaggtgga ctttacccgc tctctggcgc 2281 tgtttacgag gatcttcgac tacttcgaca agaccaacaa catcaaggat ccgctgctgg 2341 gaacggcgcc ggatctgtcg aacccgtccg tggaattcca gcatgtggca ttttcctata 2401 ccccggacaa gcctatcctg acggatatca acttcttcgt accgggcgga cagatgtacg 2461 cgatcgtcgg gcgctcgggc agcggcaagt ccacggtggt gaacctcatc ccccggctgt 2521 acgacgtgaa cggaggccac gtgaaggtgg ccggacagga cgtgcgcagc ataaagctga 2581 agatgctgcg gcaggccatc ggcatggtct cgcaggaaag ctacctgttt aacgggacga 2641 tccgggaaaa cctgctctat gcaaagcccg acgccaccca ggaagagatc gaagccgcct 2701 gcaggatcgc caacatccac gacatgatcg caggcctcga aaagggctac gacaccgaag 2761 tcggcaaccg gggcctaaag ctttccggcg gagaaaaaca aaggatctct ctggcacgcg 2821 tggtgctgaa agatcccaag atcctgatat tggacgaggc gacgtccgct ttggactcca 2881 tctctgaaaa cgccatccag gatgccctgg acaaggtgat ggaaggccgc acgtccatcg 2941 tcatcgccca ccggctctcc acgatcctgt ctgcggacaa gatcctcgtg gtggacggcg 3001 gcgtgatcgc agagtccggc agccacgaag agctgctggc caagggcggc atctataaag 3061 aactctacga gactcagttc tcgaaagtct taaaggaata gtcaagtaat gaagaaatga 3121 ccggggacgg ttctttatcc cacgggccct gagcttgtcg aagggaccgg gacagagaat 3181 cgtccccctt ccttttctgt tctttagagc aggccgaact gccccatcca gtactgcagt 3241 tccgcaggat cggatgcaag atcctttacg ccgacaggaa gctgctctgt taccatttcc 3301 gttgtgatag taagactgct caccccttcc tgcgaatagg cgaacgttac gctgtccaga 3361 ttatcgatcg tggcaagcag gatggtcgca taacccaact gataactgag agaagcatcg 3421 tgataatttt tttcattctc cagagtgatc gtccagctgt agggcttctc cgacgtctga 3481 agttcattgg tatagggccc cagtttttcc cggatgccca gcgcatcggc caacgcagca 3541 ttggcaggca tgtcgcctac gtaggcatgc cgcgcattcc agactgccgc tgtctgttcg 3601 tcgatcagcg tcccctgata ccagacgatg cggtcgccca gccagatctc ctgaatgttc 3661 cgataagctt cgcccgcagc gccttccgcg cctaccgcgt aaaagaagtc gttatccttg 3721 ccgcccttct tcgctgcgcg gaaccccagt tccatctttg tgccgtcttc ccgcagcaaa 3781 agatctgcgt gggtcacgcc caagctttta tccttcaaac tgccgtcgat cgcgatgcca 3841 tgttcctggg agatgcaatt gatgttgacc gcactcggat cgacgtagct gccgatccgg 3901 tatagcttga tccaggcgcc tgcaccgaac acgaatgccg cggccagaat ccccgcgatg 3961 acccgcttcc acgtgccggt gcggaccttc ttcagatagt cgatctcctt cgcttcggcc 4021 ttgttctcct ccgcagcggg tcccccttcc ccctgcatgg cggccagaac tttgcggcag 4081 tcctcgcagc cttccaggtg ccgctcgacc gcctcgttcg tctcttcgct cgtcagttta 4141 tcgatgtagc tcggcagcag atctcttacc accgcgcagc tcagatcatt cttcatcgtc 4201 tcttaccttc cccttcaatt tctcttttcc tctgtaaaac gtcactctcg cccagttctc 4261 gctctgcccc aggacgtcgc cgatctcctt gaacgacagg cctccgagga gacgcagata 4321 cagcacctcg cgggcaggct ccgggctctc atggatcgcc gcgtacagga ttcttttgcg 4381 ctctgccgcc agcgtttccg cttcgggtga aggagcagtc ccgccgcccg gctcgacgcc 4441 gctttccgcc agttcgtcca gactgtcctg cagcggatgc ttgcgccggt acgccatcag 4501 ctggttcttc gcgatggcgc acagccaggt cgataccttg cagctgccgt cgaaacgccc 4561 gatgctgccg accgcctgcg cgaacgtctc ctgggtcagt tcctcggaca ggtcttcgtc 4621 gcccgtgagc gagc // LOCUS sequence038 4629 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence038 VERSION sequence038 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..4629 /mol_type="genomic DNA" /organism="" /note="sequence038" CDS 584..1765 /product="aldo/keto reductase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011020474.1" /transl_table=11 /codon_start=1 /translation="MQYRKDKNGNELSILGFGCMRFTKKGGKIDIDKAEKEVLAAFDAG VNYYDTAYVYGDSEATMGEIFERNQMRDKIKIATKLPQYLCRSKETVEKYFREELSRLR TDHVDYYLMHHMTDLAMWEKLKEIGILDWIAEKKASGAIRNIGFSYHGNTDNFLKILND YDWAICQIQYNYFDEVAQAGRIGLQAAAAKGIPVVIMEPLRGGKLVNQLPKEALKIFKD SGKSWSPAEWGLRWLYDQPEVTVVLSGMNSLEMVQENCRVASETSAGSLTQTEFDTLEK VCQAIRAKDKVGCTGCRYCMPCPQNVDIPGAFRCYNTMYIESKHEGRFQYAQTAGLVKP PAYASQCIGCGKCEQHCPQNIPIREKLKEADRALRPLPYKIGIEVARKFMFRK" /locus_tag="LOCUS_1800" /note="WP_011020474.1 aldo/keto reductase (Methanosarcina acetivorans) [pid:45.6%, q_cov:100.0%, s_cov:99.5%, Eval:3.4e-95]" /note="MGA_234" CDS complement(1813..3447) /product="long-chain fatty acid--CoA ligase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_005086603.1" /transl_table=11 /codon_start=1 /translation="MAITDLLERNSKLYGNEIALVELNPEIQEEPRVTWREYELIQPTT GSPYRREITWSVFDEKANRVANLLLSRGIRKGQKVAILLMNCLEWLPIYFGVLKTGAVA VPLNFRYTADEIDYCLKLADADVLFFGPEFIGRVEDIFPKIKSQMILFFVGDNRPSYAE SYAEAVSNCSSSSPIVLVEDTDDAAIYYSSGTTGFPKAILLDHTALMQSARMEAIHHET THDDIFLCIPPLYHTGAKMHWFGSLYTGSRAVILKGNSPKAILDAVSLERATIVWLLVP WAQDILAAFDRGDIKPEHYQLSQWRLMHIGAQPVPPSLIRHWLEYFPHHKYDTNYGLSE STGPGCVHLGLENVRKVGAIGVPGFGWKCKIVDENDKEVEQGTVGELCVQGPGVMKCYY HNPDATAEVLKDGWLHTGDMAKQDEEGFYFLVDRKKDVIISGGENLYPVQIEDFLAAHP KIHDVAVIGLPDKRLGEIAAAIIQVKQGMECTEEEIDRFCLELPRYKRPRKIIFADVPR NPTGKIEKPKLRQIYGGTNLVEQQNKA" /locus_tag="LOCUS_1810" /note="WP_005086603.1 long-chain fatty acid--CoA ligase (Mycobacteriaceae) [pid:36.2%, q_cov:88.6%, s_cov:93.0%, Eval:6.8e-71]" /note="MGA_235" CDS 3634..3948 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MAKNTKEDRSTALYEAVLDLRDADEARRFFEDLCSPTELRSMERR FDVARMLLQNKVYTEILEKTGTSSATISRVRRNIIDNGAGGAMKDLILRNGPADKEGHN " /locus_tag="LOCUS_1820" /note="WP_011393534.1 YerC/YecD family TrpR-related protein (Moorella thermoacetica) [pid:51.4%, q_cov:71.2%, s_cov:73.7%, Eval:1.7e-13, partial hit]" /note="MGA_236" ORIGIN 1 ctggtagctg ccgcccatca ggacgatctt gtcgatcttc tcgacgatgg cgggctccat 61 gcggatggcc atgcccaggt tcgtcatggg gccggtggtg accatggtga tcggctcttc 121 gctcgccatc agggtctcca cgatgtattg caccgcgtgc ttctcctgca gtttcagggt 181 gatctccggg aacgccggac cgtccaggcc ggtctctccg tgaatatcag cggcggtcat 241 cttctcgcgc accatgggcc ctttacagcc catatacacg gggatgtcgc ctctgccgat 301 ccactgcagc accttaagcg cgttgcggct cgtcttttcg atggtctgat tgccggattc 361 cgtcgtaatg cccagcagct cgatcttggg gctgcccgcc gccagcataa tggcgaccgc 421 gtcgtcgtga cccgggtcac agtctaaaat gatcttggta atttcgctca tgggataaac 481 tccttttcgg ttctaacgct actatcttac catattttat gcactgtagg ggacggttct 541 gtggtatatt ggcatagata gaaaactgtt taggagagac atcatgcagt acagaaaaga 601 caaaaacgga aacgaactct cgatcctcgg cttcggctgc atgcgcttta cgaaaaaggg 661 cggaaagatc gacatcgaca aggcggagaa agaggttctg gcagcgttcg atgccggggt 721 caactattac gataccgcct acgtctacgg cgacagcgaa gcgaccatgg gcgagatctt 781 tgagcgcaat cagatgcggg ataagatcaa gatcgccacg aagctgcccc agtatctgtg 841 ccgcagcaag gagaccgtcg agaagtattt ccgggaggaa ctgtcgcgcc tccgcacgga 901 ccacgtggac tattacctga tgcaccacat gacagacctg gccatgtggg aaaagctgaa 961 ggagatcggc atcctggact ggatcgccga gaaaaaggcc tccggggcga tccgcaacat 1021 cgggttctcc taccacggca acacggacaa tttcctgaag atcttaaacg actacgactg 1081 ggctatctgc cagatccagt acaactattt cgacgaagtg gcgcaggcag gccgcatcgg 1141 actgcaggct gcagcggcga aggggatccc cgtggtcatc atggaaccgc tgcggggcgg 1201 aaaactggtg aatcagcttc caaaagaggc cttgaagatc tttaaggaca gcggcaaaag 1261 ctggagcccc gccgaatggg gcctgcgctg gctgtacgac cagccggaag tgacggtggt 1321 gctctccggc atgaattcgc tggagatggt gcaggagaac tgccgggtgg catccgaaac 1381 gtccgcgggc tcgctcaccc agacagaatt cgatacgctc gaaaaggtct gccaggcgat 1441 ccgggccaag gacaaggtcg gctgcaccgg ctgccgctac tgcatgccct gcccgcagaa 1501 cgtggacatt cccggtgcgt tccgctgcta caacaccatg tacatcgagt cgaaacacga 1561 aggacgcttc cagtatgccc agaccgcagg actggtaaag cctcctgcct acgcatccca 1621 gtgcatcggc tgcggcaagt gcgagcagca ttgtccgcag aacattccga tccgcgagaa 1681 actaaaggaa gccgaccggg cgctccggcc gctgccctat aagatcggga tcgaagtagc 1741 gcgaaaattc atgttccgca aataggaacg caataaaaaa gcaggaagcc gaaacttcct 1801 gctttttcgt gcctatgcct tattctgctg ttcgaccaga ttggtgccgc cgtagatctg 1861 acggagcttg ggcttttcga tcttgcccgt cggatttctc ggaacatccg caaagatgat 1921 cttccgggga cgcttgtacc ggggcagctc caggcagaag cggtcgatct cctcttccgt 1981 gcactccatg ccctgcttta cctggatgat agccgctgcg atctcgccca gacgcttgtc 2041 gggcaggccg atgaccgcca catcgtggat cttcgggtgc gccgccagga agtcctcgat 2101 ctgcacggga tacaggtttt caccaccgga gatgatgacg tccttcttgc ggtcaaccag 2161 gaaatagaag ccctcttcgt cctgcttcgc catgtcgccc gtgtgcagcc aaccgtcctt 2221 gaggacctcc gccgtcgcgt ccgggttgtg ataatagcac ttcatgacgc cggggccctg 2281 cacgcacagt tcgcccacgg tgccctgctc cacttctttg tcgttttcat ccacgatctt 2341 gcacttccag ccgaagcccg gcacgccgat ggcgccaacc ttgcggacgt tctccagtcc 2401 caggtgcacg cagcccggac ccgtggattc ggacagaccg tagttcgtat cgtatttatg 2461 atgggggaaa tactccagcc aatggcggat gagcgaaggc ggcacaggct gcgcgccgat 2521 gtgcatcagg cgccactggg agagctgata atgctccggt ttgatgtcgc cgcggtcgaa 2581 tgccgctaga atgtcctggg cccagggcac cagcagccag acgatggtcg cccgttccag 2641 ggacaccgca tccaggattg ccttggggct gttgcccttc aggataacag cacgagagcc 2701 ggtgtagagt gacccgaacc agtgcatctt cgccccggta tggtacagcg gcggaatgca 2761 cagaaagata tcgtcgtggg tggtctcgtg atggatcgcc tccatgcggg cggactgcat 2821 cagcgccgtg tggtcgagca ggatggcctt cgggaagccc gtcgtgccgg aggaatagta 2881 gatggctgcg tcgtccgtat cttcgaccag aacgatcggc gaggaggacg agcagttgga 2941 caccgcttcc gcatagcttt ccgcatagga cggacggttg tcgccgacga agaacaggat 3001 catctgggac ttgatcttcg ggaagatgtc ctccacacgg ccgatgaatt cgggaccaaa 3061 gaacagcacg tccgcatccg ccagctttaa gcagtaatcg atctcgtcgg ccgtatagcg 3121 gaagttgagc ggcacagcca cggcgccggt cttgaggacg ccgaagtaga tcggcagcca 3181 ctccaggcag ttcatcagca ggatcgcgac tttctgaccc ttgcggatac ctctcgagag 3241 cagcaggttt gccacccggt ttgccttttc gtcgaacacg ctccaggtga tctccctgcg 3301 gtagggagaa ccggtcgtgg gttgtatcag ttcatattca cgccaggtga cccggggttc 3361 ttcctggatc tccggattga gctccaccag tgcgatctcg tttccgtaca gtttgctgtt 3421 gcgttccagc aggtctgtga tggccataga aaagtctcct tttataagtc aaattgataa 3481 cacaaaaact ttaatacttt tatccgttaa agtcaagcat gaaaaaatct cgttctttta 3541 tgtgttaaag tcctttactt tcacaggtta aagggttaaa atagcttgta tattccctcg 3601 acccgacaga tcaagagaag gaaggttgaa aaaatggcga aaaacaccaa agaagaccgg 3661 agcaccgccc tttatgaagc ggtcctggac ttaagagatg cggatgaagc cagacgattt 3721 tttgaggatc tctgttcccc cacggaactg cgcagcatgg agcggcgttt cgacgttgcc 3781 cggatgctgc tgcagaacaa ggtgtacacg gagatcctgg agaagaccgg caccagcagc 3841 gcgaccatca gccgcgtgcg ccgcaacatc atcgacaacg gagccggagg cgccatgaag 3901 gatctcatcc tgcgcaacgg cccggcagat aaggaaggac acaattaaaa tgaaacagtt 3961 aatgcttggc aatgcagccg ctgcccgggg cctctgggaa gccggcgtgt gcgtggtgtc 4021 ttcataccca ggcacgccca gcaccgagat caccgaggaa gcggcgaagt acgatgagat 4081 ctacgccgaa tgggcgccca acgaaaaggt cgccatggag accgcgttcg gcgcatccct 4141 ggcaggcaag cgcagtttct gcggcatgaa gcacgtcggc ctcaacgtag cggcagatcc 4201 cctgttcacc tgcagctata ccggggtcaa cgccggcatg gtgatcgccg tcgccgacga 4261 cgccgggatg cacagctccc agaacgagca ggattcccgc cactatgcgc gctccgcgaa 4321 gatccctatg ctggagcctg cggattctgc agaagccctg gcctttgcga agaaagccta 4381 cgagctgtcc gaacagttcg acacgcccgt cttcttaaag atgtgcaccc gcatcgccca 4441 ctcccagtcc atcgtggaga ccggcgagcg cgtggaggct cccgcaaagc cctatcagaa 4501 aaacatcgcg aagtacgtca tgaccccggc caacgccatc aagcgccacc ccatcgtgga 4561 ggagcgcacg aaaaagctgg cggaattcgc ggagacctcg gacctcaacc gcatcgaaga 4621 cggcgcgga // LOCUS sequence039 4592 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence039 VERSION sequence039 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..4592 /mol_type="genomic DNA" /organism="" /note="sequence039" misc_feature <1..3444 /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_003427073.1:pyruvate:ferredoxin (flavodoxin) oxidoreductase" /note="WP_003427073.1 pyruvate:ferredoxin (flavodoxin) oxidoreductase (Clostridioides difficile) [pid:64.5%, q_cov:99.6%, s_cov:97.5%, Eval:0.0e+00]" /note="MGA_238" /locus_tag="LOCUS_1830" CDS 3893..4183 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MTLEWFKNPDHVVYVEKEKFVDNFAKETGIPNLRKEIDEFEERPT AEGKIVKGTRRTSLRPLVPNLMFGGDMDMGDNVWIYLGEYYPAYCIYEDQD" /locus_tag="LOCUS_1840" /note="MGA_239" ORIGIN 1 attttcccca tcactccgtc ctccccgatg gctgagatcg tggacgacat ggcagcgcat 61 ggagaaaaga acctgttcgg ccaggaagtc cgcgtagtcg agatgcagtc cgaaggcggc 121 gcatccggca ccgttcacgg ctccctcgca gccggcgctc tcaccaccac ctataccgca 181 tcccagggcc tgctcctcat gatccccaac atgtacaaga tcgcaggcga actcctgccc 241 ggcgtattcc acgttacggc aagaaccctg gctgctcacg cactgtgcat cttcggcgat 301 cactccgacg tcatggcctg ccgccagacc ggtttcgccc tgctgtgctc ctcctccgtt 361 caggaagtca tggacctggc agcgatcgca cacctgtccg ccatcgaagg cagagtacct 421 ttcctgcact tcttcgacgg tttcagaacc tctcacgaaa ttcagaagat cgaagttgtc 481 gattacgacg tctatcgcaa gctgatcgac atggatgctg ttcaggcctt cagagacaga 541 gcgctcaacc ccgaacatcc ctgcatccgc ggcaccgctc agaacccgga tatcttcttc 601 caggccagag aagctgccaa taagtactac gaagcactgc ccgacatcgt tgccgattac 661 atgaagaagc tcggcaagga gatcggcaga aagtatcagc ccttcgacta tgtcggcgct 721 cccgatgccg aaaacgtcat cgtcgccatg ggctccgtct gcgaagcgat cgaagagacc 781 ctgccgcatc tgctggctaa gggcgaaaag gtcggtctca tcaaggtcag actgtacaga 841 ccctggtctc cgaagtacct caagaaggtc atgccgaaga ccgtcaagag aatcgccgtt 901 ctcgaccgga ccaaggaacc cggcgctatg ggcgatcctc tctacatgga cctcaagacc 961 atgtactaca ccgaagagaa cgcacccgag atctacggcg gccgctatgg cttaggctcc 1021 aaggacacca cgccgggaca gatcgttgcg gtctacaata acctgaaggc taagaagccc 1081 aagaacaact tcaccatcgg catcgaagac gacgtctacg gcacttccct caagcccgtc 1141 aagatcgcta ccgaacccga aggcacctac cgctgcaagt tctggggtct gggttccgac 1201 ggtaccgtcg gcgccaacaa gcaggccatc aagatcatcg gcgacaacac cgatatgtat 1261 gcacagggct acttctccta cgactccaag aagtccggcg gcattactgt ttcccacctg 1321 agattcggta agaaccccat caagtccacc tacctcatca ccgaagcaga cttcgtcgct 1381 tgccacaacg aatcctacgt tcacgcatac gatgttctgg ccggtctgaa gaagggcggc 1441 actttcctgc tcaactgcac ctgggacgat gcggctctcg aagagcatct gcccgctgcc 1501 atgaagcagt acatcgccaa gaacaagatc aagttctaca ccatcgatgc gaccgacctg 1561 ggcgtcaaga tcggcctcgg caaccgcatc aacatgatca tgcagtccgc gttcttcgcg 1621 ctcaccaagg tcatccccgt ggaagatgct gaaaagtatc tgaagaagtc catcgagaag 1681 acctacggca agaagggcga aaacgtagtc aagatgaact gggctgccgt ggatgccggc 1741 ctcaccggat tccacgaagt caaggtaccc gctgcctgga aggatgccgt tgacgctccc 1801 gccaaggcca agaaggtccc cgaattcatc gaaaacgtac tcgtacccat gaaccgtcag 1861 gaaggcgaca agctgcccgt ttccaccttc gtggacatcg cagacggcac cttccccagc 1921 ggcaccgctg cttacgagaa gcgcggcgta gccgtcaagg tacccatgtg gcatcctgaa 1981 aactgcatcc agtgcaacca gtgctccttc gtctgcccgc acgcaacgat ccgtccgatc 2041 ctgctcaccg aggaagagaa ggcaaaggct cccgcaagct tcgcgaccat ccccgcgatg 2101 ggcaaggaag cggccggcat ggcttacaga atgcaggtat ccccgctcga ctgcctcggc 2161 tgcggcaact gcgccgacat ctgcccgggc aagaagggcg caaaggctct caccatggaa 2221 agctttgctt ctcaggaagc ggaagctgcc aactgggagt tcggtatgga gatcggcgaa 2281 aagcccgtta tggacaaggg ttccgtcaag ggttcccagt tcgcattccc gtacttcgag 2341 ttctccggcg cctgcgcagg ctgcggcgag actccgtaca tcaaggtcgt tacccagctg 2401 ttcggtgacc gcatgatgat cgctaacgcg accggctgct cctccatctg gggcgcatcc 2461 gcaccttcca tgccttacac caccgacaag aacggcagag gtccgtcctg ggcgaactcc 2521 ctgttcgaag acaacgctga attcggtctc ggtatggcta ccgctgttcg ccagaacaga 2581 gaaaaggtaa aggatatcgt ctgcgaactc gcagagacca ccaagagcgc agagatcaag 2641 gaagctgcaa aggcttgggt cgaaggcatg gacgaaggtt ccacctccag agaacagtcc 2701 gaagccctga tggctgcggt caataaggcg aagctgtccg gcagagctgc cgaactcaag 2761 gcagaactca aggcgaagga agacttcctc gtcaagaaga gcgtctggtg cctgggcggc 2821 gacggctggt cctacgacat cggttacggc ggactggacc acgttctcgc ttccggcgaa 2881 gacatcaacg tgctcgtctt cgataccgaa gtttactcca acaccggcgg tcagtcctcc 2941 aaggcgactc cggctgctgc gatcgcaaag ttcgctgcaa gcggcaagaa gaccaagaag 3001 aaggatctgg gcatgatggc agccagctac ggctacgtct acgttgcaca ggtcgccatg 3061 ggcgccgaca agaaccagtt cctgaaggcg atcaaggaag ccgaaagcta ccatggtccg 3121 tccctcatca tctgctacgc tccctgcatc aaccacggcc tcaagaaggg catgggcaag 3181 actcaggaga acgagaagct ggcagtcgaa tgcggttatt ggcagctgta ccggttcaac 3241 cccgagctca aggcaaaggg cgagaacccc ttcgttctgg attccaagga tccgaccggt 3301 tccttccgcg acttcatcat ggatcaggtc cgctatgcgt ccctggccaa ggaattcccg 3361 gacaaggcag aagctctgta cgaaaaggca gagaacgacg ccaaggaaag actggaaggc 3421 tacaaggtca gagccggcaa ataatcggtt gacccgaata taaaggcata acagaactcc 3481 cggagcggca tgctccggga gtttttttgt tctctacatc ttgcgtattt ccggctgagg 3541 tgatacactt tatctacaag ttgatagatt ctatgttccg cagcaatgcg gcgaagaggg 3601 aaaccggttc aagtccggtg cggtcccgcc gctgtaagcg aagagcgacg gcaaaagcca 3661 ttgggaaacc gagaaggcgc cgaagcgacg atgcgcaagc caggagacct gcatagaaag 3721 aaaaagcacc cgacgcggaa atcggaagag ctttacaagc gcagtaaata cgggctgtgg 3781 aattttttcc acagcctttt cgtttgcttt ccatccgcag gggtttcagc caaggatcca 3841 gacttgtctg aaacccctgc tccttcataa atagagcaaa aaggaggatc ttatgacact 3901 ggaatggttt aaaaatcccg atcacgtggt atatgtcgaa aaggaaaagt tcgtggacaa 3961 cttcgcgaag gagaccggca ttcccaatct ccgcaaggag atcgacgaat ttgaggaacg 4021 tccgaccgca gaaggcaaga tcgtaaaagg cacgcgccgc acatcgctgc gcccgctggt 4081 ccccaacctg atgttcggcg gcgacatgga tatgggcgac aatgtctgga tctatctcgg 4141 cgagtattat cccgcctact gcatctacga agatcaggac tgacgcgtca acaacacgaa 4201 aaaacggagc ttcggctccg ttttttgttt ctctattctt ctctgagcag cgccagccct 4261 ctggccagct tggaacggtc ttccggcacc aggtgatatt tctcctggag gcggtcaccc 4321 agggactgga tatccttcgg atcgcctgcg tacagttcga tctccagttc catgatgggg 4381 atctccccct tgtcggtgat gatgctgccc gtgtcgatgg ccagctccat gatgctgccg 4441 ccgtaggtga gccggcagcg gctgcgcagg tagcgcatct ccagcaggtt gatgagaggg 4501 tcatccccga tgagatccag cagcactttg ccgtcctcgc tctccttaaa cagttctttg 4561 ggagaactga tgaagtgttc catggaggcg gg // LOCUS sequence040 4555 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence040 VERSION sequence040 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..4555 /mol_type="genomic DNA" /organism="" /note="sequence040" CDS complement(908..2374) /product="TrkH family potassium uptake protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_012870209.1" /transl_table=11 /codon_start=1 /translation="MILNQKLIAKVLSAVASVVGAAMLLPAAVSAVYKEWDVFRAFLLC ALPVLAAGLIVMRITPSQRSEDLRMRDGFFIVGVSWLVMSLVGAIPFMLTGAIPNFADA YFETASGFTTTGSTILSEIEHLPKGILFWRSFTHWLGGMGVLVLTIAILPKLGIGGQKI MRAETTGPTMDKISFTVNDTARTLYMIYLVFTVLETVLLCLGGMSLFDSLVHTFGTVGT GGYSSYNASIGAFHSGYFEWVIGIFMMLCGVNFSLYSNVYRRTPGKIFRDPEFRVYLGI MGGATLFITCMLMAHRYYNGLADTLRTAFFQVSSIMTTTGYGTVDFDLWPLPCRFVLFL LMLIGGCAGSTGGGMKVIRIILTLKLVKRGIFRKLHPNAVSPIKVGDTIMSAETMSGVA GFVMLYLFTTLISTLVLCLEKVSLVTALSSVVACLSNIGPGFEAVGATQNFGFYSAPAK MLLSLLMIAGRLELFTVILLFTPAFWNKKK" /locus_tag="LOCUS_1850" /note="WP_012870209.1 TrkH family potassium uptake protein (Thermanaerovibrio acidaminovorans) [pid:47.6%, q_cov:86.1%, s_cov:87.0%, Eval:6.0e-116]" /note="MGA_242" CDS complement(2381..3766) /product="Trk system potassium transporter TrkA" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011459869.1" /transl_table=11 /codon_start=1 /translation="MGGLVPPSHFKGKSMKVAIVGAGKLGLAITEALLGGGNEITLIDK DESLIQKVSGRYDILTVAANAKRVDIMKELKIWTYDLLIAATDQDDRNIVICSFAKELG CPQTIARVRSPEHVEQLDFIMKTQRIDHIVNPDLACAQEIYKYLTEKYTLKDGQFLADG VTILEFKIDKIPALVDIQVRDLPGVLQNILIAAVSRNGKIIVPNGNTKLLAGDTLYVIG QEKQIKDISEKVHEKKVYTDLSRVMIAGGGKTGYFLAKKLSEFGAAVKIIEVDRERCEW LSAKLNGVLVLHGDATDTNLLRDENMDDMDAFVAATGFDEENLLLSLTAKQHNIEEVVA KVSRKNYASLTETLGVSMIINPVDMCAANILRFIQRDGTVIFSQLIQGQAEFIEVWAER GMPLTEKTLLDLDIPEGVIIAAIHRGDDVIIPSGRTKVQVGDRVIILSLLSSVPRLEGL LKH" /locus_tag="LOCUS_1860" /gene="trkA" /note="WP_011459869.1 Trk system potassium transporter TrkA (Desulfitobacterium hafniense) [pid:33.4%, q_cov:97.0%, s_cov:98.9%, Eval:1.2e-65]" /note="MGA_243" CDS complement(3771..4430) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MARQKESLEMYLTEEQIEYIKSLPEEERQQATEDLLGIKRFANGA VDLTTVPGKKGDFFRKKQRIFNPERVRDEEGLFEKVYSDDNYFEATCPFCGTTAEHQGK RYHYSKKTKMLIGRDAALMAVVAILVMLRVLNVILALVAITLITMDLANHARRKMFYTV TCRKCGAHFPLDQDEYDKLVEDLKAQAEAEAAEAEQEDEPEEEEAEETAETEVTEE" /locus_tag="LOCUS_1870" /note="MGA_244" ORIGIN 1 gcttctccgg ccgttgcata cgttctcgta acgtacagat ccgctgcgat cagcagtatg 61 gcgcctgccg cgatccccag gtaggccttc agctccgtat tgcgtcgtat ggtgtcttta 121 tcgcgcttga tgatcgcaaa atagacggcg aagctgacgc aggagatgag catgaacagc 181 gccatgacgc cttccgcgaa gggcgtggta aggtgaagca gcccctgagt cctgtgattc 241 atgccgccgg aagcggaggt cccgaagctc agcaggatgg aatcgaagga agaaaggccg 301 ctcagcttta gcaggaccgc ctgcagcagg gtcatgccga tgtagatcgc atagatcgcc 361 cgggacgtgt tcttgcggtt gaaaaagatg ttgtcggtgt tgacgccggt gctctcgctc 421 ttgatgagag agccctggtt ctcaaaggtc gcaggcagca gcgtctgcat taagaccagg 481 atgccgatgc cgccgatcca ctgggcaaaa gagcgccaca gcaggaaggc ccggggcaga 541 tcgccgatct ttaagaagac cgtggcgccc gtcgtcgtaa aggccgacac ggattcaaag 601 aacgccgaga agggggaatg cagcagcccc gcgataaggt aaggcagggc tccgatgatg 661 gatacgcaga tccacgacag cgacgtgagc agcaggctgt ccttgagggt gatccagttg 721 ccggcgtcct tataagtgag agaaaggctg gcgccgatgg cgagggcgaa ggccgcgggc 781 acgaggaacg ccaggatcgc gtcggtctga ttcgtatagg cagcgtaaag caggggcacg 841 atgagggcgg ccccggtaaa ggtcagcagg tgacccaatg tcttcgcgat gcttctcaga 901 tggatgatca tttcttctta ttccagaacg cgggggtaaa cagcaggata acggtaaaca 961 gctccagtct gccggcgatc atcagcaggg agagcagcat tttcgccggc gcggagtaga 1021 agccgaaatt ctgcgtggcg ccgacggctt cgaaacccgg tcctatgttg gacaggcagg 1081 cgacgacgct gctgagcgcc gttacgaggc tgactttttc cagacacagc accagggtgg 1141 agatcagcgt ggtgaacagg tacagcatga cgaagcccgc gacgcccgac atggtctccg 1201 cggacatgat ggtgtcgccc accttgatcg gggataccgc gttgggatgc agcttgcgga 1261 agatgccgcg ctttacgagc ttgagcgtaa ggatgatgcg aatgaccttc atgccgccgc 1321 cggtggagcc tgcgcagccg ccgatgagca tcagcaggaa cagcacgaag cggcagggga 1381 gcggccagag gtcgaagtcc acggtgccgt agccggtggt cgtcatgatg gagctcacct 1441 ggaagaacgc ggtccgcagc gtatccgcca ggccgttata gtaccggtgg gccatcagca 1501 tgcaggtgat gaacagcgtg gcgccgccca tgatgcccag gtagacgcga aattccggat 1561 cgcggaagat cttaccgggc gttctgcggt agacgttgct gtacagactg aagtttacgc 1621 cgcacagcat catgaagatg ccgatgaccc attcaaagta gccgctgtgg aaggctccga 1681 tgctggcgtt ataactggag tagccgccgg tgccgacggt gccgaacgtg tgcaccaggg 1741 aatcgaacag gctcatgccg cccaggcaga gcagaacggt ctccagcacc gtaaacacca 1801 ggtagatcat gtacagcgta cgggcggtat cgttgacggt aaagctgatc ttgtccatgg 1861 tcggaccggt ggtctcggcc cgcatgatct tctgcccgcc gatgcccagc ttcggcagga 1921 tggcgatggt gagcaccagc acgcccatgc cgcccagcca gtgggtgaaa gagcgccaga 1981 acaggatgcc tttgggcaga tgctcgatct cggacaggat ggtggatccc gtggtcgtaa 2041 agccggatgc tgtctcgaaa taggcgtccg cgaagttggg gatcgcaccg gtgagcataa 2101 agggaatggc gccgaccagc gacatcacca accagctgac gcccacgata aagaaaccat 2161 cgcgcatccg caggtcttcg gagcgttggc tcggcgtgat gcgcataacg ataagccctg 2221 ccgcaagcac cggcagagcg cagagcagaa acgcccggaa gacgtcccat tccttataaa 2281 cggcagacac cgcagcgggc aggagcatgg cggctcccac gaccgaggcc acggcgctga 2341 gtacttttgc gataagcttt tggtttaaga tcatggtgtc ttaatgcttc agcagtcctt 2401 ccagtctggg gacggaagag aggagcgaca ggatgatgac ccggtctccc acctgcacct 2461 tcgtgcggcc gctggggatg atgacgtcgt cgccccggtg gatcgccgcg atgatgacgc 2521 cctcgggaat gtccagatcc agcagcgtct tttccgtgag gggcatgccg cgctccgccc 2581 agacttcgat gaattccgcc tgaccctgga tgagctggga gaagatgacg gtgccgtctc 2641 tctggataaa gcgcaggatg ttggctgcgc acatgtctac ggggttgatg atcatggaga 2701 cgcccagggt ctccgtgagg gaggcgtagt tcttgcggct cacctttgcc acgacttcct 2761 cgatgttgtg ctgcttcgcc gtgagggaca gcagcaggtt ctcctcgtcg aagccggtcg 2821 ctgcgacgaa ggcgtccatg tcgtccatgt tttcgtcgcg cagcaggttc gtgtccgtag 2881 cgtcgccgtg gagcacgagc acgccgttga gcttggcgga cagccattcg cagcgttctc 2941 tgtccacttc gatgatcttg acggcagcgc cgaactccga gagcttcttt gccaggaaat 3001 aaccggtctt accgccccct gcgatcatga cgcgcgacag gtccgtgtag accttctttt 3061 cgtgcacctt ctcgctgata tccttgatct gcttttcttg accgatgacg tacagcgtgt 3121 cgccggccag cagtttcgtg ttgccgttgg gcacgatgat cttgccgttc cgggaaacgg 3181 cggcgatcag gatgttctgc agtacgccgg gcagatctct cacctggatg tcgacgaggg 3241 cggggatctt atcgatctta aactccagga tcgttacgcc gtccgcgagg aactggccgt 3301 ccttgagcgt atatttttcc gtaagatact tgtagatctc ctgggcgcag gcgaggtccg 3361 ggttgacgat gtgatcgatc cgctgggtct tcatgatgaa gtccagctgt tccacgtgtt 3421 ccggcgaacg cacccgcgcg atggtctgcg ggcatcccag ctccttcgca aagctgcaga 3481 tgacgatgtt gcggtcgtcc tgatccgtcg ctgcgatcag caggtcgtac gtccagatct 3541 tgagctcttt catgatatcc acccgcttgg cgtttgccgc cacggtgagg atatcgtacc 3601 gtccgctgac tttctggata aggctttcgt ccttgtcgat gagagtgatc tcgttgccgc 3661 cgccgagcag ggcttccgta atggcgagcc ccagtttgcc ggctcctacg atggctactt 3721 tcatgctttt ccccttaaaa tgcgagggcg gcacaaggcc gcccatatct ttactcttcg 3781 gtaacttctg tttctgcggt ttcttccgct tcctcttctt caggttcgtc ttcctgttcc 3841 gcttccgcag cttccgcttc ggcctgcgcc ttcagatctt cgacgagctt gtcgtattcg 3901 tcctggtcga gagggaagtg cgcaccgcac tttctgcagg tgacggtata gaacatcttc 3961 cggcgggcgt ggttcgcaag gtccatggtg atgagcgtga tcgctaccag cgccaggatg 4021 acgttgagca cccgcagcat gaccaggatg gcgacgaccg ccatcagagc ggcgtctctt 4081 ccgataagca tctttgtctt cttggagtag tgataccgct tgccctggtg ctctgccgtc 4141 gtgccgcaga agggacaggt cgcttcgaag tagttgtcgt cgctgtagac tttctcgaac 4201 agaccttctt cgtctcttac gcgttccggg ttgaagatgc gctgcttttt gcggaagaag 4261 tcgcctttct tgcccgggac cgtcgtcagg tccacggcgc cgttggcgaa acgcttgatg 4321 cccagcaggt cttccgtcgc ctgctggcgt tcctcttcgg gaagggattt gatatattcg 4381 atctgctctt ctgtgagata catctccaga gattcttttt gtcttgccat ctttgtcctc 4441 ctgaacaata ttccagaata ttatacatta taccataaaa gaaaggcgtt gtatcccttt 4501 ctgcggatag tttcctatgg tataatacat tattaacgtt tagaaagagg tagac // LOCUS sequence041 4493 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence041 VERSION sequence041 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..4493 /mol_type="genomic DNA" /organism="" /note="sequence041" CDS 479..1564 /product="DNA-processing protein DprA" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_010943186.1" /transl_table=11 /codon_start=1 /translation="MKNLIYDVWLSTLPGVTSARKLELMRRFGSPAGVFQAPEAELKEM FSKNNILSTSEGGLHRLLQKDLRRAEWCLKQAKKTGAAVVSIRCASYPPQLKTIKDPPI VLFALGDVSLLQTRCIAVVGTRRASPYGKWAAAEIAKRVALAGVTVVSGMAEGIDSAAH TGCLKAGGKTIAVFGTGVDVCFPKSNLRLYEEIRENGLLLSEYTFGESGYAFNFPERNR IISGLSESCIVAEGAVKSGSLITAGLAAEQGRNVFALPGNINQPGSAGTNLLISEGVPP INSMEHLLQTLGLASLDVQQRTDLSDQEKRLMTHIASCGSSSKQFILDSCGLPFAESSP LLTCLELKGLVRMEGAQVYVL" /locus_tag="LOCUS_1880" /gene="dprA" /note="WP_010943186.1 DNA-processing protein DprA (Geobacter sulfurreducens) [pid:40.6%, q_cov:94.7%, s_cov:95.2%, Eval:4.2e-57]" /note="MGA_246" CDS 1651..3735 /product="type I DNA topoisomerase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_010965091.1" /transl_table=11 /codon_start=1 /translation="MATSKYLVIVESPSKARTIGKFLGSRYNVVASAGHLRDLPKSTLG VDIENDFEPKYINVRGKADLIKTIKKDAKEASKVFLATDPDREGEAISWHLCSLLGIDP AKAYRVVFPEITKSAVLEGIKNSRPIDMNLVNAQQGRRVMDRIAGYEISPVLWNKIGKG LSAGRVQSAALKIICDREREIEDFVPQEYWNIAADLTKEGLTPAQQKKNTFTAALAEYK GKKVKLTSKEETDKVLTDLNKGSYSVKTLEPYETVKRPFAPYTTSTMQQDASIKLHFTP SKTMMLAQQLYQGVSVKGHGTTGLITYMRTDSVRISDEADRACKSFIRNTYGAGYVGNN HYTNKSSNTQDAHEAIRPSYMDLDPETVKDSLQNDQYKLYKLIWSRFVASRMKPAVYSG NAAEIANGDYILKAKGSALTFDGYLKVYSDNSKEKDKMLPPLAVGEPLKLVKLDGEQKF TQPPARFTEASLIKEMEENGIGRPSTYATIVNTLTEKRYVAKEKNALSPTDLGNKITYV IMEPYFKELVDVGFTADMEKQLDKVEEGDVRWQSVVGDYYNNYLKDELAKARAEVEKVV TAPEFIGENCPECSKPLVKKSGKFGSFIACSGYPDCRYTRNIIVGTGVACPKCGKEIIQ KRSRKGKTFYGCSGYPDCDQVFWYRPVDKKCPKCGSLLVERGRKLVCSKEDCHYSENKQ " /locus_tag="LOCUS_1890" /gene="topA" /EC_number="5.6.2.1" /note="WP_010965091.1 type I DNA topoisomerase (Clostridium) [pid:51.9%, q_cov:98.8%, s_cov:98.4%, Eval:2.6e-211]" /note="MGA_247" CDS 3756..4295 /product="ATP-dependent protease subunit HslV" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_172636479.1" /transl_table=11 /codon_start=1 /translation="MMQFHATTIVLVKRSADDICIGGDGQVTMGEHAIMKNNAKKVRKI YKNSVITGFAGSVSDAFSLTEKFEKKLEEHGGNLKRAAVALAQTWRSDGGARNLEAMML AADKESVLLISGTGEVIEPDENYVAIGSGGNYAYAAAHALYDHTDMDAESIVRESLKIA SDICVYTNNHISVEKL" /locus_tag="LOCUS_1900" /gene="hslV" /EC_number="3.4.25.2" /note="WP_172636479.1 ATP-dependent protease subunit HslV (Desulfitobacterium) [pid:56.4%, q_cov:100.0%, s_cov:100.0%, Eval:3.7e-52]" /note="MGA_248" ORIGIN 1 gaaagcgacc gcaaacgcta tctgaacaag gtctccgggc ctcttttaga ccgcatcgac 61 atgcatgtgg cggtagagcg gacgacatac cgggagatga gcggtccggg acctgcgatc 121 gctgcgccgc cggacgaagc agccgtatct tccgccatgc tgcggcaggg cgtgatgcag 181 gctgtcgaga tgcagcgcca gcgctatgag ggcttgggga tcgccaataa cgccaggctt 241 tcgccccggg aaacagagcg gttctgccgt ctggacagtt cgtgcagcgc gttgatggag 301 gcggcatttt cccgctattc gctgtccgca aggtcgtacc accgcatcct gcgtacggcg 361 cgcaccatcg ccgatatcga tggatgcggg gagatccggg aagatcactt gctggaggcg 421 ctgagctatc gcatgccgga gcgttttttc gaatcgtaaa caaggggagg gggatagtat 481 gaaaaatctg atctacgacg tatggctgag tacgctgccc ggcgtgactt ctgccagaaa 541 actggaattg atgcgccgtt ttggcagtcc tgccggtgtt tttcaggcgc cggaagcgga 601 attgaaagag atgttttcaa aaaacaatat tctgtctact tcggaaggcg gccttcacag 661 actgctgcag aaggatctgc ggagggcgga gtggtgcttg aaacaggcca aaaagaccgg 721 cgccgccgtc gtctccatac gctgcgccag ctacccgccg cagctgaaga cgatcaaaga 781 ccctcccatc gttttgtttg ccctggggga tgtctccttg ctgcagaccc gctgcatcgc 841 ggtggtcggc acccgtagag cgtctcccta cggcaaatgg gcagcggcgg agatcgcaaa 901 acgagttgcc cttgccgggg tcaccgtcgt atcgggcatg gcggaaggca tcgattcggc 961 ggctcacacc ggttgtctga aggccggcgg caagaccatc gccgtattcg gcacgggggt 1021 ggacgtgtgc tttccaaagt ccaatctgcg gctgtacgaa gagatccggg aaaatgggct 1081 gttgctctcc gaatacacct tcggcgaaag cggatacgcc ttcaatttcc cggagcgcaa 1141 ccgcatcatc tccggactgt ccgaaagctg catcgtggcg gaaggcgccg tcaaaagcgg 1201 gtcgctgatc acggcgggcc ttgcggcaga gcagggaaga aatgtgtttg cgctgcccgg 1261 aaacatcaac cagccgggaa gcgccggtac caatctgctg atctccgaag gcgtgccgcc 1321 tatcaactcc atggagcatc tgctgcagac gctgggactc gcctccctcg atgtgcagca 1381 gcgcaccgat ctgagcgatc aggaaaagcg gctgatgacg catatcgcct cgtgcggcag 1441 cagttcgaaa cagttcatcc tggacagctg cggactgccg tttgcggaaa gttcacccct 1501 ccttacctgc ctggaactca agggactcgt gcgcatggag ggggcgcagg tctatgtctt 1561 ataatgtagg aagtttgtct gggggcttta caattgctac atcataatta taataaataa 1621 ttgtatttcc aatgcagaga aaggagcact atggctactt ccaaatattt agtgatcgta 1681 gagtccccgt ccaaggccag gaccatcggt aaattcctgg gcagccgcta taacgtggta 1741 gcgagcgcgg gccatctccg cgatcttccc aagagcacgc tgggcgtgga tatcgaaaac 1801 gatttcgagc ccaaatacat caacgtccgg ggcaaggcgg acctcatcaa gaccatcaag 1861 aaagacgcga aggaagcttc gaaagtcttt cttgcgacag accccgaccg ggagggcgaa 1921 gccatctcct ggcacctgtg cagtcttctg ggcatcgatc ctgccaaggc ttaccgggtc 1981 gtctttcccg agatcacaaa gagcgcggtg ctggagggca tcaaaaacag ccgtcccatc 2041 gacatgaacc tggtgaacgc ccagcagggc cgccgggtga tggaccgcat cgcaggctac 2101 gagatcagtc ccgtgctgtg gaacaagatc ggcaagggcc tttccgcagg cagagtgcag 2161 tccgcggccc tgaagatcat ctgcgacaga gagcgcgaga tcgaggattt cgttccccag 2221 gaatactgga acatcgcagc ggacctcacg aaagagggcc tgacccccgc acagcagaag 2281 aaaaacacct ttacggccgc gctggcggaa tataaaggca aaaaggtgaa gcttaccagc 2341 aaagaagaga ccgacaaggt cctgacggat ctgaacaaag gctcttacag cgtaaagacg 2401 ctggaaccct acgagacggt caagcgtccc ttcgctccct atacgacgag caccatgcag 2461 caggatgctt ccatcaagct gcactttacg ccctccaaga ccatgatgct cgcacagcag 2521 ctgtaccagg gtgtctctgt aaagggtcac gggacgaccg gtcttatcac ctacatgaga 2581 acggactccg tccgtatctc cgatgaggca gacagggcct gcaagagctt tatccgcaac 2641 acctacggcg caggctacgt cggaaacaat cattatacca ataaatcgtc caatacgcag 2701 gacgcccacg aagccatccg gccttcctac atggatctgg atccggagac ggtcaaggac 2761 tccctgcaga acgatcagta taagctgtac aagctcatct ggtcgcgctt cgtggcgagc 2821 cggatgaagc ctgccgttta cagcggtaac gcggcggaga tcgccaacgg agactatatt 2881 ctgaaggcga agggttctgc gcttacgttc gacggctacc tgaaggtcta cagcgacaat 2941 tccaaggaaa aggacaagat gctgccgccg ctggcggtgg gtgaaccgct caaactcgtc 3001 aaactggacg gggaacagaa gtttacgcag ccgcctgccc ggttcacgga agccagtctc 3061 atcaaggaga tggaggaaaa cggcatcggc cgtccgagca cttacgccac catcgtcaac 3121 acgctgacgg aaaagcgcta tgtagcgaag gaaaagaacg cgctgtcccc gacggatctc 3181 ggaaataaga tcacctacgt catcatggag ccgtatttca aggaactcgt ggatgtgggc 3241 tttacggcgg acatggaaaa gcagctggat aaggtggaag agggcgacgt gcgctggcag 3301 tctgtcgtcg gcgactacta caacaactac ctgaaggacg aactggcaaa agccagggcg 3361 gaggtagaaa aagtcgtaac ggcaccggaa ttcatcggag agaactgccc cgagtgcagc 3421 aagcctctgg taaagaagag cggtaagttc ggctccttta tcgcctgcag tggctatccc 3481 gactgccgct acacgaggaa catcattgta ggcaccggtg tcgcctgccc gaagtgcggc 3541 aaggagatca tccagaagcg cagccgcaaa ggcaagacgt tctatggatg cagcggctat 3601 cccgactgcg accaggtctt ctggtacaga cccgtggaca agaaatgccc gaagtgcgga 3661 tcgctgctgg tggaaagagg ccgcaagctg gtctgcagca aggaagactg ccactattcc 3721 gaaaacaagc agtaagaggg gtcaagagag aaaaaatgat gcaatttcat gcaacgacga 3781 tcgttttggt aaaaagaagc gcggacgaca tctgcatcgg cggcgatggc caggtgacca 3841 tgggcgagca cgccatcatg aagaacaacg cgaagaaggt tcgcaagatc tataaaaatt 3901 ccgtcatcac cgggttcgcc ggatccgtct ccgacgcctt ctccctcacg gagaagttcg 3961 aaaagaaact ggaagaacac ggcggcaatc tgaagcgagc tgcggtcgcg ctagctcaga 4021 cctggcgcag cgacggcggc gccaggaacc tggaagccat gatgctggcg gcggacaagg 4081 agagcgttct gctcatctcc ggcaccggcg aagtcatcga accggacgag aattatgtgg 4141 ccattggctc cggcggcaac tatgcctatg ctgcggctca cgccctgtac gaccatacgg 4201 atatggatgc ggagagcatc gtgcgcgaat ccctgaagat cgcgtccgac atctgcgtct 4261 acacgaacaa ccacatctcc gtagaaaagc tgtaaggagg ctgacccatg gcaaagacat 4321 ttaccgatta cacgccgaaa gagatcgtgg cggaactgga taaatacatc atcggccagg 4381 ataaggccaa gcgctctgtc gccgttgccc tgcgcaaccg ctacagaaga aaccagctgt 4441 ccgaggagat gagagaggag atctccccga agaacatcct gatgatgggt ccc // LOCUS sequence042 4471 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence042 VERSION sequence042 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..4471 /mol_type="genomic DNA" /organism="" /note="sequence042" CDS complement(261..2537) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MSSENKDNRERLSKEELDRAMQERREKRAKARAKKDKRSGKSGTS AKTSASHTHAAKSAKPDLKGLLPKKETPKKDKKKTRTAAAKASAAKSASAKGFRPFACL LLGPIFALFEILLTVLTGSGFLHVGVFHAFGIGLVLGAVCSLFAEKISFILEAVVLEIF TIAFLVEYFIYNSYRVFMSKTDIATGAGDVVTGFGGVVVGLILRGIPIILLFHVPLALM IWRRKDLGFRKPMNFRPAGVQALAGVVLLILGALFAGIGGREGNFSSDVQTKGLIYATG KDLRGGYELDMEAALDAPDVLSAAHGTGSSSGPSFFGLNKLNVDLDALIASSSGNIKAA HQYVQQQKPSPKNEYTGLFAGKNLIFITAEAFSEELISEELTPALYRMATKGINFNDYY QPAWGGSTSTGEYSNMMGIVPMDGVNSIQDTIGKDNSINIFHKLRSLGYFSECYHNGLY DYYGRNRTHTGLGFDNFIAKGNGMEDYLLDVWPDSDLEMMKYTMTRYMDHQPFSVYYMS ISGHTNYAWSANAMSKKNRDAVAELPYSEQVKGYFACNLELEYALEYVIQTLEEAGIAN DTVIVLGTDHYPYGLEKSAAWGTDKDYLQELYGYAYQTPKERDHSRLLIWSGCLEESDP IQIDFPTYSLDIQPTLCNLFGVDYDSRLFVGQDVFSEEEPLVLWTNGSFLTDKGYYYGG KWTDADPAQPASQDYINAMRSKVQGKLSYSKLVLSTDYFRSFNAGVIPSAPKTEDAAPA PETGE" /locus_tag="LOCUS_1910" /note="WP_002293776.1 LTA synthase family protein (Enterococcus) [pid:24.8%, q_cov:48.0%, s_cov:52.4%, Eval:2.5e-21, partial hit]" /note="MGA_251" misc_feature complement(2521..>4471) /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_000791061.1:LTA synthase family protein" /note="WP_000791061.1 LTA synthase family protein (Bacillus cereus group) [pid:24.9%, q_cov:57.3%, s_cov:58.5%, Eval:2.4e-25, partial hit]" /note="MGA_252" /locus_tag="LOCUS_1920" ORIGIN 1 aggatggacg cgccgccgaa caggcctatt tcgcgccgga attcggtctc ttcagaagca 61 agctcggcct cgtgcatttg gagattcttg ttttcatcca taatgtagcc tttctcttct 121 aaaaagatta taaaagaaat attacgtgat attcataata taacacgatt tataacggag 181 tacaacactt taagccgtaa aaaaggcccc ggttcagcgc cggggcctta atttgttaat 241 atttagatgt ctgaagaaat ttattcacct gtttccgggg ccggtgcggc atcctccgtt 301 ttcggcgcgc ttgggatgac cccggcattg aaggatctaa agtaatccgt actcaggaca 361 agtttcgaat aactgagctt accctgcact ttcgagcgca tggcgttgat ataatcctgg 421 ctggcgggct gggccggatc cgcatccgtc cacttgccgc cgtaataata gcccttatcc 481 gtcaggaacg atccgttggt ccagagcacc aggggctcct cttccgagaa gacgtcctga 541 ccgacgaaca gacgggaatc gtaatccacg ccgaacagat tgcacagcgt gggctggatg 601 tccaggctgt aggtggggaa atcgatctgg atggggtcac tctcctccag gcacccgctc 661 cagatgagca gccgggagtg gtctctctcc ttcggcgtct gataggcgta gccgtacagc 721 tcctgcaggt agtccttatc cgtgccccag gctgcactct tttcgagacc gtagggatag 781 tggtccgtgc cgagcacgat gacggtatcg ttcgcgatgc ccgcctcctc cagggtctga 841 ataacgtatt ccagggcgta ttccagctcc aggttgcagg cgaaatagcc cttcacctgc 901 tcggaatacg gcagctctgc caccgcgtcg cggttcttct tggacatggc gttggcggac 961 caggcatagt tcgtgtggcc gctgatggac atgtaataga cggagaacgg ctggtgatcc 1021 atgtaccgag tcatggtata tttcatcatc tccaggtccg aatccggcca gacatccagc 1081 agatagtcct ccatgccgtt gcccttggca atgaagttgt cgaagcccag gcccgtatgg 1141 gtccggttgc ggccgtagta gtcgtacagg ccgttgtgat agcattcgct gaagtagccg 1201 aggctgcgca gcttgtggaa gatgttgatg gagttatctt ttccgatggt gtcctggatg 1261 gagttgaccc cgtccatggg cacgatgccc atcatgttgg aatattcgcc ggtggacgtg 1321 ctgccgcccc aggccggctg gtaataatcg ttgaagttga tgcccttcgt cgccatgcgg 1381 tagagcgcgg gcgtcagctc ttcgctgata agctcctcag agaacgcctc cgccgtgata 1441 aaaatgaggt tctttccggc gaacagccct gtatattcgt tcttcggtga gggtttctgc 1501 tgctgcacgt actggtgcgc cgccttgatg ttacccgaag aggatgcgat gagcgcgtcc 1561 agatccacat tcagcttgtt gaggccgaag aaagacgggc cggaggaaga cccggtgccg 1621 tgagccgcgg acaggacgtc cggcgcatcg agcgccgctt ccatatccag ctcgtagccg 1681 ccccgcaggt cttttccggt ggcgtagatg agtcccttcg tctgcacgtc ggagctgaag 1741 ttgccttccc tgccgccgat ccctgcaaac agagcgccca ggatgagcag tacgacgccg 1801 gccagcgcct gcacgcctgc cggccggaag ttcatcggct tgcggaaccc cagatctttg 1861 cgccgccaga tcatgagcgc cagcggcacg tggaacagca ggatgatggg gatgccccgc 1921 aggatgagcc cgacgaccac accgccgaag cccgtcacca cgtcccctgc tcccgtcgcg 1981 atgtccgtct tgctcatgaa cacgcggtag ctgttataaa tgaaatattc taccaggaaa 2041 gcgatcgtaa agatctcgag gacgaccgcc tccaggataa aggagatctt ctcggcgaac 2101 aggctgcaga ccgcgccaag cacgaggccg atgccgaaag cgtggaacac gcccacgtgc 2161 aggaaacccg aaccggtgag caccgtaagc aggatctcga acagcgcgaa gataggcccc 2221 agaagcaggc aggcaaaggg ccggaagccc ttggcagaag cggacttggc agcggaagct 2281 ttggccgcag cagtccgggt cttcttctta tcctttttcg gcgtttcttt tttcggcagg 2341 aggcccttca gatccggttt tgcagacttc gcggcatggg tatgggacgc agaagtctta 2401 gcggatgttc cggacttgcc ggaccgctta tccttctttg ccctcgcctt ggctcgcttt 2461 tcgcgccgct cctgcatcgc tctgtccagt tcttccttgc tgagccgttc cctgttgtct 2521 ttattctccg aagacatagc tgaaataatc cttttcgatg acgttcttgc aataattcag 2581 tttatcacga acgatatcct ttacggaatc gatgtaatcc gcatccgccg tctgaccttc 2641 cgcaggcgta aaccgtccgg tgccggcgtc gtaaaagccc ttttccgtct tccagctgta 2701 gctgttccac atcacgagcc cttcgtccgt ggacagcacg tcccggcccg gatacaggcg 2761 ggaatcgtac tcgacgccca tcaggttgag gatcgtcggc acgatgtcga tgctgctgat 2821 cggctgggtc acggtaatgg ggtccatatc ccggaacgcg ccgctgtaga atatcagcag 2881 gttgtggtcg cgtttcgcct catcggtggc cggatatccg tacagttccg acacgtaatc 2941 cctgtcgttg gcccagatca tgctgttctg cagggcgtag ggatagtggt ccgaggtgag 3001 gacgatgagc gtatcgtcca gccggcccgc ctcctccaga cggtccacga cgatcttgac 3061 ggcatcttcc agttcgagct gcgccgccac gtaggacttg atcttcgtgc tggcgtccag 3121 gccctccacg aggtccttat gcttgatggc ctgctcctgg tgcgtaaagt tataaatgct 3181 gtgaccgctg taggtcatgt aatacacgta gaacttttcg tcgtcgatcc agtcgtctac 3241 ggtgcagttc atcatctccg tgtcgctggg aggccacatg tccgtcaggt agtcctccat 3301 gccggtaccg ttggaaataa aggactcaaa gcccagccag gggtgggtca gataccggtt 3361 gtagtagtca taatccccat tatggtaagc tgtcgccgta taccccagag gcatcaggtg 3421 ataaccgacg cagctggcat tgttgtggcc gatgatctgc tgcatggagt tggcatggtt 3481 gaccggcaca atgcccgtaa gcgtcgcgaa ttcaccggac gtggtgctgc cgccccagaa 3541 cggctggtaa tagtcttcga acgtaatgcc ttccgttgcc attttataca gcgtcggcgt 3601 cagttcctcg ctcaccgcct ctgccgcaaa gctctccgcg cagatgacga tgagattctt 3661 gccctcgaac aggcctgtgt attcgttctt gaccgtagcc ttctgggaag ccacgtagct 3721 gtggaccgca ctgatggcgg ggtcggtctc ggcagccgcc agcgcgttaa aatcgatgtc 3781 gcgcttgttg agtccgtgga acgcgggcgc gccgttggaa ctgctgcccc gggtcacgag 3841 cccctccggc tttttaggct tctccggctt tccgaacgcg ccgtacacca cgtcgcgctg 3901 cgtggacgtg atgagcccga aattgcggat gccgtcgttg aacacatact cgtaggaata 3961 cttcggtgcg gcgaaggtgt ccagctgggt gctgcccgcc gccatgctct ggcagacgac 4021 gccggccagg gccagataga cgagggtcca gcggtccttg cgggtaaagt cccagacttt 4081 atatagcgcg agaaggacga acacggggac gtgatacagc gcgatgatgc ccactccttc 4141 ccggatgagc cgggcaaggt cttcgccgaa ttcatccata accccgccgg cgccctggaa 4201 gatagtcagg ggatccataa atgtctggta ggaattgttg acgaagaact gcacgcagaa 4261 ataaaacgcg ccgatctccg ccaggatgag ggctgccgca aaacctgcct tccggttttt 4321 gaaggcgaat gccacgcagt tgcacagcat gccgcaggca aatccggcca aaaacgcgct 4381 ggcaggatgg tagccggaag ccaggccgca gtccgatgcc agccgccatt ccagatacat 4441 gaaggccagc ggcagagcca gcatgctgag a // LOCUS sequence043 4429 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence043 VERSION sequence043 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..4429 /mol_type="genomic DNA" /organism="" /note="sequence043" misc_feature <1..769 /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_012048076.1:histidine--tRNA ligase" /note="WP_012048076.1 histidine--tRNA ligase (Clostridium botulinum) [pid:51.6%, q_cov:98.0%, s_cov:59.3%, Eval:7.6e-70, partial hit]" /note="MGA_253" /locus_tag="LOCUS_1930" CDS 779..2560 /product="aspartate--tRNA ligase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_004454140.1" /transl_table=11 /codon_start=1 /translation="MDKLLKRSCYCGEVRENCIGQEITVNGWVAKKRNLGSLIFADIRD RSGIVQVVFGDGTPADVLEKANGLRSEYTVGIKGVVRERESKNADLETGAVEILANELS IYAEAETPPIYIKDDDNVSGDLRLKYRYLDLRKPLMQKTLAFRSKMYNVIRNFYYENGF IEVETPVLAKPTPEGARDYLVPSRVNPGKFYALPQSPQQFKQLLMVGGTDRYIQIAKCY RDEDLRADRQPEFTQIDLEMSFVDQEDILEVQERFLQRLFKEMLDVDIQLPLPRMTWDE AMNRYGSDKPDLRVGFELVDIADTVKDCSFGVFTDAIKDGGRVMGINMNGCSPKFSRKD IDKMTESIKTFGAKGLVWIRKEEGEIKSSVGKFFSQEELEKICERFGAKAGDLILIVSG KKEVVWASLGFLRRDLASKLGMLDPHEYKLLWVVDFPMFEWSDEENRYMAMHHPFTSPK KEDIHYLESGELDKIYADAYDIVINGYEAGGGSIRIHDSKLQKKIFEVLQLTEEDIRIK FGFFIDAFKYGAPPHGGLAFGLDRLCMLLLGTDDIRQVIAFPKNQNAQCVMSEAPTIVT DQQLEELSIAVKLPEGK" /locus_tag="LOCUS_1940" /gene="aspS" /EC_number="6.1.1.12" /note="WP_004454140.1 aspartate--tRNA ligase (Clostridioides difficile) [pid:56.5%, q_cov:99.7%, s_cov:99.3%, Eval:1.2e-198]" /note="MGA_254" CDS 2561..3685 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MGKRIGVLGGSFDPLHYGHLILAEQIRQEAELDKVILVPAYVNPF KEEVPPADGHHRLEMLRLAAGDHPFFGISDIELKREGPSYTYDTLAALKEKDYPDDELF FIMGTDSFYQLEHWHKAEELIENFGFLIGMRKGYDEEELKATISRLQQKYPLRAEYIRI PELEISSTDIKQRIRAGKSVRFLLPDACISYIREHELYLDLVGKVREYARTHEKTSRFA HTCGVVKMAKQLAKQYGADPEKAEIAAWFHDVRRPAGNLEHGPAAADLLQKLYGVTDED ILNAIRFHTTGRPGMSLLEKVIKIADQLEEGRDYPGVEHMRSFTKLPVDQCVYKLMTHT RDYVHSIGGTFDPLSDEAIEWLKQQIEQGGNHGQ" /locus_tag="LOCUS_1950" /note="WP_028841927.1 nicotinate-nucleotide adenylyltransferase (Thermodesulfovibrio) [pid:43.9%, q_cov:52.9%, s_cov:99.0%, Eval:3.4e-41, partial hit]" /note="MGA_255" CDS 3675..4031 /product="ribosome silencing factor" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003416416.1" /transl_table=11 /codon_start=1 /translation="MDNKELALLAAKLLDSKKARDISIIDIAEKSGFADYFVIATAGSA RQISALCDEVEDGLAKEDILVNHKEGKGETGWVLLDYGDVIVNVFSAEQRDHYQIEKVW IDCPQVEFEPAAEQ" /locus_tag="LOCUS_1960" /gene="rsfS" /note="WP_003416416.1 ribosome silencing factor (Clostridioides) [pid:45.6%, q_cov:87.3%, s_cov:88.8%, Eval:1.3e-21]" /note="MGA_256" ORIGIN 1 catcaacagc atcggctgcc cgaactgccg cggcgaatac cgcaaggctc tgcaggactt 61 cctgcggccc cactacgacg agctgtccga gaccagcaag ggccgcttcg agaagaaccc 121 catgcgcatc ctggattcca aagatccgga cgacaagaag ttctccgaag gcgcaccccg 181 catgatcgac tatctctgcg acgaatgcaa agcggcgttc gaggatctga agaacgatct 241 ggacgcgctg ggaatcccct acgaggtgga tccgaacatc gtaagaggtt tggattacta 301 cacgaagacc gcgttcgagt tcatctccga agacctgggt gctcagtcca cggtgtgcgg 361 cggcggacgc tacgaccatc tggtggaaga ggtcggcgga ccctatacgc cggctgtcgg 421 cttcggcatg gggctggaga gactgctcct catcctggaa gccaagggca tcgagatccc 481 caagcccgcc ggctgcgacg tgtttatcgc gacgctgggc gaaagaccga agaccttcgg 541 cctcaaactc gccaaagacc tgcgcgccaa gggctacagc gtcctgacgg atgtgatggg 601 acggggcctg aaagcccagc tgaaatacgc agaccgcagc gatgcgcggt atacggtcgt 661 tatcggggac gacgaactgg agaaaggcgt cgtgaccctc agagatatgg ataattccac 721 gcagaaagag atcgccatcg acaagatcga agaagaaata cacaggtagg tgctgaaaat 781 ggacaaatta ctgaagagaa gctgctactg cggcgaagtg agagaaaact gcattggaca 841 agagatcacc gtgaacggct gggtcgccaa gaagagaaac ctgggcagcc tgatcttcgc 901 ggatatccgc gacagaagcg gcatcgtgca ggtcgtgttc ggcgacggca cgcccgcgga 961 tgtgctggaa aaggccaacg gcctgcgcag cgaatacacc gtcggcatca agggcgtcgt 1021 acgggaaaga gagagcaaga acgcggacct ggagaccggc gctgtggaga tcctggccaa 1081 tgaactgagc atctacgccg aagccgagac tccgcccatc tacatcaagg acgatgacaa 1141 cgtatccggc gatctgcggc tcaagtaccg ctatctggac ctcagaaagc ccctcatgca 1201 gaagacgctt gccttccgca gcaagatgta caacgtcatc cgcaacttct attacgagaa 1261 cggatttatc gaagtggaga cccccgtgct ggccaagccc acgccggaag gagccagaga 1321 ctatctggtg cccagccgcg taaacccggg caagttctat gcgctgcccc agtctcccca 1381 gcagtttaag cagctgctga tggtgggcgg cacggaccgc tacatccaga tcgccaagtg 1441 ctaccgcgat gaggacttaa gagcggaccg ccagccggaa tttacccaga tcgacctgga 1501 gatgtccttt gtggaccagg aagatatcct ggaggtccag gaacgcttcc tgcagcggct 1561 gttcaaggag atgctggacg tggacatcca gctgccgctg ccccgcatga cctgggacga 1621 agccatgaac cgctacggct ccgataagcc ggatctgcgc gtgggcttcg aactcgtgga 1681 tatcgcagac accgtaaagg actgcagttt cggcgtgttc accgacgcca tcaaggacgg 1741 cggccgcgtg atgggcatca acatgaacgg ctgctccccc aagttctccc gcaaggacat 1801 cgacaagatg accgaatcca tcaagacctt cggcgcgaag ggcctggtct ggatccgcaa 1861 ggaagaaggg gagatcaagt cctccgtggg caagttcttc agccaggaag aactggagaa 1921 gatctgcgaa cgcttcggcg ccaaggccgg cgacctcatc ctgatcgtct ccggcaagaa 1981 ggaagtcgtc tgggcttccc tgggcttctt aagacgcgat ctggccagca agcttggcat 2041 gctggatccc cacgaataca agcttctgtg ggtcgtggac ttcccgatgt tcgaatggtc 2101 tgacgaggag aaccgctaca tggccatgca ccatccgttc acctctccga agaaggaaga 2161 catccactat ctggagagcg gcgagctgga taagatctat gcagacgcct acgatatcgt 2221 catcaacggc tacgaagccg gcggcggctc catccgtatc cacgacagca aactgcagaa 2281 gaagatcttc gaggtactac agcttacgga agaagacatc cgcatcaagt tcggcttctt 2341 catcgatgcg ttcaagtacg gtgcgcctcc ccacggcggc ctggcatttg gtctggacag 2401 actgtgcatg ctgctgctgg gtaccgacga tatccgtcag gtgatcgcgt tcccgaagaa 2461 ccagaacgca cagtgcgtca tgagcgaagc gcctacgatc gtaacagatc agcagctgga 2521 agaactctcc atcgcagtaa aactgccgga aggaaaataa atgggtaaaa ggataggggt 2581 gcttggcgga agctttgacc ccctgcatta cggacacctc atcctggcgg agcagatccg 2641 tcaggaggcg gaactggata aggtcatcct ggtaccggcg tacgtcaatc cctttaagga 2701 ggaagtgccg cccgcggacg gccatcaccg gctggagatg ctgcggctcg ccgcaggcga 2761 ccatccgttc ttcggcatca gcgacatcga actgaagcgg gaaggcccgt cctacacgta 2821 cgatacgctg gcagccctta aggagaagga ctacccggac gacgagctgt tcttcatcat 2881 gggcacggat tcgttctatc agctcgaaca ctggcacaaa gccgaggaac tcatcgagaa 2941 tttcggattt ctcatcggca tgcgcaaggg ctacgacgag gaggaactga aggcgaccat 3001 ctcgcggctg cagcagaagt atccgctgcg ggcggagtac atccgcatcc cggagctgga 3061 gatcagctcc acggatatca agcagcgcat ccgggccggc aaatccgtgc gcttcctgct 3121 gccggacgcc tgcatctcgt atatccgcga acacgagctc tatctggatc tcgtgggcaa 3181 ggtgagggaa tacgcccgca cccacgaaaa gaccagccgt ttcgcgcata cctgcggcgt 3241 cgtcaagatg gcaaagcagc tggcgaagca gtacggcgca gatccggaaa aagcagagat 3301 cgcagcctgg ttccacgacg tgcgccggcc tgccggcaat ctggagcacg gccctgcggc 3361 ggcagatctg ctgcagaaac tgtatggggt caccgacgag gatatcctga acgccatccg 3421 cttccatacc accggccgcc ccggcatgag cctgctggaa aaggtcatca agatcgcgga 3481 ccagctggaa gaaggaaggg attatccggg tgtggagcac atgcgatcct ttacgaagct 3541 tccggtggac cagtgtgttt ataaactgat gacccacacc agagattacg tacacagcat 3601 cggaggcacg ttcgatccgc tgtccgatga agccatagag tggctgaaac aacaaataga 3661 acaaggagga aatcatggac aataaggaac ttgccctgct ggcagcgaag ctgctggaca 3721 gcaagaaagc cagagacatc agcatcatcg atattgcgga aaagtccggt tttgccgatt 3781 acttcgtgat cgcgaccgcc ggctccgccc gtcagatctc cgccctgtgc gacgaagtag 3841 aagacggcct ggccaaggag gatatcctgg tcaaccacaa ggaaggtaag ggagagaccg 3901 gatgggtgct cctggactac ggcgacgtca tcgtcaacgt gttttccgcg gaacagagag 3961 atcattacca gatcgaaaag gtctggatcg actgcccgca ggtggaattc gagcctgcgg 4021 ctgaacaata gattaagaaa cggtacagaa aggcagatca atggaacgtc agtataattt 4081 caaaaagatc gaacccagat ggcagaagat ctgggcagaa aaggacgcat ttcacgtaac 4141 ggaagaccca aacaaggaga aattctattg tctggagatg ttcccttatc cttccggcaa 4201 actgcacatg ggtcacgtga gaaactattc catcggcgac gtgctggcca gatacctgca 4261 catgaacggc aagaatgtgc tgcatcccat cggattcgac tccttcggtc tgcccgcgga 4321 aaacgccgcc atcaagaacc agacccatcc cgccgtatgg accagctcca acatcgcgga 4381 gatggagaac cagctccgcc ggctgggctt ctcctacgat tgggacaga // LOCUS sequence044 4375 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence044 VERSION sequence044 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..4375 /mol_type="genomic DNA" /organism="" /note="sequence044" misc_feature <1..555 /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_012868810.1:sirohydrochlorin cobaltochelatase" /note="WP_012868810.1 sirohydrochlorin cobaltochelatase (Thermanaerovibrio acidaminovorans) [pid:40.5%, q_cov:98.9%, s_cov:62.3%, Eval:2.0e-35, partial hit]" /note="MGA_258" /locus_tag="LOCUS_1970" CDS 652..1569 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MERKVWKALCLLLAALLITGSFAACTKAQEPAEPAETQEPAAEET QGSDQIADASEQIAHEDVVDDSWVPVPASALNDGTYEITVDSSSSMFNIVACTLTVADG AMTADMTMGGTGYRYIYLGTPEEAVAAAETDYLLPEVDAEGLHHYIVPVEALDAGVDCA AFSDNKEKWYDRVLVFRSSTLPMSAYVPDFLTTVSSLGLADGTYTCEVSLSGGSGKASV QSPANITIRGGAMTAEIVWSSDKYDFMVVNGAQYNPITTEGGSTFLIPISAFNFNVPVQ ADTIAMSTPHLIDYTLYFDASTIQ" /locus_tag="LOCUS_1980" /note="MGA_259" CDS 1636..2598 /product="adenosylcobinamide-phosphate synthase CbiB" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011861967.1" /transl_table=11 /codon_start=1 /translation="MILIRYNAIAMIAGLILDLLIGDPQGWPHPVIWIGKWISFCDKKI RTKAAGDSAKLRRGSVWMTASTVLLSMAVTAAVLRAAAFGGTYVLLAAMTIISWTCLAS KSLAKEANDVQKALEQSLEAGRKQVGRIVGRDTASLSSEEIVAATVETVAENTTDGIVS PLIYLFLGGPVLAMGFKAASTLDSMEGYLDEKYRDIGWSGAKLDDLLNYVPARISGHLM CLAAFLTGTDGKNAYRIMKRDHANHLSPNCAWTESAAAGALHVQLGGSHEYFGKVIEKP TIGDKDRGIEPGDIRKTNRLMYGTTFLAAGLLFLIGLAL" /locus_tag="LOCUS_1990" /gene="cbiB" /note="WP_011861967.1 adenosylcobinamide-phosphate synthase CbiB (Clostridioides difficile) [pid:45.4%, q_cov:90.6%, s_cov:89.5%, Eval:2.1e-65]" /note="MGA_260" CDS 2604..3668 /product="cobalt-precorrin-5B (C(1))-methyltransferase CbiD" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011461551.1" /transl_table=11 /codon_start=1 /translation="MKKLREGFTTGSCAAAAALACCLWQRDGACPEVVELEVPGGKVYR PQIVPHEDGSCGIIKDSGDDPDITKGMEVISRVDVSQEDGPIVFRGGDGIGTITQKGLK IPVGEPAINPVPREMIEAAVRSVFGSKGATVTVSIPGGTEIAKKTFNPRLGIEGGLSVL GTTGILRPMSLEALRDSLYVELKMRAEQGHKHLAFTFGNQGESALHALGCQIPVVQVSN EIGFMLDSARELGIEYLLVSGHPGKMAKIAAGVMQTHSQTADGRREAIITHLALMGAPK TLCEQVYGCVTTDSAAEFIHAAGFDGVWDRIAIAAKEYMTFRVREEIEIETMVTDYEAN VMGKSAERPKGLET" /locus_tag="LOCUS_2000" /gene="cbiD" /EC_number="2.1.1.195" /note="WP_011461551.1 cobalt-precorrin-5B (C(1))-methyltransferase CbiD (Desulfitobacterium hafniense) [pid:41.0%, q_cov:91.5%, s_cov:85.3%, Eval:1.5e-62]" /note="MGA_261" ORIGIN 1 cagccgaccc acctgatggc aggtctggaa tacaacgata tcgttgcttc cgcagcgaac 61 tacgcagacg cgttcgaatc catcacgatc ggcaagaacc tgctggattc cgacgcagac 121 ttcgagcatg ttgctcaggt cgtccatgaa gagacccagc agtacgatga cggcgagacc 181 gccatcatct tcatgggtca cggcaccgaa gccgaatcca acgcagtcta tgccaagatg 241 cagaccgtgt tcgacaagct cggctatgcc aactactaca tcggcaccgt agaagcgact 301 ccgtccctgg acgatgttct cgctgctgcc aaggccggcg gttataagaa agtcgttctc 361 gagcccctga tgatcgtctg cggcgaccac gccaacaacg acatggcagg cgacgaggaa 421 gactcctgga agagcacctt cgaagcggaa ggcttcgagg tcgaatgcaa catggtcggt 481 ctcggccagc tgcccgcgat ccaggaactg atcgtagacc actgcaaggc caccatgacc 541 gaagcaggtt tctaatctcg aataccgaaa caaatcggaa acggtccgga aaaaccttcc 601 gggccgtttc tggcaattga acagatcgca gtaagactga aggaaaaaag aatggaaaga 661 aaagtttgga aagcgttgtg cctcctgctg gcagcgctcc tcattacagg cagctttgcg 721 gcatgcacaa aggcacagga gccggcagaa cctgctgaaa cacaggaacc ggcggcagaa 781 gagacacagg gttcggatca gatcgcagac gcatcggaac agatcgcgca cgaggatgtc 841 gtcgatgaca gctgggtgcc cgtaccggca tctgctctca acgacggcac gtatgagatc 901 accgtggaca gcagttcttc gatgttcaac atcgttgcgt gcacgcttac cgttgcggat 961 ggtgccatga cggccgacat gacgatgggc ggcacagggt accgttacat ctatctggga 1021 accccggaag aagccgttgc agcggcagaa acggattatc ttctgcccga agtggatgcc 1081 gaagggctgc accactatat cgttcccgtg gaagcgctgg atgcaggcgt agactgcgcc 1141 gctttttcag ataacaagga gaagtggtac gacagagtgc tcgtgttccg cagcagcact 1201 ctcccgatga gcgcctacgt accggatttc ctgacgacgg tttccagcct gggactggca 1261 gatggtacct atacctgcga agtttccttg tccggcggca gcggcaaggc cagcgtccag 1321 tctcctgcga acatcacgat ccgcggcggc gcgatgaccg ctgagatcgt ctggagcagc 1381 gacaaatacg attttatggt cgttaacgga gcgcagtaca acccgatcac gaccgaaggc 1441 ggatccacgt tcctgatccc catcagcgcc ttcaatttta acgtgcctgt ccaggcggat 1501 acgatcgcga tgagcacgcc ccatctgatc gattatacgc tgtattttga cgcatccacg 1561 atccagtaaa aaacagtctg ccgggccggg ccaagtgcct gtcccggctt tctcctattc 1621 cgtaaagaag catttatgat ccttatccgt tacaacgcca tagccatgat cgcaggtctt 1681 atcctggatc ttctgatcgg agatccccaa ggatggccgc atcccgttat ctggatcgga 1741 aaatggatca gtttctgcga taaaaagatt cggacaaagg cggcggggga cagcgcgaaa 1801 ctgcgccggg gttcggtctg gatgaccgca agcaccgtgc ttttgtccat ggccgtgaca 1861 gcagcagtgc tgcgcgcagc agcctttggc ggcacgtatg tgctcctcgc cgcgatgacg 1921 atcatctcct ggacctgtct ggcctccaaa agcctggcaa aagaggctaa cgacgtgcag 1981 aaagcgctgg agcagagcct ggaagcggga agaaagcagg tcggccgcat cgtaggcaga 2041 gatacggcgt cgctgtcctc cgaagagatc gtggcggcca cggtggagac cgtggcggag 2101 aacacgacgg acggcatcgt atctcccctg atctatctgt ttctgggagg tccggtcctc 2161 gccatgggct ttaaagcggc cagcacgttg gattcgatgg aaggatacct ggatgaaaag 2221 taccgggata tcggctggtc cggcgcaaaa ctggacgatc tgctgaatta tgtgcccgcc 2281 cgtatctccg gacatctgat gtgcctggca gcgtttctga ccggaacgga tgggaaaaat 2341 gcctaccgga tcatgaagag ggaccacgcc aaccacctga gcccgaactg cgcctggacg 2401 gagagcgcgg cagcaggagc cttgcacgta cagttgggcg gcagccatga atacttcggc 2461 aaggtgatcg aaaaaccgac gataggcgat aaagaccgcg ggatcgaacc cggcgatatc 2521 cggaaaacga accgcttgat gtacggaacc acgttcctgg ccgcaggact tctgttcctg 2581 atcggcttag cgttataaca cacatgaaga aactcagaga agggtttacg accggaagct 2641 gcgcggcggc tgcggcgctg gcctgctgtc tgtggcagcg ggacggagcc tgccccgaag 2701 tggtggagct ggaagtgccc ggtggaaaag tatatagacc ccagatcgtt ccccacgaag 2761 acggaagctg cggcatcatc aaggacagcg gcgacgatcc ggacatcacg aagggcatgg 2821 aagtcatcag cagggtggat gtatcgcagg aagacggtcc catcgttttc cgcggcggag 2881 acggcatcgg caccatcacc cagaaaggac tcaagatccc ggtaggggaa cctgccatca 2941 atcccgttcc ccgggagatg atcgaagcgg ctgtgcggag cgtgttcggg tcaaaaggcg 3001 ccaccgtgac ggtctccatc cccggcggaa cagagatcgc gaaaaagacc ttcaatccgc 3061 gcctcggcat cgaaggcgga ctgtccgtgc tcggcaccac aggtattctg cggcccatga 3121 gcctggaagc gctccgcgat tctctgtacg tagaactgaa gatgcgtgcg gagcagggcc 3181 acaagcatct ggcgttcacc ttcggcaacc agggcgaatc ggcgctccat gcgctgggct 3241 gtcagatccc cgtcgtgcag gtgagcaacg agatcggctt tatgctggat tctgccagag 3301 aactggggat cgagtatctg ctggtgagcg gtcacccggg caagatggca aagatcgccg 3361 ccggcgtgat gcagacccac agccagacgg cggacggcag aagagaggcc atcatcaccc 3421 atctggcgct gatgggggct ccgaaaactt tgtgcgaaca ggtctacggc tgcgtgacga 3481 cggattctgc cgcggaattc atccacgcgg cagggttcga cggcgtctgg gaccgcattg 3541 cgatcgccgc aaaagagtat atgacgttcc gcgttcgcga agagatcgag atcgaaacga 3601 tggtgacgga ctacgaagcc aacgtgatgg gaaaatccgc agaacgtccg aaggggttgg 3661 aaacatgaat caggtaacac acggcggcaa cgtctggcag ggggctgacc cttccgaatg 3721 gctggactac tccgctaaca taaggccggg cggcgcaccg gaatgggtaa aagaagcgct 3781 gcagaaggcc atggacaaca tatcctatta tccggctaca gatatgcacc gggcgagaaa 3841 aggcctcgcg gactatctgg aactgccgga aacctacgtg cagccggctt ccggcggtgc 3901 ttccgccatc gaactggcaa cgcgctgcgg catgaaccag gtgctgctgt gcgcgccgtg 3961 tttcggcgaa tataaaggcg cagctttgaa gatgggactt cccgtagaga ctgtcgtgtt 4021 gctgcaagaa gaccgcagca tcgcgtctcc cgccaaagcc gtaaaagata cgctgcagga 4081 acggactctc atctggctct gcagccccat gaatcctacg ggtcacacct ttacgcggca 4141 ggagattctg gacctgctgg atctggcgag agaacggcgt tgccgcgtag cgctggacga 4201 ggcgtttatc gacttctgtc ccggtgcgag caaccgcgat ttggtaaaga cctggccgga 4261 gctcatcgtg accggctcca tgacgaagat cctcggcatt cccggcgtgc ggttgggtta 4321 cctctgcagc caggatgcgc tgcagctcgg cagcaaatgc cttccctggg agctc // LOCUS sequence045 4374 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence045 VERSION sequence045 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..4374 /mol_type="genomic DNA" /organism="" /note="sequence045" misc_feature <1..810 /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_003232049.1:L-serine ammonia-lyase, iron-sulfur-dependent, subunit alpha" /note="WP_003232049.1 L-serine ammonia-lyase, iron-sulfur-dependent, subunit alpha (Bacillus) [pid:33.5%, q_cov:91.4%, s_cov:83.0%, Eval:1.8e-32]" /note="MGA_263" /locus_tag="LOCUS_2010" CDS 797..1816 /product="23S rRNA (adenine(2503)-C(2))-methyltransferase RlmN" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003431147.1" /transl_table=11 /codon_start=1 /translation="MQNIKAFTREERAKALKELGLPAFREKQIFAWICRGAKSWDECTD LSKDLRRQLAERFSWDNAAAELVQTSSDGTRKFLLRMPDGERVEAVFMAYEYGNSLCIS TQVGCNMGCSFCASTIGGRIRSLESWEMLEEVVVCVRESGEPINHIVLMGMGEPFDNYE AVAGFLRTVHDPQGLGLSYRNITLSTCGLVPGIRRFGEDFPQVNLAISLHASNQQAREK LMPVAKAYPLPELMRACRDHAEKTGRRVTFEFALIEGQNDTPQTAKELADLLRGMLCHV NLIPLNPVTETGMTGSSRKAAAHFRDMLESMGIPATVRRQLGADIDAACGQLRKKVTS" /locus_tag="LOCUS_2020" /gene="rlmN" /EC_number="2.1.1.192" /note="WP_003431147.1 23S rRNA (adenine(2503)-C(2))-methyltransferase RlmN (Clostridioides difficile) [pid:45.8%, q_cov:98.2%, s_cov:97.4%, Eval:2.9e-84]" /note="MGA_264" CDS 1921..2349 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_012048265.1" /transl_table=11 /codon_start=1 /translation="MVKLLVGHKGSGKTKAMVDMANASLDSVNGSVVFINKNHRLMYDL KYRIRVVCMEDFEHITNIDEYIGFIYGIISQDHDIELIFIDSILKHADVKLEDLEEFLG RLAAISEIYGPDFVVSISADVDELGSYVNKYEIINPAQ" /locus_tag="LOCUS_2030" /note="WP_012048265.1 hypothetical protein (Clostridium botulinum) [pid:31.1%, q_cov:95.1%, s_cov:98.5%, Eval:5.2e-16]" /note="MGA_265" CDS 2349..2954 /product="CoA pyrophosphatase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011949003.1" /transl_table=11 /codon_start=1 /translation="MDLDTIKKKLQGRESGLLEIRKHSCVLIPFVERDGRLCLLFELRS AGISQPGEVCFPGGRMEKGETPVQTAVREIGEELGIRPEDILYTHEYDTLIHIANMAVH TVIGEIRPEALDSIRPEEAEVSEWFTIPVDWLMENEPYVYEYDIVQDVKDFPYDMVESP DKYNWRKGKCTVPIWHYEGHCLWGMTARIVVQLLKFLA" /locus_tag="LOCUS_2040" /note="WP_011949003.1 CoA pyrophosphatase (Clostridium botulinum) [pid:34.0%, q_cov:98.5%, s_cov:95.2%, Eval:1.0e-27]" /note="MGA_266" CDS 3038..4201 /product="BMP family ABC transporter substrate-binding protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011459550.1" /transl_table=11 /codon_start=1 /translation="MKKLLALLLALAMVFSMAACTSSNEPAPAEPSEGEGGEGETAAAY SVAMITDYGDITDESFNQATYEACKAFSDANGLQFNYYKPAGDSTAEREAMIDAAIADG YNVVVCPGFAFAEALASASVTYPDVKFIALDVSEFDLTSAGLTEIPDNLFSAVYQEELC GFMAGYAAVALGYTHLGYLGGMAVPSVVRFGNGYIQGADLAAKELGIDGVTIEYVYGNQ FFGDADITSYMDTWYQTSGVEVVFACGGGIWTSAAEAAAKVGGKVIGVDVDQSKTIDAY GEGMTVTSAMKGLKATVNTLLTELVLNDNWSAYGGQVMTLGLVSGTDVEANYTQIPFDT TQWSDSFTQDDYVALVGRMFSGEITVDGSQDEFVPSTITLNRYDNIK" /locus_tag="LOCUS_2050" /note="WP_011459550.1 BMP family ABC transporter substrate-binding protein (Desulfitobacterium hafniense) [pid:38.7%, q_cov:79.8%, s_cov:76.9%, Eval:5.0e-51]" /note="MGA_267" ORIGIN 1 atctccggct ggacggagca gcaggtcatc tcccaggcgg aaaacctgtg ggacgtcatc 61 ctggcatcgg agaagaacgg atataaagaa ggcaacgatc tgcgccaact gcttggaccg 121 aaggcgcccc aggtaaaagc attctatgaa agcagtccgc agaagatctc cggcggcatc 181 gtcgacaagg cggcgccgat gtccctgtct atcatggaat gggcgggcag ttccggcacc 241 atcgtctgca ttccgacggg aggtgcctcg ggcatcgtgc ccggggtcat ccagggcctg 301 tgcgaagaca aaggacttgg cagggaagaa gccgtaaaag gccttctggc tgccggcatg 361 gcgggcgtct tcatggccga gaccgactac ttcggaggct ggggatgcca ggcggagatc 421 ggctgcggcg tcggtatggc ggcggccgct ctcgtcagca tgatggacgg cacgcccaaa 481 cagtgtctgg acgccgccag catgggcatc cagagtctga tcggcctggt gtgcgactcc 541 gtgtgcggac agtcccaggt gccgtgctat ctgcgcaata tgactggaac tgctacggcg 601 gtcacctgcg ccaacgcggc gctggcgggg ctggatgcgc tcatccccct ggacgagatg 661 gtgacggcca tgatgaacgt gggaagggct tcccggtcca tcaaactcaa ttccatgggc 721 gccaacggca caccgacggg cgtgcgcctc gaagccgaag aacaggagag acagcagagg 781 gctgtcgacg aaaaacttgc aaaacattaa agcctttaca agagaagaac gggcgaaagc 841 cttaaaagaa ctggggcttc ccgcgttccg ggaaaagcag atcttcgcct ggatctgccg 901 gggtgcaaag agctgggacg agtgcacgga tctgtccaaa gatctgcgcc gccagctggc 961 ggaacggttt tcctgggata acgctgccgc ggaactcgtg cagacgtcct ccgacggcac 1021 ccggaaattc ctgctccgca tgccggacgg cgagcgcgtg gaagcggtgt tcatggccta 1081 cgaatacggc aactccctgt gcatctccac ccaggtcggc tgcaacatgg gctgcagctt 1141 ctgcgcttcc accatcggcg gccgcatccg cagcctcgaa agctgggaga tgctggagga 1201 agtcgtggtc tgcgtgcggg agagcggcga acccatcaac catatcgtcc tgatgggcat 1261 gggcgaaccc ttcgataatt atgaggcggt cgcggggttc ctccggacgg tgcacgatcc 1321 ccaggggctg ggactcagct accgcaacat cacgctttcc acctgcggtc tcgtgccggg 1381 catccggcgg ttcggggaag attttcccca ggtgaacctg gccatctcgc tgcacgcgtc 1441 caaccagcag gcgagggaaa agctgatgcc ggtggcgaaa gcctatccgc tgccggaact 1501 gatgcgcgcc tgccgcgatc acgcggaaaa gaccggacgg cgcgtcacgt tcgaattcgc 1561 tctgatcgaa gggcagaacg acacgccgca gacggcgaag gaactggcgg atctgctgcg 1621 gggcatgctg tgccacgtca acctcattcc gctcaatccc gttacggaga caggcatgac 1681 cggcagcagc agaaaagcgg ctgcgcattt ccgcgacatg ctggaatcca tgggcattcc 1741 ggcgacggtg cggcggcagc tcggcgcaga tatcgacgct gcctgcggtc agctcaggaa 1801 aaaagttact tcttgaaaat tacatacaaa agtttgtctt tcgcggcttg cccaaaagtc 1861 cggggcaagc tataatgaaa gaacagatat accttagaga gagaaagtgg ggcgattcca 1921 atggtaaaat tactggtagg gcacaagggc agcggcaaga ccaaagcgat ggtcgatatg 1981 gccaatgcca gcctggacag cgtaaacgga agcgttgttt ttataaataa gaaccaccgg 2041 ctgatgtacg atctcaaata tcgtattcgt gttgtctgca tggaggactt cgaacatatc 2101 acgaatatcg acgagtacat cggttttatt tatggcatca tttcccagga tcatgatatc 2161 gagctcatct ttatcgacag catcctgaag catgcggacg taaaactgga agacctggaa 2221 gaattcctgg gcagactggc cgccatctcc gagatctacg gtccggattt cgtggtcagc 2281 atctccgccg acgtagacga gctcggctct tacgtaaaca aatacgagat catcaatccg 2341 gcccagtaat ggatctcgat acgatcaaga aaaaactgca gggccgcgaa agcggtctgc 2401 ttgagatcag aaagcacagc tgcgtcctga ttccctttgt ggaacgggac ggaaggctgt 2461 gccttctttt tgaactgcga agcgccggca tctcccagcc cggcgaagtg tgcttccccg 2521 gcggacgcat ggaaaaaggg gagaccccgg tgcagaccgc ggtgcgcgag atcggcgaag 2581 agctgggcat ccgtccggag gatatcctct acacgcacga atacgacacg ctcatccata 2641 tcgcgaacat ggcggtccac accgtcatcg gagagatccg ccccgaagcg ctggacagca 2701 tccgccccga agaagcggag gtctccgaat ggtttacgat ccccgtggac tggctgatgg 2761 agaacgaacc gtacgtctat gagtacgata tcgtgcagga tgtaaaggat tttccctacg 2821 atatggtgga gtctcccgac aaatataact ggcggaaggg aaagtgcacg gtgcccatct 2881 ggcattacga gggtcactgc ctctggggga tgaccgcaag aattgtcgtt cagctactaa 2941 aattccttgc ctaatgcagg ggactattgt ataattctac tgttattgac gcggcagaat 3001 tttagagtgc cgcggtcaga ataaggagga aaatcaaatg aagaagttac tcgcgctgct 3061 cctcgcgctg gctatggtat tctccatggc tgcatgcacc agcagcaacg aacccgctcc 3121 tgctgaaccc agcgagggcg aaggcggcga aggcgagacc gcagctgcct actctgtcgc 3181 gatgatcacc gactacggcg acatcaccga cgaaagcttc aaccaggcta cttacgaagc 3241 ctgcaaagct ttctccgacg cgaacggcct gcagttcaac tactacaagc ccgctggcga 3301 cagcaccgca gaaagagaag ctatgatcga tgcagcgatc gctgacggct acaacgtagt 3361 cgtttgcccg ggattcgctt tcgcagaagc actggcaagc gcttccgtca cctatcccga 3421 cgttaagttc atcgctctgg acgtttccga gttcgacctg acttccgcag gcctgaccga 3481 gatccccgac aacctgttct ctgctgttta ccaggaagaa ctgtgcggct tcatggccgg 3541 ttatgcagct gtagctctcg gctacaccca cctgggttac ctgggcggca tggctgttcc 3601 ctccgtcgtt cgcttcggca acggctacat ccagggtgca gacctcgcag ctaaggaact 3661 gggcatcgat ggcgttacga tcgaatacgt ctatggcaac cagttcttcg gcgatgcaga 3721 catcacttcc tacatggata cttggtatca gacctctggc gtagaagtcg tcttcgcttg 3781 cggcggcggc atctggacct ccgcagctga ggcagctgcc aaggtcggcg gcaaggtcat 3841 cggcgtagac gtagaccagt ccaagaccat cgacgcttac ggtgaaggca tgaccgtcac 3901 ctccgctatg aagggtctga aggctaccgt caacacgctg ctcaccgaac tcgtactgaa 3961 cgacaactgg tccgcttatg gcggccaggt catgactctg ggtctcgttt ccggcaccga 4021 cgtcgaagcg aactacaccc agatcccgtt cgacaccacg cagtggtccg acagcttcac 4081 tcaggatgac tacgttgctc tcgttggcag aatgttctcc ggcgaaatca ccgtagacgg 4141 ttcccaggac gaattcgttc cttccaccat caccctgaac agatacgaca acatcaagta 4201 ataactggat aaaatcgcat caaaaatcaa aaggacgacc tttaaggccg tcctttttta 4261 tgttatcatt ttagtatcta tgtgaataca ggaggttgaa gccatggatg caccttatgc 4321 aatcgaaatg ctcaacatca cgaaacgatt tccgggcatc attgcaaatg ataa // LOCUS sequence046 4370 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence046 VERSION sequence046 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..4370 /mol_type="genomic DNA" /organism="" /note="sequence046" CDS 740..1420 /product="cell division ATP-binding protein FtsE" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003357393.1" /transl_table=11 /codon_start=1 /translation="MIIFDNITKRYGSKVALENATIHIDKGDFVFLVGPSGAGKSTFIK LILKEIEPDEGKLIVAGRDITHLSNREIPQLRRSLGVVFQDFRLLPNKTVFENVAFAME VLHHKPRVIKRQVPQVLDLMGIGEAADKFPDELSGGEQQRVAIARAIINNPKVLIADEP TGNLDKDTAWEIMQLLNQVNLRGTTVVMVTHAFDIVERMGKREVEIESGHIIRDTKGGI AADV" /locus_tag="LOCUS_2060" /gene="ftsE" /note="WP_003357393.1 cell division ATP-binding protein FtsE (Clostridium) [pid:58.7%, q_cov:98.2%, s_cov:97.8%, Eval:4.3e-71]" /note="MGA_270" CDS 1413..2306 /product="permease-like cell division protein FtsX" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003357632.1" /transl_table=11 /codon_start=1 /translation="MFKGLGYSLKQAVVQIFRNKGMTVASLFAITAMLLILGLFFFLTV NVNFITEEIKDQFDTIEVFLQDDQTEAQAEVIRNSLSQLQGVANVEYISKAQAMEEFKT RWGDNAYLLDGLASNPLPNSLRVTLENLEDGELVAEVSRSMSGVEDVRYYQTEVNKILR ISEGIQKGALVVIAFLIIVSVVVVSNTVKLTVMARQEEIRIMKYVGATNWFIRGPLLLE GMFIGLIAALIALGCTWAIYARLIAAIGQQAVILLSTSLVETNFMMINLTWIYIALGIS IGAFGSILSMRRFLQA" /locus_tag="LOCUS_2070" /gene="ftsX" /note="WP_003357632.1 permease-like cell division protein FtsX (Clostridium) [pid:34.5%, q_cov:98.0%, s_cov:97.6%, Eval:1.1e-41]" /note="MGA_271" CDS 2340..3521 /product="M23 family metallopeptidase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_018305385.1" /transl_table=11 /codon_start=1 /translation="MRREKLTKGKIRAKVALWSIVVAMAAAVFVTPFAAGAQTIEDYQN QLNQKNNQKEQVQNQLNQEKKNLEEVQAELNALDQKIYQSQKELNGLEADLNKTKEEIA VALEELEQLQKDIEKQNDDLNARLRSMYKNGDVGMLSVLFGSSSMSDFMTNMDMVERIY NADAELLAGLEDQYDVVEEQKNKLQALKDQLIVQQEAVAAKKASLEADRQEVDARRKEV EADVNTLSAQYDAVKKEADAISETIKVLQSANTQYIGGAMCWPSQASTRITSPFGWRYL SLLGGRNYHTGVDIGAAGGTNILAANSGTVIKAGWNNSYGYMVMVDHGGGIVTLYAHSS KLLVKTGDVVARGQAIALIGSTGMSTGNHLHFEVRVNGKYQNPLNYITPSVRN" /locus_tag="LOCUS_2080" /note="WP_018305385.1 M23 family metallopeptidase (Desulfitobacterium hafniense) [pid:33.9%, q_cov:95.9%, s_cov:98.9%, Eval:5.3e-56]" /note="MGA_272" ORIGIN 1 gacgggcagc ggcgtgaccc tcacagccct cgcccttgcc tgcgcgcttt cggaggagtg 61 ctccgtatgt tttgcggagg cggggaagcc ctacgtgttc gacgcctgcg gcatggcgaa 121 ggcctttctt ctgagcggct ttacggatta ttatcagctg ttcgcggacg gcaaaccgtt 181 tccaggaccc tccaacctct ggcgcggcgt ccattgggca gtccggccgg gttcgctccc 241 gcccctgcag ccggaactga acaccgcgga cgacatcctg cgctttgcgg aaaagctgcc 301 gggcagcgtc accgtactgg actgctccgg cctggaagac ctgctgctcg aaggcgtgct 361 ggcaggggcg gacaaagtct atctcgtcgt cgatccgctg cccggaaaac tgcttccggc 421 gtcgccccgc ctgcagcgtt tgcgctatgc gtttcctgcg gcggtgcccg tggtcaaccg 481 gatgaatccc ggcgtgcata aaagagaact cgacgcctac ctggggacat cttcctacct 541 ggccctgccg gacataggcg cggagacggt ctaccgtgcg gaatacgcct gcgcgctgcc 601 ctgggatatg cccgaaggca gaaaactgct cgcttcactg aaaaaacatg aataaaatga 661 cggcgcaatt tggccttcaa tagaatatat ggtataatta gatgttaaat tgtacctaaa 721 accacaagag gccagattag tgatcatatt cgataacatt accaagcggt acggatcgaa 781 ggtggccctg gaaaacgcta cgatacacat agacaaaggg gacttcgtgt ttctcgtagg 841 gccttccggc gcaggaaaat ccaccttcat taaactgatc ctgaaagaaa tagagccgga 901 cgaaggcaag ctgatcgttg cgggccggga cattacccat ctctccaacc gggagatccc 961 ccagctgaga agatcgctgg gcgtcgtgtt ccaggacttc cgcctgctgc ccaacaagac 1021 ggtattcgaa aacgtcgcct tcgccatgga ggtgctccat cataaacccc gcgtcatcaa 1081 acggcaggtg ccccaggtgc tggatctgat gggcatcggc gaagcggcgg ataaattccc 1141 ggacgagctg tccggcggcg agcagcagag agttgccatc gccagagcca tcatcaacaa 1201 tccgaaggtg ctcatcgcgg acgagcccac cggcaacctg gacaaagaca ccgcatggga 1261 gatcatgcag ctgctcaacc aggtcaacct gcggggcacc acggtggtca tggtcaccca 1321 cgcgttcgac atcgtggaaa ggatgggcaa gcgcgaggtg gagatcgaga gcggacatat 1381 catccgcgat accaaaggag ggatagctgc cgatgtttaa aggtttaggt tattccctca 1441 agcaggccgt cgtccagatc ttccgcaaca agggcatgac ggtcgcatcg ctgttcgcga 1501 tcacggccat gctgctcatt ctgggcctgt tcttcttcct gacggtcaac gtcaacttca 1561 tcacggagga gatcaaggac cagttcgata cgatcgaagt gttcctgcag gacgatcaga 1621 cggaagccca ggcggaagtc atccgcaaca gcctgtccca gctgcagggc gtggcaaacg 1681 tagaatacat ctcaaaagcc caggccatgg aggagttcaa gacccgttgg ggcgataacg 1741 cctacctgct ggacggcctg gcatccaatc cgctgcccaa ttctctgcgg gtcaccctgg 1801 agaatctgga ggacggcgaa ctggtggcgg aggtcagccg gtccatgtcc ggcgtcgaag 1861 acgtccgcta ctatcagacg gaagtcaaca agatcctgcg gatctcggag ggcatccaga 1921 agggcgctct cgtggtcatc gctttcctga tcatcgtctc cgtggtcgtc gtgtctaata 1981 cggtaaagct caccgttatg gcgcgtcagg aggagatccg catcatgaaa tacgtgggcg 2041 cgacgaactg gtttatccgg ggaccgctgc tgctggaagg tatgttcatt ggccttatcg 2101 cggcgctcat cgcgctgggc tgcacctggg cgatctatgc gcggctcata gcggccatcg 2161 gccagcaggc ggtcattctg ctgtccacca gtctcgtgga gacgaacttc atgatgatca 2221 acctcacatg gatctacatc gcgctgggca tcagcatcgg cgcgttcggc agcatcctgt 2281 ccatgagacg gttcctgcag gcatagtaaa gacacaaggg gaaaaaacag gggaattcca 2341 tgagaagaga gaaactgacg aaaggaaaga tacgggcgaa ggtcgctttg tggagcatcg 2401 tagtcgcgat ggctgccgct gttttcgtga ccccgttcgc agcgggggcg cagacgatcg 2461 aggactacca gaaccagctc aaccagaaga acaaccagaa agagcaggtg cagaaccagc 2521 tcaaccagga gaaaaagaac ctggaagagg tgcaggcgga gctgaacgcc ctggatcaga 2581 agatctatca gtcccagaag gaactcaacg gactggaagc ggatctcaac aaaacgaagg 2641 aagagatcgc agtcgctctg gaggaactgg agcagctgca gaaggatatc gaaaagcaga 2701 acgacgacct gaacgcgcgg ctgcgcagca tgtacaagaa cggcgacgtg ggtatgctct 2761 ccgttctgtt tggcagcagc tccatgtcgg atttcatgac gaacatggat atggtggagc 2821 gcatctacaa tgcagatgcg gaactgctgg cgggtctcga agaccagtac gatgtagtcg 2881 aggagcagaa gaacaaactg caggctctca aggaccagct catcgtgcag caggaagccg 2941 tcgcagcgaa gaaggcttct ctcgaagcgg accgtcagga agtcgacgcc cgcagaaaag 3001 aagtggaagc agacgtcaac acgctgtctg cgcagtacga tgccgtcaag aaagaagccg 3061 acgccatcag cgagaccatc aaggtgctgc agagcgccaa cacgcagtac atcggcggcg 3121 ccatgtgctg gccctcccag gcgagcacgc gcatcacgtc tcccttcggc tggcgttatc 3181 tgtcgctgct gggcggccgc aactaccaca ccggcgtgga catcggtgcg gcgggtggca 3241 caaacattct ggctgccaac tccggtacgg tcatcaaagc cggttggaac aactcctacg 3301 gctacatggt gatggtcgac cacggcggcg gcatcgtcac gctgtacgcg cactccagca 3361 agctgctggt aaagacgggc gacgtggtgg caagaggcca ggcgatcgcg ctcatcggct 3421 ccaccggcat gtccaccggc aatcacctgc attttgaggt acgggtcaac ggcaaatacc 3481 agaacccgct gaattacatt acgccatctg tacgcaatta atgagtacct ggatatacga 3541 acagacaaat acgacaccgg catggggacc cgaaggggtc cctgcttcgg ttatgggcat 3601 tttgcagcgc aggggcatcc gtacggcgga agaggctgag gatttcctcg cgccggcgcc 3661 gaaacggacc tacgatccgg aacttctgcc ggatctgcct gcggcggcgg acaaactgct 3721 gcaggcagcg gcggacggac tgtccatctg gatctacgga gactacgacg cggacggcgt 3781 aacggctacg gcgctgctct acaccgtgtt gcagaaactg acggaccggg tgaactttta 3841 cgttccttcg cggttcaccg acgggtacgg ccttaacaag gacgccgtgc ggcgcatcgc 3901 ggagaagggc gcgcagctgc tcgttaccgt ggactgcggc agcacgaacc gcgaggaagt 3961 ggcctacgcg aaagaactgg gcctggatgt gatcgttacg gatcaccacg aactggaggc 4021 gggtgcgatg ccggactgcc tgttggtgaa cgcccacagg gaggacagtc gctatccgtt 4081 cccggggctg tcgggctgcg gcgtcgcctt taagcttgcc caagccatcc agaggaggct 4141 gactgcagca ggcgatgaca ggtttacccg gcaggacatc acggatctgc tggatctggt 4201 agcgatctcc accgtggcgg acgtggtgcc tctgctggat gaaaaccgca gcctcgtcaa 4261 gtacggtctg cgggtcatca attcgagaaa gcgcagaggt ctgcgcatcc tgctcgacat 4321 ggtagggctc gaacgcaaag aggtggatgc ggacgacatc gggtttatcc // LOCUS sequence047 4236 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence047 VERSION sequence047 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..4236 /mol_type="genomic DNA" /organism="" /note="sequence047" CDS complement(1929..2291) /product="ornithine aminomutase subunit alpha" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003434665.1" /transl_table=11 /codon_start=1 /translation="MKRADDFEERRKHIANLSDEELYNRFWELTAQVVDPLLELGYKNT TPSVERSVLLRMGISSLDTQKIVNGCMDHGLMGKGAGHCVYKLSKIENITIPEAGTKLA NGEGWDVVAAAFRGGK" /locus_tag="LOCUS_2090" /note="WP_003434665.1 ornithine aminomutase subunit alpha (Clostridioides difficile) [pid:62.7%, q_cov:98.3%, s_cov:95.2%, Eval:4.5e-38]" /note="MGA_275" CDS complement(2322..3734) /product="2-amino-4-oxopentanoate thiolase subunit OrtB" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_032507361.1" /transl_table=11 /codon_start=1 /translation="MALAKDYASVMGRNNEIMKEAMGLDYDKFESGKMRFDYEGLMAST GYTLEEIEKVQSATGVGNTPILELRNLTALARKYAKPGYGATILAKDEAANPSGSFKAR RAACAVATAKKMGYKGVMAATSGNYGAAVASQAAMQGLKCIIVQECFDSHGVGQPEIIE KARKCEAYGAEVVQLTVGPELFYTFLSILEDTGYFNASLYSPYGIAGVETLGYEIAMQC REKYGKDPAVVVCTSAGGGMMTGTARGLIKAGATNTKCIAASIDLTGLHMASDTAFNKK SCTTGHTGFGVPYAVDPDHSDVPRSAARPLRYMERYVTVKQGDVMYITEALANLEGIER GPAGNTALAAAFSLAQELPADEYIIISETEYTGAGKHVQPQLAFARENGIEIKFGDPNA EDKPGVNIVLPKDPSYIKTVDMDLDHMRKSFIKKACKKYGTFDIDEDDIAFLAEEVNAT PEWVKGVVEDLK" /locus_tag="LOCUS_2100" /gene="ortB" /EC_number="2.3.1.263" /note="WP_032507361.1 2-amino-4-oxopentanoate thiolase subunit OrtB (Clostridioides difficile) [pid:69.3%, q_cov:98.5%, s_cov:97.7%, Eval:1.8e-181]" /note="MGA_276" CDS complement(3734..4033) /product="2-amino-4-oxopentanoate thiolase subunit OrtA" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011860811.1" /transl_table=11 /codon_start=1 /translation="MAKKGDWVRIHRVVLPAEGRNPNLPADTAKVPLEMWVKGTLCADA EIGDEVEVETATNRIEHGTLVEVNPYYTHSYGKFVPELIQIDRQLREILFGGEE" /locus_tag="LOCUS_2110" /gene="ortA" /EC_number="2.3.1.263" /note="WP_011860811.1 2-amino-4-oxopentanoate thiolase subunit OrtA (Clostridioides difficile) [pid:59.4%, q_cov:97.0%, s_cov:94.1%, Eval:4.6e-27]" /note="MGA_277" ORIGIN 1 ggacgtgccg aggtagatgc attcgatgcc ccacttctcg atgccgccgt gcttgatgtt 61 catgatctcg cgcataccga cggagtgttc gtcttcgccc acggtgccgc agatggcctt 121 catgtgcttg acttcctcga attcgtgata cagttccgcg tcggacatgt agtgaggttc 181 ttccgggatc tcgatctcgt tgatgtcgat atcgaaggcc agcttgccct tcagctcgat 241 gcgggtgcct tccgcttcct gcagcacttc gcgggagatg acttccggat cgatcagacc 301 cagcttcttg ccgatctcta cagcgacagc ttcggaaacg cgcttgttgg tcgggatgca 361 catggtcatc atgacgacgc cgtcgccgca ccattccatt tcgggcttga tggtgtggcc 421 gtctctgtac ttcgcgacct tttcgagacg tctgtctacg cagtcggtct cgtccagctc 481 gtcgatgtag acgatcttgg agcggtcttc gaacgtgcag ccgccgatga gggcggaggg 541 gttcttcggg tcgccgccgt actgctcgac gttgttgtag ccgtagtgag ccgtaacagg 601 agccatgtag tccggatctc tctcgaagat cttgccgacg cctacgccgc cttcgatctt 661 acgggcgata ccgtcgccgt ttctttcggg gtacttggcg gagtcaacga agaaaccttc 721 ctggactgcc ttgaagtagc cgccgacttc cacgatctct tccatgaaca gcagagctct 781 ttccttcagg tcgcgtacgg tcttgcgcag cgggccgttg ggatcgttgt tcagctggac 841 catctgcatc aggccgtcga gaccgatcag cgtctgcttc gcggtgtcgg tagcttcgat 901 gttgtagatg tgccagggaa cgtttctgcc ttcgtccggc gtgatggtgg actgaatgtc 961 cgcgctcgtg agcttggaga tgaacatgtt cattacgtgg gtaacggtcg cttctctcgc 1021 ggaggagtcg atgtacttcg tgttcatctg ggctctcatc ttatatctgc cgcacatctc 1081 tctcagggcg actgcgtacg gcaggtccat gtacatgcac ggagccggcg ttgcgctggg 1141 aggtacggtg gacagggaga tgttttcggg cttctcgccg accttttcgg agaacagcga 1201 gttgatggag tgctgaacga tcagctcggg catgaccttc caggcgtctc ttgcggtcgc 1261 gttcgcgttg tgcgcgccgt cgatctgcag catgtcggcc caggccatga tcttcttgga 1321 ttcgcaggcg tctacgaagg atcttaccat gttgacgtct ctgtacagaa cgttgtactg 1381 gggatcctgg tgcgcgccgt tgatgccttc ttcggcgaac atgaccgcga tgtcggggcc 1441 tgcgacgccg gagatgtaag agtgatagtt gatgggtctg ccgacttcat cctcgatcag 1501 gtccagggcc tttctctggg ctctgacctg ctttctggtg acggggatgc cgccgatacc 1561 ctgcggggta ccttccatca ggccgtcgat gtgggactgg cccatgtggc ggatgaccat 1621 cagatggtcc gcgccgtgcc atgcggccat tctcatacgg cggacgtcgt cctcgaatct 1681 gccggacgcg atctccgtcg tgatggtggg catgggctgg ggatccagac cgtcgaaata 1741 ttttgccggg ggaaggggca cgccctgctt caggggttcg gagatatcgt gatactcgaa 1801 cggtcccatg ttcttgtttt tcgcaggctt tctccaggtc cagcctcttc ttctgggttc 1861 gtacttgtcg aggtccttca gcagttcaac cacgtcaagc ttttcattgg gctttaaagg 1921 ttccatgctt atttacctcc tctgaacgct gcagctacga cgtcccagcc ttcgccgttg 1981 gcgagcttgg tgcctgcttc gggaatggtg atgttctcga tcttggacag cttatacacg 2041 cagtggcccg cgcccttgcc catcagaccg tgatccatgc agccgttgac gatcttctgc 2101 gtgtccaggg aagagatccc catgcgcagc agaacggaac gctccacgga aggtgtggtg 2161 ttcttgtagc ccagttccag aagaggatcc acgacctgcg cggtcagctc ccagaatctg 2221 ttatacagct cttcgtcgga aagattcgcg atatgctttc ttctttcctc gaaatcgtct 2281 gctcttttca tcctttttct ccttcaatct atgcctataa cttacttcag atcttcgact 2341 acgcccttga cccattccgg agtcgcattg acttcttcgg ccaggaacgc gatatcgtct 2401 tcatcgatgt cgaaggtgcc gtacttcttg caggccttct tgatgaagga ctttctcatg 2461 tgatccagat ccatgtccac agtcttgatg tagctgggat ccttgggcag aacgatgttg 2521 acgcccggct tgtcttcggc gttcggatcg ccgaacttga tctcgatgcc gttctctctt 2581 gcgaacgcga gctggggctg gacgtgcttg ccggcgccgg tgtactcggt ctcggagatg 2641 atgatgtatt cgtctgcggg cagttcctga gccagggaga acgcggctgc cagagcggtg 2701 ttgccggcgg ggcctctctc gatgccttcc aggttcgcca gagcttcggt gatgtacatg 2761 acgtcgccct gcttgacggt gacgtatctc tccatgtagc gcagaggtct tgcggcgctt 2821 ctgggtacgt cggagtgatc cgggtcaacg gcatagggaa cgccgaaacc ggtgtggccg 2881 gtggtgcagc tcttcttgtt gaaggccgta tcggatgcca tatgcagacc ggtgaggtcg 2941 atggatgccg cgatgcactt ggtgttggta gcgcctgcct tgatgaggcc tctggcggta 3001 ccggtcatca tgccgccgcc tgcggacgtg cagactacga ctgcgggatc cttgccgtac 3061 ttctctctgc actgcatggc gatctcgtaa ccgagggtct cgacgccggc aatgccgtag 3121 ggggagtaca gggacgcgtt gaagtatccg gtgtcttcca ggatggacag gaaggtgtag 3181 aacagttcgg gaccgacggt cagctgaacg acttcagcgc cgtaggcttc gcactttctg 3241 gccttctcga tgatctcggg ctggcctacg ccgtgggagt cgaagcattc ctgcacgatg 3301 atgcacttca gaccctgcat agcggcctgg gatgcgacgg ctgcgccgta gttgccggaa 3361 gtggcggcca taacgccctt gtagcccatc ttcttggcgg tagcgactgc gcaggcagct 3421 cttctggcct tgaaggaacc ggaggggttg gcggcctcat cctttgccag gatggtggcg 3481 ccgtaaccgg gcttggcgta ctttctcgcc agcgcggtga ggtttctgag ctccaggatc 3541 ggggtgttgc cgacgcctgt cgcggactgg accttctcga tctcctcgag cgtgtagccg 3601 gtggaggcca tcagtccttc gtagtcgaag cgcatcttgc cggattcgaa cttgtcgtaa 3661 tccagaccca tggcttcctt catgatctca ttgtttcttc ccattacgga agcgtagtct 3721 ttagccagtg ccattattct tcacctccga acaggatctc tctcagctgg cggtcgatct 3781 ggatgagttc cggaacgaac ttgccgtagc tgtgcgtgta ataggggttg acttccacga 3841 gggtgccgtg ttcgatgcgg ttggtggcgg tttcgacttc tacttcgtca ccgatctccg 3901 cgtctgcgca cagcgtgccc ttgacccaca tctcgagggg taccttggcg gtatctgcgg 3961 gcagattcgg gtttctgcct tctgcgggca gcaccactct gtggatgcgc acccaatcac 4021 ctttctttgc cattttattc tccttcatat tgggagcggt caccggaaaa ggtgaccgct 4081 tccaaaccat agtgctttcg ctttaaacta ctttacgatc ttcttctctt ctctgatgag 4141 gttgcggaag tcgcccatga tagctctggg aatgggcagg tcgatcatgg tcttcagacc 4201 tgcttctgcg ttgatgacca tggggatcat gttgac // LOCUS sequence048 4176 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence048 VERSION sequence048 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..4176 /mol_type="genomic DNA" /organism="" /note="sequence048" CDS complement(224..1189) /product="ABC transporter substrate-binding protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003732701.1" /transl_table=11 /codon_start=1 /translation="MNKKRIVSLLLALAMIFALAGCTSSEPAQPAEPSEPEASGSVITV TDMMGREITLDEPATRVVALSAADCEVLYAVGAGDALVGRGEYCDYPAEVLEVPSVQSG YDTNIEQIIALEPQVLLMSSMAQTEEQVAQLEEAGIKVVVSDAQDIEGVYTAVEMIGKL MGKEKEAEQVIIGMQVAFADLTNSTAGRGKTVYFEVSPLEYGLWTAGKGTFMNEIAEML GMKNIFDDVEGWAEISEEQVIERNPDYIVTITMYFGEGPTPVEEIMGRTGWENVTAVKN GAILNLVDNELSRPTPRLKDGAILLNNFVVEHERELAPAA" /locus_tag="LOCUS_2120" /note="WP_003732701.1 ABC transporter substrate-binding protein (Listeria monocytogenes) [pid:37.8%, q_cov:84.7%, s_cov:89.0%, Eval:2.3e-35]" /note="MGA_280" misc_feature complement(1442..>4176) /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_013230386.1:chitobiase/beta-hexosaminidase C-terminal domain-containing protein" /note="WP_013230386.1 chitobiase/beta-hexosaminidase C-terminal domain-containing protein (Amycolatopsis mediterranei) [pid:31.2%, q_cov:16.6%, s_cov:22.1%, Eval:9.2e-10, partial hit]" /note="MGA_281" /locus_tag="LOCUS_2130" ORIGIN 1 cagatgacgc ggggcagccg ggatgccagg atgatggagg cggaagacgt ggacggcgcc 61 gcattgccct tcagggcgcc ggcaacgaga gagaccgttt cggaaaacgg aacgctcacg 121 ctgccgacag agacgcacag cacaaataca gccagcatca cgcaggcaaa cgccaggtaa 181 gccagcaggg aaaaagattc agttttccgt ccgctgcgcc ccattacgcg gcaggcgcga 241 gctctctctc gtgctccacg acgaagttgt tcagcaggat ggcgccgtcc ttcagacgcg 301 gcgtcggacg ggacagttcg ttatcgacca ggttgaggat ggcgccgttt ttcacggcgg 361 tcacattctc ccagcccgtg cggcccatga tctcttccac gggagtcggg ccctcgccaa 421 agtacatcgt gatggtgacg atatagtccg ggttgcgctc gatcacctgt tcttcagaga 481 tctccgccca gccttccacg tcgtcgaaga tgttcttcat gcccagcatc tcggcgatct 541 cgttcataaa ggtgcctttg ccggcggtcc agaggccgta ttccagcggg gagacctcga 601 aatagacggt cttgccccgg ccggcggtgc tgttggtaag gtccgcaaat gccacctgca 661 tgccgatgat cacctgctcc gcctcttttt ccttgcccat cagcttgccg atcatctcaa 721 cggcggtata gacgccctcg atgtcctgag cgtcggagac cacaactttg atgccggctt 781 cctccagctg cgcaacctgc tcttcggtct gcgccatgct gctcatcagc agcacctggg 841 gctccagagc gatgatctgc tcgatgttcg tgtcgtagcc ggactgcacg gagggcactt 901 ccagcacttc tgcgggataa tcgcagtatt cccctcttcc gaccagggcg tctccggcgc 961 cgacggcgta cagaacttcg cagtccgccg cagacagcgc gacgacgcgg gtggcgggtt 1021 cgtccagggt gatctcccgg cccatcatgt cggtgacggt gataacgctg ccggaggctt 1081 ccggttcgga aggttcggcg ggctgcgccg gttcggaaga cgtgcagccg gcaagagcga 1141 agatcatcgc cagcgcgagc agcagggaaa cgattctttt cttgttcata tcggttcagt 1201 cctttctttt atctcacagc cttcgaggct gttttgcgca ttacgtttta ttataccata 1261 atgggcaagg ggagatagta tttagaaaaa cttctaaata gaaagcgagc agcacatcga 1321 agacgaggta ttcgacgata tcgcagcatt cattcaaaac aacaaataaa caacgagaag 1381 gaggcgtccg gatggacgtc tccttcgttt atgggcatta tccgctgctt ctgtctgtat 1441 tctattccgc ttcgaaagcg atgtacagga acgtgatgat ctgacccctc aggcaggtca 1501 tatccgggct gaatgccgtt tcgctcgtcc ctgctgtaat gccgttctca taggcgcagg 1561 cgacagcttc cgcgaaatag tcgccttcgt ttacatcatc gaagggctcg ctgcctgcag 1621 cgggtctgcc tgccatatta tacaggaacg tgaccgcctg cgccctggtg acgggctgct 1681 ccgatccgaa tctgtctgcg ctgacgcctg cggtgattcc ctgctcataa gcccatagga 1741 cagccttata gaaataatct ccttccgtca cgtccgtaaa cggattttcc gttccttccg 1801 gctcaggaga gccggaggcg atccacagga aggtgacgat ctgcgcccgg gtcgcagatt 1861 ccatcgggct gaaggtcttc ggggacgttc ctcctgtgat gtcgtttttc agcgcccact 1921 ccacagcttt gcggaaatac gcatcagcag gaacatccgt gaacgggaaa tcatccggag 1981 aagactgctt ttcgatcttt tcgaatacgg cttcgatctc gaccgctgac gaaggcatcg 2041 taaaactgta cttatcgccg gtcttgctga cctcgatctc attgccgtac ttgtccctga 2101 tcgtcagccg gctcacttca taaccttcgt ccggcgtaca ggagaccgtg acggtatccc 2161 ctgccgatgc atgtttcggg aaagcagaaa tctctccgtt ttcactcgtc tgcggtttta 2221 ctgtgtgggt ctttctctcg cgcggcgcgc tttcctgcgg ttcttctgct ttggtatata 2281 cagcttctgc gataccactg tccttgaaac cgtcgaggat cgcaatagcc ttcagcgtca 2341 ccgtttcttc gatcgtaatg acactgccgg gcatataaat gccgctgtcc tttgtcggat 2401 ccgagccatc caatgtatag cggatcgccg cgcctgtggt cgcgcaggag atcgtaacat 2461 ccagtttatc gcggaaagtc tgcgagcctt cgctcagaac cggcaaagcg actgtttcaa 2521 ctgtttcgcc tgctttcacg atcgtgagcg tgccgatgga cagtcccttc gcagccgtat 2581 aattgccgcc ttccgctacg tcgaagctca cctcgtattc gccagcctcc gtatgtcctg 2641 ccggatcata ctgcacgctt actgcaccca tgcccgttct ggcgcttacc ggcgcctgta 2701 cttcgatggg ctgacccgta taatcccggg aacccggcgg ggtgatcgta aagtcagcct 2761 ccgttgggac agctttctgc agggaccaga cagcagttgc cgtaccggta taaacacctg 2821 ttccgctgat ctcgagcatg gtgtctccga cgtctgtcgc cgtgccgccg ctgctgatct 2881 cataatcgac gaacgcagca ccatccaacg tcaccagatc gatgacgacg ctttgctccg 2941 ttccgttata aacattctga gttcccagtg tgatgaccgc gccggaaata tccttcggcg 3001 gagcgccgtt taccttgacc gcgatagttt cttctctgcc gttatgattc gtactgtccg 3061 cgatcgtcac ggtgaccgtg acagtaccgc cgtatgctcc agcggtgaat atgcctgtcg 3121 tttcattcac actgcagtcc aaagcgttgc catcgatggc ataggtcaca gttccctgcg 3181 caccgctgac attgccggac aggtctaccg acgcgccagc ctcgacggag gcggtaccgt 3241 tgaccaccgc aggatcttcg atcttgttga tcgtgagctg tccaaagacg atatcggaag 3301 cagctttata gttctggctt tccgccacgt caaaggaaac ggcgtacctg ccggcatcgg 3361 tgtgaccttc cggcgtatag cgaagggtca ctgcgccgat cccggaatgc ttcgcaacag 3421 gagcggtcac atctaccgga tcgccggtat aattcgcaga acctggcgac acagttataa 3481 aatcgcttct caccggaata gctttctgca acgaccagac aatgcttttc gtccccgtgc 3541 agaaaccggt tcctgcgatc gtcagcgtag tcgcttcaac atccgtcgca gtctcgcctg 3601 caatgatctc gtattccacg attggcacgc cgttcagcgt gaccgaatcg atgacgacgc 3661 tctgcgctgt cccgtcatag accttctgcg tacccaaatt gatgaccgca gcggagagat 3721 ccttcagacc cgtatccctg agcagcggac ggtcggcatt catggcccag acgtctgtga 3781 agtcccattg aacaaagctg ctttccgcca tgaactcctg caggctcagg gcttccgcaa 3841 catcgggagg atcctgatcc atcgacaaaa aagtgggtga ataaggtcga ccgatgcccc 3901 aatcatccgc ctgcgaattc gggaagactg tcccttccag atagtagcaa tgctccaccc 3961 cgacggagga agtaacggca cctggcagag agcccactac gccgccggtc agatactgcg 4021 atccgctctt gatcttcccg ttgtaatgat agcaattccg gacagcgccg ttgctcatta 4081 ggccgaaggc tgcaattccg gcaacaccgc ctacagcctc tgtgctgctg ctcacgtcgc 4141 cttcgtgcag acagttctgc ataagagccg aaacga // LOCUS sequence049 4075 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence049 VERSION sequence049 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..4075 /mol_type="genomic DNA" /organism="" /note="sequence049" CDS complement(745..3225) /product="ribonucleoside triphosphate reductase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_002678883.1" /transl_table=11 /codon_start=1 /translation="MYHVVKRDGKVAEFNIRKISDAITKAFEAQGRQYHPSTIDMLALR VTSEFEPLIQDDQIQVEQIQDCVEKVLSEAGYADVAKAYILYRKQREKIRNVNSALLYY KDIVDNYLKINDWRVKENSTVTYSVGGLILSNSGAITANYWLSEVYDQEIAEAHRSAAI HIHDLSMLTGYCAGWSLKQLIQEGLGGIPGKITSAPAAHLSTLCNQMVNFLGIMQNEWA GAQAFSSFDTYLAPFVRVDNLSQKEVKQCIQSFIYGVNTPSRWGTQAPFTNVTIDWTVP NDLKNLPAIVGGKEMNFTYGDCQKEMDMVNKAFIEIMIEGDANGRGFQYPIPTYSITKD FSWEETENNKLLFEMTAKYGTPYFSNYINSDMEPSDVRSMCCRLRLDLRELRKKSGGFF GSGESTGSVGVVTINLPRIAYLAENEEDFYARLDHLMDIAARSLKTKRTVISRLLDNGL YPYTKRYLGTFNNHFSTIGLIGMNEVGLNAKWLRADMTSPKTQKFAVDVLNHMRERLSD YQEQYGDLYNLEATPAESTTYRFAKHDKERYPDIITANENGTPYYTNSSHLPVGYTEDV FSALDIQDDLQTLYTSGTVFHAFLGEKLPDWKAAASLVRKIAENYKLPYYTMSPTYSVC KDHGYLSGEHFTCPICGQKTEVYSRITGYYRPVQNWNDGKTQEFKDRKTYVISRSHLTH TGPLARPMYMEEAAPAVEEPALKAVEPVSEAPAPAPAEPVTPAESAVHPAQMENILFTT PTCPNCKMAAALLDKAGIPYTKLFAEKNPDLVEKYGIKQAPTLVISADSADFLKFRGVS DIRGYLGELAKKNA" /locus_tag="LOCUS_2140" /EC_number="1.17.4.2" /note="WP_002678883.1 ribonucleoside triphosphate reductase (Treponema denticola) [pid:59.5%, q_cov:79.1%, s_cov:92.2%, Eval:7.2e-232]" /note="MGA_283" ORIGIN 1 atccgcctcg atgccggtgg cgttgtcgat ggccgtaacc gcgcagatct tgccgccctc 61 ggtcttgatg ccggtgatct tcatgtccac gtgcttctcc acgttgtcgt gggcgaacag 121 cacgtcctgc agccgggatt cgccggtaaa gtacggcaga tcctgcagca tgattacctt 181 ctcgcacttg cccgccagca ggatcgcctc ctgcagcgcg gaattgccgc cgcctgccat 241 gcagacggtc ttgcctttat agaagtcgcc gtcgcagacc gcgcagaacg agatgccctc 301 gcccaccagg tcctcttcgc cttccagtcc cagcatgcgg tgcttgaccc ccagagccag 361 gatgacggac cgtccctcga aatccccgcc gtactcggtg tggactttcc aggcgggagc 421 gccgtccgct tcgaagggct cgatgccggt cacccgctcc agctccagtt ccgcgccctg 481 ggccatcacc tggtccatga atttatccgc aaattcgttg ccggacaggc tggcaaagcc 541 ggggatgttt tccaccttcg gggatgaggt gatctgcccg ccgatggtgc ctttttcgat 601 gacaagggcc gatttgccgt tgcgctgcgc gtaaagggcc gcggtaagtc ccgcgggccc 661 tgcgccgacg ataatcacat cgtacatatt ctctgtttct cccgatcgtc taactgcgat 721 cgactcgtta tctatgcgtt ttcgttatgc gttcttctta gccagttctc ccaggtagcc 781 ccggatgtcg gacacgccgc ggaacttcag gaagtctgcg gaatccgcgc tgatgaccag 841 ggtcggagcc tgtttgatgc cgtatttctc taccagatcc gggttcttct ccgcgaacag 901 cttggtgtag gggatgccgg ccttatccag cagagccgct gccatcttgc agttcgggca 961 ggtgggcgtg gtgaacagga tgttctccat ctgtgcggga tggaccgcgg attctgccgg 1021 ggtcacaggc tcggccggag ccggagccgg tgcttcgctc accggttcca ccgccttcag 1081 agcgggttct tccactgcag gcgcagcctc ttccatatac atcggtcttg cgagaggacc 1141 ggtgtgggtc aggtgagagc ggctgatgac gtaggtcttt ctatccttaa actcctgggt 1201 cttgccatcg ttccagttct ggaccgggcg gtagtatccg gtgatgcggc tgtagacttc 1261 ggtcttctgg ccgcagatcg ggcaggtgaa gtgttcgccg gacagataac cgtggtcttt 1321 gcagacggag taggtcgggc tcatggtgta atacggcagc ttgtaattct ctgcgatctt 1381 ccggacgagg cttgccgcgg ctttccagtc gggcagcttt tcgccgagga acgcgtggaa 1441 cacggtgccg gaggtgtaca gggtctgcag atcgtcctgg atatccagcg cggagaagac 1501 gtcctcggtg taacctacgg gcaggtggga ggagttggtg tagtaaggcg tgccgttctc 1561 gttggccgtg atgatatccg gatatctttc cttatcgtgc ttcgcgaagc ggtaggtggt 1621 ggattctgcc ggggtcgctt ccaggttgta caggtcgccg tactgctcct ggtagtcgga 1681 caggcgctct ctcatgtggt tgagcacatc cacggcgaac ttctgggtct tgggcgaggt 1741 catgtcggcc cgcagccact tggcgttgag gcccacttcg ttcatgccga tgaggccgat 1801 ggtggagaag tggttgttga aggtgcccag ataccgcttg gtgtagggat acaggccgtt 1861 gtccagcagg cggctgatga cggtccgctt ggtcttcagg gatctggcgg cgatgtccat 1921 caggtggtcc agccgcgcgt agaagtcctc ttcgttctcc gccaggtagg cgatgcgggg 1981 caggttgatg gtaacgacgc ccacggaacc ggtggattcg ccgcttccga agaagccgcc 2041 ggacttttta cgcagttcgc gcaggtccag acgcagtctg cagcacatgg agcgcacgtc 2101 ggagggctcc atgtcggagt tgatgtagtt ggagaagtac ggggtgccgt acttggcggt 2161 catctcgaac agcagcttgt tgttctcggt ctcttcccag ctgaaatcct tggtgatgga 2221 ataggtcggg atggggtact ggaagccgcg gccgttggcg tcgccttcga tcatgatctc 2281 gatgaaggcc ttgttgacca tgtccatttc cttctggcag tcgccgtagg tgaagttcat 2341 ctccttgccg cctacgatcg cggggagatt cttcaaatcg ttgggcacgg tccagtcgat 2401 ggtaacgttg gtgaagggtg cctgagtgcc ccatctggac ggggtgttga cgccgtagat 2461 aaagctctgg atgcactgct tgacttcctt ctgggacagg ttatccactc tgacgaaggg 2521 agccaggtag gtgtcgaagg agctgaacgc ctgggcgccg gcccattcgt tctgcatgat 2581 gcccaggaag ttgaccatct ggttgcacag cgtggagagg tgggcagcgg gggctgaggt 2641 gatcttcccc gggatgccgc cgagaccttc ctggatgagc tgctttaagg accagcctgc 2701 gcagtagccc gtcagcatgg acaggtcgtg gatgtggatc gcagcggagc ggtgcgcttc 2761 cgcgatctcc tggtcgtaga cttcggacag ccagtaattt gccgtaatgg cgccggaatt 2821 ggacaggatg agaccgccga cggaatacgt aacggtggag ttttccttta cgcgccagtc 2881 gttgatcttc agatagttat cgacgatgtc cttgtagtag agcagtgcgg aattgacgtt 2941 gcggatcttc tctctctgct ttctgtacag gatgtaggcc ttggcgacgt ccgcatagcc 3001 ggcttcggac agcacctttt cgacgcagtc ctggatctgt tccacctgga tctgatcgtc 3061 ctggatgagg ggctcaaact cagatgtgac ccgcagagcc agcatgtcga tggtgctggg 3121 atgatactgt cttccctgcg cttcgaatgc tttcgtgatg gcgtcgctga tcttgcggat 3181 gttgaattca gcgacttttc cgtccctttt tacgacatga tacataactt tcacctcatt 3241 tatattaaag atacacggtt ggtttaaaca ccgaaaaaac gggagtattc ccgtcgatat 3301 ataatgtacc ctatcggggc ttcgatgtca atatatagtg gtatgctcga accgtgcata 3361 ctaaatatcg ggcattccgc agaatgcccg attttcaagt ctttcgccgt atttcgcttt 3421 tttgcaaggg gtttttgatc gatttttttt tatgattctg ccgcaaaaag atgttgaacg 3481 gctgttcaag atccttcctc agtgctggac atctgttgga cagaatgcga tataataaaa 3541 gcatatatag gatcaaatcg aacctcaaaa ttttttaccc atgcagtttg taaacgccgg 3601 tgcggatgga tgcgatcacg ccgccgtcga tcagaagatc ggtgccggtg atgaatttcg 3661 cgtgctcccc caacaggaac gcgccggctt ccgcgatctc gtcatcgcct cgatgctgta 3721 tgtctccggc gggatctgtc cgtatccgtg ggagaaggcc atgcagccca tgcccacttc 3781 ggatacttca atatcccgca gcagtctctt cttcaatgga tccacctccg tacgttctta 3841 tccgatcagt ccgttcgcct tcagccagcg ctcgacgctg gacttggaat tcgccgcctg 3901 gctgccggtg atgggcaggc cttttttcag atctgcgttc gggcaggtct tctggatctc 3961 ccgttcgctg ccgcccatgc cgctgccttc gttggtgcac aggggcagga tcgtcttgcc 4021 ggagaaatcg aagtgctcca ggaacgtata gacggccatc ggcatcgtgc cccag // LOCUS sequence050 4067 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence050 VERSION sequence050 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..4067 /mol_type="genomic DNA" /organism="" /note="sequence050" CDS complement(194..2479) /product="cation:proton antiporter" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_005786012.1" /transl_table=11 /codon_start=1 /translation="MHLPALITDLAVILLTAGVVTVIFKKINQPLILGYILSGFLIGPY LPYFFTAQDTASIETWSEIGIIVLMFCLGLEFSFKKLMSVGAGAVITATTVVAGMLSVG YLTGLALGWGHMDAIFLGGMLSMSSTTIIIKAFSELGVEKEDFAQLVFGILVVEDIAGI FMMIILSTISVSKNISGGDLALQLFQLVLYLIIWLVLGIYFLPSIMRKATKLMTDETLL IVSLGICFGMVLLADKLGFSSALGAFLAGSLLAGTIHAERVEHITSGIKDLFGTVFFIS VGMMIDPAMIVRYKLPILIISLVVVFGQSICSTVGVLLSGHGLKFAVHCGTSLAQIGEF AFIIASLGESLGVIANYIYPIIVSVSVLTTLTTPYCIKGADKVYHLLQRVLPGKLVARI DREETAESVAKEGSEWMTYLKRYIRITAVYGILMLACTVVGHYLLLPLLLRLPISSRMA RILCLILVYLAMAMFIRPFMDTHSFAYTKLWVEGGMTRAGLTVLTGIRILLLVLIAFIP LRRVAGASGLFLLPLVAGGLLLLSRSGWLASLYLNAEARFMANFNERNLEENDALSISD MLDERLHVSHFTVFPGYHISGKSLKELGWGKRYDVNIIKLVRGSEHLNMPDGDAVLQDG DDIYVIGEADNIATLYNRLGGWEQPAQQTLREYMESEETETSDLYSFPILVDKNSGLAG KTIRDCGLRRDYDCMILGLQRSRLPIPTPDVHTVIAAGDSIWVLGTQAMADKLIDAQIV SRKTAKAH" /locus_tag="LOCUS_2150" /note="WP_005786012.1 cation:proton antiporter (Bacteroides fragilis) [pid:38.5%, q_cov:98.0%, s_cov:98.5%, Eval:4.9e-150]" /note="MGA_286" CDS complement(2581..3084) /product="DUF1836 domain-containing protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_002357951.1" /transl_table=11 /codon_start=1 /translation="MDHRQADSFHIPRWEELPAVDLYMEQVITLIHSNLGAFFEQVGIQ PITKNMINNYVKAKIVQAPVNKRYPRISVAMIIVVYILKSCYETEDVGKLIRMGVDLEA GVPLTYNRFCDAIENAVKAVFSGEVHIKEEQIPGRERKYLMENFALSFASKYYVQMNFL NNEE" /locus_tag="LOCUS_2160" /note="WP_002357951.1 DUF1836 domain-containing protein (Enterococcus) [pid:34.8%, q_cov:92.2%, s_cov:82.5%, Eval:1.5e-17]" /note="MGA_287" ORIGIN 1 atcgtcggcg gatacaccga cggcacctat cgtccggaga atctcgtgac ccgcgcagaa 61 gcatctgtct tcgttcacaa catcctcaac gcgatcgcag aataaaacac aaggggacag 121 gtacattgtg ccgtcccaat ggaaaaggac cggccttgcg ccggtccttt tatcgtacct 181 gtttattatg ccgttaatgc gcttttgccg tcttgcggct tacgatctgc gcatcgatca 241 gtttgtctgc cattgcctgc gtacccagga cccaaatgga atcgcccgct gcgatcacgg 301 tgtgcacgtc cggtgtaggg atgggcaggc ggctgcgctg caggcctaag atcatgcagt 361 cgtagtccct gcggaggccg cagtcccgga tggtctttcc tgccagtccg gagttcttgt 421 ctacgaggat ggggaaggag tagaggtccg aagtctctgt ctcttccgat tccatgtatt 481 cccgcagggt ctgctgtgca ggctgttccc agcctccgag acggttgtag agcgttgcga 541 tattatcggc ctccccgatc acatagatgt cgtcgccatc ctgcaatacg gcgtcgccgt 601 ccggcatgtt cagatgttcg ctgccgcgga ccagcttgat gatattgacg tcgtaacgtt 661 ttccccagcc gagttctttc agggacttcc ccgaaatgtg atatcccgga aagaccgtaa 721 aatggctcac gtggaggcgc tcatccagca tgtcggatat gcttagggca tcgttttctt 781 ccaggttcct ttcgttgaaa ttggccataa agcgcgcttc cgcattcaga tagagactgg 841 ccagccagcc ggaacgggag aggagaagca gtccgccggc tacgagcggc agcaggaaca 901 gccccgatgc cccggctact ctgcgcagcg ggataaaggc gatcagcacc agcagcagaa 961 tgcggatgcc ggtgagcacc gtgaggcctg cccgggtcat gccgccttcc acccataact 1021 ttgtgtaggc gaaggaatgg gtgtccataa agggacggat aaacatggcc atggccagat 1081 agacgaggat caggcagagg atgcgcgcca ttctggacga gatcggcaga cgcaggagca 1141 ggggaaggag cagataatgg ccgacgacgg tgcaggccag catcaggatg ccgtagaccg 1201 ccgtaatgcg aatataccgt tttagatagg tcatccactc gctgccttcc tttgctacgc 1261 tttccgccgt ctcttcccgg tcgatgcggg cgaccagttt gccgggcaga acgcgctgca 1321 gcaggtggta gaccttgtcc gcccctttga tgcagtaggg cgtcgtaagg gtcgtgagga 1381 cggagacgga tacgatgatg ggatagatat agttggcgat gacccccaga gattctccca 1441 aagatgcgat gatgaaggcg aattcaccga tctgcgccaa agacgtgccg cagtggacgg 1501 cgaatttcag cccgtgaccc gagagcagca cgccgacggt agagcagatc gactgcccga 1561 aaacgaccac cagactgatg atgaggatgg gaagcttata ccggacgatc atggccgggt 1621 cgatcatcat tcccacggag ataaagaaga ccgtgccgaa caggtccttg atgccggagg 1681 tgatgtgctc cacccgttcc gcatggatcg tgcccgcaag aagagatcct gcgaggaatg 1741 cgccgagagc ggaggaaaaa cccagtttgt ccgccagcag caccatgccg aagcagatgc 1801 ctaaagagac gatcagcagc gtctcgtccg tcatgagttt cgtggccttc cgcatgatgg 1861 aaggaagaaa atagatcccc aggaccagcc agatgatgag atagagcacc aactggaaca 1921 gctgcagcgc cagatcgccg ccggagatgt tcttcgagac ggaaatggtg gacaggatga 1981 tcatcataaa aatgcccgcg atatcctcta cgacgaggat gccgaacacc aattgcgcaa 2041 agtcttcctt ttccaccccc aattcggaaa aggctttgat gatgatggtc gtggagctca 2101 tggaaagcat gccgcccagg aaaatggcat ccatgtggcc ccatccaagg gcaagccccg 2161 taagatatcc aacgctcagc atgcccgcca ccaccgtcgt cgccgtgatg acagccccgg 2221 ccccgacgct catcagcttc ttaaagctga attccagacc caggcagaac atcaggacga 2281 tgatgccgat ctcgctccag gtctcgatgg aagccgtatc ctgcgccgta aagaagtagg 2341 gaaggtaggg accgatcaga aaacccgaca ggatgtagcc caggatgagg ggctggttga 2401 tctttttaaa gatgaccgtg acgacgcctg ccgtgagcag gatgaccgcc aggtctgtaa 2461 tgagtgcggg taagtgcatg attttctcct atcaacaaat ctctaacact tttattatat 2521 caaaaaaaga accccgcata gggacaatcg cggccctatg cggggaaaaa gacattcttt 2581 ctactcttcg ttgttgagaa agttcatctg cacgtaatac ttgctggcga aggagagggc 2641 gaagttctcc atcaggtatt tgcgctcccg gccggggatc tgctcctcct tgatgtggac 2701 ttctccggaa aacacggcct ttaccgcgtt ttcgatggcg tcacagaagc ggttgtaggt 2761 gagcggcacg cccgcctcca gatccacgcc catgcggatg agcttgccca cgtcctcggt 2821 ctcgtagcag cttttcagga tgtaaactac gatgatcatg gcgacggaga tccggggata 2881 gcgcttgttg accggcgcct ggacgatctt cgccttgacg tagttgttga tcatgttctt 2941 cgtgatgggc tggatgccca cctgttcgaa gaacgccccc agattggaat ggataagggt 3001 gatgacctgc tccatgtaga ggtctacggc ggggagctct tcccagcggg ggatatgaaa 3061 actgtctgcc tgtctgtggt ccatgacgtt cctcctaaga gataattcag tatagcatga 3121 agatagtttt gagtaaaggt tgacatggcg aaaaatacaa agtaatatag tattcgatac 3181 tatattgata tttatagtac aatgccgata ttataggttc atcaaaaaat aaaaggagca 3241 actcaatgat ctatacccag aaaggcctgg attgggcgct gaacttcatc gattccatca 3301 acgcggatcc gagcaaatac gttatctaca aacagagccg tcccattgca aatctgaagc 3361 atatgatggt gactaccaca gatctgtatc ccaacaatac ggcttttatg atgaaattcc 3421 ccggaacgaa ggaatatgaa tccatctcct tcacgagagt gctggaagag atgaatgccc 3481 tgggaaccgc tctgatcgcc aaaggcctga agggtaagcg catcgccgtc tgcggtgaaa 3541 actgctatta ttggtgcctg tcctatctgg cagcggtctg cggcgtgggc gtcgtcgttc 3601 ctttggataa ggaactgccc gacggcgatc tgaagggcct cgccaccgca gcggaagtcg 3661 cttgcgtctt tacgacgaag aagcatcagc ccatgttcga ggagatgctg aagaatcacg 3721 aaggcagcat ggaatatgtc gtcggcatgt acacgaagcc ggaagaagct ggcgatgtcc 3781 tctctctgga agcgctcatc gaagagggcc ggaaactgat cgccgcaggc gagacttcct 3841 atatcaacgc ccagatcgac gaagaagcca tgggcatcct gctgtacacc tccggcacca 3901 cgggcctttc caagggcgtt atgctctccc ataagaacat ctgcgctgac ctgatgagcg 3961 cccccaacct gctggaagtt ttgccgatgg accggttctt caacgtgctg ccgctgcacc 4021 acacctacgc ctgcacctgc gacttcctgg tgcccatgta caagggc // LOCUS sequence051 4062 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence051 VERSION sequence051 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..4062 /mol_type="genomic DNA" /organism="" /note="sequence051" misc_feature complement(369..>4062) /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_012048356.1:DNA-directed RNA polymerase subunit beta'" /note="WP_012048356.1 DNA-directed RNA polymerase subunit beta' (Clostridium botulinum) [pid:66.5%, q_cov:95.9%, s_cov:98.0%, Eval:0.0e+00]" /note="MGA_290" /locus_tag="LOCUS_2170" ORIGIN 1 accgggaatg taagcggtaa cttccagacc gttggtgagg cgaacacggg cgacctttct 61 cagtgcagag ttcggcttct tcggagttac tgtcttaacg gaagtgcaaa cgcctctctt 121 ctggggtgcc ttcgtatcgg taggcactct cttgatgctg ttcatgctct tcagcagcgc 181 gggagagtta gacttctttt cggacatcgt ccggccctgt cttaccagtt ggttaatggt 241 aggcattcaa tttctccttt ctttcagatt ttttatattg acccgcccgc acgcgggcgt 301 gcgggcagag atcaacagca caacagagat agtgtaccat agcgtaagcc ttgatgtcaa 361 aggcttttct agagttcttc ctcagggatc tcctcttcgg catccatctc ttcttcgggc 421 aggatctcct cgtcgatcgc ggggtcatcc attgcctcgt cgtcgaagaa accgcgggat 481 tcttcttccg cgtattcctc tttgacttcc ttcgtgttga aggattccat gtattcggta 541 tttacgccgt agtcgatctc gatgttcttg tactgcttca tacccgtacc ggcggggatg 601 agcttaccga tgatgacgtt ctccttcagg cccagcagtc tgtcgcgctt gcccttgatg 661 gcagcgtcgg tgaggactct ggtggtttcc tggaaggatg cggcggacag gaaggagttc 721 gtcgccagag acgccttggt gataccgagg agctctctct tgtaaacggc aggttcctgt 781 ccttcttcca gcgcattgtt ctcgtcttcg atctcgaaga ggttgtacag cgcgccgggc 841 agcaggtggg tgtcgcccgc gtcgtcgatg cggtacttgg acagcatctg ggacacgatg 901 acttcgatgt gcttatcgtt gatgtctaca ccctgctgct tgtacactct ctgaacttcc 961 ttcaggaggt actggtaaac gccttcaaca ccgttgaggc gcatgatgtc gtgcgggttg 1021 agcgggccct gggtgatgcc ttcgccggcg tggaccacgc tgccttcggc taccttcagg 1081 cgggcgccgt aaggaatgat ataggttctt tcctcttcgc cccgtacgcg gacctcggtc 1141 ttgttatcgg gccgcggctc gatggagacg acggtgccgt cctgttcgca gatctccgcg 1201 atacccttcg gcttacgggc ttcgaaaagt tcttcgactc tcggaagacc ctgggtgatg 1261 tcgtttcctg cgacggatac gccgccggtg tggaacgttc tcatggtcag ctgcgtaccg 1321 ggttcgccga tggactgggc tgcgatgata ccgaccgctt cgccgatatt cacgtgggag 1381 cccgtcgcca ggttgcggcc gtagcaggct gcgcagatgc cggtcttgct cttgcaggtc 1441 atgaccgaac ggatcttgac ggcttcgatg ccggcgtctt cgatggcctg tgcctgcgct 1501 tcggtgatct cgtcgccgcc ttcgacgatg agttcgcccg tcttgggatc tgcgatatct 1561 tccaacgccg ttctgcctac gatacgcagg cgcagcgctt cgatgacttc cttgccgtcg 1621 gtgaaggctc tgacttcgat gccttcgtcg gtgccgcagt cgttctcacg gacgatgacg 1681 ttgtgggaaa cgtctacgag acgtctggtg aggtaaccgg agtctgcggt acgcagagcg 1741 gtatcggcca gaccctttct ggcgccgttg gcggagatga agtattccat gaccgtcaga 1801 ccttcgcgga agttcgcggt gataggaatt tcgatggtct taccggcagc gttgcccatc 1861 agaccgcgca tgccgccgat ctgacggatc tggttcttgg aaccacgggc gccggagtct 1921 gccatgatga acaggttgtt gtccgcctgc agggaatcca tcagggcgtc tgccacgtcg 1981 tcggtggcct tgtgccagat ctggatgacg ttctcgtagc gctcgttgtt gctcatgagg 2041 ccgcgtctgt agaacgcttc gtacttgtcg accttggcct gggccgcgtc gatgatctcc 2101 tgcttgttct cgggcatgac catgtcgccg atggagatgg tgatggcagc cttcgtggaa 2161 tatttaaagc cggtgctctt gatgtggtcg agcatcttgg ccgtttcggt gttgccgtga 2221 gcccggaagc acttgtcgat gatccgggtg aggtccttct tgcggcagag gaagccgatc 2281 tccagggagt acggatcctt gctgcggtcg atgaacccca gatcctgggg gatctgctcg 2341 ttgaagataa agcgtccgac ggtggattcc accaggcggc cttccttatc ttcgggtccg 2401 aggtacatgc gcaccttgat cttcgcgtgg atcgcgatgg cgccggtctg gtaggccatg 2461 agcatttcgg catagtcggt aaagaccttg ccgtcgccct tttcggggac tctctcgtag 2521 ccgtccgccc ggttcttttc ctcgtccttg aactcgtcga tgcgctcaac gatcttgccg 2581 tcctcatccg tcttggcgca tacgccgggg tgagtcaggt aataggagcc gaggatcatg 2641 tcctgggtcg gcgtcgtgat gggggagccg tccttgggtg ccaggatgtt gttgacggac 2701 atcatcagga atctggcttc ggcctgtgcc tctacggaga gaggtacgtg gaccgccatc 2761 tggtcgccgt cgaagtctgc gttgtaagcg gtgcagacca gcggatgcag cttgatggcc 2821 ttgccttcga ccaggaccgg ttcgaaggcc tggatgccca gtctgtgcag cgtcggggcg 2881 cggttgagga ggacgggatg atcctggatg acgtcatcca gcacgtccca gacttccggg 2941 cgcacctttt cgaccattct cttggcgctc ttgatgttgt gtgcgaggcc gcggatgacc 3001 agttccttca tgatgaaggg cttgaagagc tccagcgcca tcttcttggg aagaccgcac 3061 tgatagaact tcaggtccgg acctacgacg attacggaac ggccggaata gtcgacgcgc 3121 ttgcccagca ggttctgacg gaaacgtccc tgcttacctt tcagcatgtc ggacagagac 3181 ttaagaggtc tgctgccggg gcccgttacg gggcggcctc tgcggccgtt gtcgatcaga 3241 gcgtctaccg cttcctgcag cattctcttc tcgttgcgga cgatgatgtc gggagcgctc 3301 agctccagca gtctcttaag acggttgttt ctgttgatga cccttctgta caggtcgttt 3361 aagtcggagg tggcgaatct gccgccgtcc agctgcacca tcggacggat gtcgggcggg 3421 atgacgggaa cgacttccag gatcatccac tcggggcggt tgccggaggc tctgagcgcc 3481 tcgatgactt ccagtcttct gacgatgcgg actctcttct ggctctgcgc gtccttcagc 3541 ttttcgcgga ggtccgcagc cagttcgtcc aggtcgatgg cttccagcag ctggcgcacg 3601 gattccgcgc ccatgcccgc cttgaagcgg tcaccgaact cttctctctt ctctctgtat 3661 tcctgctccg tcaggatgtc catgtaggcc atgtccgtgt cgccgggatc ggtgaccacg 3721 taggatgcga aatacaggat cttttccaga cttctcgggg acatgtccag aaccaggccg 3781 atgcggctgg ggatgccctt gaagtaccag atatgggaga ccggcgtggc cagttcgatg 3841 tggcccatcc gttctcttct tacttttgcc tttgtgactt ctacgccgca gcgatcgcag 3901 acgatgccct tgtagcggat gcgcttatac tttccgcagt ggcattccca gtccttcgtc 3961 ggtccgaata tcctctcgca gaacaggccg tcgcgctcgg gcttcagcgt tctgtagttg 4021 atggtttcgg gcttcgtgac ttcaccgtgg gaccagcttc tg // LOCUS sequence052 4052 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence052 VERSION sequence052 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..4052 /mol_type="genomic DNA" /organism="" /note="sequence052" CDS complement(258..980) /product="tRNA1(Val) (adenine(37)-N6)-methyltransferase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_087456344.1" /transl_table=11 /codon_start=1 /translation="MAIREDDTGFGGLVLLQDTETFSYGVDAVLLADYCKALPGESVLD LGSGNGAVALIVLGKYGVASVTGIEVQERMTRLARETAARNGLEDRLHFLQGDVLDIEA LVPAGTFDAVTCNPPYAEAGRGPVSGKEAAYIARHETTASLQDFVRAGAYALKPGGRFV LVHRPSRLPDIFASMRSCGLEPKRMQLVVPKPGAAPNIVLVTATKGGGKELTVEPDLCI RSENGSYSEELQKIYNRI" /locus_tag="LOCUS_2180" /note="WP_087456344.1 tRNA1(Val) (adenine(37)-N6)-methyltransferase (Tumebacillus avium) [pid:41.9%, q_cov:97.5%, s_cov:93.3%, Eval:4.0e-46]" /note="MGA_292" CDS complement(982..1947) /product="stage 0 sporulation family protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003404857.1" /transl_table=11 /codon_start=1 /translation="MVKVAGVRFKAAGKVYFFDPADLELFAGDNVIVETARGVEYGTLS ADLMEVEEEEIVAPLKPILRKADENDAKRHEENLKKKDRALQLCQEKIDKHGLEMKLVD VEYTFDNSKVIFYFTADGRVDFRELVKDLAGVFKMRIELRQIGVRDETKMMGGIGSCGR ELCCHAWLPDFEPVSIKMAKVQNLSLNPIKISGICGRLMCCLQYENETYCHLKKGMPDV GERITTRDGKAVVTDVNILENKIKTRLILEEKTEDKPEKLSTEYYIYGKEEIQRAPNKR GQDKNFPKKAKKKGGFGTDADIAAMSEEELKQQAELLELE" /locus_tag="LOCUS_2190" /note="WP_003404857.1 stage 0 sporulation family protein (Clostridium) [pid:59.4%, q_cov:79.8%, s_cov:84.2%, Eval:1.5e-87]" /note="MGA_293" CDS complement(1964..2815) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MAQQLRSLLNSGRLVHAFLFVGTKEERLQTGRALARAILCVQPVQ GDACGDCPSCRKFDHGNHEDFLYLDLETAPGSAKTQIGVDAVEHLQEQLKLKPFGKRHV VLIEEAHLLNTAAQNKLLKTLEEPAGDSVLILLAEKKDALLPTVVSRCSTYYLEDGGFE PDAEILTAVRNFFVLFAEKSLFYRKRDCVKSILEDKNDPRGKALSFLQTLESVLRDALL CPYGAQISPLCADWPAFEELCAKVDKQASERAISAVEQAIRSIRAGYNTGYTIKKLCLD LT" /locus_tag="LOCUS_2200" /note="WP_011391576.1 DNA polymerase III subunit gamma/tau (Moorella thermoacetica) [pid:39.5%, q_cov:54.8%, s_cov:25.5%, Eval:2.0e-24, partial hit]" /note="MGA_294" CDS complement(2820..3455) /product="dTMP kinase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_000677237.1" /transl_table=11 /codon_start=1 /translation="MKGIFITFEGPDGSGKTTQIRLLEQHCKEKGYDVVLTREPGGTPI SEAIRSLLLDPSHKEMDGVTEALLYAASRAQHVAEKIKPALAKGCIVLCDRFMDSSIAY QGYARGLGDDVRVINEFAVQGTQPDITFFMDLSAAAGKARVAAARDMDRLEQEDLSFHN AVYEGYLQLKEIYSQRYVCIDASRSIEQIAEEIRERFDNYVLCRNEQE" /locus_tag="LOCUS_2210" /gene="tmk" /EC_number="2.7.4.9" /note="WP_000677237.1 dTMP kinase (Bacillus) [pid:49.5%, q_cov:97.2%, s_cov:100.0%, Eval:7.4e-51]" /note="MGA_295" CDS complement(3471..3683) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MSYTIARYALWILLCIPVIVLGFGLCGDLMNSILQESREKKAKKD AKAASDQQRRSFEEEYRKSRDSGVL" /locus_tag="LOCUS_2220" /note="MGA_296" rRNA complement(3773..3878) /product="5S ribosomal RNA" /inference="COORDINATES:profile:Barrnap:0.8" /locus_tag="LOCUS_r0010" /note="Barrnap_1" ORIGIN 1 caacaagcat cagctggtcg gagcgcacgt catctccacg gacctgcgcg cgggcgcagc 61 gctggtgctg gcaggcctgg ttgcaaaggg aaagaccgag gtctcagaga tctatcatat 121 cgaaagaggc tacgagaaat tccatgacaa actgacggcg ctgggcgcta agatcgagcg 181 cgtggaagat taaaaccgaa aaaaaaggga cggctcttcg tcccatcaac gaaaaaagga 241 cgggatcccg tcctttttta tatcctgtta tagatcttct ggagctcttc gctgtaggaa 301 ccgttctccg aacggatgca gagatccggt tcgacggtca gctcttttcc accgcccttg 361 gtggcggtca ccagcacgat gttgggcgca gcccccggtt tcggcacgac cagctgcatc 421 cgtttaggct ccagtccgca gctgcgcatc gatgcgaaga tatccggaag ccgcgacgga 481 cggtgcacca ggacgaatct gccgcccggc ttcagcgcat aggcgccggc ccttacgaaa 541 tcctgcagcg acgctgtcgt ttcgtgccgg gcgatatacg ccgcttcctt cccggagaca 601 ggtcctctgc cggcttccgc gtaaggcggg ttgcaggtga ccgcatcgaa cgtccctgcg 661 ggaacgagag cctcgatgtc gagtacgtct ccctgcagaa aatgcagcct gtcttccaga 721 ccgttacgcg ctgcggtctc ccgcgccagg cgggtcatcc gttcctgcac ctcaatgccg 781 gtaacggaag caacgccgta tttgcccaat acgatgagtg caacggcgcc gttgccgctg 841 cctagatcca gcacggactc tccgggcaat gccttgcagt aatcggccag cagcaccgcg 901 tcgacgccgt aggaaaacgt ctccgtatcc tgcagcagaa cgagtccgcc gaatcctgtg 961 tcgtcctcgc ggatcgccat attactccag ttccagcagt tccgcctgct gtttcaactc 1021 ttcttcggac atggcggcga tatcggcgtc cgtgccgaat ccacccttct ttttcgcctt 1081 tttcgggaag ttcttgtcct ggccgcgctt gttcggcgcc cgctggatct cctccttgcc 1141 gtagatgtaa tactcggtgg agagtttttc cggcttatcc tccgtcttct cttccaggat 1201 gagtctcgtc ttgatcttgt tctccaggat gttgacgtcg gtcaccacgg ctttgccgtc 1261 ccgggtcgtg atgcgctcac ctacgtccgg catgcccttc ttcaggtggc aatacgtctc 1321 gttttcgtac tgcaggcagc acatcaggcg tccgcagatg ccggagatct tgatgggatt 1381 gagggagaga ttctgcacct tcgccatctt gatggagacc ggctcgaaat ccggcagcca 1441 ggcgtggcag cacagttctc tgccgcagga accgatgccg cccatcatct tggtctcgtc 1501 ccgcacgccg atctggcgca gttcgatacg catcttgaat acgcctgcca ggtccttgac 1561 cagttcgcgg aagtctacgc ggccgtccgc tgtaaaatag aaaatgacct tggagttgtc 1621 gaacgtgtat tccacgtcca ccagtttcat ctccagaccg tgcttgtcga tcttctcctg 1681 gcagagctgc agcgctctgt cttttttctt cagattttcc tcgtggcgct tcgcatcgtt 1741 ctcgtccgcc ttgcgcagga tcggctttaa cggtgcgacg atctcctctt cctccacttc 1801 catgagatcg gcggaaagcg ttccgtattc gacgccccgg gctgtctcca cgatgacgtt 1861 gtctccggca aacagttcca gatctgccgg gtcaaaaaaa tataccttac cggcggcttt 1921 gaatcgcacg cccgcaactt ttaccattgt ttcctccaaa atattatgtc aagtcaagac 1981 aaagtttctt gatcgtataa cctgtattat agccggcccg tatcgagcga atcgcctgct 2041 ccacagcgga aatcgcgcgt tctgaggcct gtttgtccac tttggcacat aattcctcaa 2101 aagcaggcca atcggcgcac agtggcgaga tctgggcccc gtaggggcat aacagcgcat 2161 ctctcaacac cgattccagc gtctgcagaa agctgagcgc cttcccccgg ggatcgtttt 2221 tgtcttccag gatagacttt acacaatccc gcttacggta aaacagcgac ttttctgcaa 2281 acaacacaaa gaaattccgt acggccgtca ggatctccgc atccggttcg aatccgccgt 2341 cttccagata gtacgtgctg caccgggaca cgacagtcgg aagcagcgcg tccttctttt 2401 ccgccagcag gatgagcacc gaatcgcccg caggctcttc cagcgtcttc agcagtttgt 2461 tctgcgccgc cgtgttcaaa agatgcgctt cttcgatgag cacgacgtgc cgcttaccga 2521 aaggcttcag cttcagctgt tcctgcagat gctcgacggc atccacgccg atctgcgtct 2581 tcgcgctgcc gggcgcggtc tccagatcca gatacagaaa gtcctcgtgg tttccgtgat 2641 cgaacttccg gcaggacgga cagtctccgc aggcgtctcc ctgcacaggc tgcacacaga 2701 ggatggcacg ggccagcgct cttccggtct ggagccgctc ctctttcgtt ccgacgaaca 2761 gaaacgcgtg gaccagccgg ccgctgttca gaagagaacg cagctgctgc gccacggcgc 2821 tattcttgtt cgtttctgca aaggacatag ttgtcgaacc gttcccggat ctcttctgcg 2881 atctgctcga tgctccggga tgcatcgatg cagacgtaac gctgggaata gatctctttc 2941 agctgcagat agccttcgta gaccgcattg tggaacgaca ggtcttcctg ctccagccgg 3001 tccatatctc tggctgccgc aactcttgct ttgcccgctg cagcggacag gtccatgaag 3061 aacgtgatat ccggctgggt gccctgcacg gcaaattcgt tgatgacccg cacatcgtcg 3121 cccagaccgc gggcgtaccc ctgataggcg atggaagaat ccatgaaccg gtcgcacagc 3181 acgatgcagc cctttgccag ggccggtttg atcttttccg ccacatgctg ggcacgggag 3241 gcggcgtaga gcagcgcctc ggtgacccca tccatctcct tatgagacgg gtcgagcagc 3301 agactccgga tcgcttccga gataggcgtt ccgccgggtt ctctcgtaag gacgacatcg 3361 tagccctttt ccttgcaatg ctgttccaac aggcggatct gcgtcgtctt accgctgccg 3421 tccggccctt cgaacgtaat aaaaataccc ttcaaaagat cgtttcctca ctataaaaca 3481 ccgctgtctc tggacttgcg gtattcttct tcaaaacttc tgcgctgctg gtcgcttgcc 3541 gctttcgcgt cttttttcgc tttcttttct cggctctcct gcaggatgct gttcataaga 3601 tcgccgcaca aaccgaagcc cagcacgatg actgggatgc agagcaggat ccataatgca 3661 tatctggcta tggtatagga cataagccct ccttaactaa ataagtatac cataaatagg 3721 gaaaaaggaa aagataacga aaaaagcacc tttgcaggtg ccttttcgaa ccggctgcgt 3781 cctactttcc caggcagctt cccaccaagt atcatcggct ctgaagggct taactactgt 3841 gttcgggatg ggaacaggtg taaccccaac gatattgcaa ccagattttt tgtgaagata 3901 tcgatgtacc ttcaaaacta aacaatgctt gtaaaaacca ttggtcaagt gctcgaccta 3961 ttagtatcgg tcagctcaac atgtcgccat gcttacacct ccgacctatc aacgtggtag 4021 tctcccacgg gtcttagcct tgcggcagga ga // LOCUS sequence053 4040 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence053 VERSION sequence053 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..4040 /mol_type="genomic DNA" /organism="" /note="sequence053" CDS complement(394..1605) /product="molybdopterin molybdotransferase MoeA" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_000442200.1" /transl_table=11 /codon_start=1 /translation="MISVEEALRIIAQTAPLEGTEELDVYDCVGRIAAEDLVSPIDQPP FPRSPLDGFAFHSEDVKGAGWERPARLKQVGYVPAGCGTEFAVGPGECVRIMTGGRIPA DCDAVVGIEDAAYEAACGFDGDDAVQIYKAVGHFQNYVFAGDDFAKGTVLCKVGQKIDA ATADCLAAAGFAALRARRRPRVAILATGSEIAAPGSPLQAGKIYDSNSVYLKNRLKQLG FEADTSFCPDDPALLATELQKQIGSYDLVLTTGGVSVGDADYLPIILAELGAAVRFAGV RLKPGSPIMLAGKDGSQILCLSGNPYAAAATFELFARPLLAKLSGDPSLEPQETEGVLA EAFPKGSPVPRYLRAKLENGILTVPSGHSSGQLLTMAGCNCLAELPACGGATPAGTKLK VYRI" /locus_tag="LOCUS_2230" /note="WP_000442200.1 molybdopterin molybdotransferase MoeA (Bacillus cereus) [pid:37.1%, q_cov:95.5%, s_cov:89.0%, Eval:1.1e-56]" /note="MGA_298" CDS complement(1611..2636) /product="molybdopterin-binding protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003435117.1" /transl_table=11 /codon_start=1 /translation="MKLIRTEDAVGTVLCHDMTQIIPGVTKDARFRKGHIVTEEDIPVL LSMGKENLYVFEKPEGWLHEDEAAERLLALCFGPNMTRSGTKEGKIEVKADCDGLFLVD RDRLRLVNGQDQLMIATRMGNVAVKKDDKLAGMRVIPLVIEAEKLDKAAELVGPQPLLR VVPFTVKTCAVIVTGSEVAKGLIEDKFGPVVEKKLAAFGVETIYRTKCVDDTDTILKAI AEARAAGADLILCTGGMSVDPDDKTPGAIMQSGARIVTYGGAALPGAMLCLGYFEDGVP ILGLPGCVMYHKATIFDIVLPRVLAGVEISKADIAELGYGGLCLGCKECRFPDCSFGKG W" /locus_tag="LOCUS_2240" /note="WP_003435117.1 molybdopterin-binding protein (Clostridioides difficile) [pid:54.9%, q_cov:99.4%, s_cov:99.7%, Eval:4.1e-99]" /note="MGA_299" CDS complement(2895..3680) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MEPNYIGLSETIRKTVDRFFSALFPRFFGDEPSSISEEGLEEKSR IEMDLAVQELTKALLYVLPQEQAMHCVKQTMARIDQIRRMLQTDIQAAYEGDPAAISPD EVILCYPAFRAIVVYRIAHCLYILKVPIIPRMMTELAHSWTGIDIHPGATIGPSFFIDH GTGVVIGETCTIGSRVKLYQHVTLGAKSFKVADDGSLVKGIKRHPDIGNDVVIYAGATV LGGDTKVGDGCVIGGSVWLTHSIPPGTVLTTKYETQLHV" /locus_tag="LOCUS_2250" /note="WP_011120272.1 serine acetyltransferase (Rhodopirellula baltica) [pid:63.5%, q_cov:68.2%, s_cov:54.9%, Eval:1.5e-60, partial hit]" /note="MGA_300" ORIGIN 1 cacatgtcgt agatggtaag gagcgcagcg gaaacgccgg tgagcgcctc catctccacg 61 ccggtcttgc cttccgtttt tacggtgcag accgcccgga tcgctgtttt ttcctccagg 121 atctcgagat ccacggaagc ctttgtgatg ggaagcggat ggcacagtgg aatgatgtcc 181 gaagtctttt tgcaggccat gatgcccgcg atgcgggcgg ctgccaggac atcgcccttg 241 ggcagcgcat cgtcctgcag cagccggagg atctcagcgc ctacatagat cgtgccttcc 301 gctttcgctt ccctcgccgt gaccgctttc ccggacacgt ccaccatgat ggcttctccg 361 ctttcgttga tgtgcgtcag tttttccata tcttcagatc ctataaactt tgagttttgt 421 tccggcaggg gtagcaccgc cacaagccgg taattcagcc agacagttgc agccggccat 481 ggtcagaagc tgaccgctgg agtgaccgga aggcacggtc aggatgccgt tttccagttt 541 cgcccgcaga taccggggca ccgggcttcc cttcgggaaa gcttccgcca gaacaccttc 601 tgtctcctgc ggttccagcg aaggatcgcc ggataacttc gccagcagag gccgggcaaa 661 cagttcgaag gtcgccgcag ctgcataggg gttgccggac agacagagga tctgcgagcc 721 gtcctttcct gccagcatga taggtgaacc gggcttcagc cggacaccgg cgaaccgcac 781 cgcagcgccc agttccgcca ggataatcgg caaatagtcc gcatcgccca ccgacacgcc 841 gccggtggtc aggacgagat cgtaagaacc gatctgtttt tgcagttccg tcgcaagaag 901 cgccgggtcg tccgggcaga aagaggtatc cgcttcaaaa cccagctgct ttaagcggtt 961 tttcagatag acggagttcg agtcgtagat cttgccggct tgcagggggc tgcctggggc 1021 agcgatctcg ctgccggtgg ccagaatggc cacccgcggc cgccggcggg cgcgcagcgc 1081 cgcgaagccg gcggccgcca ggcagtctgc cgtcgccgcg tcgatcttct gcccaacctt 1141 gcagagcaca gttcccttcg cgaaatcatc gcctgcaaag acgtaattct ggaagtgtcc 1201 cactgcttta tagatctgta cagcatcgtc cccatcaaag ccacatgccg cttcatacgc 1261 tgcatcttcg attccgacca cggcgtcgca atccgcaggg atcctcccgc ccgtcatgat 1321 gcgcacgcac tcgccgggtc ccacagcgaa ctcggttccg cagccggcag gtacataccc 1381 cacctgcttt agccgggcag gtctttccca gcccgcccct ttcacgtctt cgctgtgaaa 1441 tgcaaagcca tctagcggag aacggggaaa cggcggctga tcgatgggcg aaaccaaatc 1501 ttccgccgcg atccggccga cacaatcgta cacgtccagc tcttccgtgc cttctaaagg 1561 tgctgtctgc gcgatgatgc gcagcgcttc ttctacagag atcatccctt ctaccagcct 1621 ttcccgaagc tgcagtccgg gaaacggcat tccttacatc ccaggcaaag cccgccgtaa 1681 cccagttccg cgatatccgc cttcgagatc tccacgcctg ccagcacgcg gggcagcacg 1741 atatcgaaga tcgtagcctt gtgatacatc acgcagcccg gcagtcccag aatgggcacg 1801 ccgtcttcga aatagccaag gcacagcatg gcgccgggca gcgccgcgcc gccgtaggtg 1861 acgatcctcg caccgctctg catgatagcc cccggcgttt tgtcgtccgg atctacgctc 1921 atgccgccgg tgcaaaggat cagatcggcg cctgccgctc ttgcttctgc gatcgccttc 1981 aggatcgtat ccgtatcgtc tacgcatttc gtgcggtaga tcgtctccac cccgaaagcc 2041 gccagtttct tttccacgac ggggccgaat ttgtcttcga tcaaaccctt cgctacttcg 2101 ctgccggtca cgatcacggc gcaggtcttt accgtaaaag gcacgacccg cagcagcggc 2161 tggggaccca ccagctccgc cgctttatcc agcttttccg cttcgatcac cagggggatc 2221 acccgcatac cggccagttt gtcgtctttt ttgaccgcca cgtttcccat gcgggtcgcg 2281 atcatcagtt ggtcctggcc gttcaccagg cggaggcggt ctctatccac cagaaacagg 2341 ccatcgcagt ccgccttcac ctcgatcttg ccctctttcg tccctgagcg ggtcatgttc 2401 ggtccgaaac acagcgccag cagccgctcc gccgcttcgt cctcgtgcag ccacccctcc 2461 ggcttttcga acacgtaaag attctccttg cccatggaca gcagcaccgg aatgtcctct 2521 tccgttacga tatgcccttt gcggaaccgc gcgtccttgg tgaccccggg aatgatctgg 2581 gtcatgtcgt ggcacaggac agtgccgact gcgtcttctg ttctgatgag tttcatgctg 2641 tttctcctat acaaaatgcc ctgcctccgt aaaggaagca gggcgatcat accaaaaccg 2701 gcggcccgaa agccgcttgc tgctgcatcc ttttcaatga ggaaggccct gcggtttccc 2761 gccaggaccc tggaggggaa agtcccctcg gcctgccgtc cttagcgttc tgccttaggc 2821 gcagcaggct cggaagccgt tgttctgtta ccgttcattt tacacggatg cagaagggtt 2881 ttcaacaccc ctcgtcaaac atgcagctgg gtctcatatt ttgttgtcag aacggtcccg 2941 ggcgggatgg aatgagtcag ccagacgctg ccgccgatga cacagccgtc tcccaccttc 3001 gtatcgccgc ccagtacggt ggcaccggcg tagatcacca cgtcgtttcc gatgtccgga 3061 tggcgcttga tgcccttcac cagactgccg tcgtccgcga ctttaaagct cttcgcccct 3121 aaagtcacat gctgatacag cttgacccgg ctgccgatgg tgcaggtctc accgatgacg 3181 acgccagtgc cgtgatcgat gaaaaacgac gggcctatcg tcgccccggg atggatgtcg 3241 atgccggtcc agctgtgggc cagctccgtc atcatccggg gaatgatggg caccttcagg 3301 atgtacaggc agtgtgcgat gcgatagacg acgatcgccc ggaaggcggg atagcacaga 3361 atgacttcat ccgggctgat cgcagcagga tccccttcgt aagccgcctg gatatccgtc 3421 tgcagcatcc tccggatctg gtcgatgcga gccatggtct gttttacgca gtgcatcgcc 3481 tgttcctggg gcagcacgta cagaagcgct ttcgtcagct cctggacggc caggtccatc 3541 tcgatgcggg acttttcctc cagaccttcc tcactgatgg aagacggttc gtctccgaaa 3601 aagcggggaa acagggcgga gaaaaagcgg tcaacggtct tccggatcgt ctccgaaaga 3661 ccgatataat ttggttccat atgaatatcc tcagattacg ttaaaaatac ccttccgtgg 3721 acagatagcg gtctccggta tcgggcagga tgaccacgat gttcttgccg gcgttctccg 3781 gacgctttgc cagctgtatc gcagcagcga ccgcagcgcc ggcagagatg cccaccagga 3841 cgccctcgtt tctgccgatg gctgcacccg cggcataggc gtcctcgttc gagattgcga 3901 tgacctcatc cagcacgctc aggtccagcg tatccggtgc gaatccggca ccgatgccct 3961 ggatcttatg gggacctgct ttgccttcgg agatgaaggg agatgcggca ggttccacgc 4021 ctacgacctt tactgccggg // LOCUS sequence054 4032 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence054 VERSION sequence054 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..4032 /mol_type="genomic DNA" /organism="" /note="sequence054" CDS complement(353..1141) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MMTVSEMKERKKTLHYTNEKIAELSGVPLGTVQKIFGGATTYPRY DTMQALEKALGGSGSTFTVQKTPAVYGSSTKEDLPRQGEYTVDDYRALPDHPRYELIDG VLIEMESPSTKHQSLLGELAYHFNLFIRSRKGTCRVFFAPFDVQLDCDEKTMVQPDLII ICDRDKLKDWGLWGAPDFALEVLSPSSKKKDMIIKYRKYKAAGVKEYWLVDPENEIVLT YYFGEDGTEKTGIYGFDNKIPVEIYHGELEIDFAEIVPYL" /locus_tag="LOCUS_2260" /note="WP_005814895.1 Uma2 family endonuclease (Desulfitobacterium hafniense) [pid:37.3%, q_cov:64.5%, s_cov:91.6%, Eval:1.8e-29, partial hit]" /note="MGA_303" CDS 1297..2073 /product="TSUP family transporter" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_002681078.1" /transl_table=11 /codon_start=1 /translation="MFLGLITYPKLIFVCVAVFLAGFVDSIAGGGGVISLPAYMLTGLD PVAAFACNKTTACFGATLAAGRYIKNKTVNWTAAVPSVIMAILGAWLASLLVLRLDPTV FQKIILFVLPFVAVFLFFKRDFGSVDASADIPRNKVIIVSALIGLTLGFYDGLVGPGTG TFAILAFTSLLKFDLKTAGGTARVFNWASGFGSMVSFLFAGKVIWGIALITAVCSLAGN YIGSGLAIKKNPAFIRVMLTVVCGLLLVKLGYDVLF" /locus_tag="LOCUS_2270" /note="WP_002681078.1 TSUP family transporter (Treponema denticola) [pid:46.2%, q_cov:97.3%, s_cov:95.8%, Eval:2.0e-62]" /note="MGA_304" CDS complement(2055..2567) /product="flavin-based extracellular electron transfer system protein EetB" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003723627.1" /transl_table=11 /codon_start=1 /translation="MRSLTSGPARAAACGVLTALALIFSYIEFLVPLPIAIPGIKLGLA NIVVLVCLYLLGEKYAFFINCTRIALAALLFGSLFSALYALAGGIISFAAMALLKKTGI FSVCGVSMAGGVFHNLAQLTVAAFLVETAQVYYYFPVLLLSGMATGIGIGVLATLILRS LGQNKTS" /locus_tag="LOCUS_2280" /gene="eetB" /note="WP_003723627.1 flavin-based extracellular electron transfer system protein EetB (Listeria) [pid:37.3%, q_cov:91.2%, s_cov:87.8%, Eval:9.9e-25]" /note="MGA_305" CDS complement(2551..2895) /product="NusG domain II-containing protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_002294810.1" /transl_table=11 /codon_start=1 /translation="MLAIALLLLGLGSFLLLQNLQKAGDTVTVTVDGAVYGTYPLAEDR TEQIVTPLGSNTLRIEGGRVWISEADCPNHDCVEKGAIAKQGQIILCLPHKLSVTITEQ EGGGPDAVSY" /locus_tag="LOCUS_2290" /note="WP_002294810.1 NusG domain II-containing protein (Enterococcus) [pid:36.2%, q_cov:88.6%, s_cov:76.1%, Eval:9.4e-12]" /note="MGA_306" CDS 2926..3990 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MIHRPLKMITALLLLTAVIVAQCGCTAQTAPEQPATQTSFGEDWL LNTYCYIQTYEAGQESLIRQAFSVARDFENRLSRTIETSDIGRFNASESGCTVDVDTAL LLQDCRDAWERSDHMLDVTMGAVTQLWDFSAEDPKVPDAAAIAEALTHVGAWDKIWIEP IDGGPAGVWQILKDDAGIALDLGAVAKGYIADKTADFLRQHGVARAVINFGGNVVFVGS KEDGSPWACGIEDPAEGGSEELIQDRALIGLVTCSEGSVVTSGTYERCFTQDGVLYHHV LDPHTGYPVETDLLSATIIGPSSQVCDTLSTSCLLLGSKKGMELIGSFEDYEAVFILED GSIVKTDGADFKEQ" /locus_tag="LOCUS_2300" /note="WP_005817208.1 FAD:protein FMN transferase (Desulfitobacterium) [pid:33.3%, q_cov:81.6%, s_cov:72.9%, Eval:1.2e-43, partial hit]" /note="MGA_307" ORIGIN 1 aacctgggcg acaaagccgc cgataccgct gagatcgcaa agctcaagat gaagatcagc 61 tccgccgaga gcgacatcaa gggcgtttat accgagatgg gcaagaagct cttcgaagag 121 catcccgaat atctggagaa gttcttcacc gaagaaaagg gcaagatcga agaactcacc 181 gccaacatcg cggcgctgaa ggagcgcatc gaagccgtta agaacactgt cggcaaggtc 241 gaagatgccg cagccgagaa agtggaagaa gtcgaagaaa agatcgaaga atccctgtaa 301 agttttcaaa cacacgaacg cccgggcagc agcccgggcg ttttgctgta tcttagagat 361 agggcacgat ctccgcgaaa tcgatctcca gttctccgtg atagatctct acgggtattt 421 tgttatcaaa tccgtagatg cccgtcttct cggttccgtc ttcaccaaag taataagtga 481 ggacgatctc gttctccggg tcgacaagcc agtattcttt tactcctgcg gccttgtatt 541 tccggtattt tattatcata tcctttttct tgctggaagg agacagaact tccagtgcga 601 aatctggtgc accccagagt ccccagtcct ttagcttatc tcgatcgcag atgatgatca 661 gatctggttg gaccatggtt ttctcatcac agtccaactg tacgtcgaag ggggcaaaga 721 agacgcggca agtgcccttc ctgctgcgta taaacaggtt aaaatgatat gccaattcac 781 caagcagact ctgatgcttt gtgctcggcg attccatttc gatcagcacc ccatcgatga 841 gctcgtagcg ggggtggtcg gggagagccc ggtaatcgtc caccgtatat tcgccctgcc 901 ggggaagatc ctccttcgta gaacttccgt aaacggcagg ggtcttctgt acggtaaacg 961 tgctgccgga gccacccagc gctttctcca gcgcctgcat ggtatcgtag cggggatacg 1021 tcgtcgctcc tccgaagatc ttctgtacag tacccaaagg cacgccggac aattccgcga 1081 tcttctcgtt cgtgtagtgc agcgttttct tgcgctcttt catttcgctt acggtcatca 1141 tgggcatcgc ctccatttta tatataataa ccgattttgt tccgtataac aaccgtaaat 1201 ggcttttaaa cggtcttctt ttggaaagtt tcttcgcagc ctgttttatg ataaaataag 1261 cgggtaccgt atcccatcgt tgtttcagca aaactcatgt tcctcggcct catcacctat 1321 ccaaaactca tcttcgtctg cgtcgccgta tttctggcgg gttttgtgga ctccatcgcc 1381 ggcggcggag gcgtcatcag cctgcccgcc tacatgctca ccgggctcga cccggtggcg 1441 gctttcgcct gcaataagac gacggcctgc ttcggcgcca cgctggcggc ggggcggtat 1501 atcaagaata aaacggtcaa ctggacggct gcggtcccct cggtcatcat ggccattctg 1561 ggcgcctggc tggcttccct tctggtgctg cggctcgatc cgacggtctt ccagaagatc 1621 atcctgttcg tgctgccttt cgtggctgtt tttctgtttt ttaagcggga tttcggcagc 1681 gtggatgcga gtgcggatat tccaagaaat aaagtgatca tcgtgtcggc gctcatcggg 1741 ctcaccctgg gcttctacga cggcctggtc ggccccggca ccggcacgtt tgccatcctt 1801 gcctttacgt ccctgttaaa gttcgacctg aagacggcag gcggcacggc cagagtcttc 1861 aactgggcca gcggcttcgg ctccatggtg agcttcctgt tcgcaggcaa ggtcatctgg 1921 ggcatcgcgc tcatcacggc ggtctgttcc ctcgccggca actacatcgg ttccggcctc 1981 gccataaaga aaaacccggc gtttatccgg gtgatgctta cggtggtatg cgggctgctt 2041 ctcgtaaaac tgggctacga cgttttattc tgacccagcg aacgcaggat gagcgtcgcc 2101 agcacgccga tgccgatgcc ggtcgccatg ccggagagga gaaggacggg gaagtaatag 2161 tagacctggg ccgtctccac caggaaagcg gcgacggtga gctgcgccag gttgtggaac 2221 acgcctcctg ccatggagac gccgcagacg gaaaagatgc cggtcttttt cagcagcgcc 2281 atcgcggcaa aggagataat gccgcctgcc agcgcgtaca gcgcggaaaa caggctgccg 2341 aacagcagcg ccgccagcgc gatgcgggtg cagttgatga aaaaggcgta cttttcgccc 2401 agcagataca ggcagaccag cacgacgatg ttcgccagac ccagcttgat ccccgggatc 2461 gcgatgggca gcggaacgag aaattcgata taggaaaaga tgagggcgag ggccgttaac 2521 acgccgcagg cagcggctct ggccggtccg ctagtaagag accgcatccg gaccgcctcc 2581 ttcctgttct gtgatggtca cagacaattt atgcggcagg cacaggatga tctgcccctg 2641 ctttgcgatc gctccctttt ccacgcagtc gtggttcgga cagtccgctt cggagatcca 2701 tactcgcccg ccttcgatgc gcagcgtatt gctgccgagg ggcgtaacga tctgctccgt 2761 gcggtcctcc gccaggggat aggtgccgta gacggcccca tccacggtga ccgtcacagt 2821 atccccggct ttttgaaggt tctgcagcag cagaaaactg cccaacccca gcaggagaag 2881 ggcgatcgcc aacacgatat ccgctttttt gaaaaaggaa gttttatgat ccatagacct 2941 ttgaaaatga tcacagcact gctgcttctt acggcagtaa ttgtagcaca gtgcggctgt 3001 acagcgcaaa cggcgccgga gcagccggcg acgcagacca gcttcggcga ggactggctg 3061 ctgaatacgt actgctacat ccagacctac gaggccgggc aggagagtct catccgtcag 3121 gcgttttccg tggccagaga tttcgagaac cggctttccc gcaccataga gaccagcgat 3181 atcggacggt ttaatgcatc ggagagcggc tgcaccgtgg atgtggatac ggcgcttctg 3241 ctgcaggact gccgggatgc ctgggaacgc tcggatcaca tgctggacgt gaccatgggc 3301 gccgtgacgc agctgtggga tttctctgca gaagacccga aagtgcccga tgcggcggcg 3361 atcgcggagg cgcttaccca tgtcggggcg tgggataaga tctggatcga acccatcgat 3421 ggaggtcctg ccggcgtgtg gcagatcctc aaggatgacg ccggcatcgc cctggatctg 3481 ggcgccgttg caaaggggta catcgcagac aagacggcgg acttcctgcg tcagcacggc 3541 gtggcgcgcg ccgtcatcaa tttcggcggc aacgtggtgt tcgtcgggtc aaaagaggac 3601 ggcagtccct gggcctgcgg catcgaagat ccggcggaag gcggcagcga agagctcatc 3661 caggacagag ccctgatcgg tcttgtcacc tgcagcgaag gatccgtcgt tacctccggc 3721 acctacgagc gctgctttac gcaggacggc gtgctgtacc atcatgtgtt ggacccccac 3781 accggatacc cggtcgaaac ggatcttttg tctgccacca tcatcggacc atcctcccag 3841 gtctgcgaca ccttatccac cagctgtctg cttttgggca gcaaaaaggg catggaactg 3901 atcggatcgt tcgaggatta cgaagccgta tttattctgg aggacggcag catcgtcaag 3961 acggacggtg cagattttaa agaacaataa aaagggacga ggggtggtgc ccaaagaggc 4021 tcatcgagcg at // LOCUS sequence055 3987 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence055 VERSION sequence055 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3987 /mol_type="genomic DNA" /organism="" /note="sequence055" CDS complement(688..1404) /product="TIGR03936 family radical SAM-associated protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011460898.1" /transl_table=11 /codon_start=1 /translation="MPNNKELHRYLFGFYKKGNMRFISHLDLQRLFKRCIKRAGIVPAY SNGFNPHEKINIVHPLSLGFETEQDYFELDTEQPYEESRLVEGMNLALPEGIRFTFCRE IPYSSRNSSSITEMSLYEAFLPSSQNLNTEGFIIQDEVKILKKDKKTKKMVEKDVKDWI GRLELLEETEEGSRLSLLLRSAPNETLNPASLLESLCAFSGSPFDREALRVTRKDLFAR KDGQLVSLSCYYTQED" /locus_tag="LOCUS_2310" /note="WP_011460898.1 TIGR03936 family radical SAM-associated protein (Desulfitobacterium hafniense) [pid:27.2%, q_cov:92.9%, s_cov:94.9%, Eval:6.0e-18]" /note="MGA_309" CDS complement(1394..3253) /product="TIGR03960 family B12-binding radical SAM protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003419074.1" /transl_table=11 /codon_start=1 /translation="MSNVQKQLDKLLLKVEKPARYIGGELHSIVREPLPGTVRFAFCFP DLYEIGMSYMGLNILYHLLNKTDHTYCERCFTPARDMMAAMKAADMPLFTLETKTPLKE MDFVGFTLQYELSYSNILAMLDLAGIPALSKDRTEADPIIICGGPCAFNAEPVADFMDV ILVGDGEELLPEVCRIRGEFRRAGKTKQEFLAEIAKLQGVYIPSFYEEIRDEKGTFRGY RKLREEAPDRVLKAIVHDIDTVDFPKELIVPLIEVVHDRSVAELFRGCTRGCRFCQAGM VYRPVRERSEEKVLDIAKTQLENSGQGELSLLSLSTSDYTHFEPLVTDLMEYCKQHQVS LSLPSLRMDNFSFKVLDEIQGVRKTGLTFAAEAGTQRLRNVINKNITEEHIFTALRQAF DLGWTSVKLYFMMGLPTETYEDLDGIVDLAKRIMDLAKEHNGGKVGRYSVSVSVSNFVP KPDTPFMWVRQNTPEEFEQKHYYLKDRLKKIKGVNFRYHGSYASMLEAVFARGGRELST VLLRAYELGAAFDAWTEGFRQDAWEQALAENSIGADYFALNDIDPDAPMPWEIVDCGIT KEFFQREWKKAQEAVTTPDCRLGCNGCGVNAHTECRWGGIYAE" /locus_tag="LOCUS_2320" /note="WP_003419074.1 TIGR03960 family B12-binding radical SAM protein (Clostridioides difficile) [pid:49.1%, q_cov:97.1%, s_cov:98.0%, Eval:7.2e-173]" /note="MGA_310" misc_feature complement(3246..>3987) /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_009888921.1:GTPase ObgE" /note="WP_009888921.1 GTPase ObgE (Clostridioides difficile) [pid:48.6%, q_cov:99.2%, s_cov:57.6%, Eval:2.5e-62, partial hit]" /note="MGA_311" /locus_tag="LOCUS_2330" ORIGIN 1 acgccgaaac tgcagcccag gatggtggtg agggcttttt ccgtggcgcc gctggtgatg 61 agcagggtca tgatgatgac gtagatacag gtgatcgccg tcatgaagta gacgttgtag 121 cccgccagga tcgacggaac gtacaccatg aagaccgcaa ggcaggtgaa cgccagggag 181 accagggtgt tgagaccctt caggtgaccg aagaacaaca gcgccgcgca gaacagcagg 241 ccgaagcgga tcatggcatc cagacggtaa tagccgccgt atacccagtc cgcgtcccct 301 tccttcgtgc cgtaattata gaggatgacc ttatcgccga cttccagcgt ctcgtctgcc 361 tgcacggtgt agttgtctga cgtatgggcc gccagtacct cctggccttt gaattcgccc 421 gtcaggatgc gggctttgaa ataggtcagg tcgttctggt attctacgtc ctccgaaagc 481 tcgtagttgt cggagacggt cttttcgatg ctggtgattc tcgccttttc cgcataggca 541 tcctcggcgt agaggatcgt caggtccttc gtgacgatct tgtttccgcc caaaataaaa 601 ataagggaaa cgactaccgt tgcgatccac accaccaggt tgcggaattt cggtgtcgtt 661 ttatatttct ttttaaactc agccatacta gtcttcctgt gtatagtaac aggacaagga 721 aacgagctgt ccgtcttttc ttgcgaacag atccttgcgg gtcacgcgca gcgcctccct 781 gtcgaagggt gaaccgctga acgcgcagag ggattccaga agcgatgcgg gattgagcgt 841 ctcgttgggt gcgctccgca gcagcaggga gagcctgctc ccctcttccg tctcctccag 901 aagttccaac cggccgatcc agtcctttac gtccttctcg accatcttct tcgttttctt 961 gtctttcttt aagatcttta cctcgtcctg tattataaaa ccttccgtgt taagattctg 1021 tgaagaaggc aaaaacgcct cgtagaggct catttccgtg atggaggatg aattcctcga 1081 cgaataggga atctcgcggc aaaacgtaaa tctgatgcct tccggaaggg ccagattcat 1141 gccctctacc agacggctct cttcgtaagg ctgttctgtg tccagttcga agtaatcctg 1201 ctccgtttcg aagcccaggg acagcggatg gacgatgttg atcttctcgt gggggttgaa 1261 cccgttggag tatgccggaa cgatacccgc cctcttgatg cagcgcttga agagccgctg 1321 caggtccagg tgggagatga accgcatatt ccccttttta taaaacccga aaaggtatct 1381 gtgcagttcc ttgttattcg gcatagattc ctccccagcg gcactcggtg tgagcgttga 1441 ccccgcagcc gttgcatccc agccggcagt ccggtgtggt gacggcttcc tgtgccttct 1501 tccattctct ctggaagaat tccttcgtga tgccgcagtc cacgatctcc cagggcatgg 1561 gagcgtccgg gtcgatgtcg ttcagcgcga aatagtccgc accgatgctg ttctccgcca 1621 gcgcctgttc ccaggcgtcc tgccggaatc cttccgtcca ggcgtcgaag gcggcgccca 1681 gctcgtaagc ccgcagcagc actgtggaca gttcccggcc gcctctggcg aacaccgcct 1741 ccagcatgct ggcgtagctg ccgtggtagc ggaaattgac ccctttgatc ttctttaagc 1801 ggtccttcag ataatagtgc ttctgttcga attcttccgg cgtgttctgc cgcacccaca 1861 tgaatggtgt atccggcttg ggcacgaaat tggagacgga tacggatacg ctgtagcgtc 1921 cgactttgcc tccgttgtgt tcctttgcca ggtccatgat gcgcttcgcc agatccacga 1981 tgccgtccag gtcttcgtag gtctccgtgg gaagtcccat catgaaatag agtttgacgg 2041 aagtccagcc caggtcgaat gcctgccgca gcgcggtaaa gatgtgctct tccgtaatgt 2101 tcttgttgat gacgttgcgc agccgctggg tccctgcttc cgctgcaaag gtcaggcctg 2161 tcttgcgcac gccctggatc tcatccagca ctttaaagct gaagttgtcc atgcgaagcg 2221 acggcagcga aaggcttacc tgatgctgct tgcagtattc catcagatcc gttaccagcg 2281 gttcgaaatg cgtgtagtcc gacgtggaga gagacaggag cgacagttcg ccctggccgc 2341 tgttctccag ctgggtcttg gcgatgtcca gcaccttttc ctcgctgcgt tcccgcacgg 2401 gccggtagac catgcccgcc tggcagaacc ggcagcctct cgtgcagccc cggaacagct 2461 ccgccacaga cctgtcgtgc accacttcga tgaggggcac gatgagctcc ttggggaaat 2521 ctacggtgtc gatgtcgtgg acgatggctt tcagcacccg gtccggtgcc tcttcccgca 2581 gtttgcggta tccccggaag gtcccctttt cgtcccggat ctcctcgtag aacgacggga 2641 tatagacgcc ctgcagtttg gcgatctccg cgagaaactc ctgcttcgtc ttccccgccc 2701 ggcggaattc tccccggatg cggcagactt cgggcagcag ttcttcgccg tctcccacca 2761 ggatgacgtc cataaagtcc gccaccggct ctgcgttaaa ggcgcaggga ccgccgcaga 2821 tgatgatggg gtcagcctcg gtgcggtctt tggaaagcgc cgggatgccc gccaggtcca 2881 gcattgccag gatgttggaa tagctgagct cgtactggag cgtgaacccc acaaaatcca 2941 tttcctttag cggcgtcttc gtctccagcg taaacagggg catatccgcc gccttcatgg 3001 cagccatcat gtcccttgcc ggcgtaaagc agcgctcgca ataggtatga tccgttttgt 3061 tcagcagatg gtacaggatg ttgagcccca tataggacat gccgatctcg tacagatccg 3121 gaaagcagaa cgcaaaacgc acggtaccgg ggagaggctc ccgcacgatg ctgtgcagct 3181 ctcctccgat ataccgtgcc ggtttttcca cttttaaaag aagtttgtct aactgtttct 3241 gaacgttact catcgtaata ttcgaaatcg taatcgatga cggtgatggt gtccccttct 3301 tccagaccca tctgcagcat ctcctcgatg gcgccgctct cttcgatgta gcggtagaga 3361 tagcgcagag atcctgcgtc gttgaaattc gtggagttga agatcttctc cagctgcttg 3421 cccgttacca ggaagccgcc cttcttgcgc tccacgtaga cgtttctgta gtccgggtcg 3481 tcctcgggtt tcgtatcctg gaagaagacg gtctcttcct gttcttccgc ttcggtctcc 3541 agcagcagct tataagcggc ccgcagcagc tcgtccacgc cctcgtggat gggtgcgctg 3601 cagggataga cgctgtagcc cttgctttcc gcataggctt tgaatttctc gtagacctcg 3661 tcatcggcca tgtcgatctt gttggcgcag acgatctggg gcttcttcgc cagcttttcg 3721 ctgtagccag ccagttctgc gttgatcttg tccagatctt ccttcgggtc tctgccctcg 3781 cttccggaaa cgtccaccac gtggatgagg atgcgggtgc gttcgatgtg cttcaggaag 3841 tccaggccga ggccggcgcc ttcggaggca ccttcgatga gccccggaat atccgccatg 3901 acgaagctgg agtcgtacat ggatacgacg cccaggttcg gcgtgatggt cgtgaagtgg 3961 taattcgcga tcttggggtt ggcgctg // LOCUS sequence056 3924 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence056 VERSION sequence056 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3924 /mol_type="genomic DNA" /organism="" /note="sequence056" CDS 161..703 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MTDQQTNKTAEEVKEEEVLEQEEPVGTAENGEPEEAPEAAPQEPG EDWQDKYTRLYAEFQNFRRRTDKEKSDIYAFANEKFAMGLLEVVDNFERAMEHGSESDP KFSEGMQLILKQLQGVLEKNNVEEIEALGKPFDPNYHNAVMTEAAEAESGTVTKVLQKG YMLNKKVIRPSMVAVAQ" /locus_tag="LOCUS_2340" /note="WP_005816478.1 nucleotide exchange factor GrpE (Desulfitobacterium) [pid:48.6%, q_cov:75.0%, s_cov:64.8%, Eval:4.0e-30, partial hit]" /note="MGA_313" CDS 719..2605 /product="molecular chaperone DnaK" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_010964594.1" /transl_table=11 /codon_start=1 /translation="MSKVIGIDLGTTNSCVAVLEGGEPTVIANAEGNRTTPSVVGFTKG GERLVGETAKRQAITNPDRTISSIKRHMGSSYTVSIDGKEYTPQDISAMILAKLKADAE SYLGEKVTEAVITVPAYFSDSQKQATKDAGKIAGLDVKRIINEPTAAALAYGLDKENEH HKILVYDLGGGTFDVSILELGDGVFEVLSTNGDTKLGGDDFDNVLMNYMADQFAKENGV DLRNDKMALQRLKEAAEKAKKELSSSQTTNVNLPFITVNQDGPLHLNMDITRAKFDQLT EHLVQRTIEPMKKAMADAGVTMADLAKVILVGGSTRIPAVQEAVKRITGKEPFKGINPD ECVAIGASIQAGVLTGEVKDVLLLDVTPLSLSIETLGGVATKLIERNTTIPTKKSQIFS TAADNQSAVDIHVMQGERQMAADNITLGRFQLTGIPAAPRGVPQIEVTFDIDANGIVNV SAKDLGTGQQQSITITSSNKLSEEEIKQKVKEAEEYAEADKKKKEDTEARNQAETLVYE TEKNLKTLEGKLSEAEVKEITDAKDELQKALNAGTTEEVKAKTEALTNKFHIMSTKLYE QAAAQQQAQQGGAGPQGGFNPGAGFGGAAGGAAPADDGVQDADFEVVDDDNK" /locus_tag="LOCUS_2350" /gene="dnaK" /note="WP_010964594.1 molecular chaperone DnaK (Clostridium) [pid:66.1%, q_cov:99.5%, s_cov:99.8%, Eval:1.7e-230]" /note="MGA_314" CDS 2665..3816 /product="molecular chaperone DnaJ" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_004454751.1" /transl_table=11 /codon_start=1 /translation="MADKRDYYEVLGLEKGATEDQIKSAFRKMAMKYHPDRNPGDKSAE EKFKEINEAYSVLSDPDKKEKYDRFGFAGVDPNSAYSGGGGFGGFDASGFGGFEDIFNM FGGGFGGFGSSRQTRNGPRRGADIQKRMNITFNEAVFGCKKEIRLTKDCTCDACGGTGA KKGTGKKTCPHCGGTGQVRTVQNTPLGQFQSVRTCDHCGGTGQIIEDPCPACGGTGKVR KTITLNVTIPAGSYTDYVLTLQGQGQPGTNGGPAGDLYIVLNVGDHKLFTRKGDDLWLK VPVTFSQAALGDTVTIPGLSEKLALKIPAGTQPGDVLRMKGKGVPNVRSKRPGDLYAEI VLEVPTKLSAEQKELIKKFGETKTTTGYAKRKSFMDNLKDLFS" /locus_tag="LOCUS_2360" /gene="dnaJ" /EC_number="1.8.4.-" /note="WP_004454751.1 molecular chaperone DnaJ (Clostridioides difficile) [pid:49.7%, q_cov:99.7%, s_cov:99.2%, Eval:5.2e-109]" /note="MGA_315" ORIGIN 1 gattaccggg tcaacggcga attggtcggc cgtctcgggg tcatcggccc cacccgtatg 61 aaatacggca aagtcacttc ggtgatcaaa tatatcagcg acaacatctc ccagacgttc 121 gagctgaaag aaaataacga tgtaaaggac gatagcaaca atgacggatc agcagacgaa 181 caagacagct gaagaagtaa aagaagaaga ggttctggaa caggaagagc cggtcgggac 241 cgcggaaaac ggtgagccgg aagaggctcc ggaagcggct ccgcaggaac cgggagagga 301 ctggcaggac aaatacacca gactctatgc ggaattccag aatttccgcc ggcgcacgga 361 caaggagaag agcgacatct atgccttcgc gaacgaaaag ttcgccatgg gcctcctgga 421 ggtcgtggac aacttcgagc gcgccatgga gcacggatcg gaatccgatc ccaagttctc 481 ggaaggcatg cagctcatcc taaagcagct gcagggcgtt ctggaaaaga acaacgtaga 541 ggagatcgag gcgctgggaa aacccttcga tcccaattat cacaacgcag taatgaccga 601 agcagcggaa gccgagagcg gcaccgttac gaaggtctta caaaaaggat atatgttaaa 661 taagaaagtg atacggccca gcatggtcgc cgtagcacaa taggaggtat agaaaacaat 721 gagcaaagtt atcggtatcg atttaggaac cactaacagc tgcgtggcag tactggaagg 781 cggcgagcct accgttatcg ccaacgcgga aggcaacaga accacaccgt ccgtggtcgg 841 cttcaccaag ggcggcgaga gactcgtggg cgagaccgcc aagagacagg cgatcaccaa 901 ccccgaccgt accatctcct ccatcaagag acacatggga agcagctaca ccgtctccat 961 cgacggaaaa gaatatacgc cgcaggatat ctccgcgatg atcctggcaa agctgaaggc 1021 ggacgccgaa agctatctgg gcgaaaaggt gacggaagcg gtcatcaccg ttcccgctta 1081 cttctccgac agccagaagc aggcaacgaa ggacgccggc aagatcgcag gtctggacgt 1141 aaagcgtatc atcaacgaac cgaccgcagc ggctctggcc tacggcctcg acaaggaaaa 1201 cgaacatcat aagatcctgg tctacgacct gggcggcggc accttcgatg tctccatcct 1261 ggaactgggc gacggcgtgt tcgaagtact gtccaccaac ggcgacacca agctgggcgg 1321 cgatgacttc gataacgttc tgatgaacta catggcagat cagttcgcca aggaaaacgg 1381 cgtcgatctg agaaacgaca agatggctct gcagagactg aaggaagctg cagaaaaggc 1441 caagaaggaa ctgagctcca gccagaccac caacgtcaac ctgccgttca tcacagtcaa 1501 ccaggacggt ccgctccacc tgaatatgga catcaccaga gcgaagttcg atcagctgac 1561 cgaacacctg gtacagcgca ccatcgagcc gatgaagaag gccatggcag acgcaggcgt 1621 tacgatggca gacctggcca aggtcatcct ggtgggcggt tccaccagaa tccccgcagt 1681 ccaggaagcc gttaagagga tcaccggcaa ggaacccttc aagggcatca acccggacga 1741 atgcgtcgcc atcggcgcca gcatccaggc gggcgtactc accggcgagg tcaaggacgt 1801 gctgctgctg gatgtcaccc cgctgagcct ttccatcgag actctgggcg gcgtagccac 1861 caaactgatc gagagaaaca ccaccatccc caccaagaag agccagatct tctccacggc 1921 tgcggataac cagagcgcag tggacatcca cgtaatgcag ggcgaacgcc agatggcagc 1981 cgacaacatc acgctgggca gattccagct gacgggcatt cccgcagcac cccgcggtgt 2041 acctcagatc gaagttacgt tcgatatcga cgccaacggc atcgtgaacg tatccgctaa 2101 ggatctggga accggccagc agcagagcat tacgatcact tcctccaaca agctctccga 2161 agaggagatc aagcagaagg taaaggaagc cgaggaatac gccgaggccg ataagaagaa 2221 gaaggaagac accgaggcca gaaaccaggc agagaccctg gtctacgaga ccgagaagaa 2281 cctgaagacc ctggaaggca agctgtccga agcggaagtc aaggagatca ccgatgcgaa 2341 ggacgaactg cagaaggcgc tcaacgccgg caccacggaa gaggtcaagg ccaagaccga 2401 agccctcacc aacaagttcc acatcatgag caccaagctg tatgagcagg ctgccgcaca 2461 gcagcaggcg cagcagggcg gcgcaggtcc ccagggcgga ttcaacccgg gcgcaggatt 2521 tggcggcgca gccggcggag cagctcctgc tgacgacggc gtccaggatg cggacttcga 2581 agtcgtggac gacgacaaca aataattctg aaaaagggta acgcggaggc gggcgtatag 2641 tccgcctttg cggtgattta taacatggca gacaaaagag attattacga ggtcttagga 2701 ctggaaaagg gcgctacgga agatcagatc aaatcggcct tccgcaagat ggccatgaag 2761 tatcatccgg acagaaaccc tggcgacaag agtgcggagg agaagttcaa ggagatcaac 2821 gaggcctatt ccgttctgtc tgaccccgac aaaaaagaaa aatacgaccg cttcggcttc 2881 gccggcgtag atcccaattc cgcctacagc ggcggaggcg gcttcggcgg cttcgatgcg 2941 tccggcttcg gcgggtttga ggacatcttc aacatgttcg gcggtggttt cggcggcttc 3001 ggcagcagcc ggcagacgcg gaacggtccg cggcgcggtg cggatatcca aaagcgcatg 3061 aacatcacgt tcaacgaagc ggtgttcggc tgcaagaagg aaatccggct gacgaaggac 3121 tgcacctgcg atgcctgcgg cggcaccggc gcgaagaagg gcaccggcaa gaagacctgt 3181 ccgcactgcg gcggcaccgg ccaggtccgc accgtacaga acacgcctct gggccagttc 3241 cagagcgtcc gtacctgcga tcactgcggc ggcaccggtc agatcatcga agatccgtgc 3301 ccggcctgcg gcggtaccgg caaggttcgc aagaccatta cgctcaacgt tacgatcccg 3361 gcaggatcct acacggatta cgtgttgacg ctgcagggtc agggccagcc cggcaccaac 3421 ggcggtccgg caggtgacct gtacatcgtg ctcaatgtgg gcgaccacaa gctgtttacc 3481 cgcaagggcg acgatctgtg gctcaaagtg cccgtcacct tcagccaggc agctctgggc 3541 gataccgtta cgatccccgg actttccgag aagcttgcgc ttaagattcc ggcaggcacg 3601 cagcccggcg acgtgctccg catgaagggc aaaggcgtgc ccaacgtgcg cagcaagcgg 3661 cccggcgacc tgtatgccga gatcgtgctg gaggtcccga ccaaactgtc cgcagagcag 3721 aaagaactca tcaagaagtt cggcgagacg aagaccacca cgggctacgc gaagagaaag 3781 tcctttatgg ataacctgaa ggatctgttt agttaaaaat acggcaaaag attgggtgcc 3841 ggtctgtccg gcaccctttt tgtgttatac tttaaggact gacgaaaacg aggtgtatcc 3901 tatggaaaac agagtaacac taca // LOCUS sequence057 3913 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence057 VERSION sequence057 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3913 /mol_type="genomic DNA" /organism="" /note="sequence057" CDS complement(338..577) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MCKIPVIDLSATGQNIARLRIAAGLSVKDLQDIFGFANPQAIYKW QNGLCLPTLDNLVILAAALGVSLDEIVVYWAACA" /locus_tag="LOCUS_2370" /note="WP_011476650.1 helix-turn-helix transcriptional regulator (Ligilactobacillus salivarius) [pid:47.8%, q_cov:84.8%, s_cov:74.4%, Eval:1.2e-11, partial hit]" /note="MGA_316" CDS complement(629..1828) /product="RNA-splicing ligase RtcB" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011459687.1" /transl_table=11 /codon_start=1 /translation="MFEIKGKVNTAICYATVVEDEAIEQIRRMCDFDFTEDSRVRIMPD VHAGKGCTIGTTMTVHGKAVPNVVGVDIGCGMYTVKLAEKDIDLAKVDEACHTIPSGQN VWPGRIEAFDFTQLRCYRELKEMSWLKRSLGTLGGGNHFIEVEEGADGTKYLVIHSGSR NLGKQVAEFYQALATDLNRGKEEYLKARKAIIETYKAQGRKQEIQQALKDLQWTKRDAT IPDDLCYVYGEYFDDYLHDVDICQKFAVRNRELMAEVILERAGLTKVDAFHTIHNYIDV DEMILRKGAIAAHEGELVLIPINMRDGSILARGKGNPEWNYSAPHGAGRIMSRSKAKES LDMEAYKASMAGIYTTSVNEATLDEAPMAYKSIDDILGVVTESVDVIEILKPIFNFKAS " /locus_tag="LOCUS_2380" /note="WP_011459687.1 RNA-splicing ligase RtcB (Desulfitobacterium hafniense) [pid:48.5%, q_cov:100.0%, s_cov:99.8%, Eval:5.3e-104]" /note="MGA_317" CDS complement(2186..2980) /product="N-acyl homoserine lactonase AiiB" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_010974862.1" /transl_table=11 /codon_start=1 /translation="MKIYILDNGYLLMDKNILLKDAVLANADEPDKKCELVHCPIMMVL IRHEKGNILFDLGCHPEAGKKGYWPDRVWKAERYFHEPEQELEAQLALCGVTPAEIDTV VLSHLHEDHTGNARLFPHAALYAPKKEYLDAMWSVHTNPDTGYVKAEVTAPYREIHLID RDFELLPGIGIVNLPGHTNGLLGMVLHTEKDGVLIFPQDAVFCEESYGPPARLPGGFED SVACLASIEKVRRLQAQYGATVFFGHDPDNFPKYRHAPAYYE" /locus_tag="LOCUS_2390" /gene="aiiB" /EC_number="3.1.1.81" /note="WP_010974862.1 N-acyl homoserine lactonase AiiB (Agrobacterium) [pid:30.4%, q_cov:99.6%, s_cov:98.9%, Eval:6.0e-33]" /note="MGA_318" ORIGIN 1 agagatgtat ctaaaaccgc tattaaaggg gcaaaaacga tacatttttc gctttgtatt 61 gtggatttcg gacttcagag aacgagaaaa gagcgttttg ggcagaagag attacataat 121 ctctcaatta tcgtaaacca atggggcaag caatcgggct atcttctcaa aaatgtatct 181 attttcgcat tttttgatcc atttagatac atttgcagaa tccacgattt ttgcaccggt 241 ctgtccttca tttcttttgc agatttcctt cctccctcat gttagattgc agacaatggg 301 tggttctccg aaaggcggac agtgctggtc ctcgtcccta cgcgcaggcc gcccaatata 361 caacgatctc atccaagctt acacccagcg cagcagccag aattaccagg ttgtccaggg 421 tcggcaggca aagaccgttc tgccacttgt agatcgcctg cgggttcgca aagccgaaga 481 tatcctgcag atcctttacc gacaggcctg ccgcgatcct cagcctcgcg atgttctgcc 541 cggtcgcaga cagatcgatg accggtatct tacacatttc atttacgctc cgtttccggc 601 agaggctaag ccggaaacgc gcgccggctt agcttgcctt aaagttaaag ataggcttta 661 aaatttcgat cacatccacg gattctgtga ccacgcccag aatatcgtcg atggacttgt 721 acgccatcgg ggcctcgtcc agggtcgcct cgttcacgga agtcgtgtag atgcctgcca 781 tggatgcctt gtaagcctcc atgtccagcg actccttcgc cttgcttctg gacatgatcc 841 gcccggcacc gtgcggcgct gagtagttcc actccggatt gcccttgccg cgcgccagga 901 tggagccgtc ccgcatgttg atcgggatca gcaccagctc tccctcgtgt gccgcgatgg 961 cgccttttct aaggatcatc tcgtccacgt cgatgtagtt gtggatcgtg tggaaggcgt 1021 ccacctttgt gaggcccgct ctctccagga tgacctctgc catcagctcc ctgtttcgaa 1081 cagcgaactt ctggcagatg tccacgtcgt gcaggtagtc gtcgaagtac tcgccgtaga 1141 cgtagcagag gtcgtcgggg atcgtggcgt cgcgcttggt ccactgcagg tctttcagcg 1201 cctgctggat ctcctgcttt ctgccctgcg ccttgtaggt ctcgatgatt gccttccggg 1261 ccttgaggta ctcctccttg ccccggttca ggtccgtcgc aagcgcctgg tagaactccg 1321 cgacctgctt gccgagattt ctggaccctg agtggatcac cagatacttg gtgccgtccg 1381 cgccttcctc cacctcgatg aagtggttgc cgccgcccag cgtgcctaag gaccgcttga 1441 gccagctcat ctccttcagc tcccggtagc agcgcagctg cgtaaagtcg aaggcttcga 1501 tccggccggg ccagacgttc tggccagacg ggatagtgtg acaggcttca tcgaccttcg 1561 ccagatcgat gtccttttcc gccagtttga ccgtgtacat gccgcagccg atatccacgc 1621 cgaccacgtt ggggacggcc tttccgtgga ccgtcatcgt ggtgccgatc gtgcagccct 1681 tgccagcgtg cacgtccggc atgatccgca ctctgctgtc ctccgtaaaa tcgaaatcgc 1741 acatccgtcg gatctgctcg atcgcctcat cctctacgac ggtcgcatag cagatggctg 1801 tattcacttt tcctttgatc tcaaacattt tctcttccct accaaaaagg ccgcctgtcc 1861 tttctttgac aagcggcctg accaacacat tgtttacgct aactgtgacc cgatatcacc 1921 gatcgccttc cgctgtcttt ttgtggcacg ataatccaac tttgcgtttt cttttccgca 1981 aagggggcga atgccatatt caaatgtttg cagcattgaa gttctcatcg tttatccttt 2041 tatggacctt ttggcctttt ccgttagcac tatatcacat ggccggtccc ctttcaataa 2101 acctgtaggt taaattattg ttacagcttt agtgaaaaat cgcagaaacc catatcctgc 2161 tctgacagga catttccatc cgcgcctact cataatacgc cggcgcatgc cggtacttcg 2221 ggaagttgtc cgggtcatgc ccgaaaaaga ccgttgcgcc atactgcgcc tgcagcctgc 2281 gcaccttctc gatcgacgcc aggcaggcca cactgtcctc aaagccgccc ggcagcctcg 2341 ccggcggccc gtacgattcc tcgcaaaaca cagcatcctg agggaagatc agaacgccgt 2401 ccttttccgt gtgcagcacc atgcccagca gcccgttcgt atggcccggt agatttacga 2461 tcccgatccc cggcaggagt tcgaaatccc ggtcgatcag gtgaatttcc cggtagggag 2521 cggtcacctc ggcctttacg taaccggtat ccggatttgt atgaacgctc cacatcgcat 2581 ccagatactc tttcttgggc gcatagagtg ccgcatgcgg aaacagccgc gcgttgcccg 2641 tgtggtcttc gtgcagatgc gacagaacga cggtgtcgat ctccgccggg gtcaccccgc 2701 acagcgccag ctgcgcttcc agttcctgct ccggctcatg gaaataccgt tccgccttcc 2761 acacccggtc gggccaatag cccttctttc ctgcctctgg atggcagccc agatcgaaca 2821 ggatattccc cttctcgtgg cggatgagca ccatcatgat cgggcagtgg acaagctcgc 2881 actttttgtc cggctcatcc gcgttggcca gcacggcgtc cttcagcagg atgttcttgt 2941 ccatcagcag ataaccgttg tctaaaatgt agatcttcat actatgcacc tccgccaccc 3001 ctagtatagc agacaacggg ctggaccaca gacttctttc aggtgaactg tcaacgcaca 3061 aatcgtgcgt tataacggtt gacatccgcg cccgcccgcg ttattcttaa tgtataaaca 3121 cagcaaaccc ttagaattgt aagcgttata cactttggag gacgcatcat ggcaattaca 3181 gaacgtgtag aaaagatccg tcagaattac gtcaatacga agccccacat ctcctacgag 3241 cgcgcctggg cctggaccaa gtccttccag cgcaccgagg gacaggctca catcatccgt 3301 accgcgcagg cctttaagga cacctgcgaa gagctgtccg tcaacatctg ggaaggcgaa 3361 ctggtcgtcg gcaccagcgg cgagttccgc aagtgcgcca tcctgacgcc ggagttcggc 3421 tggctgtgga tcaacgagga gatggatacg ttccccgaaa gaggacagga tccctacgac 3481 gtgaccccgg agcaggcgaa attcatccgc gaaaacatct tcccctactg gaagggaaag 3541 tccgtggaag aagccttcct ggcccgcatc tccgaagata cgaagaagat cggcgtggac 3601 accggcttcc tggacaccga ctccaagtgg aggaacggta tcggcgagat ctccgcagac 3661 tacatcgacg tgctactgcc caagggctac ggcggcatta aggccgaagc cctggactac 3721 atggccaaat tgaacgaagc catccccgaa gacaagaaga agatcgattt ctataaatct 3781 atggtgttca tcgccgacgg catgatcgca ctgggccgcc gctacagcgc aaaggccgcc 3841 gaaatggcga aggccgaggc tgacccgaag agaaaggccg aactggaaga gatcgcggac 3901 atctgcgccc gca // LOCUS sequence058 3906 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence058 VERSION sequence058 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3906 /mol_type="genomic DNA" /organism="" /note="sequence058" misc_feature <1..882 /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_048061266.1:phosphoglycerate dehydrogenase" /note="WP_048061266.1 phosphoglycerate dehydrogenase (Methanothermobacter thermautotrophicus) [pid:37.7%, q_cov:88.7%, s_cov:44.6%, Eval:1.5e-38, partial hit]" /note="MGA_320" /locus_tag="LOCUS_2400" CDS 892..2352 /product="FGGY-family carbohydrate kinase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_005168723.1" /transl_table=11 /codon_start=1 /translation="MQYFLVMDAGTTSIKAGLISIDGTFADIQNEPAQVLMPFSGASEM DMNDVWEVAKKVILKLKANNEALWPEVIAVGLSAQGDGLWAIDDKGRPVRNAMLWNDTR TVLDYESLNPTLLAKNTTAMFPGANIAELTWLKKNEPENYAKIAWIFHCKDWINFKLTG QIGTDASDASTSLMNIYTKQYDEEILDWLGLPEMKGKFAPISTSDEIIGTIYPDAAEEL GLRVGTPVIAGCLDVLAIATGCGLMKGGQRGSIVGTTLANYVVMDEETARGCVATNGSI LCHTKKDTYIRLMAATAGASAMDWMRRTILDGEDFAKTDEELAKIPIGADGVMSTPYIN GERAPFKLSSASAGFYGIRAHHTKYHLAKASFESIAMAMADCYANLPKGDAELYLAGGA AKSQYICQMLCDCMGAVTYRFEEKELGLMGIYRLILDALKISQSVTANTDKFEPNMENH EKYMALYKEYCVLKDSMMPFWRSRAAEE" /locus_tag="LOCUS_2410" /note="WP_005168723.1 FGGY-family carbohydrate kinase (Yersinia enterocolitica) [pid:34.0%, q_cov:99.2%, s_cov:96.4%, Eval:1.8e-75]" /note="MGA_321" ORIGIN 1 attacgagct acgatcccgt tacgaaagac gtgatcgacg ctgcgccgaa ctgcgggctc 61 atcgtctgca cgcgggccac gcccgtcaac gtggataccg cctacgccag ggaaaagggc 121 atcaaggtga gctacgccgt ggagcgcaat tccgacacga cggcggaata caccctggga 181 ctcatgctgg cggtcacccg cggcataggg ttcgcctacc gcgatctgtg cgaaggcaag 241 ttcgccgcgg acgacatcgg cagccatggc agcgaatccg cgaagcgcga cgttacctgg 301 tccacggggg agaccagccc ctacacgtat tacaaaggct atcagctgaa gggtcacagc 361 gtcggtatcc tgggctgcgg cagcatcggc atgcgcgtcg cgaagctctg cgacgccttc 421 agcatgaaag tctacggctg cagccgctct cttacgaaag agaacgcgcc tgcctacatg 481 gaagtctgcg aaagcctgtt ggacatggcg ccgaaggtgg atatcctgac ggtccatctg 541 aaggacacgc cgcagacgga gaatatcgta aacgcggacg ttttccgcgc catgaaaaaa 601 acggcttatc tcatcaacga ttccagaggt tccgtcgtgg acgaggatgc tctgatcgag 661 gcgctgcgca atggcgagat cgccggcgcc gccatagatg tgttccgcga ggaacccatc 721 tccagatccc acccgtattt tgaaatgcgc gaccgggtgc tggtgacccc gcacatcggc 781 ggagccacct gggacgccat ttccaatcac accagggaat tcgtcaccga tgtgatgcat 841 tatatcaacg gcgaagagtt ggaatatgag tatcgaaagt aggaggtgca catgcagtat 901 tttctggtaa tggatgcagg aaccacaagc atcaaggccg gtctgatctc gatcgatggt 961 acatttgcgg atattcagaa cgagcctgcc caggtcctga tgcccttctc cggcgcgtcg 1021 gaaatggata tgaacgacgt gtgggaagtg gcgaagaagg tcatcctcaa actgaaggcg 1081 aacaacgaag cgctttggcc ggaggtcatc gcagtcggtc tctctgccca gggcgacggt 1141 ctgtgggcga tcgacgacaa gggcagacct gtccgcaacg ccatgctctg gaacgatacc 1201 agaacggtcc tagattatga atccttaaat ccgacgcttc ttgcgaagaa tacgacagcc 1261 atgttccccg gcgccaacat cgcggagctt acttggctca agaaaaacga accggagaac 1321 tacgcgaaga tcgcctggat cttccactgc aaggactgga tcaactttaa gctcaccggc 1381 cagatcggca cggacgcttc cgacgcttcg acctcgctga tgaacatcta cacgaaacag 1441 tacgacgaag agatcctgga ttggctgggt ctgccggaga tgaagggcaa gttcgctccc 1501 atctccacct ccgacgagat catcggaacg atctatccgg atgcggcaga agagctgggt 1561 cttcgtgtcg gcacccctgt catcgcgggc tgcctggacg tgctggccat cgctacaggc 1621 tgcggcctga tgaagggcgg ccagagaggt tccatcgtcg gcacgacgct ggcgaactac 1681 gtcgtcatgg atgaagagac cgcgagaggc tgcgttgcca cgaacggctc catcctgtgc 1741 cacacgaaga aggataccta catccgtctg atggctgcca ccgcaggtgc ctccgccatg 1801 gactggatga gacggacgat cctggacggc gaggatttcg cgaagaccga cgaagaactg 1861 gcgaagatcc ccatcggcgc cgacggcgtc atgagcacgc cctatatcaa cggcgagcgc 1921 gcgcccttca agctgagttc cgcttccgcg ggcttctacg gcatccgggc gcatcacacg 1981 aagtatcatc tcgcgaaggc cagcttcgag agcatcgcca tggccatggc ggactgctat 2041 gccaacctgc ccaagggcga cgcggaactg tatctggcgg gcggcgcggc taagagccag 2101 tacatttgcc agatgctctg cgactgcatg ggtgcggtca cataccgctt cgaggagaag 2161 gaactgggcc tgatgggcat ctaccggctc atcctggacg ccctcaagat ctcccagtcc 2221 gttacggcaa acaccgacaa gttcgagccg aacatggaaa accatgagaa gtatatggca 2281 ctgtacaaag aatactgcgt cctgaaggac agcatgatgc cgttctggag atccagagca 2341 gcggaagaat aaggaggaaa gacgatgtca ttgctcatca gaaacgccaa tatcgcgacc 2401 atggacagcg agcagcccag agcgcaggct gccgtggtca cgggtaagta tttcgcctac 2461 gtaggcaccg aagagggcgc gaaggagtat atcgcagccc ataacgacgg cgtctgcgag 2521 gaagtggact gcggcggcca gctgctgctg cccgggttca acgactccca catgcacttc 2581 ctgcactacg taaagacccg catccacgtg gatctcgtgg gatgcacgtc cttaaaagaa 2641 gtgctggacc gcatgaagga ggcctataag accttcgaca agagcgacgg tctgtggttc 2701 gtaggcgaag gctggaacca ggattacttt acggacgaga agcggttcct cacgaaggac 2761 gacctggata ccatcacgac ggactggccc atcatgatcc agcgcacctg cggacacgtg 2821 ggcgtgctca actccaaggg tatcgagatg ttcgacatga gccagggaga aggcctgaag 2881 tacaaggaat acgcggaagt cggccccgac ggcaagctca acggcgtcat caaggagaac 2941 ctgttcgact acatgaagac cacgctgccc gcgccgtccc tggaaaagct gatggacctg 3001 atggagaagc accagtacga tctgttcgag aagggtctta cgtccgtcca gtccgacgag 3061 ggcaactaca cgccggcagg ccggtaccac gatctgcaga agctgatgag agagcgggcg 3121 gagaagggca ccttcaagct ccgtctggct tcccagatgc tgtacttcaa cgcggagaag 3181 ctgaagtggg cgttctccga aggctacgac acgtccttcg gcaacgacac cgtcaagatc 3241 tcctgcacga agctgctgtc cgacggctcc ctgggcgcca gaacggctct catgagaaag 3301 ccctacgcgg acgatgcttc caccaccggc ctggccctgt ggacccaaga aggcctcaac 3361 gagatggtgg agatctccca gcggcagaac gtgcctgtgg cggtccacgc catcggcgac 3421 ggcgctgtcg aaatggtgat caacgccgtg gaagccgccc agaagaagta tccccacgtg 3481 catcccagac acaccgtggt gcacagccag gtgaccgaca gagcgctgct gcagcgcatg 3541 aaggatctgg gtatctccgt catggttcag cccatcttca tcgactacga catgcacgtc 3601 atctacgaca gagtgggcaa agaactggcg gagagctcct acgtgtggaa gtggtacaag 3661 gatatgggca tccacatgag cttcggcacc gactgcccgg tggaatcctt cgaaccggtg 3721 cagggtatct actgcgcagt cacaagactg gcgaagaacg gcgacggacc gtacctgccg 3781 gagcaggcgc tgtccgtgga ggacgccatc tacgcctata cggcggagtc cgcctggaat 3841 acgggcgatg aaaacatcaa gggtaaggta aaggcaggca tgcttgcaga ctttattacc 3901 atggac // LOCUS sequence059 3902 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence059 VERSION sequence059 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3902 /mol_type="genomic DNA" /organism="" /note="sequence059" CDS 107..1525 /product="serpin family protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_007054058.1" /transl_table=11 /codon_start=1 /translation="MIMKKVLSAGLAVLLAFGACSCATVDAEDTDPTGSGTGPKEKPAV TETSSYALAEPVLPEMAPYPDEMSFAGEDGLFDSDGFDAAWTAWNEGVQARRDAAQSYP GKLDAYLKKTTETFLTPKEAGKNAVCSPVNIWLALAMVAETADGQTRTELLDLLGVSSI EDCRKLANKLWTANYIDDGAATSKLAASLWMNQDVPFKEQTVQTLADDYFASTFRGGMT DPAYSAAFKSWLNDNTGGLLQDAVENLPDFDPQTIMALATTVYFSGKWSDQFQDANTYT ETFHGAVSDKDADFMHRSSTGQYFYSEHFAAVSLPFEDAGSMWLLLPDEGVTPADLLKS GEAMDFVLSGGAKGAESTFLKIDMAVPKFDVEADMDLAEKLTALGAGSMFTNKADFSNL TDMDGVFIGSATHDARVKVDEEGCEAAAFTAMMYEGTALPPEERVEFKLDRPFLFALMG IDGLPLFYGVVNQL" /locus_tag="LOCUS_2420" /note="WP_007054058.1 serpin family protein (Bifidobacterium longum) [pid:28.5%, q_cov:82.0%, s_cov:87.8%, Eval:1.5e-34]" /note="MGA_323" CDS complement(1614..2141) /product="nitroreductase family protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011459068.1" /transl_table=11 /codon_start=1 /translation="MEFNKLIETRRSVRAYAEAASKEDIEAILTLAQQAPSWKNGQPSR CYAVVTPEKVMEVQETCLPDFNARSSAGASLIVTTFVRNLSGFGPEGPANKAGNYWGAY DLGLHDAYLVLAASDLGFDTLIMGIRDAEALKKSLGIPEEEEVMAVIAVGKRAKEPGSR PRKDIAEVAKFF" /locus_tag="LOCUS_2430" /note="WP_011459068.1 nitroreductase family protein (Desulfitobacterium) [pid:27.9%, q_cov:97.7%, s_cov:93.8%, Eval:2.7e-12]" /note="MGA_324" CDS 2279..2989 /product="adenosylcobinamide-GDP ribazoletransferase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_010964693.1" /transl_table=11 /codon_start=1 /translation="MLGFFTRIPVPQIEYTEERYVKGIPLLPFVGAVSGGLLWCVFQLS RWLPMPVVALLIFLAYLLITGGIHMDGLGDSCDALFSARDPERMLEIMKDSRSGSFGVL GLIAASAAYLILLSYAPWQAVLLFPVVGKVTPALSSNWAPYIRAKGMAELFCQNATKGV LAFDALLCIAAGFALGIPVGIAAVIALFACVALVLRVKHILGGITGDILGLACEVSQLI FLFVCVVFSARGLL" /locus_tag="LOCUS_2440" /gene="cobS" /EC_number="2.7.8.26" /note="WP_010964693.1 adenosylcobinamide-GDP ribazoletransferase (Clostridium) [pid:35.4%, q_cov:99.2%, s_cov:96.4%, Eval:7.9e-31]" /note="MGA_325" ORIGIN 1 cacgtgtact tttccgtctg cggcattccg atgcagataa aataggaaga tccgcgcgac 61 gcagcgcggt ctttttctgt ctatcagggt gaaaggggat tttactatga tcatgaaaaa 121 agtgttgagc gcaggcctgg ccgttctgct ggctttcggt gcctgcagtt gtgccacggt 181 ggacgcagaa gataccgatc cgaccggcag cggcacaggc ccaaaggaaa agccggcagt 241 tacagagacc agctcctatg ctttagcaga gccggtgctg ccggaaatgg caccttatcc 301 ggatgagatg tcctttgccg gagaggacgg cctgttcgat tccgatgggt tcgacgccgc 361 ctggaccgcc tggaacgaag gggtgcaggc gagaagagac gcggcccaga gctatccggg 421 caagctggat gcctacttaa agaagacgac ggaaaccttc ctgacgccga aggaagcggg 481 gaagaatgcg gtctgctcgc cggtcaacat ctggctggcg ctggcgatgg tcgctgagac 541 cgcggatggg cagacccgta cggaactgct ggatctgctg ggcgtttcct ccatcgagga 601 ctgccggaaa ctggcgaaca agctctggac ggccaactat atcgacgacg gcgcagccac 661 cagcaaactg gcggcttctc tgtggatgaa ccaggatgta ccgttcaaag agcagacagt 721 ccagactctg gcggacgatt attttgcctc cacgttccgg ggcggcatga cggatccggc 781 gtattcggcg gccttcaaga gctggctgaa cgacaacacc ggcggcctgc tgcaggacgc 841 ggtggaaaac ctgccggatt tcgatccgca gaccatcatg gccctggcca cgaccgtcta 901 cttctccggc aagtggagcg accagttcca ggatgcgaac acctatacgg agaccttcca 961 cggggctgtt tcggacaagg atgcggactt tatgcaccgt tcgagcaccg ggcagtattt 1021 ctacagcgag cattttgctg cggtcagcct gccctttgaa gatgcaggca gcatgtggct 1081 gctgctgccg gacgaaggcg tgacccccgc agacctgctg aagagcggcg aagccatgga 1141 tttcgtgctc tccggcggcg caaagggggc ggaaagcacg ttcctgaaga tcgatatggc 1201 ggtgcctaaa ttcgacgtgg aagcggacat ggatctggcg gaaaaactga cggcactggg 1261 cgccggcagc atgttcacga acaaggcgga cttctccaac ctgacggaca tggacggcgt 1321 ctttatcggc agcgccaccc acgatgcccg ggtcaaagtg gacgaggaag gctgcgaagc 1381 ggcggccttt accgcgatga tgtacgaggg aactgcactg cccccggaag agcgggtgga 1441 attcaagctg gataggccct tcctgtttgc cctgatgggc atcgacggcc tgccgctgtt 1501 ctacggcgta gtcaatcagt tataaagacg aaaaaacggg gacggttctt tgtctcacta 1561 aagcagtgct gcactgctga gacaaagaac cgtctccgtt ttgcattttc ggattagaag 1621 aactttgcga cttcggcaat gtccttgcgg ggtctgctgc cgggttcctt ggcgcgcttg 1681 ccgacggcga tgacggccat cacttcttcc tcttctggga taccgaggct ctttttgagc 1741 gcttcggcat cgcggatgcc catgatgagg gtgtcgaagc ccaggtcgga tgcggccagc 1801 accagatagg cgtcgtggag tcccagatcg taggcgcccc agtagttacc ggccttgttg 1861 gcagggcctt ccggtccgaa gccggacaga tttcttacga aggtcgtcac gatgagggat 1921 gcgccggcgg agctgcgggc gttaaagtcg ggcaggcacg tctcctgcac ttccattacc 1981 ttttccgggg tcacgactgc atagcatctg gacggctggc cgttcttcca ggacggcgcc 2041 tgctgcgcca gggtgaggat cgcttcgata tcttctttgg atgccgcttc cgcgtaagcg 2101 cgtacgctgc ggcgggtctc gatcagtttg ttgaattcca ttctgtctct ccttgtctgc 2161 tttggatagg ttctacctgt tcattatctg ccctttgctc ccaaaatgca aatgcaaaag 2221 aagcccgtgc attgtataat aaatgcatag agatattatg ttccgatcct tccttttaat 2281 gctgggattc ttcacgcgga tcccggtgcc gcaaatcgaa tatacggaag agcgctatgt 2341 aaaaggcatt ccgctgctgc ccttcgtcgg cgccgtgagc ggaggcctgc tttggtgcgt 2401 tttccaactt tcccgctggc tgcccatgcc ggtcgtggcg ctgctgatct tcctcgccta 2461 tctgttgatc accggcggca tccacatgga cggcctgggc gactcctgcg acgccctgtt 2521 ctccgcccgc gatcccgagc ggatgctgga gatcatgaag gattcccgca gcgggagttt 2581 cggcgttctg gggctcatcg cggcgtcggc ggcctacctc atcctgctga gttacgcgcc 2641 ctggcaggcg gtgctgctgt ttccggtggt cggcaaggtg accccggcac tctcctccaa 2701 ctgggcacct tacatccggg cgaagggcat ggcggagctg ttctgccaaa acgccacaaa 2761 aggcgtgctg gccttcgacg cgctgctgtg catcgctgcc ggttttgccc tggggatccc 2821 cgtcggcatc gccgcggtca tcgcgctgtt tgcctgcgtg gcgctcgttc tgcgggtcaa 2881 acatatctta ggcggcatta ccggagacat cctgggcctc gcctgcgaag tctcccaact 2941 gatattcctg ttcgtttgcg tcgtgttttc tgcaaggggg ttgctatgaa aaagaaatct 3001 gtattggtcg ttcttttgat cctggcgctt gccttaggcc tcgcgctcac cggctgttcg 3061 agcggagacg ataccatcga tcccggcgat ctgcagcccg gctccgaaac ggaggaaccg 3121 gcggaaggcg aagcgggcga agaaggagaa ggggaacagg aggcggaact gcctcccgcc 3181 gttgacccgg ccaaacccaa accggtctat tactacaatc cgctgtccgg cgaacggacg 3241 atgtcggaca ttacgaagct gcggccctac gccgttatgc tgaacaacaa gcgcgaggcg 3301 ctgccccagc tgggcgtgag ccaggcggac atcatctatg aagtctgcgc ggagggcggc 3361 atcacccgta tggaagccct gtttgcgacc atggaaggcg tgggcaccct gggcagcatc 3421 cgttccatcc ggccctacta catcgagctg gcgctgggct acgacgccat catcatccac 3481 gcgggcggca gcgaagaggc ttattacgat ctgagcgcct ggaagaccac ccacttcgac 3541 ggcgtgcggg gcggctggga tgccagcatc ttctggcgcg atcagtggcg gatggcgaac 3601 cgcggctacg agcactccct gctcaccagc ggcgagaaca ttctgaagtt cgtggcggac 3661 tccaactacc ggctggaaca caacgaaggt tatcaggcgc cgatcaagtt caacaacgag 3721 aacgcagcga agttcggcgt ggatgccaac tccgtcacgg tgcgcttctc caactacaag 3781 acagacgtct ttacgtatga ccccgagagc ggcctgtaca tgatcgaggg ccacggacag 3841 gaatacatcg acggcaacac cgaagagcag gtgggcgtta cgaacgtgct cgtgctgaac 3901 ac // LOCUS sequence060 3824 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence060 VERSION sequence060 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3824 /mol_type="genomic DNA" /organism="" /note="sequence060" CDS complement(179..583) /product="GrdX family protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_012869887.1" /transl_table=11 /codon_start=1 /translation="MAAKAEIISNNPDIEALVPKTFSFTGMAGSPAKAVLTAARDRIHL GAKLLAHPMAGRLRPNETPYMTVVLAPPAPSTGAGTDLDRPSLEIIEYCLAEEEKYINM RKKYDEPLLPDLRFISCELFTGILQELGIR" /locus_tag="LOCUS_2450" /note="WP_012869887.1 GrdX family protein (Thermanaerovibrio acidaminovorans) [pid:31.7%, q_cov:94.0%, s_cov:95.1%, Eval:4.2e-12]" /note="MGA_328" CDS complement(750..2273) /product="FMN-binding glutamate synthase family protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_012546886.1" /transl_table=11 /codon_start=1 /translation="MSFVRNNDSAFSDTKTRGQKLTPCSGMCSFCTEDCIGTCEIGLSA VLGKAMVYPTNTGSNQIASEKDNPIDYSIFNINGRCFGALGAPENGEYPSIYHVKTERT IGKRNPIKIALPFTLPALIKLNWKDYFAAAAMAGTICVIGEGSPSKDPDLKTENGKIVR FEKLKEMLGAFNRYYRGYGQIVLQCNVEDDAMGLPEYAIRECGAEGIEFKFGQSAKGTQ PANRIGSLEAAIAKKRDGFIVYPDPEDPAVAEAAKRGAAPGFWSYARHPLWTEETLAKR IEALRAMGLKNVYFKTAGFDPADLEKLLRIASDLEVDMITFDGAGGGSGYSPNKMMNEF GLPAACIESAIVPMCDKLKAEGKYIPSIVITGGFATEDQAYKALALGAPYVTAVGLCRA TMAAAMVGKKVGDLLKEGTVPAHLQKFGKTADELFLELGEVRSLYGEEADSMSLGAVGA YSYLRKMTFGVQHFATLNRKFDLALADRSDLIPLTQDARMLLKGTWFEW" /locus_tag="LOCUS_2460" /note="WP_012546886.1 FMN-binding glutamate synthase family protein (Thermodesulfovibrio yellowstonii) [pid:37.9%, q_cov:96.6%, s_cov:94.1%, Eval:3.0e-94]" /note="MGA_329" CDS 2416..2922 /product="prolyl-tRNA synthetase associated domain-containing protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003428667.1" /transl_table=11 /codon_start=1 /translation="MNKQEIYDFLKQQHIDFEITEHPAVWNMEDVAQLEMPHPEADAKN LFVREDKTRNYYLITVKGDKRVDLKALRKEEGLRQLKFASAGELAEVLGLYAGAVTPLG LLNDESRTVTLIIDSYFLQTPALIGAHPNDNTATVWLKTEDLLWFLRSHGNEVLVRDLP YVPEE" /locus_tag="LOCUS_2470" /note="WP_003428667.1 prolyl-tRNA synthetase associated domain-containing protein (Clostridioides difficile) [pid:40.6%, q_cov:92.3%, s_cov:94.5%, Eval:4.2e-28]" /note="MGA_330" CDS 3035..3262 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MPLEEADTVLFGIPFDGGASYRAGAAQAPDMLRANTLQSTPCTER LEWFDTFNVVDAGNFPLTMEDREEVFADIQ" /locus_tag="LOCUS_2480" /note="MGA_331" ORIGIN 1 ccaggatcag ctcgcgcatc tcatcgggat ctgcgatgag cgtatcccct tcgatgcgcg 61 cgggactgcc gaactcgatg ttccgtatgg cgatctttct gagttccagt tccatgcata 121 cctccttttc tcgttagtct tgctatgatt gcttatagaa agttgaaaga tcaacgttct 181 atcgtatgcc gagctcctgc aggatgcccg taaacagttc gcagctgatg aaccgcagat 241 cgggaagaag cggctcatcg tattttttgc gcatatttat gtatttttcc tcctccgcca 301 ggcagtattc gatgatctcc aggctgggac gatcgagatc ggtccctgcg cctgtcgaag 361 gggccggagg ggcaagcacc accgtcatgt agggcgtctc gttcgggcgc aggcggcccg 421 ccatggggtg agccaggagc tttgcgccga gatggatgcg gtcgcgcgcg gcggtaagta 481 ccgccttggc cggtgaccct gccatccccg taaacgaaaa ggttttcggc accagcgctt 541 cgatgtccgg attgttggaa atgatttctg cttttgcggc catttgccga agcgcctccc 601 ctctcagttt gattataata tacgaataaa tctgccgcca ctattacttt tttatataac 661 tgcaaatctt ccgataaaca atgcaagcaa tccaataaaa aagccggccc gaaggccggc 721 tgatgcagcg ggacaggtcc cttgtgtcgt taccattcaa accaggtgcc ctttaagagc 781 atgcgggcat cctgcgtaag cggaatgagg tcgctgcggt ccgccagggc gagatcgaac 841 ttgcggttga gcgtcgcaaa gtgctgtaca ccgaaggtca tcttgcgcag ataggaatat 901 gcacccacag cgcctaggga catgctgtcc gcttcttcgc cgtacaggct gcggacttcg 961 cccagctcca ggaacagctc gtccgccgtt ttgccgaact tctgcagatg agcgggaaca 1021 gtgccttcct tcagcaggtc gcccaccttc ttgcccacca tcgccgctgc catggtggcg 1081 cggcacagac cgacagccgt cacgtaggga gcgcccagtg ccagcgcctt ataggcctgg 1141 tcttccgtag cgaatccgcc ggtgatgacg atggacggga tatatttccc ttccgccttc 1201 agcttgtcgc acataggaac gatggcgctt tcgatgcagg cagcaggcag gccgaactca 1261 ttcatcatct tgttcgggct gtagccggat ccgccgccgg cgccgtcgaa ggtgatcata 1321 tccacttcca gatcggacgc gatgcgcagc agtttctcca gatcggcggg gtcaaaccct 1381 gcggtcttga aatagacatt cttcagtccc atggcccgca gcgcttcgat gcgcttggcc 1441 agcgtctcct ccgtccacag cggatggcgc gcataggacc agaaccccgg tgctgcaccg 1501 cgcttagcgg cttccgcgac agccggatcc tccgggtcgg gatagacgat aaaaccgtcg 1561 cgtttcttgg cgatggcggc ctccagagaa ccgatgcggt ttgcgggctg cgtgcctttc 1621 gcgctctgac cgaacttgaa ctcgatgccc tcggcgccgc actcccggat cgcatattcc 1681 ggcagcccca tggcgtcgtc ttccacgttg cactgcagca cgatctgtcc atagccccgg 1741 taatagcggt tgaatgcgcc taacatctcc ttcagttttt caaagcggac gatctttccg 1801 ttctccgtct tcagatccgg gtccttgctg ggagatccct cgccgatgac gcagatggtg 1861 ccggccatgg cggctgccgc aaaatagtcc ttccaattca gtttgatgag cgccggcagc 1921 gtaaagggga gcgcgatctt gattggattg cgtttgccga tggtgcgttc cgtcttaacg 1981 tgatagatcg acggatactc gccgttttcc ggtgcgccta gcgccccgaa gcagcggccg 2041 ttgatgttga agatcgagta gtcgatggga ttatcttttt cgctggcgat ctgattgctt 2101 cccgtattgg tgggatagac catcgccttg cccaaaacag cggagagacc gatctcgcag 2161 gtcccgatgc agtcttccgt gcagaaggag cacatgcccg agcagggcgt cagcttctgg 2221 ccgcgtgtct tggtatcgct gaaagcggaa tcgttgttgc ggacgaatga catgtatgac 2281 acctcttttc tatccgttcc gtgttaaaat ctgctattat aaaagtacca caaaaagacc 2341 aacccgtaaa tcagtaggat aaatgaactg tcggggacgg ttttttactg ttcatttttt 2401 atctgcagca gcatcatgaa taaacaggaa atttacgatt ttttaaaaca gcagcatata 2461 gacttcgaaa tcacggaaca ccccgccgtc tggaacatgg aggatgtggc gcagctggaa 2521 atgccccacc cggaggcgga cgccaagaat ctgttcgtgc gggaggacaa gaccaggaat 2581 tactatctga tcaccgtaaa gggcgacaag cgggtggatc tgaaggcgct gcggaaagaa 2641 gaaggcctgc ggcagctgaa atttgcgtct gccggggaat tggcggaggt gctcgggctc 2701 tacgccgggg ccgtcacgcc cctggggctg ctcaacgacg aaagccgcac cgtgaccctc 2761 atcatcgact cgtatttcct gcagacgccg gctctcatcg gcgcccaccc caacgacaat 2821 accgccaccg tctggctgaa gacggaggac ctgctctggt ttctgcgttc ccacggaaac 2881 gaagtgctgg tccgggatct cccttacgta ccggaggaat aagccggcac agtctttcgc 2941 acatcgtttt gaacagaaaa ggagatctcc catggtcaca aaagataaat agtccctcga 3001 tcccaacgcc tggtgcggac tcaaccgtcc ggacatgcct ctggaagagg cggacaccgt 3061 actgttcggc attcccttcg acggcggcgc cagctaccgc gcgggggcag cccaggcgcc 3121 ggacatgctg cgggctaaca cgctgcagtc cacgccctgc acggagcgcc tggaatggtt 3181 cgataccttt aacgtcgtgg acgccggcaa ttttccgctt acgatggaag accgggaaga 3241 ggtgttcgcg gacattcagt aattcgtctg cggtctcgta aaggcaggta gaaaaatcac 3301 catgataggc ggcgatcaca gcgttacgat ccccgtggaa cgcggcatcg acgatgccct 3361 ggacgaaccc ttcggcatca tccacatcga tgcccatatg gacctgtgcg acgcgctgga 3421 aggcgataaa ctgtcccacg gcaacacgga gcgccgggcg ctggagctga agaacataca 3481 gggtttcgag aacctctact ttatcggtat ccgctccatc gaacccgacg aattcgagct 3541 gtataaaaac aatcccatcc aggtgaagac cgctttcgac tgctatgcgg agggcatcga 3601 atccgtcgcg aaggactgca tcgaaaagat gagccgctac agcaaagtct acctcacctt 3661 cgatatcgat gcgcttgacc cggcttacgc cgcaggcacc ggcacgccgc agttcggagg 3721 gctcacctcc cgcatggcca tcaccctgct gaatatgcta ttcgacgcgc ttcccatcat 3781 cggtttcgat gtagtggaga tcgcaccgcc cctcgacccc tccc // LOCUS sequence061 3819 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence061 VERSION sequence061 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3819 /mol_type="genomic DNA" /organism="" /note="sequence061" CDS complement(82..786) /product="gamma-glutamyl-gamma-aminobutyrate hydrolase family protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011393651.1" /transl_table=11 /codon_start=1 /translation="MNKKPLIGITTSYDREHKEMNIRTTYTEAVMHGGGIPVLLPVTME PERIRELFDSVDGILLCGGPDIHPNIYGEQIKYYCGHVNHERDVFELELARLAIENDKP LMGICRGSQVLNVACGGTLYQDINLQGATDFKHADNSESHSPVAHPVDLLPGKLLQQVL GIDELEITSWHHQAVKKPGKGIEVCAMCPDGIIEGVYMPEKKCIFGLEGHPELLPDNPG YKLFDYFVDNCR" /locus_tag="LOCUS_2490" /note="WP_011393651.1 gamma-glutamyl-gamma-aminobutyrate hydrolase family protein (Moorella thermoacetica) [pid:42.2%, q_cov:97.4%, s_cov:97.4%, Eval:2.3e-43]" /note="MGA_333" CDS complement(817..2184) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MERNILEYVKETRELLATSEILGAQTARAAALQEKLEDQSITVSV IGQFKRGKSCLVNALLGEDILPTGIVPITSAATKIRYGKPSCSVRFFNGVVKPVSEAEL SHYINEQENPGNLLGVDCVDMTAESDFLKDGLTFVDTPGIGSYHKNNTDAAYAFIKESD AVIFMLSVDSPINEIEIDILRNTKEYAAKFFFAVNKIDTIGDADREAYINYCRNLLCTL MGVDDVVLFPISAKEGTGLEDLKTALNRDLRAKVREILEESARLKLKDIISQALSQIEL YWKVLLMPPAQLRGSLADLKTMLADAGEETAKTVHELEADRDIIIPGLEETLKVKLNEF KMQLSEGVTRIFGMDYHYELPSLKEGEESKGGYRLASELGREYLEETAALREDLDKTIN DVLMYRNNDAVDVVNRIYTLNKLTRTLKRTQRILQGMEEENPAPSNHPIKMTNLCP" /locus_tag="LOCUS_2500" /note="WP_012870015.1 dynamin family protein (Thermanaerovibrio acidaminovorans) [pid:28.4%, q_cov:66.8%, s_cov:78.4%, Eval:2.7e-30, partial hit]" /note="MGA_334" CDS complement(2194..2853) /product="GntR family transcriptional regulator" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011391621.1" /transl_table=11 /codon_start=1 /translation="MKIDMEKDRGSSLPQDLFNKLRDDILQKKIKPGEKLTEQRICQEY QVSRTPVREAFQKLELDGLIEIIPNRGAFVLGLTRQDIEDMYELRSAYESIAVKWAIDR MTKEEFDEMQEAFELMEFYTMKQDPAKMLAMNTRFHQIIYNGTKNRMLQHTLTSYQVYT KNTKYSPEYIKEYMDEVLEEHRQIFLAFQAKDKEAASRAAVQHMSNGKHRAGFGTD" /locus_tag="LOCUS_2510" /note="WP_011391621.1 GntR family transcriptional regulator (Moorella thermoacetica) [pid:34.3%, q_cov:91.8%, s_cov:86.6%, Eval:1.8e-31]" /note="MGA_335" ORIGIN 1 caaaaacact caaccacatt atatagtatt taggccttcg attcaaccat agaaaaagac 61 ccgccgcagc gggccttgcg atcatctgca gttgtcgaca aagtagtcga acagtttata 121 gcccgggttg tcgggcagca gttcggggtg cccctccaga ccgaagatgc actttttctc 181 cggcatgtac acgccttcga tgatgccgtc ggggcacatg gcgcagacct cgatgccttt 241 gccgggtttc tttacggcct ggtgatgcca ggacgtgatc tctagttcgt cgatgcccag 301 cacctgctgc agcagcttgc ccggcagcag atccacggga tgggcgacgg gggaatggct 361 ctcggagttg tccgcgtgct tgaagtccgt ggcgccctgc aggttgatgt cctggtacag 421 cgtgccgccg caggcgacgt ttaagacctg actgccgcgg caaatgccca tcaggggctt 481 gtcgttttca atggcgaggc gcgccagttc cagttcgaac acgtctctct cgtggttcac 541 gtggccgcag taatacttga tctgctcgcc atagatattg ggatggatgt ccgggccgcc 601 gcacagcagg atgccgtcca cggaatcgaa cagttcccgg atgcgctccg gctccatggt 661 gacgggcagc agcaccggaa tgccgccgcc gtgcatcacg gcttcggtgt aggtggtacg 721 gatgttcatc tccttatgtt cgcggtcgta gctcgtcgta atgccgatga ggggtttttt 781 gttcatgcga tgtcctttct atgccgagtg acccgatcag gggcacagat tcgtcatttt 841 gatgggatgg ttgctgggcg cggggttttc ttcctccatg ccctgcagga tgcgctgggt 901 gcgctttaag gtgcgggtga gcttgttgag ggtatagatg cggttgacca cgtccacggc 961 gtcgttgttg cggtacatca gcacgtcgtt gatggtcttg tccagatcct cgcgcagcgc 1021 ggccgtctcc tccaggtatt ccctgcccag ttcggaggcc agccggtagc cgcccttgct 1081 ctcctcgcct tccttcaggc tgggcagctc gtaatggtag tccatgccga atatgcgggt 1141 cacgccttcc gacagctgca tcttgaattc gttcagcttt accttgagcg tttcctccag 1201 ccccgggatg atgatgtcgc ggtccgcctc gagctcgtgc acggtcttcg cggtctcttc 1261 gcccgcatcg gccagcatgg tcttgaggtc tgccagactg ccccgcagct gtgcgggcgg 1321 catcagcagc accttccagt acagttcgat ctgggacagc gcctgggaga tgatgtcctt 1381 cagcttaagg cgcgcgctct cctccaggat ctcccggacc ttggcccgca ggtcgcggtt 1441 gagggcggtc ttcaggtctt ccaggccggt gccctctttc gcgctgatgg ggaacagcac 1501 cacgtcgtcc acgcccatca gggtgcacaa cagattgcgg cagtagttga tatacgcctc 1561 ccggtcggca tcaccgatgg tgtcgatctt gttgaccgca aagaaaaact tggcggcata 1621 ttccttcgtg ttgcgaagga tgtcgatctc gatctcgttg atgggagagt ccacggacag 1681 cataaagatg acggcgtcgc tctccttgat gaacgcgtag gccgcatccg tgttgttctt 1741 gtgataggag ccgatgcccg gcgtgtcgac gaacgtaagg ccgtccttta ggaagtcgga 1801 ctccgcggtc atgtccacgc agtccacacc caggaggttg cccgggtttt cctgctcgtt 1861 gatgtaatgg gacagctccg cttcgctcac gggcttgacg acgccgttaa agaagcgcac 1921 gctgcaggaa ggcttcccgt agcggatctt cgtcgcggcg gacgtgatgg gtacgatgcc 1981 ggtgggaagg atatcttcgc ccagcagcgc gttgacgagg cagctcttgc cccgcttaaa 2041 ctgtccgatg acggacacgg taatgctctg atcctccagt ttttcctgca gcgctgccgc 2101 tctggcagtc tgcgcaccca ggatctcgga ggtcgcgagg agctcccggg tctcttttac 2161 gtattctaag atattacgtt ccatataaaa agtttaatcc gttccgaagc ccgcccggtg 2221 cttgccgttg ctcatgtgct gcacggcggc gcggctggcg gcttctttgt ctttcgcctg 2281 gaaagccagg aagatctgcc tgtgctcctc caggacttcg tccatgtatt ccttgatgta 2341 ctcagggctg tacttcgtgt tctttgtgta gacctgatag gacgtaaggg tgtgctgcag 2401 catccggttc ttcgtgccgt tgtagatgat ctggtggaac cgggtgttca tggcgagcat 2461 cttggcgggg tcctgcttca tggtgtagaa ctccatgagc tcgaacgctt cctgcatctc 2521 gtcgaactcc tccttggtca tccggtcgat ggcccacttc accgcgatgg attcgtaggc 2581 ggagcgcagc tcgtacatgt cctcgatgtc ctggcgggtg agcccgagaa cgaaggcgcc 2641 ccggttgggg atgatctcga tgagcccgtc cagctccagc ttctggaacg cttcgcgcac 2701 gggtgtgcgg ctcacctggt attcctggca gatgcgctgt tccgtcagct tttcgccggg 2761 ttttatcttc ttctgcagga tgtcgtctct cagtttgttg aacaggtcct ggggaagcga 2821 gcttcccctg tccttttcca tgtcgatctt caaagtcgta tgcctttctg cgggtctatc 2881 tgggttctgc gtaaatgttc tcgccttcca cgcggaagtc cacgaagttg gagttgatgt 2941 attcgccgga agcgtctctc atctggaaga ccagggtgta ggtgtcgtcg ggcagccagg 3001 cttcctcgaa gcgcgtatcc ttgccgtacg tgatggtcgc cacgctgtag ggctcgaaat 3061 ccgtcgtgcc ggcgggtgcc atgtaccaga tgagatcgat gctgtcgcct tcctccaggc 3121 tgtagaggtt cttgtccgcc atgccgttgg catccacggg cttgcgggcg cccagcaccg 3181 tccaggtctc agtcttgaag tcgtagacca cgtccagctt atattcttcc ccgttgatca 3241 gcacgggcac ggcgtacagg ttgtaatctt cgccctcgta ggacagctcc ataaatacga 3301 gctgaccgcc gagagagccc cagctgccgc ggaagttatc ggtaaagacg cccttctccc 3361 agtcggcgaa gatgtcgttg tccgtgccca tccagagcac ggtgccgctc ttctcgtcgg 3421 acagatacag ggagaagctg atgccggcca gcaggtcgtt ggcttccgga ccgagggtga 3481 gcacggcgct gccctcgtcg ttgaccttca gagacttgcc ttcccagccc atatccttca 3541 tggtcttggg tgcagcgggc gcttccacgg gcgcttcgct caggcccttc acgtaagcca 3601 ggccttcgtc cgtcagtttg cctgtcagac cgtactggta gaaatacggg aacgactggc 3661 tggcggagat gccggcgtag gcgttgaagg tcttcatgtc gttggtgtac gggaagaaga 3721 aggacaggcc cgtcgcattg ctgcggtatc tgccgttgat ctcatacagc acgcagtcgt 3781 ccaatgcagc cgttaccgac ttggccgaag ccagcagag // LOCUS sequence062 3808 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence062 VERSION sequence062 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3808 /mol_type="genomic DNA" /organism="" /note="sequence062" CDS complement(304..1107) /product="NAD(+)/NADH kinase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003418878.1" /transl_table=11 /codon_start=1 /translation="MKTVYVYHYAGSKESGAVAEQLKEKLRNAGFTVAEEFGPSVEFAC VVGGDGTFMHGLRECGFPDIPFVGVNTGHLGFFQEFQPDSLDQLVDLIRTGDYRVQRHS LLQASVRTEGGKTYDFKGLTDVIFRGSISKVTHLNLAIGDNFIEKFSGDGILIASSAGS TAYNYSLGGSLVDPRVDLLQITPMAPMNTTVYRSFTSSLLVPPGLDIHIFPDRNYKDSG YLIVDGEEYFFEHVEDISVDLSKDEIQLVRLSDYDFWGKVMSKFL" /locus_tag="LOCUS_2520" /note="WP_003418878.1 NAD(+)/NADH kinase (Clostridioides difficile) [pid:42.3%, q_cov:100.0%, s_cov:100.0%, Eval:5.0e-59]" /note="MGA_338" CDS complement(1109..2899) /product="oligoendopeptidase F" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_015944353.1" /transl_table=11 /codon_start=1 /translation="MARDRKNTPIEYTWNVEAMYEMASGCEKDLQNCLQLAEKFKEYKG SLDNGPKTLLAALRDRDIVIRKLRKASEYAFLRKCEDNRVPEFQALADKAAMIGARVSE ITSFFTPELAAIPGDKLRSWIEAEPGLAVYAHFLDEIQRNRPHILSKEEEKLLAQLSEI SGVMGDTFDMLSDADFKFGTILNEKGEETEVTHGSYIGLVSCKDRSVRKEAYEHMYAQY EAYRNTVASLYTYSVKQDVAMARIRNFGSALEASVFDDNVSADVYNNLIDVVNAHLPAM HRYVALRKKLLGLDDLAMYDIYVPVLDEPETDIPYEEAQKIIDEALVPLGEEYRGIVKQ AFASRWADVYENEGKTSGAFSAGCYDSIPYILLNYNNKLDDVFTVIHEMGHSMQTWYSN HNQEPVNADYPIFTAEVASTVNESLLYRHLIDHADSDLRKAYLINQYLDGFKGTLFRQT QFAEFERDVHAMVEAGDMPTCESLCKLYGDLNAKYYGPDVNYDEHIAIEWARIPHFYGA FYVYKYATGYSAATAISKKILEEGQPAAENYIKFLRSGGCDYPLELLKLAGVDMSTPAP IEAAMQTFEELLDELERLIG" /locus_tag="LOCUS_2530" /gene="pepF" /note="WP_015944353.1 oligoendopeptidase F (Desulfitobacterium hafniense) [pid:48.2%, q_cov:99.5%, s_cov:99.0%, Eval:4.9e-163]" /note="MGA_339" CDS 3004..3522 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MTKEELYDLLEIDTPADLEYFEQMADLLETEEEISWDLFRHALSE IRAENAGEFAENYVGELMNAVPDGVPADGLTEALDAMQQRLMLLAEDLDEAQAREDFAE ELYKLRNWLHDEEGVLVDGEPLPMLQAFTEMRAEKLGAASHTYDLERFPELTPEEISYS LGRFEKIEM" /locus_tag="LOCUS_2540" /note="MGA_340" ORIGIN 1 atgcaccacg aggaacggct gcttgtttac gacgagcagg tcgtcgtcct cgtagaccac 61 gtccagtggg atgttctcgg ggtcaaagta actgctttcc ttcggaaacg atatcgtaag 121 catctgcccg ggacgtccct tgtcccggag ccgcgccttt tggccatcca gggcgatctg 181 tcccgacacc ttgatcttgc gcatcagacg cgaggagagc gaaaagcggc gctgcagcac 241 ttcctttacg tagagacctt cgtcggcctc cgttaaccgg taggtgatgt cgtttgccat 301 ggtctacagg aacttggaca tgaccttgcc ccagaagtcg taatccgaca ggcgcaccag 361 ctggatctcg tccttggaga ggtctacgga gatatcttct acgtgttcga agaagtactc 421 ctcgccgtcc acgatcaggt agccgctgtc cttatagttg cggtccggga agatatggat 481 atccagcccc ggaggcacca gcaggctgct ggtaaagctg cggtacaccg tcgtgttcat 541 gggcgccatg ggcgtgatct gcagcagatc cacccgggga tcgaccaggc tgccgcccag 601 ggaatagtta taggcggtgc tgccggcgga agatgcgatc aggatgccgt cgccggagaa 661 cttctcgata aagttgtcgc cgatggcgag attcagatgg gtgaccttcg agatgctgcc 721 ccggaagatg acatccgtca gtcccttgaa atcgtaggtc ttgccgcctt cggtgcgcac 781 cgacgcctgc agcaggctgt ggcgctgcac ccggtagtct ccggtgcgga tgaggtccac 841 cagctgatcc aagctgtcgg gctggaactc ctggaaaaag cccaggtggc cggtgttgac 901 ccccacaaag gggatgtcgg gaaagccgca ttcgcgcagg ccgtgcataa acgtgccgtc 961 tccgccgacg acacaggcga attccaccga agggccgaat tcctctgcga cggtaaaccc 1021 tgcgttcctg agtttttcct tcagttgttc cgccacggca ccggactctt tcgaaccggc 1081 atagtggtat acgtaaacag tcttcatgtt aaccgatcag tctttccagc tcgtccagca 1141 gttcttcaaa ggtctgcatc gccgcttcga tgggagcggg ggtgctcatg tccacgccgg 1201 cgagcttgag cagttcgagc ggatagtcgc agccgccgga tctcaggaat ttgatatagt 1261 tttccgctgc cggctgccct tcctccagga tcttcttgga gatcgcggta gcggcggagt 1321 agccggtcgc gtatttatac acgtaaaatg cgccgtaaaa atgcggaatg cgggcccact 1381 cgatggcgat atgctcgtcg tagtttacgt cgggtccgta atacttcgcg ttcaggtcgc 1441 cgtacagttt gcacagggat tcgcaggtcg gcatgtcgcc ggcttccacc atggcgtgga 1501 cgtcccgttc gaactctgcg aactgggtct ggcggaacag cgtgccctta aagccgtcca 1561 gatactggtt gatgagatat gccttgcgca gatcgctgtc cgcgtgatcg atcaggtggc 1621 ggtacagcag cgattcgttc accgtgctgg caacttccgc cgtaaagatc ggatagtccg 1681 cgttcaccgg ctcctggttg tggttggaat accaggtctg catggagtgg cccatctcgt 1741 ggatgaccgt aaagacatcg tccagcttgt tgttatagtt cagcaggata tagggaatgc 1801 tgtcgtagca gcctgcagaa aaggcgccgc tcgtcttccc ttcgttctcg tagacgtcgg 1861 cccagcggct ggcaaaggcc tgctttacga tgccgcggta ttcttctccg agaggtacca 1921 gcgcctcgtc gatgatcttc tgcgcttcct cgtaggggat gtccgtctcc ggttcatcca 1981 gcacgggcac gtagatatcg tacatggcca gatcgtccag gcccagcagt ttcttgcgca 2041 gcgctacgta gcggtgcatg gcgggcagat gggcgttgac cacgtcgatc aggttattgt 2101 aaacgtccgc ggagacgttg tcatcgaaaa cagatgcctc cagcgcggaa ccgaaattcc 2161 ggatgcgggc catggcgacg tcctgcttta cgctgtaggt gtagaggctc gccacggtgt 2221 tgcggtacgc ttcgtactgg gcgtacatgt gctcgtaggc ctctttgcgg acgctgcggt 2281 ccttgcagga caccagcccg atgtagctgc cgtgggtcac ttccgtctct tcgcccttct 2341 cgtttaagat ggtaccgaat ttaaagtcgg cgtcggacag catgtcgaag gtatcgccca 2401 tgacgccgga gatctccgac agctgcgcca gcagcttttc ttcctctttg gagaggatgt 2461 gaggacggtt gcgctggatc tcgtccagaa aatgcgcata aacggcaagg ccgggctccg 2521 cttcgatcca gctgcggagc ttatccccgg ggatcgccgc cagttccggc gtaaagaaac 2581 tggtgatctc gctcacgcgg gcaccgatca tggccgcctt atccgccagc gcctggaatt 2641 ccggcactct gttgtcctcg cacttgcgca ggaacgcata ttccgacgct ttgcgcagct 2701 tgcggatgac gatatctctg tcccggagcg ccgccagcag cgtcttggga ccgttgtcca 2761 ggctgccttt gtattccttg aacttctcgg ccagctgcag gcagttctgc agatcttttt 2821 cacagccgga agccatttcg tacatcgctt ccacgttcca ggtgtattct atgggcgtat 2881 tttttctgtc tcttgccatt gtatccgacc tccacgggca aaattaacca aataagtata 2941 ccataaaaga acgcacaatg gtataatttt aaacagtttg aggactttca ggagaaaaag 3001 gacatgacga aagaagaact gtacgatctg ctggagatcg acaccccggc ggatctggaa 3061 tatttcgaac aaatggcgga cctgctggag acagaggaag agatctcctg ggatctgttc 3121 cgccacgccc tctcggagat ccgggcggaa aacgcaggcg aattcgccga aaactacgtg 3181 ggcgagctga tgaacgcggt gccggacggc gtgccggcag acggacttac cgaggcgctt 3241 gacgccatgc agcagcgcct gatgctgctg gcggaagatc tggacgaagc gcaggccaga 3301 gaggacttcg cggaagaact atacaaactc agaaactggc tgcacgatga ggaaggcgtg 3361 ttggtggacg gagagcctct ccccatgctg caggccttta cggagatgcg tgccgaaaaa 3421 ctgggcgcgg caagccacac ctacgatctg gaacgtttcc ccgagcttac gcctgaggag 3481 atctcctaca gcctgggaag attcgagaag atcgagatgt gatcatccga tattccacgt 3541 gctttttccg ctgcgggaga aaaacagata gtcgatcagg cctttctgat aagggataaa 3601 gctcccgtcg tctatcatgg cctcgatctc cgtctgactt gcccaccgga ccgcagcgac 3661 ttcttcctgc tgcagggtca gcccttcggc atccacatcc atcggcagca cataaaaatc 3721 gtcgaaccct tccgggaaat ggaccgtcag ggcaggctgt atcgcatcga actcgatcga 3781 aagaccgagt tcttcttttg tttcgcga // LOCUS sequence063 3802 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence063 VERSION sequence063 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3802 /mol_type="genomic DNA" /organism="" /note="sequence063" CDS 1993..2310 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MSLESMKMVEKAELDAKKLIAEEKARAKTAAEQAAAAGRQKLEEE SEKARKSAAEVIENAKLVGKASCTDIDRASEDAIARLRSAAEHKLPDAARFIAERIAEN L" /locus_tag="LOCUS_2550" /note="MGA_343" ORIGIN 1 catacctgct ggatgagacc agccaggatg aaggatacga atgcaacacc ggcaaccgtc 61 agtgcgtagg gcagctgcgt gaacacgtgg ttcaggtggt agcagtgtgc gcctgcggaa 121 gccatgatgg tggtatcgga aatgggggag cagtggtcgc ccataacgcc gccggagcag 181 gctgccgcca gaccgatggt gcagaggacg ggctctacgt cgtagtcgaa tacggatacg 241 acgatcggcg ccatgatgcc gatggtgccc caggaagtac cggtcgcgaa accgatggct 301 gcgccgatga cgaagatcac ggcaggcagg aagttcttca gggagcctgc attggcaagt 361 gccgcgctta cgtagtcagc agagtacatg gcgtatctgg tgaaggagca cagcgtccag 421 gccagggtga ggatgaggat gggggatacc atctggatga agcccttggg aacggagtcg 481 aagctctttt cgaagccgat caggcgtctg caccagaagt acaggaaggt gaagatcatg 541 cccagggtgc cgccgatgga caggcccaga gctgcatccg catctgcgaa ggaatcggtg 601 aaggctgcgc cgtcgaagaa accgccggtc cagatcatgc cgatgatgca gaagatgatc 661 agaacgataa cgggtacgag caggtcggca acagaggtct tcttgtcgga aggtgcttcg 721 taatcgtctg cgccttcgaa cggacggtgt tcggtggtga acaggtcgcc cttgacctga 781 gcgttgtact cgtgctggag catgggaccg tagtcgatgt tcttgatgga gatgaccacg 841 atcatgacca gcgtgaggat gcagtagtag ttccagggga tctgcttgat gaacagctgg 901 aagccgttta cgttgtcgct gttaacgtag ccggaaacag cagcagccca ggaggagatc 961 ggtgcgatca tgcagaccgg agctgcagta gcgtcgataa cgtaagccag cttcgctctg 1021 gagatgttgt gggactcggt gaccggtctc ataacggcgc ctacggtgag gcagttgaaa 1081 tagtcatcta cgaagatgag aacacccagc agcatggtga tgagctgtgc ggatgctctg 1141 ctcttaactc tggtcttggc ccagcgtccg aatgcttcgg agccgccgcc cttgttcatc 1201 aggtcggaga tgataccaag ttcgaccagg aagatgatga tgcccatgtt ccaggagtcg 1261 cacagaacgg acagcagacc gtagtcagaa ccgacgagag ccaagatggt ctcccaggga 1321 cggaactgtg tatacagcaa tgcgccgata aggcagccga agaacaggga ggaatacact 1381 tccttagaga tcagtgccag tgcaatggcg cagatcgggg gaagcaggga ccagaacgtt 1441 cccgcgaacg gagtctcagc atcttctacg atgatgggct tgttcgcata agacgtgccc 1501 aggaaagcca gcagtgcgat gatgatgact acggctacca gataggcggt cttggtgctt 1561 ttcttttcca tagaaaataa cctcctaaaa ataaagataa aaattgcgac aggtttctaa 1621 caggtcgttc aaaaaatacg gcacacctgt acgaatatat tataccaaat atttgggttt 1681 tgtgaacaaa aaagagaagg agaacgacat tgtttctgtt tgtcgcttta aagttctgca 1741 tatccttcac gatttgttgc aatttgtcat atatttcaca aatagtttgt tgaaacaaaa 1801 caacagtgat gctattttaa taaacagttg acaaatatac cacacctgtg gtaatgtgta 1861 cccggacaaa tcttctaccg caaggtgaga gattgtgata tactaatgca gataagaagc 1921 aagaggcgca gaggacggta tcgttttttt tgcggccttt ttctatattc tcacgcaagg 1981 agagtgaagc gaatgtcact ggaatccatg aaaatggtgg aaaaggcgga actggacgcg 2041 aagaagctca tcgcggaaga gaaggccaga gccaaaacgg ctgcggaaca ggcggctgct 2101 gccggcagac agaagcttga ggaggaatcc gaaaaggcca ggaagtctgc ggcggaagtc 2161 atagagaacg cgaagctcgt gggcaaggcc tcctgcacgg acatcgaccg ggcttcggaa 2221 gatgccatcg cccggctccg cagcgcagca gagcacaagc tccccgacgc tgcccggttc 2281 atcgcggaaa ggatcgcgga aaatctatga gcattcagaa gatgaagcga gtccgtctga 2341 tcggactgcg cagcgaaaag gatgcgtttc tggacgatct gctccgcttt ggtaaagtcg 2401 agatctcgga ttatccccag gcggaaggcg acgtcgtggt gttcagtacg aacaactacg 2461 ataagaccgg ccttcctgca gacatgctgg tggtcaacca gaacaagctg agtgcggctc 2521 tggacatcat gcagcggtat ttcccggaga aaaagggact gctggatccc aaacccgagg 2581 cgccgctgga aagctttctc agcgatgccc ggctcaacag ctgcctgcac agcgcaaacc 2641 gcgtcatccg gctggacggc gagatcaagg gatggaacaa cgagatcggg gaactgcaga 2701 cgcaaaagac ggcgctgcag ccctggctta cgctggacat gccgctggaa tacgagggca 2761 cggagcacgt ttcgtttacg ctctgcagcc ttcccgcgga cgccccgaag gcggatgtgg 2821 aaagcgcgct ggcgctggca gctccggaga gcgaactcat tcccgtctct tcggataagt 2881 tcctgcagta ttgcctgctg gtctgccaca gagacgaatt cgatgcggcg gaggatgccc 2941 tgcgcaattt cagctataac ccgatggagc ggatgaacct cacagggacc ccgcaggaga 3001 acgtcgaacg catcgacaac gaagtcgaat acgacgagat caagatcgag cgggccaagg 3061 gcaagctgat gagcgaaacg gcttaccggc agtacatcca gcagagctgg gacagcctgg 3121 ccacgaagct gtacgagacg gagagccgca gccgcatgct caactccgag agctccttcg 3181 ccatggaagg ctgggtgccg gaggaggatg tcccaggact ggaggcggtc ctcggcaact 3241 acgtcgtcca cgcggagttt gaagatccgg cgccggaaga gtatccggac gttccggtca 3301 aactgaagag caacatcctc acccgctgca tgaacatgat cacgaacatg tactccctgc 3361 cggcttacga cggggtggat cccaacccgc tcatggcgcc tttcttcatt attttttacg 3421 gcatgatgat ggcggacatg ggctacggca tcctgatgtt cgcggcaggc atgctcatga 3481 taaagaagat gaaagccaga ggcggcacga gagatttcgg cgaactgctg gtctggtgcg 3541 gcatctccac cttcctgtgg ggcgctgcga ccggcggttt cttcggagat tttatcccgc 3601 aggccatcaa gatcttcaac ccggagagca cctttaccat gccggcgctg ttcacgccgc 3661 tggaagacac catcgccatc ctgttcggat cgctggcgct gggcatcgtg cagatcttta 3721 ccggcatgat cgtcagcgtc aaggagaagt tcaagagagg ggagttcaag agcgccctgt 3781 tcgacgaatt cgcctggtgg gc // LOCUS sequence064 3792 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence064 VERSION sequence064 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3792 /mol_type="genomic DNA" /organism="" /note="sequence064" misc_feature <1..1253 /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_118838626.1:amidohydrolase" /note="WP_118838626.1 amidohydrolase (Salinibacter ruber) [pid:30.1%, q_cov:98.6%, s_cov:73.3%, Eval:6.8e-41, partial hit]" /note="MGA_345" /locus_tag="LOCUS_2560" CDS 1268..2113 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MKIAVTYENGQVFQHFGHTEQFKVYEVEDGKVVSSQVFGSDGTGH EALAVLLSQRAIDVLICGGIGGGAQAALQEQGIELCAGASGDADAAVQAYLRGELVNTG ANCDHHDHHGEGHECGDHSCGGHEGGCGGCHGPRMEGPNVGKKVRTHYRGTFNDGTQFD SSYDRGEPLEFICGAGMMIPGFDKAVADMKPGEIRNVHLMPEEAYGIRDLNNVLTLEIQ QLPGSQDLNVGERAYLQTMDGRPFEVQVIAKDDKNITLDANHEMAGKELNFEIELVEVE " /locus_tag="LOCUS_2570" /note="WP_010933554.1 peptidylprolyl isomerase (Chlorobaculum tepidum) [pid:45.6%, q_cov:48.4%, s_cov:95.1%, Eval:9.9e-29, partial hit]" /note="MGA_346" CDS 2141..3271 /product="amidohydrolase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_010972927.1" /transl_table=11 /codon_start=1 /translation="MDKTLFDKAVELRHEIHAHPDLSNQERPTFERIIAFLRENAPSIE ILDRGHYVLARYKAADPKKPPIAFRADVDAILVYDDIDKPWKSTIDGVGHKCGHDGHAA ALAALAMQLDKDGADRDVYMIFQPAEENGTGSAMCTDFLTEFGIAEIYGFHSQAGAPKY TVMLRDGLYCCASKGMTITMTGSPAHASQPEDGKNPSEAIAKTVLAVSKIADQANYKGL VLATIVQIDVGEKEAFGVAASKGKLLMTIRGEIEAEMDLLQARLEDEAMKNAAEYGLAC QFSYCDAFPETVSTPACNEKLRKACDALGYKWWDRPMFYRGSEDFGNFTKVVPGAMFFI SNGEDGECDGCHTLHFDFNDELIDMVVNIEMELIRA" /locus_tag="LOCUS_2580" /note="WP_010972927.1 amidohydrolase (Agrobacterium tumefaciens complex) [pid:33.0%, q_cov:97.3%, s_cov:95.6%, Eval:1.9e-47]" /note="MGA_347" ORIGIN 1 atctggaccg catctccacc gagatccccg tggccatcgt ccggggctgc gagcacgcag 61 gtgccgtgaa ttccgtgctg ctggctgcca tggggctcga taaggatcac catacgatcg 121 agggcggcga agtcgtcctc ggcgaagacg gcgaacccaa cggctacctg aaggaggccg 181 ccatccgcgc catctacggc tacatcccca acctgtccga cgaggaactg gaggaggcca 241 tcctgacggc gatgcgctac tgcgcttcct ggggtatcac cacggtgcag agcatggatc 301 tgggcaccta tctgcccaac tggacgccca actaccgcgt gctgaagggc atttacgaga 361 agggcgagga tctggtccgc tatacgggtc agacgtcctt tgctaccgtg gaagacttta 421 aggcctacgt ggacggctcc tacggcgaaa cgcccgacgg cttcccgttc aaggaagtgg 481 tcgcagacga ccgcatgcac atgggcccgt tgaagctggt gcgcgacggc gctctgggcg 541 cccgcacggc catgatgcgc cgcgaatact gcgatgaccc gggcaactac ggcatcgatt 601 ccatgtcgga cgagtcctat caggcctatg tggatgtagc agctgcagca gggctgcaga 661 cggtcaccca ctgcatcggc gatgaggcca tcgagcgctg cacgaagcag tggaacaaga 721 ccggcagaaa agacttgcgc ttcggcgtgg tgcacaacca gatcacggat gtaccgctgc 781 tgcagttcct gaaggattcc ggctgcgtta tcgcttacca gcccatcttc ctggacagcg 841 acatgcatgc ggtggagagc cgctgcggca aggaactgag ttccacgtcc tacgcgttta 901 aaacggcgcg ggagatgggg ctgcgctgct cctacggcac ggatgcgccg gtggtggatc 961 cgaatccctt tgacaatctc tactccgcgg tgacccgcaa ggatctgaag ggctggccgg 1021 aagagggctg gaacccccag gagtgcgtgg accgggagac cgccgtcgac tgctacacgg 1081 aggacagcgc gtactttgaa ttccgggaga ccgtaaaggg ccggctgaag cccggcttct 1141 acgcggacct caccgtgctg gacaaggact tctttacctg cgcggaggac gagatccggg 1201 gcatccgtcc cgtgctcacc atgtgcgccg ggaaaataac atatcgtaaa taagagagga 1261 aatatctttg aaaatcgcag ttacttatga aaacggccag gtgtttcagc actttggcca 1321 cacggaacag tttaaagttt atgaagtaga agacggcaaa gtcgtgtctt cccaggtctt 1381 cggatcggac ggcaccggcc atgaagcgct tgccgtgctg ctgtcccaga gggcgatcga 1441 cgtcctgatc tgcggcggca tcggcggcgg tgcacaggcg gcgctgcagg agcagggcat 1501 cgaactgtgc gcaggcgcca gcggcgatgc ggatgcagcg gtacaggcct atctgcgagg 1561 cgagctggtc aataccggcg cgaactgtga ccaccacgat catcatggcg aaggccacga 1621 gtgcggcgat cacagctgcg ggggtcacga aggcggctgc ggcggatgcc acggtccccg 1681 gatggaaggc ccgaacgttg gcaaaaaggt ccgcacccat taccgcggca ccttcaacga 1741 cggcacgcag ttcgattcgt cctacgaccg gggcgaaccc ctggaattca tctgcggcgc 1801 agggatgatg atccccggct tcgataaagc cgtcgcagac atgaagcccg gcgagatccg 1861 caacgtgcat ctgatgccgg aggaagctta cggcatccgg gacctgaaca acgtgcttac 1921 gctggagatc cagcagctgc ccggttccca ggatctgaac gtaggcgagc gggcctacct 1981 gcagacaatg gacggacgtc cgttcgaggt gcaggtcatc gcgaaggacg acaagaacat 2041 tacgctggat gccaaccacg agatggccgg caaagagctc aactttgaga tcgaactggt 2101 ggaagtagag taactgggat cacagataag gaggcaatct atggataaga cacttttcga 2161 caaggcggtg gaactccggc acgagatcca cgcgcatccc gacctttcca accaggaaag 2221 accgactttt gaacggatca tcgccttttt aagggaaaat gctccgtcga tcgagatcct 2281 ggacagaggg cattacgtgc tggcccgcta taaggctgcc gatccgaaga agcctcccat 2341 cgctttccgg gcggatgtgg acgccatcct ggtgtacgac gacatcgata agccctggaa 2401 gagcaccatc gatggcgtgg gtcacaagtg cggccacgac ggccacgcgg cagccctcgc 2461 agccctggcc atgcagctcg acaaggacgg cgcggacaga gatgtctaca tgatcttcca 2521 gcccgccgag gagaacggta cgggatccgc catgtgcacg gacttcctga ccgaattcgg 2581 catcgccgag atctacggct tccacagcca ggcgggagcg cccaaataca ccgtcatgct 2641 gcgcgacggg ctctactgct gcgccagcaa ggggatgacc atcaccatga ccgggtcacc 2701 cgcccacgca agccagccgg aagacggcaa aaatccatcc gaagccatcg ccaaaacggt 2761 gctggctgtc tcgaagatcg cggaccaggc caactataaa ggtctggtgc tggccaccat 2821 cgtgcagatc gacgtaggcg agaaggaagc cttcggcgta gccgcctcca agggcaaact 2881 gctgatgacc atccgcggcg agatcgaggc ggagatggat ctgctgcagg caaggctcga 2941 ggatgaagcc atgaagaacg ccgcggaata cggtctggcc tgccagttca gctactgcga 3001 cgcgttcccc gaaacggtga gcacgcctgc ctgcaacgaa aagctccgca aagcctgcga 3061 cgccttggga tacaagtggt gggaccgtcc gatgttctac cggggatccg aggatttcgg 3121 caactttacg aaggtcgtgc ccggcgccat gttcttcatc tccaacggcg aggatggcga 3181 atgcgacggg tgccatacgc tgcatttcga cttcaacgac gaactgatcg acatggtcgt 3241 gaacatcgag atggaactga tccgcgcata atacccattt aatgtaaatt gtatccatgt 3301 aaataaattg cacggaatca cgcaaatcgt atacaatctc tgcccgtagt gctatactaa 3361 aagagcatag aactacgggc atttttatgc cttcgctata gtaaaaaaag aaaaggagag 3421 acaaatgatc cagctgcatg aacagggcgt cttcctcgta gacggcaagc cttgcgatca 3481 gggcttagaa ccgaaggaag aggccaagaa gaagaccatc gcttacggca ttcttcaggc 3541 tcacaacaga tcggaagatc cggagaaact gcagatcact ttcgatgcca tggtttccca 3601 cgacattacc tatgtcggga tcatccagac agcaagaggc tccggcctga aagaattccc 3661 catgccgtac gctatgacca actgccacaa ttccctttgt gcagtaggcg gaacgatcaa 3721 cgaagacgac cacgtgttcg gactttccgc ggccaagaag tacggcggta tttatgttcc 3781 ggccaatatg tc // LOCUS sequence065 3784 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence065 VERSION sequence065 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3784 /mol_type="genomic DNA" /organism="" /note="sequence065" CDS 438..806 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MKSSLDNLVEISMLMDFYGALLSERQQQIVTLYHEENCSLQEISE ELGVSRQGVHEALKKAEKSLQGFEEKLGLVARFRSQEQVLQNALASVDELLGRCEDPGV RQGLLRIKNDINSIEEQV" /locus_tag="LOCUS_2590" /note="WP_003393779.1 putative DNA-binding protein (Clostridium botulinum) [pid:40.7%, q_cov:74.6%, s_cov:82.7%, Eval:7.0e-15, partial hit]" /note="MGA_350" CDS 809..2146 /product="signal recognition particle protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_005813193.1" /transl_table=11 /codon_start=1 /translation="MAFESLSEKLSGVFKKLRGKGVLTESDINEAMREVKLALLEADVN YKVVKEFVADVKEKALGEEVLKSLTPGQQVVKIVNDELVALMGGGSSKLTYSPSGFTTI LMVGLQGTGKTTTCAKLAAYLKKQGKHPMLAACDVQRPAAIDQLEVVGGQVDVPVFCDR ESKDPADIALRARKEAERKGLDMLIVDTAGRLHVDEALMEELKEVKKAVKPHEILLVVD AMTGQDAVTAAEAFHEAMGIDGIVMTKLDGDTRGGAALSVKSVTGRPIKFIGMGEKLDA LEPFYPDRMASRILGMGDVMSLIEKAQEAVDEEKAAELEKRLAKNQFTLEDFLDQIGQI KGMGGLGKVLNMLPGVQGKVSEDDMDAGEKEFRTMEAIIQSMTPEERKKPDLLNASRRK RIAAGAGVTVAKVNQLIKKYEDTRKLMKQLNNGKFGKRFGRRFPGF" /locus_tag="LOCUS_2600" /gene="ffh" /note="WP_005813193.1 signal recognition particle protein (Desulfitobacterium hafniense) [pid:62.2%, q_cov:95.7%, s_cov:93.4%, Eval:4.8e-149]" /note="MGA_351" CDS 2196..2438 /product="30S ribosomal protein S16" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003720111.1" /transl_table=11 /codon_start=1 /translation="MVKIRLRRMGAHKKPFYRVVVADQRTARDGKSIEEIGTYNPLTNP VEINIDAEAAKKWLANGAVPTDTCRALLKKAGILE" /locus_tag="LOCUS_2610" /gene="rpsP" /note="WP_003720111.1 30S ribosomal protein S16 (Listeria) [pid:65.8%, q_cov:98.8%, s_cov:87.8%, Eval:1.2e-24]" /note="MGA_352" CDS 2452..2688 /product="KH domain-containing protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003362589.1" /transl_table=11 /codon_start=1 /translation="MTGLVETIARSLVDSPDEVQVRELPGKDPGVTVVELKVAASDMGK IIGKQGRIVKALRTVVKAAAVKQNKKVVVEIVS" /locus_tag="LOCUS_2620" /note="WP_003362589.1 KH domain-containing protein (Clostridium) [pid:61.0%, q_cov:98.7%, s_cov:100.0%, Eval:2.7e-19]" /note="MGA_353" CDS 2747..3235 /product="ribosome maturation factor RimM" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003384687.1" /transl_table=11 /codon_start=1 /translation="MDTIKLGKITAPQGIKGEVRVYPYTDELTRFSEIEAVLLDGQKRK IQNARYMKNMAVLKLEGVDDRNMAESLRNKELLLAKEDLWEQPEDTYFIDDLVGCTVIS EDGAPVGMLKSIISRPAQDLYEIERADGSTFLLPAVKEFIKNVDLDNKTITIHLINGL" /locus_tag="LOCUS_2630" /gene="rimM" /note="WP_003384687.1 ribosome maturation factor RimM (Clostridium) [pid:40.5%, q_cov:94.4%, s_cov:92.1%, Eval:4.9e-31]" /note="MGA_354" ORIGIN 1 ccatcgaatt cgagaactac gaaaagatgt gggcccgcat gcgctccatc ctgtgcccga 61 acaaggccat cgtcaaggaa tgggcggaca aagaaccgca tctggaactg atcggcgatc 121 cctggggcac tacctgcctc atccgctacg actacgacgt ggattccgag actctggcga 181 aggacgctat ggaagacgag agaaagatcc tgttcgtccc cggcgactat ttcgacatcc 241 cgaagaccat ccgcgtaggc tacggcgcct tccgcgatcc cgaggtgctg aaggccggcc 301 tggcccagtt ctccgattac ctgaagaagt gggagaagta gttctccgat ccctctgaag 361 gcctataaat tcttttatgc gggttgtcaa gttttttgct tgacaacccg ttttcgttat 421 gatatcatcc ccaaggtatg aagagcagtc tggacaattt agtggagatc agcatgctga 481 tggacttcta cggcgcgctg ctttccgagc ggcagcagca gatcgtaacg ctgtaccatg 541 aagagaactg cagtctgcag gagatctccg aagagctggg cgtttcccgg cagggcgtgc 601 acgaagcgct caagaaggcg gaaaagtcgc tgcaggggtt cgaggaaaaa cttggcctgg 661 tggcgcggtt tcgttctcag gaacaggtgc tgcagaatgc actcgcgtcc gtggacgaat 721 tgctgggtcg gtgcgaagac cccggcgtcc ggcagggatt gctccggatc aaaaacgata 781 tcaactccat cgaggaacaa gtataaacat ggcttttgaa agtctttcgg aaaaattaag 841 cggcgtattt aagaagctgc gcggcaaggg cgtccttacg gaaagcgaca tcaacgaagc 901 gatgcgcgaa gtcaagctgg cgctgctgga agcggacgtc aactataaag tcgtcaagga 961 attcgtcgcc gacgtcaagg aaaaggccct gggcgaagag gtcctgaaga gccttactcc 1021 gggtcagcag gtcgtcaaga tcgtaaacga cgaactggtt gccctcatgg gcggcggcag 1081 cagcaagctc acgtattccc ccagcggatt tacgaccatc ctgatggtgg gtctgcaggg 1141 caccggtaag accacgacct gcgcgaagct ggcggcttac ctgaagaagc agggcaagca 1201 ccccatgctg gcagcctgcg acgtgcagcg tcccgcagcc atcgatcagc tggaagtggt 1261 gggcggacag gtggacgttc ccgtgttctg tgaccgcgag agcaaagatc cggcggacat 1321 cgcgctgcgc gccagaaaag aggcggagcg caagggcctg gacatgctca tcgtggatac 1381 ggcaggccgt ctccacgtgg acgaagccct catggaagag ctgaaggagg tcaaaaaagc 1441 cgttaagccc cacgagatcc tgctggtggt ggacgccatg accggtcagg acgccgttac 1501 ggcggcggaa gccttccacg aagccatggg catcgacggc atcgtcatga cgaagctgga 1561 cggcgatacc agaggcggcg cggcgctctc cgtcaagagc gtaacggggc ggcccatcaa 1621 gttcatcggt atgggcgaaa agctggacgc cctggaaccg ttttatccgg accgcatggc 1681 cagccgcatc ctcggcatgg gcgacgtcat gtctctcatc gagaaggcgc aggaagctgt 1741 ggacgaggag aaggcggcgg aactggaaaa gcgcctggcg aaaaaccagt tcaccctgga 1801 ggatttcctg gatcagatcg gacagatcaa gggcatgggc ggcctgggca aggtgctcaa 1861 catgctgccc ggcgtgcagg gcaaggtgag cgaagacgac atggatgcgg gcgagaagga 1921 gttccgcacc atggaggcga tcatccagtc catgaccccg gaagagcgta aaaagccgga 1981 cctgctgaac gcgtcccgca gaaagcgcat cgcagccggt gcgggggtca ccgtggcgaa 2041 ggtcaaccag ctcatcaaaa aatacgaaga caccagaaag ctgatgaaac agctcaacaa 2101 cggtaaattt ggcaagagat tcggaagaag atttcccgga ttttaacgca taaacaagtt 2161 caatcgatcg atatctataa ttttggaggt aacaaatggt taagatcaga ttaagaagaa 2221 tgggtgctca caagaagcct ttctacagag tcgtcgttgc agatcagaga acggcaagag 2281 acggtaagtc catcgaagag atcggcactt acaaccccct caccaacccc gttgagatca 2341 acatcgacgc agaagctgcc aagaagtggc tggccaacgg cgcagttccc accgacacct 2401 gccgcgctct gctgaagaag gccggcatcc tggaataacc gggggccttc tatgacaggt 2461 ttggtagaaa cgatcgcaag atccctcgtg gacagcccgg acgaagtcca ggtccgcgag 2521 ctgccgggaa aagatcccgg cgtgactgtg gtcgaactga aggtggccgc gtccgacatg 2581 ggcaagatca tcggcaagca gggccgtatc gtgaaggcgc tgcgcaccgt cgtcaaggca 2641 gccgcagtca aacagaacaa gaaagtcgtc gtggagatcg tctcttagga ctctcccgga 2701 gaaaaggcgg ggcagacccg ccttttttca aaacggaagg agaccgatgg ataccatcaa 2761 actgggaaaa ataacggcgc cgcagggcat caagggcgaa gtgcgggtct atccgtacac 2821 ggacgagctc acccgcttct ccgagataga agcggtgctt ctggacgggc agaaacggaa 2881 gatccagaac gcccgctaca tgaagaatat ggctgtcctt aagctggaag gcgtcgacga 2941 ccgcaacatg gcggaaagcc tgcgcaataa ggaactgctc ctggcgaagg aagacctgtg 3001 ggagcagccg gaggatacgt atttcatcga cgacctcgta ggctgcactg tgatctccga 3061 agacggggct cccgtaggta tgctcaagag catcatcagc cgccccgccc aggatctcta 3121 cgagatcgaa agggcagacg gcagcacgtt cctgctgcct gcggtcaagg agttcattaa 3181 aaacgtcgat ttagacaaca aaacgatcac cattcacctg atcaatggat tataagcgta 3241 tgaaagtcac gatcctcaca caatttcccg acatgttcgg gccggtgacc accagcatcc 3301 tcggcagagc tgccgaaaaa ggcctgctgg agctggacat cgtcaatatc cgggactata 3361 cgctggacaa acacagaaag accgacgaca cgcccttcgg cggcggcgcc ggcatggtga 3421 tgaccccgca gcctgcgttc gacgcgctgc gcagtctcgg ggcgcagggt aagcgcatcc 3481 tgtacatgtc ccccagagga cctatcctgg accagaatct ggccgaggac ctggcgtcgg 3541 aggaggagtt ctttattctg tgcggtcatt acgaaggggt tgacgaacgc atcctcaaag 3601 cctggaacat ggaggaggtc tccataggcg attatatcct gacgggcggt gaactggctg 3661 ccatggtcct cgtcgactgc gtgtcgcggc tcggtcccgg cgtgctggga agcggcgatt 3721 cgctgtccga ggaatccatc tacagcggcc tgctggaata tccccagtac acgaagcccc 3781 gcag // LOCUS sequence066 3782 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence066 VERSION sequence066 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3782 /mol_type="genomic DNA" /organism="" /note="sequence066" misc_feature <1..1127 /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_011837459.1:peptide ABC transporter substrate-binding protein" /note="WP_011837459.1 peptide ABC transporter substrate-binding protein (Streptococcus sanguinis) [pid:26.2%, q_cov:83.7%, s_cov:48.6%, Eval:2.8e-19, partial hit]" /note="MGA_356" /locus_tag="LOCUS_2640" CDS 1251..2195 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MAKYILKRFGAALLSLFIIITLIFCLLRLMPIEGYLGPNVDKLSE EVIAAKLAAKGLDKPVPVQLFNFYRNLARGDLGKSWIYRENVDIVKIIKPKIKISAKLG AMAMGLSLLIGIPLGAVMARSKGKWPDKLGTGFIVFLQAAPSAVYFLFIQMYATKGTGL PMLYNDSKPISWILPIISLALPSIANYGMWMRRYMVDQMNQDYVKLARAKGVSNKAVMM KHVFRNAFVPMVQTIPSSLLFTIMGSLYVESIYSVPGMGGLLIDVIQRQDNTMVQALVL IFASVGIIGLFLGDILMVLVDPRISLTGKEESR" /locus_tag="LOCUS_2650" /note="WP_002902452.1 ABC transporter permease (Streptococcus) [pid:41.5%, q_cov:68.2%, s_cov:43.4%, Eval:4.1e-42, partial hit]" /note="MGA_357" CDS 2195..3241 /product="ABC transporter permease" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_002893621.1" /transl_table=11 /codon_start=1 /translation="MSLFRKGAVMEKASEGMADQLEKALRDSLPDDLTPEQVAALDPSR FEMAEYDDTLAEKTGYSSYSYWRSTFRAFWNNRLARFLLVALLLLIAFTIIQPHLPGQR PPAQIYDFDDGSVMRNLPPSHDFWFGTNAVGQDLWARVWSGTRTSLLIALIVAISDNVI GITIGILWGYVRKLDAFLTEVYNIIDNIPRTIILILISYILRPGMATMIISMCCVGWLG MARFIRNQILMIRDRDYNLASRCLGTSTGKIMIKNLLPYMVSVIMLQTALAIPSVISDE VFLTYCGLGMPKNIASLGNLVEEGRKMMMTSSRYQLIFPALVVTFITVSFYLIGNTFAD ASDPRNHV" /locus_tag="LOCUS_2660" /note="WP_002893621.1 ABC transporter permease (Streptococcus sanguinis) [pid:37.8%, q_cov:89.1%, s_cov:99.7%, Eval:6.7e-60]" /note="MGA_358" ORIGIN 1 ataacgctca ggcagactcc atcgctccgg aaatgttcct gcgcggcgag atcgactcct 61 gctccgtcac caccaacatc ctggatgaat ggctcaacgg cgacaacgcc cagtacgtcc 121 accagtccaa gaagctgggc accatcatgt acatgctgtt caacttcaac ccgaagatgg 181 atgacgaagc agcaaacgaa gcctacagag cagccgtcaa caacaagaac tggcgtatgt 241 ccatcgtgta cggtctcaac aaggcttact gcctgtccgc ttacgacccc tactatgcgg 301 aagaacgcgt tacgaatctg atgatccccg cagacttcgc gatggtcgac ggtaaagact 361 acaccgagtt cggcaacctg cccgaactgt ccaagggctt ctatgacgaa gccaaggctc 421 tggaattcag agatgctgcc aaggccgaac tggaagccgc cggcgtgccc ctgcccatcc 481 agatccccgt attctacaac ccctccacgc cgaacatgga caactccttc cagctgatcg 541 aaaagcagct cgaagaactg ctcggcaccg actacatcga cattacggtc tacgccggcc 601 cgaccacgaa cttcatcggt gaagtccgcc gtcccggcaa gtggggcctc tacgaacagg 661 gctggtcccc ggactacgca gatcccgcga cctacttcga acccttcggt tacggctgga 721 ccttcggttc tcaagaatac atcgaaggcg atgaatacaa gaccggctac atctataccg 781 aagaagatta cgccaacaac gtgatcgacg acgaagaact ggtcggaacc ccgcagatgg 841 tcttcaactc cctggtcgaa gcggccagag ccgaaaagga actgaacgcc cgctacgaac 901 tgttcgccaa ggcggaagaa tacgccctga ccgaaggcct gatgatccct tatcagcagt 961 acaacgacgg ctacgttgcg tccaagctcg ctctctacga agcagagaac gcgatggccg 1021 gtatctgcgc gtacaagtat aagggcatgc acctgctcga aaagtcctac tccatggatg 1081 aattcgaaaa ggctaccgag gcctgggaag ccgacaaggc aaagtaagac gctttgagat 1141 ctccaaatct caatagaaaa gcgcaataaa gtggagggtg tcccaaaagg catgccaatg 1201 ctgaagggac accctctttt ctcaatcaaa cacagaagga ggatgaaaag gtggcgaaat 1261 acatactcaa gcgcttcggc gcagcccttc tcagcctttt tatcatcatt acgctcatct 1321 tctgtctgct gcgcctgatg cccatcgaag gctatctggg accgaacgtg gataagctga 1381 gcgaagaagt catcgcagcg aaactggctg cgaagggact ggacaaaccg gttcccgtgc 1441 aattattcaa cttttaccga aatctcgcgc ggggcgacct gggcaaatcc tggatctacc 1501 gcgaaaacgt ggacatcgtc aagatcatca agccgaagat caagatctcc gcgaaactgg 1561 gagcgatggc catgggcctc tccctcctca tcggcatccc tttaggcgcg gtcatggcgc 1621 gaagcaaagg caagtggccc gacaaactgg gcaccggctt tatcgtgttc ctgcaggctg 1681 ccccttccgc cgtgtacttc ttgtttatcc agatgtacgc gacaaaagga acaggcttgc 1741 cgatgctata caacgacagc aaacccatct catggatcct tcccatcata tccctggccc 1801 ttccctccat cgccaactac ggtatgtgga tgcgccggta tatggtggac cagatgaacc 1861 aggactacgt aaaactggcc cgcgccaagg gcgtatccaa caaggcggtc atgatgaagc 1921 acgtgttccg caacgccttc gtgcccatgg tccagacgat cccctcgtcc ctgctcttca 1981 ccatcatggg ttccctatat gtggagtcga tctactccgt tcccggcatg ggcggtctgc 2041 tgatcgacgt catccagcgc caggacaaca cgatggtgca ggcgctggtc ctcatcttcg 2101 cctcggtggg catcatcggc ctgttcctgg gcgacatcct catggtgctc gttgacccgc 2161 gcatcagtct taccggaaag gaggagagcc gctgatgagt ctgtttagaa aaggcgccgt 2221 catggaaaaa gcctcggaag gcatggcgga tcagctcgag aaagcgctcc gggattccct 2281 tcccgacgat cttacgcccg agcaggtcgc cgcgctcgat ccttcccgct tcgagatggc 2341 ggaatacgac gataccctgg cggagaagac cggctactcc agctattcct actggcgcag 2401 cacgttccgc gcgttctgga acaacaggct ggcgagattc ctgctcgtcg cgctgctgct 2461 cctcatcgca tttacgatca tccagcccca tctgccgggt cagcggcccc ccgcccagat 2521 ctacgatttc gacgacgggt ccgtcatgag aaatctcccg cccagccacg acttctggtt 2581 cggcaccaac gccgtcggcc aggatctgtg ggccagagtg tggagcggca cgagaacgtc 2641 gctgctgatc gcactgatcg tcgcgatcag cgataacgtg atcggcatca cgatcggcat 2701 cctgtggggc tacgtccgca aactggacgc cttcctcacg gaagtctaca acatcatcga 2761 taacatcccg agaacgatca tcctcatcct gatctcctac atcctgcgtc cgggcatggc 2821 cacgatgatc atctccatgt gctgcgtggg ctggctgggc atggcccggt tcatccgcaa 2881 ccagatcctg atgatccgcg acagagacta caacctcgcg tcgcgctgcc tgggcaccag 2941 caccggcaag atcatgatca agaacctgct gccttacatg gtgtccgtca tcatgctgca 3001 gaccgcgctg gccattccgt cggtcatctc cgacgaggtg ttcctcacct actgcggcct 3061 gggcatgccg aagaacatcg cctccctggg caacctggtg gaggaaggcc gcaagatgat 3121 gatgaccagc agccggtacc agctgatctt cccggctctg gtggtcacgt tcatcaccgt 3181 atcgttctat ctgatcggca acacgttcgc ggacgcgtcc gatccgagaa accacgtata 3241 gaaaggaggc aaagacatgt taaacaacgg agatatcatc ctctccgtaa aggatctgca 3301 tgtaaagttc agcctccgcg gcaaagtgct caacgcgatc cggggcatct ccctggacct 3361 gcacaagggc gaatccctgg ccatcgtcgg cgaatccggc tccggcaaat ccgtcttcac 3421 caagaacttc atcggtcttc tggacaagaa cggctgggtg gactccggcg agatctggta 3481 ttacggcatg gatccggaac atcccgtcga cctggcgaaa tacaagaccg aggaacagtg 3541 gcagaccata cgcggcaagg aagtcgccat ggtgatgcag gacccgatga cctccctcaa 3601 ccccttgaag accataggct ggcagatcga agaagccctt aagctccacc aggggttaaa 3661 gggcgaagcg gccagcaaaa aggcggtgga gatcctgcag gacgtaggca ttcccgaggc 3721 ggaacgccgc gccaagcagt atccccacga gttctccggc ggcatgcgcc agagagtcgt 3781 ca // LOCUS sequence067 3770 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence067 VERSION sequence067 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3770 /mol_type="genomic DNA" /organism="" /note="sequence067" CDS complement(393..1172) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MIRDFFLRGRTGHPLLPELKQYRYAHRGYHDKPQIPENSLPAFRR AIERGWGAELDVHLLKDGTLAVFHDSDLKRCTGEEGTIEDLDLAQLKQLRLEGTQEQVP LFDEVLALFEETKPLIIELKTYKGNHRALAEAVCKRLDSYKGLFCIESFDPRAVADVRQ LRPDIVRGQLVSNFLKDPEGLPRYQRIVLTNLLFDCKARPDFIACKFEDRGVSSIRRTV DKLGVQEVCWTIRRMEDLKTCEAAGAIPIFEKFDPEG" /locus_tag="LOCUS_2670" /note="WP_013363043.1 glycerophosphodiester phosphodiesterase family protein (Bifidobacterium bifidum) [pid:34.1%, q_cov:86.1%, s_cov:72.9%, Eval:3.8e-24, partial hit]" /note="MGA_361" CDS complement(1172..2506) /product="SLC45 family MFS transporter" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_010867389.1" /transl_table=11 /codon_start=1 /translation="MKLNNKRTVLVGLAFLSICAFWQMYDNVVPLILTNTFHLNETFSG AIMAGDNILALFLLPFFGGLSDRTDTKIGKRMPYILLGTAAAVVLINVLPLLDNGYYAA PSSFKLVSFVITLGLLLVAMGVYRSPAVALMPDVTPKPLRSKANAIINLMGAVGGMIYL AIAAVLYPNEKVKGLAHVDYRPLFVIVSAIMLAAVIILFVTIKEPKLTAENRALEEQHP EWNLAEDDGSGGEILPPPVKRSLGFLLASIALWFIGYNGITTWFTTYVSQVMGQALGGA SKCLLIATVGAIISYIPIGVLASKIGRRRTIMGGIVLLAVCFALGYVLTTTYSSINAIM FIVFALVGLAWAAINVNSLPMVVEMCKGSDIGKFTGYYYTASMAAQIVTPILAGTLMRN ISYKILFPYAALFVALSFLTMTQVHHGDNRPEAKKGLQAFEEMDD" /locus_tag="LOCUS_2680" /note="WP_010867389.1 SLC45 family MFS transporter (Pyrococcus abyssi) [pid:33.1%, q_cov:100.0%, s_cov:99.6%, Eval:1.8e-63]" /note="MGA_362" CDS complement(2503..3330) /product="HAD-IIA family hydrolase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_004082267.1" /transl_table=11 /codon_start=1 /translation="MALKDKKLFLLDMDGTLYLSDRLFDGTLDFLDHVKRTGGRAVFMT NNSSRGLDAYIRRMAGFGIACGPEDFVTSTDATIRYLKGAYGPKTRYFVCGTESLKQQL RAAGLILAEENGAPEADPGDLADVVLLGYDKELTYRKLEVCCILLSRGADYIATHPDLV CPTWYGSAPDCGSIIALLKTATGREPLVLGKPQPAMVQLAMEKTGFSPDQTVVIGDRIY TDIACGVNAGVDTVFVLSGEGVPSDIEKYDIHPIYVYNGIRDVLNALEKESDV" /locus_tag="LOCUS_2690" /note="WP_004082267.1 HAD-IIA family hydrolase (Thermotoga maritima) [pid:41.1%, q_cov:96.0%, s_cov:98.1%, Eval:1.6e-55]" /note="MGA_363" ORIGIN 1 gcccggcttt gtacggcgcg aagtacaagg gcattgtcgc gaaccgcgcg gacgaaccgg 61 ccgacgagac cgttacgatc tgcggcaagt gctgcgaagg cgactccgac atgatcatca 121 aggacgcccc gttcgcgatg cccaaaaccg gcgacatcat cgcggtgttc tccaccggcg 181 cttacggcta ctccatggcc aacaactaca accgcaaccc catccccggc gtcgtgctgg 241 tggaaaaagg caaggcggaa tggatggtaa agccgcagac ctacgagcag atgatctgct 301 gcgacgtaat gcccgaatcg ctgaaataaa cagcacacct atcatggaca cgaaaaaacc 361 ggccgtttgg ccggtttttt atgcttttga tcttaccctt ccggatcgaa cttctcgaag 421 atggggatgg cgcctgccgc ttcgcaagtc ttaaggtctt ccatgcgccg gatcgtccag 481 cagacctcct gcacgcccag tttatccacc gtcctgcgta tgctggatac gccgcggtct 541 tcgaacttgc aggcgataaa atccggacgc gccttgcagt cgaacagcag attcgtaagc 601 acgatgcgtt ggtaacgggg cagaccctcc ggatccttca gaaaattcga tacgagctga 661 cccctaacaa tgtccggccg cagctgcctt acatctgcga cggctctggg gtcaaacgat 721 tcgatgcaga acaacccctt gtaggaatcc agccgcttac agaccgcctc cgccagcgcc 781 cgatggttgc ccttgtaggt cttcagttcg atgatgagcg gctttgtctc ctcgaacagc 841 gccaatacct catcgaacag aggcacctgc tcttgtgtgc cttccagccg cagctgcttc 901 agctgcgcga ggtccagatc ctcgatcgtg ccctcctcgc ccgtgcagcg tttcaggtcc 961 gaatcgtgga acacagccag ggtgccatcc ttcagcagat gcacgtccag ttccgcgccc 1021 catccccttt cgatggctct gcggaatgcc ggcagcgaat tctccgggat ctgcggttta 1081 tcgtgatagc cccggtgggc gtagcggtat tgctttaatt ccggcagaag cggatgcccc 1141 gttctgcctc tcagaaagaa gtcgcgtatc atcagtcgtc catctcctca aacgcctgca 1201 ggcccttctt cgcttccggg cggttgtcgc cgtgatgcac ctgggtcatc gtcaggaaac 1261 tcagcgccac gaacagcgcc gcgtagggga acaggatctt gtagctgatg ttgcgcatca 1321 gcgtgcccgc caggataggc gttacgatct gcgccgccat ggacgcggtg tagtagtaac 1381 cggtaaattt accgatatcc gagcctttgc acatctccac gaccatgggc agggagttga 1441 cgttgatggc agcccaggcc aggccgacca gcgcaaacac gataaacatg atcgcgttga 1501 tggagctgta agtcgtcgtg agcacgtaac ccagagcgaa gcacacagcc agcagcacga 1561 tgccgcccat gatggtgcgt ctgcggccga tcttcgatgc cagcacgccg atggggatat 1621 aggagatgat ggcgccgact gtggcgatca gcaggcactt ggacgcgccg cccagcgcct 1681 gtcccatcac ctggctcacg tacgtcgtaa accaggtcgt gatgccgttg tagccgatga 1741 accacagcgc gatggatgcc agcaggaagc ccaggctgcg ctttaccggc ggaggaagga 1801 tctcgccgcc ggacccgtcg tcttccgcca ggttccattc gggatgctgt tcttccagcg 1861 cccggttctc cgccgtaagc tttggctcct tgatcgtgac gaacaggatg atgaccgccg 1921 ccagcataat ggcggagacg atgacgaaca gaggccggta atccacgtga gccaggcctt 1981 tcaccttctc gttgggatac agcaccgcag cgatcgccag atagatcatg ccgcccacgg 2041 cgcccatcag gttgatgatg gcgttggcct tggaacgcag aggcttggga gtaacgtccg 2101 gcatgagcgc tacagcagga gagcggtaga cgcccatggc cacgagcaaa aggcccagcg 2161 tgatgacgaa ggacacgagt ttaaagctgc tgggggctgc gtaataaccg ttgtcgagaa 2221 gcggcagcac gttgatgagc acgacagctg ccgccgttcc cagcaagata tagggcatgc 2281 gtttgccgat cttcgtatct gtcctgtcgg acaggccgcc gaagaacggc agcaggaaca 2341 gcgccagaat gttgtcccct gccatgatgg cgccggagaa cgtctcgttc aggtggaacg 2401 tattcgtgag gatgagaggc acgacgttgt cgtacatctg ccagaaggcg cagatggaca 2461 ggaaggcaag gccgaccagc accgttcgtt tgttgttcaa tttcatacgt cagactcctt 2521 ctccagggca ttcagcacgt cccggatgcc gttgtacaca tagatggggt gtatatcata 2581 tttttcgata tccgaaggca ccccttcccc ggacagcacg aagacggtat cgacgccggc 2641 atttacgccg caggcgatat ccgtatagat gcgatcgccg atgaccacgg tctgatccgg 2701 agaaaaaccg gtcttctcca tggcgagctg caccatggca ggctggggtt tgcccagaac 2761 aagcggttcc ctgcctgtcg ccgtcttcag cagcgcgatg atgctgccgc agtccggcgc 2821 actgccgtac caggtcggac agaccagatc gggatgggtc gcgatgtaat ccgcgccgcg 2881 gctgagcaaa atgcagcaga cctccagttt gcggtacgtc agctctttat cgtatcccag 2941 cagcacgaca tccgcgagat cgcccgggtc agcctccggc gcaccgttct cctccgcgag 3001 gatcagcccc gcagcccgca gctgctgctt taaactctcc gtgccgcaga cgaaatagcg 3061 ggtctttggt ccatacgcgc ctttcaggta acggatcgtg gcgtccgtcg acgtcacaaa 3121 atcctccggg ccgcacgcga tgccaaaccc ggccatacgg cggatatagg cgtcgagtcc 3181 ccgggaggag ttgttcgtca taaagaccgc cctgccgccc gtccgcttaa catggtccag 3241 aaagtccaat gtgccgtcga acaggcggtc gctcaggtag agcgtgccgt ccatgtcgag 3301 cagaaacagt tttttatctt ttaacgccat gctactctcc cggacggtag aacttcgcca 3361 gaccgccctc tgccgtctcc cggtaacggg cgttcatgtc cagaccggtc tggtacatgg 3421 tctccacgac ggtatcgaag gagatcttgc gggagctggt gaggaacgtg gcgatggata 3481 cggcattgat ggaccgcatg gccgccacgg cgttgcgttc gatgcagggg atctgcacga 3541 gaccgtcgat ggggtcgcaa gtgagcccca gcatatgctc catggaaacc tccgcggagt 3601 actcgatctg ctccagctcc agaccccgga tctccgcgag agccgccgct gccatgcagc 3661 aggcggtgcc gacttccgcc tggcagccgc attccgcgcc ggagatggag gcgttcgtct 3721 tgacgacgtt gccgatgacc cctcccgttg ccagcgcctg caggatgacc // LOCUS sequence068 3757 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence068 VERSION sequence068 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3757 /mol_type="genomic DNA" /organism="" /note="sequence068" CDS 448..1389 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MEFQTYNIVNERPRTIRALARQALQGRWTEAFVLLLVVTAIEQVP VSLVNSIAKQGSILGFIASIYSLLIAGPLAMGVAYYFIKLFRQRNGGLDDLKYGFGYAQ KAIVLHLNIIIRVFLWALLFIVPGIIAGIRYSMANYILADDPSKSPQQCLFESSAMMRG NKMNYVVLMISFVGWLIVASIPSGIVESILVRPAQAFLNSTDPSQYYAALSQAANHPLA LLASVPTLIVNAYMNTATACFYDLANGNLSVGGYDYAAAQGSVEDPFTGKDVTFTDVPT EVTHEDLPETFEDPELKAAEDKYTGDDNIYGE" /locus_tag="LOCUS_2700" /note="WP_008760815.1 DUF975 family protein (Bacteroides) [pid:36.8%, q_cov:55.3%, s_cov:78.7%, Eval:3.4e-20, partial hit]" /note="MGA_366" CDS 1389..2894 /product="UDP-N-acetylmuramoyl-L-alanyl-D-glutamate--L-lysi ne ligase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_002285962.1" /transl_table=11 /codon_start=1 /translation="MKKQTFLYEYVELLRGEGLLDAEPSKDLQFAPVQQLTFDSREAAP GTLFVCKGEAFKPEYLEKAFEAGAFCYVSEVRYAGEHLAILVSDIRRAMALMAELFYGT EERSFKLIGLTGTKGKSTTLYFIKNVLDAWYEKDGKRVGFLSTIDSYDGVNEFESHLTT PEAFTLHEHFWHAEEAGLPAFVMEVSSQGLKYDRTYGVSFDAGAFLNYGIDHVGKGEHT DEEDYISSKLRFFGQCKNVFLNLDTDRLDRIYGAAKDAGCFIHTYSAKGNPDADFRAED VRRENGYTLFTLKNREGETVYDFALSIPGSFNVENAMAAILLCRWLGVPHDAIAEGLKD ARAKGRMEVFENKEREVVVISDYAHNILSFEKLYEAVKEDYPGWRIEGLFGCPGGKGLS RREELPRAVSKYADFVWVTEEDPGLDDVSAICRTLSENLAKHGCPCRIVEDRTEAIETA IREAAPKTVIVMTGKGREEYMHRGNAYEPITSDSALAEKFLTE" /locus_tag="LOCUS_2710" /EC_number="6.3.2.7" /note="WP_002285962.1 UDP-N-acetylmuramoyl-L-alanyl-D-glutamate--L-lysine ligase (Enterococcus) [pid:36.5%, q_cov:93.2%, s_cov:92.4%, Eval:2.0e-74]" /note="MGA_367" CDS 2907..3263 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MSRFSVIAGRGGESRLVGRYETFEDCCAAAESMLRQGSGLGFHFK CNILCDDKEFFWVNSDAIGTGELVDLLDEWEQLGDEPGYAGADRDGKRAWVREALKSGR LVATGEAVALIPEE" /locus_tag="LOCUS_2720" /note="MGA_368" ORIGIN 1 aaggagagcg gcaaggagcc cgaaagacat ctgtacatgc agttcacctg tttcgaggaa 61 gtgggtcacg gcgctgccag ctactgcccg aagggggtca ccgagatgct gtccgtcgac 121 atgggctgcg tcggcgaagg ccttacctgc accgagcaca tggtctccat ctgcgcgaag 181 gacagttccg gaccgtacaa ctatgcggtc gtaaaagggc tggaagaagc ggcgatccgc 241 gcgaaggcgg actacgcggt ggacatctat cccagctaca gctccgacgc atctgtcgcg 301 gtctgcgcgg gattcgacgt ccgtcacggg gtcatcggcc cgggcgtcta cgcttcccac 361 ggctatgaga gaagccacaa ggacggcgtc tgcaacacgc tgctcctgct cgacgaatac 421 atccagtaac acgggaggga tcacaacatg gaatttcaga cttacaacat cgtaaatgaa 481 cggccgagga ccatccgggc cctggcgcgt caggcgctgc aggggagatg gacggaagcc 541 ttcgtcctgc tgctggtggt gaccgctatc gaacaggtgc ccgtttcgct ggtcaacagc 601 atcgcgaagc aggggagcat cctcggcttt atcgccagca tctattcgct gctgatcgca 661 ggccccctgg ccatgggcgt cgcctactac ttcatcaagc tgttccgtca gagaaacggc 721 ggcctggacg atctcaaata cggcttcggc tatgcgcaga aggccatcgt cctgcacttg 781 aacatcatca ttcgcgtgtt cctgtgggcg ctgctgttca tcgtgcccgg gatcatcgcc 841 ggcatccgct acagcatggc aaattacatc ctggcggatg accccagcaa gagcccgcag 901 cagtgcctct tcgaaagctc cgcgatgatg cgcggcaaca agatgaacta cgtcgtcctg 961 atgatcagct ttgtcggctg gctcatcgta gcgagcatcc cctccggcat cgtcgaatct 1021 attctggtaa gaccggcgca ggcgttcctg aactctacgg atccgagcca gtattatgcg 1081 gcgctttccc aggcggccaa ccatccgctg gcgctgctgg cttccgttcc gacgctcatc 1141 gtaaatgcct atatgaatac ggcgacggcc tgcttctacg atctggccaa cggcaatctg 1201 tccgtcggcg gctacgatta tgccgcggcg cagggcagcg tggaagatcc gtttacgggg 1261 aaagacgtaa cgtttacgga cgttcccacg gaagtgaccc acgaggatct gccggagacg 1321 ttcgaagatc cggagctgaa ggctgcggaa gacaaatata ccggcgacga taacatctac 1381 ggcgaataat gaagaaacag acctttcttt acgaatatgt ggagctgctg cggggtgaag 1441 gcctactgga cgcggagccg tccaaggacc ttcagtttgc cccggtacag cagctcacct 1501 tcgattcccg ggaggctgcg cccggcacgc ttttcgtgtg caaaggcgaa gcgtttaagc 1561 ccgagtatct ggagaaagcc ttcgaggcag gagcgttctg ctacgtgtcg gaggtgcgct 1621 acgcagggga gcatctagcg atcctcgtga gcgacatccg gcgcgccatg gctttgatgg 1681 cggaactgtt ctacgggacg gaggaacgca gttttaagtt gatcggtctt accggcacca 1741 agggcaaatc cacgacgctg tactttatca aaaacgttct ggatgcttgg tacgaaaagg 1801 atggcaagcg ggtcggcttt ctgtccacca tcgattccta cgacggtgtg aatgaattcg 1861 agtcgcactt gacgacgccg gaggcgttta cgctgcacga gcacttctgg catgcggagg 1921 aagcgggcct gcctgcgttc gtcatggaag tttcgtctca ggggctgaaa tacgaccgca 1981 cctacggcgt gtcattcgac gccggcgcgt tcctgaatta cgggatcgat cacgtgggca 2041 agggcgagca tacggacgaa gaggactaca tctcttcgaa gctgcgcttt ttcggccagt 2101 gcaaaaacgt gttcctcaac ctggatacag accgcttgga ccgcatctac ggcgccgcaa 2161 aggacgcggg ctgcttcatc catacctatt ccgccaaggg aaaccccgac gcggatttcc 2221 gggcagagga cgtgcggcgg gagaacggct acacgctctt tacgctcaag aacagggagg 2281 gcgagacggt ctacgatttc gcgctcagca tccccggctc cttcaatgtg gagaacgcca 2341 tggctgccat cttattgtgc cgctggctgg gcgtgcccca cgatgcgatc gcggaagggc 2401 tgaaggacgc ccgggccaag ggccgcatgg aagtgttcga gaataaggaa agagaagtcg 2461 tcgtcatctc cgactacgct cacaacatcc tgagctttga gaaactgtac gaagccgtga 2521 aggaggatta cccgggctgg cgcatcgaag gcctgttcgg atgccccggc ggcaaagggc 2581 tttcccgtag agaagaactg ccgagggcag tcagcaaata tgcagacttt gtgtgggtca 2641 ccgaggaaga ccccggtttg gatgacgtat cggccatctg ccgcacgctt tcggaaaatc 2701 tggcaaagca cgggtgcccc tgccgcatcg tggaggaccg caccgaagcc atcgaaacgg 2761 cgatccggga ggcggcgccg aagaccgtca tcgtcatgac cggcaaaggc cgggaagaat 2821 atatgcaccg tgggaacgcg tatgaaccca taacatccga ttccgccctg gcggaaaagt 2881 tcctgacaga gtaaggagga ggaaagatga gcagattcag cgtaattgcg ggccggggcg 2941 gcgagagccg tctggtgggc cgctacgaga cctttgagga ctgctgcgcc gcagcggaaa 3001 gcatgctgcg gcagggaagc ggcttgggtt ttcacttcaa gtgcaatatc ctgtgcgacg 3061 acaaggagtt cttctgggtg aattccgacg ccatcggcac cggagaactg gtggatcttc 3121 tggacgagtg ggaacagctt ggtgatgagc cgggctacgc tggagcggac cgggacggca 3181 agcgcgcctg ggtgcgcgag gcgctcaagt ctggacggct ggtggctacc ggcgaagccg 3241 tggcgctcat cccggaagaa taaaaagcaa aacactgggg ggacaggtac atcgtgcaca 3301 gcacagcgga tctgtccccc tgtatttttc agttattgtt acgcagtctt gattgagaga 3361 gaaagtttat ggctcagaaa aaagaagtga tcgatcttta tacggcagac cgcatcccga 3421 cgggtcagac catcctgcgc ggcgacaaac cgccggcagg cacgtaccgc ctggtcgtac 3481 atgtctgcat ctttaacagc aagggcgaga tgctcatcca aaagcgcaaa gacgatatcg 3541 tgcgctggcc gggctactgg gatgtgagcg tcggcggcca tgcgtcttcc ggcgatacga 3601 gcagggcggc tgcccatcgc gaaacaaaag aagaactcgg tctttcgatc gagttcgatg 3661 cgatacagcc tgccctgacg gtccatttcc cggaagggtt cgacgatttt tatgtgctgc 3721 cgatggatgt ggatgccgaa gggctgaccc tgcagca // LOCUS sequence069 3728 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence069 VERSION sequence069 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3728 /mol_type="genomic DNA" /organism="" /note="sequence069" CDS 217..768 /product="LemA family protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011085281.1" /transl_table=11 /codon_start=1 /translation="MILIIILVIILLCILYVFGFYNGCIKLRNQIEEAFSTMDVYLKQR YDLIPNLVNTVKGYAEHEQETLTALTEARTKAMAAQTAEQKVAGEQGLQSALGRLLAVA EAYPELKANQNFLNLQDQLKAQEDNIANARKYYNAVVREFNTKIEKMPGALFAGMFGFV KQPLFDIGDVTQRENVTVQF" /locus_tag="LOCUS_2730" /note="WP_011085281.1 LemA family protein (Bradyrhizobium) [pid:50.3%, q_cov:89.1%, s_cov:87.6%, Eval:6.2e-42]" /note="MGA_371" CDS 780..2525 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MKSTKRRHGFACLLCMVIVLLAAVPASAVSFTTDGFFTTLDVGED SSMHVTEEIYVTFTSPGHGIYRQIPNSGTHSYFMHGGELVEAPLPYVIRNVKCEGQEVE TDSEDGFLSVRIGSADVTVSGAQKYKLEYDIVMYEDGIDYLDQLYWNVIPAYWETDIDF AGFTVNMPKAFDASSADVITGPIGSGDDSTASWDVEEDGTVLAGHVDALPRREGVTVRI VLPEGYWTGVKSNAKQWWIAEGILGAITLLVLGLFLVKGRDPKTVKTVEFYPPENLSPA EIGYIYDNMVNDKDMTSLVMWFASKGYLKISAAPGEKKFLRKEQPIIILEKRRDLPADA PAYQKHFFDGLFEYGREANLKNLAVSTSFADSYEAAKESLQDRYGKTSPNRRLQEGQGY TAVGCLAGFIMLMVFGLATVFLYSYGGQFLKFLAVMVVCSIIVFLCVIHMSRPTPYRQK MLGRIQGFRDFIAAAELDRINQLVEQDPDYYYDILPYAYVFGLTDKWAKNFEALAPKAP DWYSGPDYYMMSPVVFCDSIGGSVRSSLSESAIHSTSASDFSGGSSGGGGFSGGGGGGG GGGGW" /locus_tag="LOCUS_2740" /note="WP_037392706.1 DUF2207 domain-containing protein (Sinorhizobium fredii) [pid:26.4%, q_cov:73.8%, s_cov:65.3%, Eval:5.7e-23, partial hit]" /note="MGA_372" CDS 2593..3174 /product="xanthine phosphoribosyltransferase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011948791.1" /transl_table=11 /codon_start=1 /translation="MKKLEERILKDGILIEDRILKVDSFINYQIDVELTNEMGLEFARI FKYCGATKVLTVETSGLPLAYAVARHLGDLPLLFAKKNKPNTNIDEDYCAEVRSFTKEV VNQIRVPKKYLNAGEKVLIIDDFLASGAASLGLLDLIDQAGASCVGVGVAVEKEFQGGR ALLEAKGLRVVSLAHITKMKDGKIEFNYTE" /locus_tag="LOCUS_2750" /EC_number="2.4.2.22" /note="WP_011948791.1 xanthine phosphoribosyltransferase (Clostridium botulinum) [pid:47.9%, q_cov:97.9%, s_cov:99.5%, Eval:1.1e-42]" /note="MGA_373" ORIGIN 1 cggcggaggt ggcggccgca gcagttcttc cggcggaggc ggcggatcgt ccgggggcgg 61 gttctccggc ggaggtggtg gcggcggagg cggcggcgcc tggtaaagcc tgaccctgcg 121 atggctgctc gcttgcgtac gctttgtttt caagtataat ataatataga aacactgtta 181 ttgttcgccc tatcctgaac aggaggtaac aaaaccatga tccttatcat tattcttgtg 241 atcatcctct tatgcattct ctacgtcttc ggtttctaca acggctgcat caagctgcgc 301 aatcagatcg aagaggcgtt ctccacaatg gatgtctatc tgaagcagag atacgacctg 361 atcccgaacc tggtgaacac cgtcaagggt tatgcggagc acgagcagga gacgctcacc 421 gcgctcaccg aagcccgcac gaaggcgatg gcggcgcaga ccgcagaaca gaaagtcgcg 481 ggagaacagg ggctgcagtc cgcgctgggc agattgctcg cggtcgcaga agcttatccg 541 gaactgaagg cgaaccagaa cttcctcaac ctgcaggacc agctgaaggc gcaggaagat 601 aacatcgcca acgcccgcaa gtactacaac gcggtcgtaa gagagttcaa cacgaagatc 661 gaaaagatgc ccggtgcgct gtttgccggc atgttcggct tcgtaaaaca gccgctcttc 721 gacatcggcg acgtaacgca gagagaaaat gtaaccgttc agttctaaag gaaaacgata 781 tgaaaagcac aaagagaagg cacggttttg cgtgcctttt gtgcatggtg atcgttcttc 841 tcgccgctgt tccggcttcc gccgtcagtt ttacgacgga cggtttcttt acgacgctgg 901 acgtggggga agattcctcc atgcacgtaa ccgaagagat ctacgttacc tttacttctc 961 cgggtcacgg gatctaccga cagatcccca attcggggac ccattcctat tttatgcacg 1021 gtggcgagct ggtggaagcg ccgcttccct atgttatccg caacgtgaag tgcgaaggtc 1081 aggaagtcga aacggattcc gaggacggct ttctgtcggt ccggatcggt tctgcggacg 1141 taacggtctc cggcgcccag aaatacaagc tggagtacga tatcgtgatg tacgaggacg 1201 ggatcgatta cctggatcag ctgtactgga acgtcatccc ggcttactgg gaaacggaca 1261 tcgattttgc cggctttacc gtcaacatgc ccaaggcgtt tgacgcatcc tctgcggatg 1321 tcatcaccgg tcccatcggc agcggagacg acagtacagc ctcctgggat gtggaagagg 1381 acggcacggt cctggcgggt cacgtggacg cattgcctcg cagggaaggc gttacggtcc 1441 gcatcgtcct gccggaaggc tattggacag gcgtaaagag caacgcgaag cagtggtgga 1501 tcgcggaggg gatcctgggt gcgatcacgc tgctggtgct ggggctcttc ctggtaaagg 1561 gccgtgaccc gaaaacggtc aagaccgtgg aattctaccc gccggagaat ctgtctcccg 1621 cagagatcgg ttacatctac gacaacatgg tcaacgacaa ggatatgaca tctctggtga 1681 tgtggttcgc gtcgaaggga tatctgaaga tctcagcggc tccgggcgaa aagaaattcc 1741 tacggaaaga acagccgatc atcatcctgg aaaagcgccg ggatctgccg gcggatgcac 1801 ctgcctacca gaaacacttc ttcgatgggt tgtttgaata cggcagagag gcgaatctga 1861 agaatctggc ggtgtccacc tccttcgcgg acagttacga ggcagcaaag gagagcctgc 1921 aggaccgtta cggcaagacg agtcccaatc ggaggctgca ggagggacag ggctatacgg 1981 cggtaggatg cctggcaggg tttatcatgc ttatggtgtt cggccttgcg acggtctttc 2041 tgtattccta cggcggacag ttcctgaaat tccttgcggt tatggtcgtc tgcagtatca 2101 tcgtcttcct ctgcgtcatc cacatgagcc gtccgacgcc gtaccggcag aagatgctcg 2161 ggcgcatcca gggcttccgt gactttatcg cagccgcaga actggaccgg atcaaccagt 2221 tggtggaaca ggatccggat tactattacg atatcctgcc ctatgcctac gtattcggac 2281 tgacggataa gtgggcgaag aacttcgaag cgctggcacc aaaagccccg gactggtaca 2341 gcggcccgga ctattatatg atgtcgcccg tagtcttctg cgattccatc ggaggcagcg 2401 tgcgttcgtc cctttccgaa agcgccatcc attccacctc ggccagcgat ttctccggtg 2461 gcagcagcgg tggcggcggt ttttccggcg gcggcggagg cggcggagga ggcggcggat 2521 ggtaatgctt gtttgttttg ccgcatacga tttgccccag tatttttgat cctattttag 2581 tgaattgaac ccatgaaaaa actcgaagaa agaattttaa aagacggcat cctcatcgag 2641 gaccgcattc tgaaggtcga ctcctttatc aattatcaga tcgacgtgga actgacgaac 2701 gagatgggac tggaatttgc ccgcatcttt aaatattgcg gcgctacgaa ggtccttacg 2761 gtggagacgt ccggtctgcc gctggcttac gccgtagcgc ggcatcttgg cgatctgccg 2821 ctgctgttcg ccaagaagaa caagcccaac acgaacatcg acgaagatta ctgtgcggaa 2881 gtgcggtcct ttacgaaaga ggtcgtaaac cagatccgcg tgccgaagaa atacctgaac 2941 gcaggtgaaa aagtcctcat catcgacgat ttcctggcgt ccggcgctgc ttccttagga 3001 ctgctggatc tgatcgacca ggcaggcgct tcctgcgtcg gcgtgggcgt cgccgtggaa 3061 aaggagttcc agggcggacg ggcgctgctg gaggcgaagg gacttcgcgt cgtttcgttg 3121 gctcacatca cgaagatgaa ggacggcaag atcgaattca actatacgga gtagaagggc 3181 agggacccca tgaagaagac gcagcgcatc tgcattatta cgcacatcct gacggaaaat 3241 cccaaccggg actattccct cggcaccttc gccgagatgt ttggctgcgc gaaatccagc 3301 gtgagcgacg acatcaagct ggtgagagaa gccatcgatg cagcaggcct cggctatctg 3361 gagaccacgt ccggcgcaaa gggcggtgtg cgctacgtgc cgtatatctc ccgtcaaacg 3421 gcggcggaag cgctggagga actgcggaaa gcttttgaag agccgtcgcg catgctgggc 3481 agcggattcg tctatacctc ggacatcatg ttcaatccga ggctcatccg cggcgcggcc 3541 atggtattcg ccaagcggtt tgccagcgcg gaagcggata tggtggtgac ggtggagacg 3601 aagggcattg gcgtggcgct gtttacggcg cggctgctca atatccctct tgcggtcatc 3661 cgccacgaga gcaaggtgtc ggaaggctcc tccatcaaca tcaactactt ttccgggtcg 3721 acggaccg // LOCUS sequence070 3727 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence070 VERSION sequence070 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3727 /mol_type="genomic DNA" /organism="" /note="sequence070" misc_feature <1..1201 /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_196793289.1:PAS domain-containing hybrid sensor histidine kinase/response regulator" /note="WP_196793289.1 PAS domain-containing hybrid sensor histidine kinase/response regulator (Oxalobacter formigenes) [pid:35.5%, q_cov:100.0%, s_cov:49.5%, Eval:9.2e-72, partial hit]" /note="MGA_375" /locus_tag="LOCUS_2760" CDS complement(1449..2408) /product="D-cysteine desulfhydrase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_001046622.1" /transl_table=11 /codon_start=1 /translation="MKKIEDFPRIPLAVLPTPIQKLENISRILGTNVYIKRDDMTGIGL GGNKVRKLEFLLADAKNKGAEIVFTTGGAQSNHAMLTAACCKKLGMTPILILKKRGVTD RKGNILLEYLMNTDVRFLDTDDSADVYREMDRVGQESGKVYYKIPTGGSNALGALGYVN CVKEISEQTDIKFDYICCAEGSGGTHAGVAMGAKLFMPETKVIGMMVDTDPFEEITTNI MKGLAELLELDFVPTVDDVHLVDVCGAGYAIPSPEGNEAIRMMAENEGLFLDPVYTGKA FGGLIKMAREGKFGPDDNILYLYSGGAGGLFAIDVNLD" /locus_tag="LOCUS_2770" /EC_number="4.4.1.15" /note="WP_001046622.1 D-cysteine desulfhydrase (Bacillus cereus) [pid:41.1%, q_cov:96.2%, s_cov:96.7%, Eval:1.2e-57]" /note="MGA_376" CDS 2596..3453 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MTEFFRPESIAQALSLLEQYRQDAAVVNGGSDIVIDLTKQRIHPA AIISIGQIAQLQQICLQDDYLCIGGAVTYKQMLSNADCCAFRGLVQAVSQVGSPAIRAV GTPAGNLVTAAPAADCATMLLALGADAVLQSTAGTRTVPLTEFYYSRGKTERRPNELLT EIRIPALAPDEGTGYFRVARRKAQDIGKVLAGCRITLADGVICQASISLGAVNACPVRA ESLEQAILGKSAEEAVEICRRTFPAEAGLRESYFKEYKEAVVPAVAAKAVALALEDAAE RSGR" /locus_tag="LOCUS_2780" /note="WP_013528241.1 xanthine dehydrogenase small subunit (Mesorhizobium ciceri) [pid:30.2%, q_cov:75.1%, s_cov:43.4%, Eval:4.1e-22, partial hit]" /note="MGA_377" ORIGIN 1 catcggcgac cagatgaagc tgcggcaggt gctcatcaac atcctgggca acgcagtgaa 61 gtttacgccg gagggcggca aagtggaact gaccgtggag cgcaccgcac agatggacaa 121 tcactccacg ctgcagttta agatctccga taccggcatc ggcatgagcg aggacttcct 181 gccccacatt ttcgatacct tcgcccagga ggattcctcc acgacgaacc ggtacggcag 241 ctccggactg ggtctcgcca ttaccaagcg catcgtcgag atgatgaacg gctccatcga 301 agtggcgagc gaaaagggca agggctccgt ctttaccgtg accgtgccgc tgatggattc 361 cgtgcgcaag ggcgcggaag gtgacccgga cgagatccgt ccgcaggaca tgagcgtgtt 421 gatcgtcgat gacgaccccg tcgcctgcca gcacggcaaa ctggtgctgg agaaggtggg 481 catcgcctcc gagatcgcat cctccggagc ggaagcggtc gagatggtcc ggctgcgcca 541 cgcgcgccgc gacccgtaca atctcatcct ggtggactgg cagatgccgg agatggacgg 601 cgtggagacc acgcgccaga tccgcagcat cgtcggaaac gaatccgcca tcatcatcct 661 gacggcctac cgctgggacg atgtgctgga ggaagccctg gaagccggcg tggacagctt 721 tatctcgaag cctctgttcg cccagaatct gatcgaagaa ttccgctccg cgttaaagag 781 aaagaacgta acggcgaaga agaccgcagc aaaggcggac cttaccggcc gccgcatcct 841 gctggccgaa gacgtggcga tcaacgcgga gatcatcgcc atggtgctgc agtcgaaaca 901 gatgacgtcg gaactggccg taaacggacg cattgccgtg gacatgttct ccgaacatcc 961 cgcaggatat tacgacgcga tcctgatgga tatgcgcatg ccggagatgg acggtctgga 1021 agccacgcgg acgatccgcg ctctggaccg ggaagatgcg aagaccatcc ccatcatcgc 1081 cctcacagcg aacgccttcg acgaagacgt acagcgcagc atgcaggcgg ggctcaatgc 1141 ccacctcagc aagccggtgc agccggaact gctgtttgag actctggagg ggctcattta 1201 aggataacgc ttgccaaacg cgccgcgatt cagtataata gtcgagcatg agccgcgccg 1261 ggagaccggc cgggccctgc gcaagagaca cctgtgaacc tggtcaggtc cggaaggaag 1321 cagccataaa cgggcccgtc tttgtgccgc agatcagtct ggccggtctc ccggcgcggt 1381 tcgtttttca tcacaacaaa aagagttccg gacaatgtgc cggaactctt cgtttattct 1441 gccggggatc agtcgaggtt gacgtcgatg gcgaacaggc cgccggcacc gccggagtac 1501 aggtacagga tgttgtcatc cggcccaaac ttgccttctc ttgccatctt gatgaggccg 1561 ccgaacgcct tgccggtgta gaccggatcg aggaacaggc cttcgttctc cgccatcatg 1621 cggatggctt cgttgccctc gggagatggg atcgcatagc ctgcgccgca gacgtctacg 1681 aggtggacgt cgtccacagt tggtacgaaa tccagttcca gcagttctgc cagacccttc 1741 atgatattcg tcgtgatctc ttcgaacgga tcggtatcga ccatcatgcc gatgaccttc 1801 gtctcgggca taaacagctt cgctcccatc gcgacgcccg cgtgggtacc gccgctgcct 1861 tccgcacagc agatgtagtc gaatttgatg tcggtctgtt cggagatctc tttgacgcaa 1921 ttgacgtagc ccagcgcgcc cagcgcattg gaaccgccgg tcgggatctt gtagtagacc 1981 ttgccgctct cctggccgac tctgtccatt tctctgtata cgtctgcgga atcgtcggtg 2041 tccaggaagc ggacgtccgt gttcatcagg tattccagca ggatgttgcc cttgcggtcc 2101 gttacgcctc tcttcttgag gatgaggatc ggggtcatgc cgagtttctt gcagcaggct 2161 gccgtcagca tggcgtggtt ggactgcgca ccgccggtgg tgaacacgat ctcggcgcct 2221 ttattcttgg catccgccag caggaattcc agcttgcgga ctttgttgcc gcccagaccg 2281 atgccggtca tgtcgtcgcg cttgatgtag acgttggtgc ccaggatgcg gctgatgttt 2341 tccagcttct ggatcggcgt cggaagcaca gccaggggga tgcggggaaa atcttctatt 2401 tttttcatgt tacgctcctt tgtcctgtga cccgggcaga tcggcccggt cctgtttgct 2461 tatctctatt atagaacacg ttggccgcga tggcgaggtg gttttctctt ctgctgcttt 2521 acatttcagg gaccgcaaga ataaaataaa ctgtgtagta ccgacagacc tcttcgttgg 2581 aaaggagaca ggaaattgac ggaatttttc cggcctgaaa gcatagcgca ggccctctcc 2641 ctgctggagc agtaccggca ggacgcagcc gtcgtcaacg gcggcagcga tatcgtaata 2701 gatcttacga agcagcgtat ccacccggct gcgatcatat ccatcggcca aatcgcgcag 2761 ctgcagcaga tctgcctgca ggatgactat ctgtgcatcg gcggcgctgt aacgtataaa 2821 cagatgctct cgaatgcgga ttgctgcgcc ttccgcggtc ttgtgcaggc ggtttcccag 2881 gttggaagcc ccgcgatccg ggccgtcgga acgcctgccg gcaatctggt gaccgcagca 2941 cccgccgcag attgtgccac catgctgctg gctctcggcg cagatgccgt gctgcagagc 3001 acggccggca cccgcaccgt tcctctcacc gaattctatt attcccgcgg aaagacagag 3061 cgcagaccga atgagcttct tacggagatc cgcatccccg cccttgcacc cgatgaaggc 3121 accgggtatt tccgcgtggc gcggcgcaaa gcccaggata tcggaaaggt cctggcaggc 3181 tgccgcataa cgctggcgga cggtgttatc tgccaggcaa gcatctccct gggcgcggtc 3241 aacgcctgcc ccgtgcgggc agaaagcctg gaacaggcaa ttctgggcaa gtccgcggaa 3301 gaggctgtcg agatctgcag gcgcaccttc cctgcggagg ctggcctgcg ggaatcctat 3361 ttcaaagaat ataaagaagc ggtagtcccg gctgtggcag cgaaggctgt tgcactggcg 3421 ctggaagacg ctgcggaaag gagcggacga tgatcccggt atcctttatt ctgaacggaa 3481 agccggtccg ctgcgaagtg ccggcggaag agacgctggt ggatacgatc cgcaaccgct 3541 tccgcctcac cggcacgaag aaaggctgcg gcaccgggga ctgcgggtcg tgcaccgtgc 3601 tgctggacgg cacggcggtg cgttcctgca cgctgctcac cggtatggtg gagggcagga 3661 gcataaccac catcgagggc gtgggcacca tggagaagct gcatcccgtg cagcaggcct 3721 tcgtgga // LOCUS sequence071 3723 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence071 VERSION sequence071 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3723 /mol_type="genomic DNA" /organism="" /note="sequence071" CDS 1541..2128 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MHFKKVLALLMAACLIFAAAGCKKESEEPSYVPANPNEEFILEIY APSELMAVMTDVANRYSTTVAPRASVRITFDDGVIQTAKIEAGTPCDIFVADEERFMDW LDAECDEEANPNKNDKIVSSTRHDFVTGPGNEDYMPEDMELAEGEVYNTTYSVAVCRAT ALSYESEQFVNYMLSDEVKDIYEVYGFETVEE" /locus_tag="LOCUS_2790" /note="MGA_380" ORIGIN 1 agtgtcgtag ccgtccggga agccgctgat gaattcctcc gcctgggcca gcacgcaggc 61 tctgcggatc tcctcgtccg tcgcgtccgg tttgccccag cgcaggtttt ccttgatggt 121 gcccgcgaac agcacgttct tctgcagcac catggccacg ctgctgcgca ggacttccag 181 gtcgtagtcc ctgacgtcca cgccgcccac ctttacgctg cccttgcgga cgtcgtagag 241 ccggggaatg agctgcacca tgctggattt gccggagccg gtgccgccga tgatgccgat 301 ggtctcgccg gatgccgcct cgaacgaaat gtttttcagg atatgtttgt tgctgccgta 361 gccgaaggag acatcggtga acacaacaga accgtccccg acggtccgga ccggatcttc 421 cggagagacg atgtcgggct gttcgtccag aacggcgcag atgcgctctg ccgccgcttt 481 ggcgatcgtc agcatcatga cgatcatgga cagcatcatc aggctcatca ggatctgctg 541 cacataggtc atgacggaca tcagctggcc ggtggtcatg gtgctggaga ccaccatctt 601 cgcgccgatc caggagatga gcagcatgca cacgtacatg caggtctgca tcagagggcc 661 gttgaacgcg atgatgcgct ccgcccgcac gaagttgctg tacagttcgc cggagacgtt 721 ctggaacttt tccttctcct cttcctcccg gacgaaggcc ttgacgaccc ggatgccccg 781 caggttttcc tgaaccacgg cgttcaggcg gtcgtagatg ccgaacacct tttccatgat 841 gggaaatgcg tgggtcatga tataggcgat gccgaagccc agaatgggca gcaccgccag 901 gaacaccagg gagagcctgg cgctctgccg gaaggccatc accagggcga acaccagcgt 961 gcagggcgaa cggaacgcca tgcgggtgag catcataaag gcctgctgca cgttcgtcac 1021 gtccgtggtc atgcgggtca cgaggccggc tgtagagaat ttatcgatgt tggagaagga 1081 gaaatcctgg atatgatgat acatatcgtg ctgcagatta ctggcgaagc cggcggatgc 1141 ccgggacgag aacagcccgc ccaggatgcc aaacgtcaga gacagcagcg cgtacaccac 1201 gagctttaag ccgatcgtgc ggatgtagtc caggtcgccc aattcgatgc cgtagtctac 1261 cagatctgcc atatggtaag ggatgagcac ttccatgacc acctccagta ccatgcagat 1321 cggggtgagg aacgtcagca gcttatactg ccggacgcat cctgccagtt tttttatcat 1381 aggacttgaa cacctttcgg attttatggt ataaattagg ttgtacgttt acgggaaagt 1441 tacctgacca ttttacagcg ccttgttttt ttacacaaga aaaaccgcag gcatttcacg 1501 aaatatacat tttataagaa tttaccggag gtttccatat atgcatttta agaaagttct 1561 cgcactgctg atggctgcat gccttatttt tgctgccgcc gggtgcaaga aagagtccga 1621 agaacccagc tacgttcccg caaaccccaa cgaagagttt atcctggaga tctacgcccc 1681 ttccgagctg atggccgtca tgaccgacgt cgccaaccgc tactccacca ccgtggcgcc 1741 gagagcatcc gtgcgcatca ccttcgatga cggggtcatc cagaccgcaa agatcgaagc 1801 cggcacgccc tgcgacatct tcgtcgccga cgaagagcgc tttatggact ggctggacgc 1861 ggaatgcgat gaggaagcca atccgaacaa gaacgacaag atcgtctcat ctacaagaca 1921 cgatttcgtc accggcccgg gcaacgagga ctatatgccc gaagacatgg aactggcgga 1981 aggcgaagta tacaatacga cctacagcgt cgccgtatgc cgtgcgaccg ctctttccta 2041 cgaatccgaa cagttcgtca actacatgct gagcgacgaa gtcaaggata tctacgaagt 2101 ttacggattc gagaccgtag aagaataaaa ccgttttcag cggcaggcaa tctcgcctgc 2161 cgttccttac atatccaatt tcataaaaac caaaggagaa ttgtcatgaa gaaaagattc 2221 atcgcaatgg tactggcatt cgtaatggtg cttgcattgg gcgcgtgcac aagcgagaca 2281 cccgcaaacg atcccggaac ggaaactccc gaggctacag gtggaatggt cgaaggcgga 2341 gagatcaccg tcggcctcta caacgatctg gacgcaagtc ttgacccgca catgtcttca 2401 tcgtcggcag gaacccgcga gatccttttc aatatctttg aaggcctcgt caagcccaac 2461 agcgacggtg aactggtgcc ggccatcgcg gaaagctatt ccgtcaacga cagcgccgat 2521 cagtacacct ttaagcttcg gcaaggcgtt aaattccata acggcaagga cgttaccatt 2581 tccgacgtcg tctggtccct gtccagagcc gcaggtctgg agaccggcga acctctggtg 2641 agcgacgtag cgaacattgc cgcggtcacc gcgacggacg atacgaccgt cgtcatcgac 2701 ctcaagaagc ccgacaccga attccttgcg catatcacca ccgccatcat ccccgaaggc 2761 atcgatcctc tgagcgaagt cgtaggcacc ggtccgttta aattcgtgtc ccgcgtcgtg 2821 cagagcgaga tcgtgctgga gaagttcgac gaatactggg gcgaaccggc acatctggac 2881 aaggtgaccc tcaagatcat cgaaaatccc gagaccctgg tgatgagcct gcgttccggc 2941 gccgtggaca tggctgtccg gctcaacgcc aaccagatca agaccctcac caacctgaaa 3001 gtgctggagg gaagcagcaa tatcgtgcag gccctctatc tgaataatgc cgtaaagccc 3061 ttcgacgacg tgcgcgtgcg ccaggcgctg tgctatgccc tggacaagca cgagatcatc 3121 gatctggcat ccgacggcta cggcagccct gtcggcagca gcatgttccc cgcctttggt 3181 aaatacttca tgcccgaact gacggattac tacaccaagg acctggacaa ggcgaaagaa 3241 ctgctgacgg aagccggtta tcccgacggc tttgaattca ccatcaccgt accctccacc 3301 atgcagaccc acgtggacgt cgcacagacg atcgtcgaac tgctgcgccc catcggcgta 3361 acggccaaag tggatcaggt ggaatgggcg acctggtatt ccgacgccta tcagaaccgc 3421 cagttcgaag cgaccgtcgt cggcatggat gcccacggcg tagctgcctc cgacatgctg 3481 gccagattcc agagcaccca cgcaaagaac ttcatcaact tcaactctcc caaatacgac 3541 gagaccttcg cggccgccgt atccaccacg gacgatgcgg agcagacgag actgttcaag 3601 gaatgcgaga ccatcctcgc ggaagaggca gccaacgtct acatccagga cggcgcatcc 3661 ttcaccgcca tggcaacgga tctggaaggc atggagttct atccgctcta cgtcctcgat 3721 cta // LOCUS sequence072 3719 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence072 VERSION sequence072 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3719 /mol_type="genomic DNA" /organism="" /note="sequence072" CDS 885..1418 /product="ribosome-associated translation inhibitor RaiA" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_010966132.1" /transl_table=11 /codon_start=1 /translation="MFIEITGKNLNPSDKLQATIEKKFSKLDKYFSGESKAAIMCSEVK TGLCKLEATIYAAGMIFRAEESSNDIYYCLDKVIDKLSTQMSRFKTRLIRRHNTQKDIL FAEIPDTAAAPEEEKGIVRTKRFKLNPMTSEEAILQMELLEHNFFIYKDGESGGINVVY KRADGSYGLLETEE" /locus_tag="LOCUS_2800" /gene="raiA" /note="WP_010966132.1 ribosome-associated translation inhibitor RaiA (Clostridium) [pid:46.0%, q_cov:99.4%, s_cov:99.4%, Eval:4.0e-35]" /note="MGA_383" CDS complement(1483..2349) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MLSYERFKQAVRTELKHYLPEDYAEHRLVEKKLYKINRCVDTFRL QPPGPVSAVPMPTLNYQDLYRSIVAGAKLESVLRSAAQAMQYRLPPEIEEECLQLQEDK PDPETIHLALINRKRNRQLLKNVPHQDFLDLAAIAVIEEGPGSGYLCVVTKEILKDLDM TQEELLKLACGNTFREYPSVLEQSQLGLNAWCEGSTFGAVCLLDKDMLREAAERLDSDV YVLPDSLHLLFLIAVKSIPRAIVLETFRRATLLEPDALDYLSDNIYYYDREQDCLKILS EHTKLPA" /locus_tag="LOCUS_2810" /note="MGA_384" CDS 2523..3542 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MDAGSISVIPRYLFFIALLLLGGAYFAAAETAFASVSKIRMISDA DDGDERAQKALYVLDHFDKALTTLLIGNNVMHIACSSAATLLASKLWGNRAVTACTFVT AFVVFLFAEMIPKSYAKACSETLAPRVAGSLIFFMKVLTPVSFLFSGISHAVTKIVGTD GSDEPTVTEEELFDIIESIDGEDKIDEDAAELVQSALEFTVKTVNFVLTPWNATVKISR SMSDDEILQVITEGHFSRLPVVDENGELEGILHIRKFLKAKIRGRKALQSRSMLDKPFY LPLYMPIDEALDALSSNRAHMAIVQRGDGSIAGIVTVEDILEELVGEIYDEEEGGLPK" /locus_tag="LOCUS_2820" /note="WP_012869172.1 hemolysin family protein (Thermanaerovibrio acidaminovorans) [pid:31.2%, q_cov:92.6%, s_cov:73.2%, Eval:4.8e-39, partial hit]" /note="MGA_385" ORIGIN 1 agctcctcgc gcaccttcag ctgtccgccg gtgagcttga tccaggtgag ccgcgcgccg 61 tcttcggcgc gggtgatctt aatgacgcgg cctctcaggt ccgcaggcca gcgcttttct 121 tcgatgcagt ccttcaggcc gtccaggaat tcctgcacgc cttccagctt caatgcggaa 181 ccgaaccagc aggggaacac cttgcgctcg cggacgaggc gccggactgt gttctgcggg 241 agggttccgc ccgccagata ttcttccagg gcgtcttcgt cggtcagtgc gatcgcctct 301 gccgcgtccg ctgcggccat gtcgacgcag tggggggaca gcttgccctg cagcagctgc 361 aggatctcct gtctcgcatc gtttcctctc gccgtttccg ccaggtccat cttattgacc 421 cacaggaacg tgggcacctg atagcgcttt aaaagcgccc agaccgtcgc ggtgtgggcc 481 tgcacgccgt ccggtccgga gatgacgagg atcgcgtagt cgagcacgga gagggtgcgc 541 tccatctcgg cggaaaagtc catgtgaccc ggcgtgtcca gcagggtcac gcgggtatcg 601 cccaggtcga agaccgcctg tttggagaat atggtaatgc cccggcggcg ctccagccgc 661 tgggtgtcta aaaacgcgtc cttatggtcg acccgtccca gggtcttgat ggcgcccgtc 721 cggtacagca tggcctccgc catggaggtc ttgcctgcgt ccacgtgggc gaggatgccg 781 atcgccgtgt gtttcatggg actattgtag cacacgcggg ctcttttatg gtataatgac 841 cttgaggcga aggcctcgca aaaaccaaac aaggaggttt tgttatgttt attgaaatca 901 ccggcaagaa tcttaacccg agcgacaagc tgcaggctac catcgaaaag aaattctcca 961 aactggacaa gtacttttcg ggcgaatcca aagctgccat catgtgcagc gaggtgaaga 1021 ccggcctctg caagctggaa gctaccatct atgctgccgg catgatcttc cgcgcagaag 1081 aatccagcaa tgacatctac tattgcctgg acaaggtcat cgacaaactc tccacgcaga 1141 tgtcccgttt caagacgaga ctcatccgcc gtcacaacac gcagaaggat attctcttcg 1201 cagagatccc cgacactgca gccgcaccgg aagaagagaa gggcatcgtg cgcaccaagc 1261 gcttcaagct caaccccatg acttccgaag aggcgatcct gcagatggag ctgctggagc 1321 acaacttctt catctacaag gacggcgaga gcggaggtat caacgtagtc tacaagagag 1381 cggacggatc ttacggtctg ctggagacgg aagaatagac ctcttctgac gcaatacagt 1441 aacgaaacgg gccctgcgca agcagggcct ttcctgttgc cgtcaagccg gcagtttcgt 1501 gtgttcgctc aggatcttca ggcagtcctg ctcgcggtcg taataataga tgttgtcgga 1561 cagataatcg agggcgtcgg gctccagcag cgtcgcccgg cggaacgtct ccaggacgat 1621 ggcccgcgga atgctcttga ccgcgatcag aaacagcagg tgaaggctgt ccggcaggac 1681 gtagacgtcc gaatccaggc gctcggctgc ttcccgcagc atatccttgt ccagcaggca 1741 gacggcgccg aacgtgctgc cttcgcacca ggcgttcagc ccgagctgcg actgttccag 1801 cacgctcggg tactcccgga acgtattccc gcaggcgagc ttcagcagtt cctcctgggt 1861 catgtccagg tcttttaaga tctccttcgt gaccacgcac agatatccgc tgccgggtcc 1921 ctcctcgatg accgcgatgg ccgccaggtc caggaaatcc tgatgcggca cgttcttcag 1981 cagctggcgg ttgcgcttgc ggttgatgag cgcgaggtgg atggtctccg gatccggctt 2041 gtcttcctgc agctgcaggc attcctcttc gatctcgggc ggcagccggt actgcatcgc 2101 ctgggccgcg ctgcgcagca cgctttccag tttcgctccg gcgacgatgc tgcggtacag 2161 gtcctggtaa ttcagcgtag gcatgggcac agcggaaacg ggaccgggcg gctgcaggcg 2221 gaacgtgtcg acgcagcggt tgatcttgta cagtttcttt tcgaccaggc gatgttcggc 2281 gtagtcctcg ggcaggtagt gtttcagttc cgtgcggaca gcctgtttga atcgttcgta 2341 agagagcatg gcatcctcct tttagataaa tggtaatatt tgtaaatatc atacaataac 2401 tgttaaaatc tgtaaagcaa atttttacca tttttctgtc gggatttcct cccgcccatt 2461 gtacgggaga ggggagtatg ctataatact ctaagtttga acacaggagg tgattcgtcc 2521 ttatggacgc cggaagtatt tccgttattc cgcgatattt gtttttcata gcgttgctgc 2581 ttttgggagg cgcgtatttc gccgcggccg agactgcttt tgcgtcggtc agcaaaatac 2641 gcatgatttc cgatgcggac gacggtgacg agcgcgcgca gaaggcgctt tacgtgctgg 2701 atcatttcga taaggctctc accactctgc tgatcggaaa taacgtaatg cacattgcat 2761 gctcctccgc ggcaacgctt ttagcatcca aattatgggg caacagggcg gtgacggcct 2821 gtacgttcgt caccgctttt gtcgtgttcc tgtttgcgga gatgatcccc aaatcctacg 2881 cgaaggcctg cagcgagacg ctggcgccgc gggtggcagg gtccctcatc ttctttatga 2941 aagtcctcac cccggtcagt ttcctgttct ccggcatcag ccacgccgtg acgaagatcg 3001 tgggaacgga cggttcggac gagccgaccg ttacggagga ggaactgttc gatatcatcg 3061 agagcatcga cggggaggac aagatcgacg aagacgcggc ggaactggtg cagtccgcgc 3121 tggagtttac cgtcaagacc gtcaatttcg tgctgacgcc ctggaacgcc acggtaaaga 3181 tcagccgctc catgagcgac gacgagatcc tgcaggtcat caccgaaggg catttctccc 3241 gcctgcccgt cgtcgatgaa aacggcgagc tggaaggcat cctgcacatc cgcaagttcc 3301 tgaaggcgaa gatccgcggc cgcaaggctc tgcagtcccg ttccatgctg gacaagccgt 3361 tctatctgcc gctgtacatg cccatcgacg aagcgctgga cgccctcagc agcaaccgcg 3421 cgcacatggc tatcgtgcag agaggggacg gcagcatcgc gggcatcgtc acggtcgagg 3481 acatcctgga ggaactggtc ggagagatct acgacgaaga ggaagggggt ctgccgaaat 3541 gacccgcagc atcatgttca tcgtgcttct gatcctgctt tccgcgtttt tctcgggttc 3601 cgagatctcc tacgcgggcg ccagcgaagt caagctgcgc aaggcggcgg aaaacgctgc 3661 gaagaaaaga agcagagaaa aatacgcaaa tgctataaaa gagaattacg aagaggcgc // LOCUS sequence073 3702 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence073 VERSION sequence073 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3702 /mol_type="genomic DNA" /organism="" /note="sequence073" ORIGIN 1 cggacagcag attcatgttc tgcagcttct ttccgggcgg ctgcgcctcg atctcgatgg 61 cggattccag ggggttgttc gggtcatcca gcgtaagccg tgcgtgaccg cccttgaaca 121 gctccgtaaa cgtcgcctcg aaattctcga ccaccgcgtc gaagctttcc ttaaagcggg 181 ctttgatggt ggcatcgatg tcgcggatga cggcatttag ctcgtcgatg gcctggttga 241 ggtcgtccct ctgggccgtc aggaaggcgt agcgctcgct cacagccttg tattcctcga 301 tggcgccgat gttcacgtct cccagcgccc gcagtctttc cttgtattcc ctggattcct 361 tcatgccgcg ggacattacg aagtccggat ccgcgaagtc cttcgcctgc gcgtaggaca 421 tctcgaactc ctcccagagt ttttccttca gggattcggt ctgggcgtcg aaacgggcaa 481 ggcgtacttc cgcatcgtgc ttgctcacct ggtgctcata cagcacgctg tcacagcgga 541 tgcggtcttc ctcgagcgcg tccgccttcg cctgatcgtc tctgcggcgg gcggagagct 601 ccgtttcctt cgcttccaat tcgctgcggc tgtcctgttt ttcctttaag ccggctttcg 661 cctcttccgc aaaggattcg atctcgcgct tctgcacgcc gatatcctca agcgcctgtt 721 ctttgctgtg ctgcagcgcc tgaagctccg ccagagatgt gcgtaccctg tcttccaaat 781 cctgtgcgcc ctggagcttt acggcggcag cgttttcctc catgcgggct gccgtgttgg 841 cggcctgcgc ctcttcgaag agactgcgga cctgttcggc ttcttctgcc agacggtctg 901 ccgctttctg cgcctcgctt ctggaggatt cctgctcgga ggatctgccg cgcagcgctg 961 cgatattgcg atccgcttcc gcgatctcct tctccagatc cgcctgttcc gccaaccgtc 1021 tgccggctgc gtctctggcg tcttcgcgct gcagtttcag ctgctgcgcc tccttttcca 1081 ggacggcgac cgtacggtct gccgcggcga tacccatctg cagttcctga acgtcctgca 1141 ggcatccgga aagtctttga cggcaggcgt ctctttcttc ctgcgcgttc tgcagatctt 1201 tggcgctctg ccggatctgc ttctccagtt cctctttttc ggctttccgc gagatgatgt 1261 tggctgtatt gtttttaaag gatccgccgg taatggcgcc ggccggattg atgtgttcgc 1321 cttccagggt cacataacgg agcgttccgc ccttcttgga cagttttaac gcgctgtcca 1381 gatcccggca cacgacgacc ttgcccagca ggtactccac gatgttctcg tatccgcccc 1441 ggcaggtgac ccgttcagaa gccagtccca ggaagccgtc catgccctgg atggcggaca 1501 gatccgcagg ttttccggcc ttgatgctgt ctgccggcag gaatgtgagg cgtccggcct 1561 tcttcgcctt cagccgttcg atggcctttt tcgcggatgc gtcgctgtcg cagatgatgt 1621 tctgcacgtt gccgcccaat gccgtctcca cggcgacttc ccagcccttg ggaacggaca 1681 gcagttcgcc caccgtgccg acgatgccgg atacgccctc ctgcatcata aagcgcacgg 1741 cgccgttata tccctcgtag gagcgttcga gctcctccag aagcttatgt cttgcagcga 1801 gttcgccggc ttttacgcgg atctcttcaa tcgcagcagc cgacgccgcc agtcccttat 1861 ccagagacgc ccgcttttcc gaagcttcct gcaagtcttt ctgcagacgc gccttggaat 1921 ccttcgcttc ctgcaggtct tcctccgcct gttccaggcg ggataccagt ccgtcgctct 1981 ccgcggtctc cccgtcttcc tgcagacgct gcagtcttct ctgcagcgtc tgcttcaggt 2041 tctccatgct ggagacttcc gctcctgcgg cgctgatggc tgcggtcagt tccaggatgg 2101 acgctttcgc ctcctccagt tccgcttcct tggcggtcag ctgtttctgc acgctctctg 2161 cggcagcttc ggcctcctcc gctttcttcc gggcggcagc ttcctctccg gaaacggcag 2221 ccttcgtctg ctgcatctcc tgcagattgg cggtctcccg ttctatcttt tcgatcgtct 2281 cgctccgctc gccctccagg cgcacgcggt cgcgttccaa tgcggcgtaa cgctcgttat 2341 tgaggccttc ccggctctcg atgaagtgga tctcctccgt cacacggccg atctgccggc 2401 gcaggtcgtc cagcttcagc tctgtttcgg cgctggcggc gcgcatcgcg cggagatcgt 2461 tttccacggt ctcccgtctg gtgcggtcct cgtccagaat cttgtccagt tcctccatct 2521 ccgtgcggac agcttccgtt ttaccgtccg ccgcatcgat gttcttcagg atgatgttga 2581 tctcgacgtc cttgtatctg tcccggatct gcagatattc ctgcgctttt tcggaatccc 2641 gctttaagcc gtcgatacgg ccttcgatct cggaggcgat gtcgttcacc cgtgcgagat 2701 tctgcgatgc gctctccagc ttgcgttcgg tctccgcttt gcggttgcgg tattttacga 2761 taccggccgc ttcttcgaag atctcgcggc ggctgtccat cttgttgctg atgatgtccg 2821 cgatcttgcc ctggccgatg atggaatacc cttccacgcc gatgcccgta tccatgatga 2881 gttcccggat gtcgcgcaga cggcagggcg tccggttgat catatattcg ctctcaccgc 2941 tgcggtacat gcgccgcgtg atgccgactt ccgtatagtc gatgggcagc gtatgatcgg 3001 aattgtcgat gacgagggtc acctccgcaa ggcccttggg cttgcggctc tgcgtgccgg 3061 cgaagatgac ctcttccatc ttgccgccgc gcagcatctt cgggctctgc tcgcccagca 3121 cccaccggat ggcatcggaa atattggatt ttccggatcc gttcgggccg acgatgcagg 3181 tcattccctc ggtgaattct attgtgaccg gatctgcaaa ggatttgaat ccattgagtt 3241 ccatgcgttt gaagtacata actacccctt ggtctgaatg gcgttcagcg ccacggctgc 3301 tgcgtgctgt tccgcctctt ttttgctctt tccgctgccc tcacccatca gttttccgta 3361 ggcatatacg gcagccgtaa acgttttggc gtggtccgga ccgctctcgg acaggatctc 3421 gtaatggatc tggggtgcgc cctcctccgc agtcctgtga ctcagcactt cctgcagcgt 3481 cgttttggca tccttaggca gctgtcccca ctcgcagagc tgcgccgttt cggtaagaca 3541 ggtcctcacg accgtattcg ccgcatcgaa gcctccgtcc agataggcgg cgccgatgat 3601 cgcctccatg cagtccgcga tgatggagat gcggtctctg ccgccgccgc tctcttcgcc 3661 gcggctcagc aacagaaatt cgttgatgcc gagttttctg cc // LOCUS sequence074 3683 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence074 VERSION sequence074 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3683 /mol_type="genomic DNA" /organism="" /note="sequence074" misc_feature <1..842 /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_011393917.1:preprotein translocase subunit SecY" /note="WP_011393917.1 preprotein translocase subunit SecY (Moorella thermoacetica) [pid:51.6%, q_cov:100.0%, s_cov:65.2%, Eval:5.5e-80, partial hit]" /note="MGA_389" /locus_tag="LOCUS_2830" CDS 853..1500 /product="adenylate kinase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011860634.1" /transl_table=11 /codon_start=1 /translation="MKRVVLLGPPGAGKGTQATRIAEKYNILHISTGDIFRANVKEGTP LGKKAKEYMDQGLLVPDELVCDLVEDRVSKEDCANGYLLDGFPRTVFQAEHFDAFLERT GAELDKTVDIEVAEDILLPRMIGRRVCRQCGRPYHVVTMPPKVEGVCDACGGEVYQRAD DREETVLNRFRVYQEQTSPLIEYYQKSGRLAVIDGSKTPDEVFDDICALLGE" /locus_tag="LOCUS_2840" /EC_number="2.7.4.3" /note="WP_011860634.1 adenylate kinase (Clostridioides difficile) [pid:65.6%, q_cov:98.6%, s_cov:98.1%, Eval:2.3e-79]" /note="MGA_390" CDS 1504..2253 /product="type I methionyl aminopeptidase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003421130.1" /transl_table=11 /codon_start=1 /translation="MIVLKSHEEIELMAKAASVTAAMLEEIPNILMPGMTTLELDHWCE DYILRHQMKPAFKGYGGFPGTACVSVNEEVVHGIPTKRRVLQEGDIVSVDLGTVYKGFY SDAARTYPVGKVSAEAQKLMEVCEASFFEGLKFCKKGHRLGDVAHAIQTYVESNGFSVI RDYTGHGVGRDLHEDPQIPNYGRANHGPQLVPGMVIAVEPMIAAGDYDVEVLSNGWTAV TLDRSLAAHYENTIVITEDEPRLLTKL" /locus_tag="LOCUS_2850" /gene="map" /EC_number="3.4.11.18" /note="WP_003421130.1 type I methionyl aminopeptidase (Clostridioides) [pid:56.6%, q_cov:100.0%, s_cov:100.0%, Eval:7.0e-81]" /note="MGA_391" CDS 2278..2496 /product="translation initiation factor IF-1" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003421127.1" /transl_table=11 /codon_start=1 /translation="MAKKDSIEVFGTVLEALPNAMFKVKLENDFIVMAHISGKMRMNFI RILPGDRVRMELSPYDLSKGRITWRDK" /locus_tag="LOCUS_2860" /gene="infA" /note="WP_003421127.1 translation initiation factor IF-1 (Clostridioides) [pid:75.0%, q_cov:100.0%, s_cov:100.0%, Eval:5.8e-25]" /note="MGA_392" CDS 2762..3130 /product="30S ribosomal protein S13" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_005810116.1" /transl_table=11 /codon_start=1 /translation="MARIAGVDLPREKRVEIGLTYIYGIGLPTSKLILEKANINPDTRV KDLTEEEVGAIRKIIDSEYVVEGDLRREVSMNIKRLMEIGCYRGIRHRRNLPVRGQNTK NNSRTRKGPKKTVGRKKK" /locus_tag="LOCUS_2870" /gene="rpsM" /note="WP_005810116.1 30S ribosomal protein S13 (Desulfitobacterium) [pid:74.8%, q_cov:87.7%, s_cov:87.0%, Eval:6.0e-43]" /note="MGA_393" CDS 3151..3546 /product="30S ribosomal protein S11" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003421122.1" /transl_table=11 /codon_start=1 /translation="MATVKKTVRKKRRERKNIESGQAHIQASFNNTLVTLTDLNGNALA WSSAGSLGFKGSRKSTPFAAQMAAEEAAKGAMEHGLKTVEVYVKGPGSGREAAIRALQT AGLNITMIKDITPIPHNGCRPPKRRRV" /locus_tag="LOCUS_2880" /gene="rpsK" /note="WP_003421122.1 30S ribosomal protein S11 (Clostridioides) [pid:75.6%, q_cov:93.9%, s_cov:93.2%, Eval:9.3e-52]" /note="MGA_394" ORIGIN 1 ggatcgtcat aatactgacc ctggtggcag gtacagcctt ccttatgtgg ctgggcgaac 61 agatcaacga gcacggcata ggcaacggca tatctctgat aatctttgcc ggtatcgtat 121 cccgcatccc gacgagcatc tccagaacga tcaagaacct gtccgcaggc acgctctcca 181 tcgtgagcct gatcatcttc ctggtatttg ccctggcggt catcgtcggc atcatcatga 241 tccaggaagg caaccgcaag atccccgtgc agtatgcaaa gagagtcgtt ggccgtaaga 301 tgtacggtgg ccagtccacc cacattcctc tcaaggtcaa ccaggccggc gttatccccg 361 tgatcttcgc catctccctg ctgcagatcc tgccgacgat cgcgtacatg accggcagcg 421 acaccggctt tgccaagttc gtgaccaagt atctgacctc gagcggcaac cccggcgtat 481 ggatctacct ggtactggat atcctgctca tcatcttctt cacgtatttc tacggttcca 541 tcacggtcaa ccccgtagag atcgcggaca acatgagagc gaacggcggc ttcatccccg 601 gcatccgccc gggcaagccg acgtcggatt acatcgcgaa ggttctgtcc agactgaatt 661 tcgcaagcgc gatcttcctg gccatcatcg ccgcgatccc catcctgatc ggacatttca 721 ccagtttctc ttccgcgttt ggcggaacgt ccctcatcat cgccgtgggc gttgccctcg 781 acaccatgaa ggcgctcgaa acgcagatgg tcatgagaaa ctacagcggt ttcttaaagt 841 aggaggcaag ctatgaagcg cgttgtactg cttggaccgc cgggagccgg caaaggcacc 901 caggcgacga gaatcgctga aaaatacaac attctgcaca tctccaccgg agacatcttc 961 cgcgcgaacg tcaaggaagg cactccgctg ggcaaaaagg ccaaggaata tatggaccag 1021 ggcctgctcg tccccgacga gctggtgtgc gacctggtgg aagaccgggt cagcaaggaa 1081 gactgcgcaa acggttacct gctggacggc ttccccagaa ccgtcttcca ggcggagcac 1141 ttcgatgctt tcctcgaaag aacaggtgcc gagctggata agaccgtaga catcgaagta 1201 gcggaagaca tcctgctgcc gagaatgatc ggcagaagag tctgcagaca gtgcggacgc 1261 ccctaccacg tcgtcacgat gcctcccaaa gtggaaggcg tatgcgacgc gtgcggcggc 1321 gaggtctacc agagagcgga cgaccgcgag gagaccgttc tcaaccgctt ccgggtctat 1381 caggaacaga cgagtcctct gatcgagtac tatcagaaga gcggaagact ggctgtcatc 1441 gacggcagca agactcccga cgaagtgttc gatgacattt gcgccctcct gggagagtaa 1501 gacatgatcg tactgaaatc ccacgaggag atcgaactca tggcaaaggc cgcttccgta 1561 acggccgcca tgctggaaga gatcccaaac attctcatgc ccggcatgac gaccctggag 1621 ctggaccatt ggtgtgaaga ctacatctta agacatcaga tgaagcccgc cttcaaaggc 1681 tacggcggat tccccggcac ggcgtgcgtc tccgtcaacg aggaagtcgt tcacggcatc 1741 ccgacgaagc ggcgcgtgct gcaggaaggc gacatcgtaa gcgtcgacct ggggaccgtc 1801 tacaagggat tctactccga cgcggcgagg acctaccctg tgggcaaggt ctccgcggag 1861 gcgcagaaac ttatggaagt ctgcgaggca agcttcttcg aaggtctgaa gttctgcaaa 1921 aagggccatc gccttggcga cgtggcgcac gcgatccaga cgtacgtgga aagcaacggc 1981 ttttccgtca tccgggatta cacgggtcac ggcgtgggca gggacctgca cgaagacccg 2041 cagatcccca actacggcag ggcgaaccac ggtccgcagc tggtccccgg catggtgatc 2101 gctgtggagc cgatgatcgc cgcaggcgat tacgacgtgg aagtgctgag caacggctgg 2161 accgcggtca cgttggaccg ctccctggcc gctcactacg agaacacgat cgtcatcacc 2221 gaagatgagc caagattgct cacgaagctt taaacgcgca aaggaggaga gcccgctatg 2281 gcgaaaaaag acagcatcga agtattcggc acagtgctgg aagctctgcc caatgcgatg 2341 ttcaaggtaa agcttgagaa tgatttcatc gtgatggcgc acatttccgg caaaatgagg 2401 atgaatttta tccgtatcct tcccggcgac agagtccgca tggagctcag cccctacgac 2461 ctgtccaagg gccggatcac ctggagagat aagtagtcct gtaacaggag gaacaataca 2521 aatgaaagtt agagcatcag tcaagcccat ctgcgaaaag tgcaaggtga tcaagcgcaa 2581 tggcaaagtc atggtcatct gcgaaaaccc caagcacaag caggtgcagg gctaatatgg 2641 caggaagaag catcttcctc caatagttta ctgtgttccg gcagtccggt gctgcaagcc 2701 ggacccttac ggaacgtaaa ttatacaaat ctatagttgc agtacaatag gaggtaaatc 2761 tatggctcgt atagccggtg tcgatctgcc cagagaaaaa agagtggaga tcggccttac 2821 ctacatctat ggtatcggtc tgcctacgtc caagctcatc ctggagaagg caaacatcaa 2881 tcctgacacg agagtcaagg atctgaccga agaagaagta ggtgcaatca gaaagatcat 2941 cgattccgaa tatgtcgtgg aaggcgacct cagaagagaa gtttccatga acatcaagcg 3001 cctgatggag atcggctgct acagaggaat cagacacaga agaaacctgc ccgttcgcgg 3061 acagaacacg aagaacaaca gccgcacccg caagggtccc aagaagacgg ttggccgcaa 3121 gaagaagtag ggagaaggag gtaagctaac atggcaacag taaagaagac tgtacgcaaa 3181 aagagaagag agcgtaagaa cattgaaagc ggtcaggctc atatccaggc ttccttcaat 3241 aacaccctcg ttaccctgac ggacctgaac ggaaacgcac tggcatggtc cagcgccggt 3301 tccctcggtt tcaagggttc cagaaagtcc accccgttcg ccgcgcagat ggctgccgaa 3361 gaagctgcca agggcgcgat ggaacacgga ctcaagacgg ttgaagtata tgtaaagggt 3421 cccggctccg gcagagaagc tgccatcaga gcgctgcaga ctgcaggcct taacatcacg 3481 atgattaagg acatcacacc cattcctcac aacggctgca gaccgccgaa gagaagaaga 3541 gtttagtaag ggaggaacga acatatatgt caagttaggg aaacatatag gggacacact 3601 gattctgtac ataaaattaa tttccagcca tttacaaatt attttgcctc agcaagctca 3661 gacaaatcta tttcaatttg gga // LOCUS sequence075 3657 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence075 VERSION sequence075 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3657 /mol_type="genomic DNA" /organism="" /note="sequence075" CDS 364..990 /product="translation initiation factor IF-3" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_005808206.1" /transl_table=11 /codon_start=1 /translation="MRPLFIFLPEDKAISKESLINEEIRAKEVRLIDAEGTQVGIVPIQ EALAKAAEANLDLVNISPNAAPPVCRIMDYGKYRYEQQKKEKEARKKQKTMEVKEMRLG IFTEEHDLETKAKLVAKFLEGGDKVKISMRFRGREMGYVKKGEETMLNFAGLFAELGNL ERAPKLEGRNMSMTIAPKSEREKEKIAKAKKQAAEKAAAENAPEE" /locus_tag="LOCUS_2890" /gene="infC" /note="WP_005808206.1 translation initiation factor IF-3 (Desulfitobacterium hafniense) [pid:52.1%, q_cov:80.3%, s_cov:87.4%, Eval:5.2e-41]" /note="MGA_396" CDS 1029..1232 /product="50S ribosomal protein L35" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003429729.1" /transl_table=11 /codon_start=1 /translation="MAKNKMKSHRGAMKRFKLTGTGKVKRNKAYKSHILTKKTAKRKRG LRQSTILGHADHKRIKSVLVGK" /locus_tag="LOCUS_2900" /gene="rpmI" /note="WP_003429729.1 50S ribosomal protein L35 (Clostridioides) [pid:63.3%, q_cov:89.6%, s_cov:93.8%, Eval:9.0e-15]" /note="MGA_397" CDS 1246..1599 /product="50S ribosomal protein L20" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003429730.1" /transl_table=11 /codon_start=1 /translation="MARVKKGMNAKRKHKKILKLAKGFYGSKHKIFSAANPAVMRSLRS AQMGRKLKKREYRRLWIARINAAARANDISYSRLMNGLKKAGIEVNRKMLSEMAIHDPA GFTKMVDAAKAAL" /locus_tag="LOCUS_2910" /gene="rplT" /note="WP_003429730.1 50S ribosomal protein L20 (Clostridioides difficile) [pid:65.0%, q_cov:100.0%, s_cov:99.2%, Eval:7.1e-36]" /note="MGA_398" CDS 1669..3078 /product="MATE family efflux transporter" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_023355052.1" /transl_table=11 /codon_start=1 /translation="MNSNPNALSGESRGSYLKKIFAIVLPIALQNLLGCAMGIVDTAMV GRMGVAPLAASGAASMVAIVLFNFMYGFLSGSGAFISQYWGIRDIETIRKVLGVIYRAS IFVSLIFSIVGELFAPQIIWLIDRDPEVIDLGVQYLRVIAPSYALAMLSYSFMVSSRCV QRLRAATIIDICAILLNSLLNYMFIWGKFGAPAWGIKGAAFATVLSRVFECSAFIIYSY AVKDHPLAFRHLSELSGYTKEFRNRILKTAIPVGFSDGLWGVTCTVYLSIYGMIGTAAV AAVQVINIVNECFQSVFYGVGSAAAVLIGEQLGQANLKRAKKSAVQFLWTGVALSALMS LFMLLISPFLIGFYHFDEATNQVLSSGLSITAWTIIMRMMCYIIMCGVLRPGGDTTFPM VVDMVCNWALIIPAMLIAVRVFHADLRTTMFLCYLGEGIKGVICYFRYRGGQWINVLTG VESSEAAADVV" /locus_tag="LOCUS_2920" /note="WP_023355052.1 MATE family efflux transporter (Catonella morbi) [pid:30.9%, q_cov:86.4%, s_cov:90.6%, Eval:3.8e-59]" /note="MGA_399" ORIGIN 1 gatacggcga acaacggcga catcgtcgtc gcgcagatcg acggcatgga gagcgaagcg 61 acggtcaaag ccttctataa ggagaacggc cacatccgcc tgcagcccag aaattccgag 121 atggagccca tcatcgtcga cgactgcaag atcatcggtc tcgtcaaggg cgtgttccgt 181 tatctgcact aggcagggat ggcttaaaaa gcgcgaaaaa tgttgaaaat tgcgcttgac 241 atgcccaccg tgcccctata tactatttga gtactaagca gaagtccgct tctcaccttc 301 aggcagtgcc gaaaaggtca acacagtaaa ttgtcagctg atggcgattt ttggagcgga 361 aatttgcgtc cgctctttat ttttttaccg gaggataaag caattagcaa ggaaagcctt 421 atcaacgaag aaattcgtgc aaaagaggtc cgcctgatcg acgcggaagg aacccaggtg 481 ggtatcgtac ccattcagga agcgctggca aaagctgccg aagcgaatct ggacctggtg 541 aatatctctc ccaatgccgc tccccctgtc tgccgcatca tggattacgg taagtaccgt 601 tacgagcagc agaagaagga aaaggaagcg cgcaagaagc agaagaccat ggaagtcaag 661 gaaatgcgcc tcggcatctt caccgaagag cacgacctgg aaacgaaggc gaaacttgtc 721 gccaagtttc tggaaggcgg cgacaaggtc aagatcagca tgcgcttccg cggccgcgaa 781 atgggctacg tcaaaaaagg agaagagacc atgctgaact ttgccggtct ttttgcggaa 841 ctgggcaatc tggaacgggc tcccaaactg gaaggccgca acatgtccat gaccatcgcg 901 cccaaatccg agcgcgaaaa ggaaaagatc gcgaaggcaa agaagcaggc agccgaaaag 961 gctgcggcgg aaaatgctcc ggaagaatag cgggcagacg ctgaagaata acaggaagga 1021 agtaaatcat ggcaaagaac aagatgaagt cccacagagg ggcaatgaag agattcaagc 1081 ttaccggaac cggcaaagtt aagagaaata aggcgtataa gagccatatc cttaccaaga 1141 agaccgccaa gagaaaaaga ggccttcgcc agtccacgat tctcggccat gccgaccaca 1201 agagaatcaa gagcgtatta gtaggaaagt aggaggtaag agacaatggc aagagttaag 1261 aagggcatga acgctaagag aaagcataag aagatcctga agctggcaaa aggcttctac 1321 ggttccaagc ataagatctt ttccgcagcc aatcccgctg tcatgagatc tctgcgcagc 1381 gctcagatgg gccgcaagct caagaagaga gaatacagaa gactctggat cgcccgtatc 1441 aatgcggcgg caagagcaaa cgacatctcc tacagcagac tcatgaacgg tctgaagaag 1501 gccggtatcg aagtcaacag aaagatgctg tccgaaatgg ctatccacga tcccgcaggc 1561 ttcaccaaga tggtggatgc tgccaaggct gcgctgtaag ccttcctttc caagaaaact 1621 atcatccctc cggccgtttc gtccggaggg attttttaga gactactgat gaattccaat 1681 cctaacgcac tgagcggcga gtcccgcggc tcctatctga agaaaatatt cgccatcgtg 1741 ctgccgatcg cgctgcagaa tctgttaggc tgcgccatgg gcatcgtgga taccgccatg 1801 gtgggccgca tgggcgtcgc gcctcttgcg gcttccggcg ccgcttccat ggtggcgatc 1861 gtcctgttca acttcatgta cggcttcctc agcgggtcag gggcgttcat ctcccaatac 1921 tggggcatcc gggatatcga gaccatacgg aaggtgctcg gcgtcatcta ccgggcgtcc 1981 atcttcgttt ccctcatctt ttcgatcgta ggggaactct tcgcgccgca gatcatctgg 2041 ctcatcgaca gagatcccga ggtcatcgac ctgggcgtgc agtatctgcg ggtcatcgcg 2101 ccgtcctatg cgctggccat gctcagctac agctttatgg tgtcgtcccg ctgcgttcag 2161 cggctgcggg ctgcaacgat catcgacatc tgcgccattt tgctcaattc gctgctcaac 2221 tacatgttta tctggggcaa gttcggcgcg ccggcctggg gcatcaaagg tgctgccttt 2281 gcgacggtgc tctcccgcgt cttcgaatgc tccgctttta tcatctattc ctatgcggtc 2341 aaagatcatc cgctggcgtt ccggcacctt tcggaactct ccggttatac gaaggagttt 2401 cgaaaccgca tcctgaagac tgcgatcccc gtcgggttct ccgacggact gtggggcgtc 2461 acctgcacgg tctacctgtc catctacggc atgatcggca cggcggcagt agcggcggta 2521 caggtcatca atatcgtcaa cgaatgcttc cagtccgtgt tctacggcgt gggcagcgcg 2581 gcagcggtgc tcatcgggga gcagctgggc caggcgaatc tgaagcgggc gaaaaaatcc 2641 gccgtgcagt tcctgtggac gggagtggca ctgtctgcgt tgatgtcact gtttatgctg 2701 ctcatcagtc cgttcctcat cgggttctac cacttcgacg aagcgacgaa tcaggtgctc 2761 tcctccggcc tctccattac ggcctggacc atcatcatgc gcatgatgtg ctatatcatc 2821 atgtgcggcg tgctgcgccc cggcggcgac accacgttcc ccatggtcgt ggatatggtc 2881 tgcaactggg cgctcatcat cccggcgatg ctcatcgcgg tgcgcgtgtt ccatgcggat 2941 ctgcgcacga cgatgttcct gtgctatctg ggcgaaggga taaagggcgt catctgctat 3001 ttccgctatc gcggcggaca gtggatcaac gtgctgacgg gtgtggaatc ttccgaagcg 3061 gccgccgatg tggtataata tcttattatg attcgcatct ttgaagacct gccggtggat 3121 gcagggttta cctgcaaacc ggcggacgga aaagtgtata gatcggaact gctgaagaaa 3181 gcgccggtcg tgcggctatc cctggtgcac ggcagcgaga tcgccgtcat ccggagcatg 3241 cagccggaag gggctgcgcc gctgcgggcg gataccgacg aagggtatct ggacgtctac 3301 gacgcggacg gagcggtcac ggatctgccc ggcgtctatc tgacgacgac acacggcgat 3361 tgcgtgccga tctggacctg tgacccggtc aaaggcgtcg tcggcgtggc acacgcgggc 3421 tggcggggca cgttgaaggg cgtcgcggtt tccctggtgc ggaccatggt ccgcgcatac 3481 ggatgcgatc cggcggacat aagagctgcg gtcggccccg ggatcggcgc ctgctgcttc 3541 gaggtcggtc cggacgtggc ggaacagttt acggatgcgt tctggtgggc ggaagactac 3601 gtatactgcc atcccggcgg aaggccgcgg ctggatctca aagggatcaa cgccgaa // LOCUS sequence076 3654 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence076 VERSION sequence076 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3654 /mol_type="genomic DNA" /organism="" /note="sequence076" CDS 73..600 /product="nitroreductase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_008765867.1" /transl_table=11 /codon_start=1 /translation="MENESIKTLLTRRSVRKYKPEHITEEEMEIILEAGKFAPTGKGTQ CTKFVVVRNKAVRDKLSEINAEILGTASDPFYGAPDLIAVFANSAATGTWIEDGSLAMG NLMNAAHAIGVASCWINRARQTFDSPDGRAMATAWGIPESYKGIGYCILGYADGEEPLP KPRKEDFVVYVD" /locus_tag="LOCUS_2930" /note="WP_008765867.1 nitroreductase (Bacteroides) [pid:35.5%, q_cov:88.6%, s_cov:88.4%, Eval:6.4e-22]" /note="MGA_401" CDS 681..1673 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MKKLVSTILCIALLAALFAGCTKQESETAPSAKPDSVLTPQDEVL SYTVGEIQEFGRNDASVWELLQDLLPNLIVYRGAGGVFQYASIDRTLPQSDYDWSNLVE VNETPREVEYAVDGETVSIKGIDVSAYQGEIDWEKVAASGVKYAFIRLGYRGYESGLLV KDDRFEENIRGALQNGVAVGVYFVTQAISVEEAVEEAQFVMENIRPYNVTWPIVLDIED AASATARTAELSQQARTDHAIAFCETVKESGYTPMLYCNIRWFIEKLDITRITDYDKWF AQYFRKPFFPYAFQVWQYSSTGRIDGIEGNVDYNISFVDYGNLPEETGD" /locus_tag="LOCUS_2940" /note="WP_011976242.1 glycoside hydrolase family 25 protein (Sinorhizobium medicae) [pid:31.3%, q_cov:58.8%, s_cov:72.8%, Eval:2.1e-15, partial hit]" /note="MGA_402" CDS 1715..2410 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="METKRLYKSSTDKAIFGVCGGFAEYFGIDSLIIRLVLVLFTLAFG AGLLFYLIAALIMPKRPEDGGMPVQPAQPGSYNATGTTYVNRASYAEPMPEHVSRSAAP MPQEVKAEEPADPVSKAWAKERETQETRGAAAGAPKQEAPKQEMPKPEATKQEAPRPER PYQAYQQPQRTQSAPRSSGDKTRLLLGVILILIGLFVLVRVFLPRFDTRILFAVCVIVA GAVLILKRD" /locus_tag="LOCUS_2950" /note="WP_003722617.1 PspC domain-containing protein (Listeria monocytogenes) [pid:56.1%, q_cov:24.7%, s_cov:86.4%, Eval:6.7e-11, partial hit]" /note="MGA_403" ORIGIN 1 cgcatcctgc ggggcgagga ggctgccaat ccggcttatc aataaacatc ccggatcgga 61 aggaggagac ccatggaaaa cgaaagcatc aaaaccctgc tgacgagaag aagtgtccgc 121 aaatacaagc cggagcacat cacggaagag gagatggaga tcatcctgga agctggcaaa 181 ttcgcgccca caggaaaggg cacccagtgc acgaagttcg tcgtcgtgcg caataaggcg 241 gtgcgcgaca aactgtcgga gatcaatgcg gagatcctgg gcacggcgtc tgatccgttc 301 tacggcgcgc cggatctgat cgccgtattt gccaacagcg cggcaaccgg aacctggatc 361 gaagacgggt ccctcgccat gggcaacctg atgaacgcgg cccacgccat cggcgtcgca 421 tcctgctgga tcaaccgggc cagacagacc ttcgacagcc ccgatggaag agccatggcg 481 accgcctggg gcattcccga gagctataag ggcatcggct actgcatcct gggctatgcg 541 gacggagaag aacccctgcc gaaacccaga aaagaagatt ttgtggtgta cgttgactaa 601 acggttaaga gagtgttaat tttctgtgac aggcctcccg caggcctgtt ttttttcttt 661 aggtatggta caatatccgc atgaagaaac tagtatcaac aatcttatgc atcgctcttc 721 tcgccgctct gtttgcaggc tgcacaaagc aggagagcga aacagctcct tccgcgaaac 781 cggactccgt gcttacgccc caggatgagg tgctttccta caccgtcggc gagatccagg 841 agttcggacg gaacgacgct tccgtctggg aactgctgca ggatctgttg ccgaacctca 901 tcgtctaccg gggggcgggc ggcgtgttcc agtatgcttc catcgaccgc accctgccgc 961 agtccgatta cgactggagc aacctggtgg aggtgaacga aacgccgaga gaagtagaat 1021 atgccgtgga cggcgagacc gtctccatca agggcatcga cgtctccgcc tatcagggag 1081 agatcgactg ggagaaggtg gcggccagcg gcgtaaaata cgcatttatc cgcctgggtt 1141 accgcggcta cgagagcggc cttctcgtga aggacgaccg gttcgaggaa aacatccggg 1201 gcgcgctgca gaacggcgtc gcggtgggtg tctatttcgt gacccaggcc atctccgtgg 1261 aagaagcggt ggaagaggcg cagttcgtca tggagaacat ccggccgtat aacgtcacct 1321 ggcccatcgt cctggacatc gaggacgccg ccagcgcgac ggcaaggacg gcggagctct 1381 cgcagcaggc gcggacagac cacgccatcg cgttctgcga gaccgtaaaa gaatccggtt 1441 acacgccgat gctctactgc aacatccgct ggttcatcga aaaactggac attacgcgga 1501 tcacggacta cgacaagtgg ttcgcccagt acttccgcaa gccgttcttc ccgtacgcct 1561 tccaggtgtg gcagtacagc agcaccggac ggatcgacgg catcgaaggc aacgtggact 1621 acaacatcag ttttgtcgat tacgggaatc tgccggagga gaccggcgat tgacccggat 1681 ccaatagaag ggaaaagaaa ggattagaaa ggaaatggaa accaagagat tgtacaagtc 1741 ctctacggac aaggcgatat tcggtgtatg cgggggcttc gccgaatatt tcgggatcga 1801 ttcgctcatc atccgcctcg tgctggtgct gtttacgctg gcgttcggcg cgggactgtt 1861 gttttatctg atcgcggcgc tcatcatgcc caaacgcccg gaagacggcg gcatgcccgt 1921 gcagccggcg cagcccggtt cctataacgc tacgggcacg acctatgtaa accgggcgtc 1981 ctatgcggaa cccatgccgg agcatgtttc ccgcagcgca gcgcccatgc cgcaggaagt 2041 gaaggcagaa gaacctgccg accccgtgag caaagcctgg gcaaaggaac gggagacgca 2101 ggagacgcgc ggcgcagccg caggcgctcc gaagcaggag gcccccaaac aggagatgcc 2161 gaaaccagag gctacgaagc aggaggcacc ccgtccggag cggccgtatc aggcttacca 2221 gcagcctcag cggacgcaga gcgccccgcg gagcagtggc gataagacca gactgctgct 2281 gggggtcatc cttatcctca tcggcctgtt cgtgctcgtg cgcgtattcc tgccccggtt 2341 cgacacccgt atcctgtttg cggtgtgcgt catcgtcgca ggcgccgtcc tcatcctgaa 2401 gagagattaa accattcacc gtaaccaatt tataaattat cacctatgga caccggaaaa 2461 agaaatctga gaacgaagct gttttatggg gcagggtacc tgccggaccc gtgcttttac 2521 cagtttatcg catcttttca gatcgtattc ctcaccggtg tcgtagggct ttctcctgcg 2581 gtcgcgggaa cgatctcgtc cgtcaccatc atgtcggacg cggtcttcag catcgtggtg 2641 ggaaagtggt ccgacaatgt acggagccgc tttggcagga ggcggccctt tttgcttgct 2701 gtttacctgc tgatgccggt ctcctttgcc atgatgttcc ggaccgccgg cggcggagaa 2761 accttcaagt tctggtatta catgctgtgg ggcttcgtgt tctggatcgc ctatgctgcg 2821 tttttcgtct gctatgtagc cctcggcgcg gatgtggcga cggattatga agaccgcatc 2881 cttctgaaca gttacacccg tctgtttacg ctgggcggcg gcattctggg aacggcgatt 2941 cctctcactg ccatcgcagc cctcacttcc cgggggatgg aaacggaaaa cgcctggttc 3001 ctgtttgcgg cagctctggc ggccctcgtg ctgctgggcg gcttcctctg ctggaacgcc 3061 acccggggac tggagcagcc cgtctgggac gaaccggaat cccagggcat cgcaggattc 3121 ttccatgact gccggcagct cctcacgctg cggccttacc ggaaagtcat cttttccaag 3181 gtcttcagca acgtggccta cacgttctac accggtacgc ttatctttta catgcagttc 3241 gtgctgcaga tcgatacccg gttctccgcg gtcatctacc tgctgagcaa cgtcgtcagc 3301 ctggtgctgg tgccctttat cgccaagatg gcctttaagc tgggaaagcg caagtacatg 3361 gcttacgccc agttcgtgtg cgccggtctc agccttctga tggggctcgt gggcgtgcgg 3421 tcccgggctc tgctggtcct ctacatgctg atctatatct acgggcaggc gagcttctgg 3481 cagctgtgca acacgaacct gtacgacatt accgacctgg acgagtaccg cttcggcgtg 3541 cgccgggaag gcaacatcat ggcgctgcag agctttatca acacgggatt tacttcggtg 3601 agcctgaaag tgctgacggg gcttctcgcc gcatccggct tttccgcaac ggcg // LOCUS sequence077 3651 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence077 VERSION sequence077 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3651 /mol_type="genomic DNA" /organism="" /note="sequence077" CDS complement(726..2069) /product="replication-associated recombination protein A" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003562821.1" /transl_table=11 /codon_start=1 /translation="MNKDQLTIFEHDMPQPLPARMRPQTIDEIVGQQHLLGPGRVLSRI IEQDAVSSMIFWGPPGVGKTTLAGVIANHTKARFINFSAVTSGIKEIKEVMKEADESRR FGEKTIVFVDEIHRFNKAQQDAFLPFVEKGAIILIGATTENPSFEVNGALLSRCKVFVL KALTEEDIVTLLQRALDSPQGFGNQLVEVEEGVLPMIARFCSGDARTALSTLEMAVLNG EPAGTDEHPEAVRVTREVLEQCTSRKSLLYDKSGEEHYNLISALHKSMRNSDPDAAVYW LARMLESGEDPLYIARRVVRFASEDVGLADPRALEMAVAAYQACHFIGMPECSVHLTQA VVYLSIVPKSNALDVAYMEAKRDALSQIDEPVPMQIRNAPTKLMKEVGYGKGYMYAHDY EDRLTTLQCLPDSLVGREYYRPTEQGNEGRFKERLQQIKDWKKEHENK" /locus_tag="LOCUS_2960" /note="WP_003562821.1 replication-associated recombination protein A (Lacticaseibacillus) [pid:65.8%, q_cov:98.0%, s_cov:96.7%, Eval:2.3e-167]" /note="MGA_406" CDS complement(2187..2561) /product="desulfoferrodoxin family protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_004453642.1" /transl_table=11 /codon_start=1 /translation="MSKFYKCSVCGNIIGKIHDSGVPVVCCGKPMDHLEANTVEASFEK HIPDVKVEDGIVKVQVGSVAHPMAEEHFIEWVYLETDKGGARKALKPGDAPEACFALCD ETPKAVYAYCNLHGLWKKDL" /locus_tag="LOCUS_2970" /note="WP_004453642.1 desulfoferrodoxin family protein (Clostridioides difficile) [pid:51.2%, q_cov:98.4%, s_cov:96.1%, Eval:5.6e-33]" /note="MGA_407" CDS complement(2571..3119) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MSEKKNPYSGTKTEQNLLAAFAGESQARNKYTYYASKAKKEGFEQ ISALFLKTAENEKEHAKLWFKELNGIGSTAENLADAADGENYEWTDMYEGFAKTAEEEG FPALAEKFRGVAAIAKQHEERDRALLKNVETKQVFEKSSVKVWECRNCGHIMVGEKAPD VCPVCAHPQAYFEVNCENY" /locus_tag="LOCUS_2980" /note="WP_015943945.1 ferritin family protein (Desulfitobacterium hafniense) [pid:67.2%, q_cov:97.3%, s_cov:45.2%, Eval:6.5e-68, partial hit]" /note="MGA_408" CDS complement(3153..3632) /product="pyridoxamine 5'-phosphate oxidase family protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011948533.1" /transl_table=11 /codon_start=1 /translation="MFRPMAAPRAKQQISEEECIQILKEQKRGILCVLGDDDYPYGTPT NHFYNEADGKIYFHSNKKGHKVDAMKKHDKICFVCYDEGFKKEGDWALNIKSVIVFGKV EFIEDKDTIVDIMTQLSHKFTDDEAYIAKEMKAAGGTLLFALKPEHMTGKLVNES" /locus_tag="LOCUS_2990" /note="WP_011948533.1 pyridoxamine 5'-phosphate oxidase family protein (Clostridium botulinum) [pid:39.1%, q_cov:96.9%, s_cov:92.7%, Eval:1.1e-21]" /note="MGA_409" ORIGIN 1 cacgatctcc cgctcttttt ccgtcagatc tttgaaaggc acatccgtgc gaacgccaag 61 ctctctcgcg atatccttca tcagcgacca catcagggtc tgccagggaa gcacggcacc 121 ttcgtcgatc gtcagggatt cgtcgggcac cagcgtggat tcgtccacga tgcgtacgat 181 gccggtgccg ccgcaggtac ggcaggcgcc ctggctgttg aaggccagtt cctccgcgcc 241 ggggccgtag aagtgagctc cgcagaccgg gcacacctgc tcccgttctg ccgccacatc 301 catggaaggc ggcagatagt gtccgttggg acagcggtgg ctggcgagtc gggagaacat 361 caggcgcagg ctgttgagca gttccgttcc ggttccgaag gtgctgcgga tgccgggcag 421 cgccggccgc tggtgcagcg ccagggacgc cggcacatac agaacttcgt ccacggaggc 481 ccttgctgcc tgggtcatgc ggcgacgggt ataggtcgag agcgactcca gataacgccg 541 ggacccttct gcatacagca cgcccagagc gagcgaagat ttgccggagc ccgagactcc 601 ggcgatgccg acgatcttcc ccagagggat atccacgtcg atatttttca gattatgcac 661 gcgggcgccc cgcaccagga tatgatcggg tgcgggagca gcttttcgcg cgtttctgtc 721 tacggtcatt tgttttcgtg ttcctttttc cagtctttga tctgctgcag gcgctcctta 781 aaacgtcctt cgttgccctg ctccgtgggg cgataatact cccggcccac cagggaatcc 841 ggcaggcact gcagcgtggt cagccggtct tcgtaatcgt gggcgtacat atagcccttg 901 ccgtagccca cttccttcat gagcttcgtc ggcgcgttgc ggatctgcat gggaaccggc 961 tcatcgatct gggacaaagc gtcgcgcttc gcctccatgt aggccacatc cagagcgttg 1021 gatttcggca cgatggacag atagacgacg gcctgcgtca gatgcacgct gcattccggc 1081 atgccgataa agtggcaggc ctgatacgcc gcgaccgcca tctccagcgc tctgggatcc 1141 gccaggccca cgtcttcgct ggcaaagcgt accacgcgcc gggcgatgta cagcggatct 1201 tctccggact ccagcatgcg ggccagccag tagaccgccg catccgggtc ggaattgcgc 1261 atggatttat gaagggcgga gatcagatta tagtgctctt cgccggattt atcgtacagc 1321 agggatttgc gggacgtgca ttgttccagc acctcccggg tgacccttac agcctccgga 1381 tgctcgtccg tgcccgcggg ttcgccgttg agcaccgcca tctccagggt ggacagcgcc 1441 gttctggcgt cgccgctgca aaagcgagcg atcatgggca gtacgccctc ctccacctcc 1501 accagctggt tgccaaagcc ctgagggctg tccagcgccc gctgcaggag ggtcacgata 1561 tcctcctccg taagagcctt cagaacgaac accttgcagc gggacaaaag cgccccgttc 1621 acctcaaacg acgggttttc cgtggtggcg ccgatcagga tgatggcccc cttttccacg 1681 aagggcagaa aagcgtcctg ctgcgccttg ttgaagcggt ggatctcatc cacgaagacg 1741 atggtcttct ccccgaagcg ccggctctcg tccgcctcct tcatcacctc tttgatctcc 1801 ttgatgccac tggtgacggc ggagaaattg atgaagcggg ccttcgtatg gttggcgatg 1861 acccccgcca gcgtcgtctt gcccacgccc ggcggacccc agaagatcat ggaggacacc 1921 gcatcctgct cgatgatgcg gctgagcacc cttcccgggc caagcagatg ctgctgtccc 1981 acgatctcgt cgatggtctg ggggcgcatg cgggccggca ggggctgcgg catgtcgtgt 2041 tcgaatatgg ttaactgatc cttgttcatc ggtcgattcc tttaacaaaa gagaacaatt 2101 gttctatttt atcatatcat attttgcccc tgctttcaag gcatagaaaa acgccgccgg 2161 agcatttccg gcggcgcaga tcgtctttac agatctttct tccacagtcc gtggagattg 2221 cagtaggcgt aaacagcttt cggcgtttca tcgcacagcg cgaagcaggc ttccggagcg 2281 tcgccaggct ttaaggcctt gcgggcgccg cctttgtcgg tttcgagata gacccattca 2341 atgaaatgct cttccgccat gggatgcgcc acggagccga cctgcacttt aacgatgccg 2401 tcttccacct ttacgtcggg gatgtgcttc tcgaagctgg cctcgaccgt gttggcttcc 2461 agatgatcca tgggcttgcc gcagcagacc acgggcacgc cgctgtcatg gattttgccg 2521 atgatattgc cgcatacgct gcacttatag aatttgctca ttcgtccctc ctaataattc 2581 tcacaattga cttcgaaata cgcctgggga tgcgcgcaga cagggcacac gtcgggcgcc 2641 ttctcgccca ccatgatatg cccgcagttt ctgcattccc ataccttaac gctgctcttc 2701 tcgaagacct gctttgtctc cacgttcttc agcagcgctc tgtcgcgctc ttcgtgctgc 2761 tttgcgatgg ccgcgacgcc gcggaacttt tccgccaagg ccgggaagcc ctcttcttcc 2821 gcggtcttcg cgaacccttc gtacatgtcg gtccattcgt agttttcgcc gtctgccgcg 2881 tctgccagat tctccgcagt ggagccgatg ccgttcaatt ccttaaacca gagcttcgca 2941 tgctcctttt cgttttccgc cgtcttcagg aacagcgcgg agatctgctc gaagccttcc 3001 ttctttgctt tcgacgcgta atacgtatac ttgttgcggg cctgggactc gccggcaaac 3061 gctgccagca ggttctgttc tgtcttagtt ccggaatagg ggtttttctt ttcgctcata 3121 aagttcctcc ttccatccgt tcactgcacg gatcacgact cgtttaccag tttgcctgtc 3181 atgtgctccg gtttgagcgc aaacagcagc gtgccgcctg ccgccttcat ctccttggcg 3241 atgtaagcct cgtcgtccgt aaacttgtgg gaaagctgcg tcataatgtc gacgatcgtg 3301 tctttatcct cgataaactc caccttgccg aacacgatga cgctcttgat gttaagagcc 3361 cagtctccct cttttttgaa gccttcgtcg tagcacacga agcagatctt atcgtgcttc 3421 ttcatggcat ccactttgtg gcccttctta ttgctgtgga aatagatctt cccatctgcc 3481 tcgttataga agtggttcgt gggcgtgccg tagggatagt cgtcgtcacc taacacgcac 3541 aggatgccgc gcttctgttc cttcaggatc tgaatgcatt cttcttccga gatctgctgc 3601 tttgctctcg gtgccgccat tggtctaaac atgtcgatgt acctccgata c // LOCUS sequence078 3645 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence078 VERSION sequence078 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3645 /mol_type="genomic DNA" /organism="" /note="sequence078" misc_feature <1..2266 /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_011016931.1:acyl-CoA dehydratase activase" /note="WP_011016931.1 acyl-CoA dehydratase activase (Fusobacterium nucleatum) [pid:51.7%, q_cov:99.5%, s_cov:75.8%, Eval:1.2e-222]" /note="MGA_410" /locus_tag="LOCUS_3000" CDS 2257..3600 /product="2-hydroxyacyl-CoA dehydratase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011016932.1" /transl_table=11 /codon_start=1 /translation="MEIGCASCKSCGLESCSGCEDDKKYIETEKREIETPDNRVIFTKE MKKTYTLLAPTMLPMHFRLFQEVFRKNGYNMELLENEGRKAVDCGVKYVHNDACYPSIC VIGQFIDALQSGKYDVNKVAVIYMQTGGGCRASNYVSLMRKAFARAGFPQVPIVTINIA GLEKHPGFKVTVPMYRDLLNCCLYADLMMTLRNQCRVREVKKGQTDALCDHWVKKLGKE IWDGKMKYSRVKENMRRMAADFALIERKPEQPVRVGIVGEIYVKYSPLGNNYLEEFLYR EGAEAVVPGLLDFMYYCVYNNRLDFELYGMRSDSRLIWKIVCDYFEKKKNDLNEIIRER GVFYGFSSYKHLLELAKEHHCVGVGMKMGEGWLLTSEMLELCEMGVSNIVCCQPFGCLP NHIVGKGMMRPIKARYPDANIVAIDFDPGASRINQENRLKLMMSNARK" /locus_tag="LOCUS_3010" /note="WP_011016932.1 2-hydroxyacyl-CoA dehydratase (Fusobacterium nucleatum) [pid:46.8%, q_cov:89.7%, s_cov:97.8%, Eval:9.5e-105]" /note="MGA_411" ORIGIN 1 agacgccgtg ttcccggaat acggccgttt tgccgtagcg ctgggcgctg cgttctacgg 61 cacgggtcag gaagcccgtt atacctatga acagtggctg tccgctctgg agaacgctgc 121 aggcgcctcc gtcaagaccg aacatgccaa accgctgttc gaagacgagg cggaatatgc 181 ggcattcctc gaacggcaca gccgcgcgaa ggtgccggcc agagacctgg aaggatatat 241 cggcaaagct tacctgggca tcgactgcgg cagcaccacg acgaaactcg tcctcatcga 301 cccggaaggc accatcctgt attcgtacta cggcaacaac aagggcaacc cggtggacgt 361 ggtgcgcgaa catctgggga tcatctatga aaaggccgat gcggggctca ccatcgccgg 421 ctccgcagtt accggctacg gcgaggagct catccagcgg gcattccatc tggacggcgg 481 tctcgtggag accatggcgc actacagcgc agccaggttc ttcaaccccg acgtggattt 541 catcatggat atcggcggtc aggacatgaa atgcctgtcc atccgcaacg actccatcga 601 ttccatcatc ctgaacgaag cctgcagctc cggctgcggc agctttatcg agacctttgc 661 gcgggcgctg ggctatccga tcgcggattt cgcgaagctc ggtctgttct cccgcaaccc 721 cgtggacctg ggcagccgct gcaccgtgtt catgaacagc tccgtcaaac aggcgcaaaa 781 ggacggcgcg gacgtgacgg acatctccgc cggtctctcc atgagcatcg tgaaaaacgc 841 gctgttcaag gtgctccggg tgcagtccgc caaggatctg ggcgagcaca tcgtcgtcca 901 gggcggcacc ttcctcaacg atgcggtgct gcgctccttc gaacgcgaac tgggagctga 961 ggtcacaaga cctgccatcg caggcctgat gggtgccttc ggcgcagcgc tctttgccaa 1021 gaaactcaat gtcgaaacat cctccacggt aagcgcggaa gagctaaaaa cgttcaccca 1081 tacctcggaa acggtcacct gcaacggctg cacgaatcac tgtccgctca cgatcaacac 1141 cttcttcggc gatgagaaat acgtctccgg caacaagtgc gagcggggcg gtctgctggc 1201 gctgggcaag aagcccgaga ccgcggccaa gctgccgaac ctgtaccggt ataaaagaga 1261 aaagctctta aagctgaaag cggacagggg agaaggcccc tataccatcg gcattcccat 1321 gtccctgggc gtcttcgaac tggcgcccat gtggcatact attttccgca aactgggctt 1381 taaggtcgag atgacgggct tttccgacaa acggatctat gcaaatggtc aatacaccat 1441 tccctccgat acggcatgct atccggccaa gctgatgcac ggccacgtgg agagcctgat 1501 ggagaagggt gtggacgcag tgttctatcc ctgccttacg tacaactacc acgagagcaa 1561 cgccacggac aatttctaca actgcccggt cgtggcctat tacagcgaag tgctcaacgg 1621 caacatggac agcctgcatc aggacggcgt caaattcctg tatccctatc tggcggtcaa 1681 cgacaagaag cagctggcca agggtctctg cgaatgcctc aacgaagcgt tcggcggctt 1741 tgcgctgtcg gcagtggaag gcgctgtcga agcgggtcac aaggcgtacg aggaatggat 1801 ggcggacgtg cgcgaagagg gcggcaaggc cctggcctgg gcccgtcaga acggaaagcg 1861 catcatggtg ctggccggcc gtccctacca tgtggacagc ggcatctgcc agggcatgga 1921 ccagctgatc gaatccctgg ggttcgtcat cgtgtccgag gactgcgtgt ccaacctggt 1981 gaccccgcag aaagtcaacg tgctcaacca gtgggtgtac cacgcgagac tatataacgc 2041 tgcgaaatac gtcggtctgc acgacgactg ccaactggtg cagctcgtgt cgttcggctg 2101 cggcctggat gccatcacga cggacgaagt ccgggcgatc ctggagcgct acggcaaact 2161 gtatacgcag atcaagatag acgagatcaa caatctgggc gctgcgaaga tccggctgcg 2221 cagcctggtc ggcgccctgg aggagagaga agcgaaatgg aaataggttg tgcgagctgc 2281 aaaagctgcg gtctggaaag ctgcagcggc tgcgaagacg acaaaaaata tatcgagacc 2341 gaaaagagag agatcgaaac gccggataac cgggtcatct ttacgaagga gatgaagaag 2401 acctacacgc tgctggcgcc cacgatgctg cccatgcatt tccgcctgtt ccaggaagtg 2461 ttccgcaaga acggctacaa catggagctg ctggagaacg aaggccgcaa ggcggtggac 2521 tgcggtgtaa agtacgtcca caacgacgcc tgctatccat cgatctgcgt catcggccag 2581 tttatcgacg cgctgcagag cggcaaatac gacgtcaaca aggtggccgt catctacatg 2641 cagaccggcg gcggctgccg cgcgtccaac tacgtatctc tgatgcgcaa ggcctttgcc 2701 agggcgggct tcccccaggt ccccatcgtg acgatcaaca tcgctggcct ggagaagcat 2761 ccgggcttta aggtgaccgt gcccatgtac cgggatctgc tcaactgctg cctgtacgcg 2821 gacctcatga tgaccctgcg caaccagtgc cgggtgagag aggtaaagaa agggcagacg 2881 gatgcccttt gcgaccactg ggtaaagaag ctcggcaagg agatctggga cggcaagatg 2941 aaatacagcc gcgtcaagga gaacatgcgg cggatggcgg cggatttcgc cctcatcgag 3001 agaaagcccg agcagccggt gcgcgtcggc atcgtcggcg agatctacgt aaagtattcg 3061 cctctgggca ataactacct ggaggaattc ctgtatagag aaggcgcgga agccgtcgtt 3121 ccgggactgc tggacttcat gtactactgc gtctacaaca accgcctgga cttcgaactc 3181 tacggcatgc gcagcgattc caggctcatc tggaagatcg tctgcgacta cttcgaaaag 3241 aagaagaacg acttaaacga gatcatccgc gagcgcggcg tgttctacgg gttctccagc 3301 tataaacatc tgctggagct ggcgaaggag caccactgcg tgggcgtggg catgaagatg 3361 ggagaaggct ggctcctcac gtccgagatg ctggagctgt gcgagatggg cgtctccaac 3421 atcgtatgct gccagccctt cggctgcctg ccgaaccaca tcgtgggcaa gggcatgatg 3481 cggccgatca aggcgcgcta tccggacgcc aacatcgtag ccatcgactt tgaccccggt 3541 gcatcccgca tcaaccagga gaatcgttta aagctcatga tgagcaacgc aagaaagtag 3601 gcataccatg acacccagac agcagcagat agtaaaaaac gtaga // LOCUS sequence079 3641 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence079 VERSION sequence079 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3641 /mol_type="genomic DNA" /organism="" /note="sequence079" CDS complement(364..1446) /product="type IV pilus twitching motility protein PilT" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_010880449.1" /transl_table=11 /codon_start=1 /translation="MDENKAYQPMDIKTILEQSVIRDVKDIFVVAGLPITYKIGNTQER MDRPKMLPDDIRLCVDDIYEISRRPKTNLDNGLDDDFSFALNGVGRFRVNIFRQRGSLA AVIRVIRFGLPDPAALSIPESVLSLADTKKGLVLITGSAGSGKSTTLACLIDRINHTRE AHIITMEDPIEYIHQHKRSIVTQREISIDTPGYMESLRSALRESPDVILLGEMRDYDTI SSAITSAETGVLLLSTLHTSSAANTINRILDVFPANQQQQVKIQLAQMLKGIVCQQLVP SVDGNLIPVFEIMKSTTAIQNMIREDKLHQLESAMQAGGAEGMCTMDGSLLKLYKEGRI SRETALMACANYENMAKRLG" /locus_tag="LOCUS_3020" /note="WP_010880449.1 type IV pilus twitching motility protein PilT (Aquifex aeolicus) [pid:44.6%, q_cov:97.2%, s_cov:95.6%, Eval:3.2e-81]" /note="MGA_413" CDS complement(1453..1830) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MKHVPIRLGPLALLLAVISICLTILAVLSFTTGQADLRLAQRYAD TVTERYALEAEGQAFLADVCRGNDLQSGLPTVSETIEGENGLSLHIELKQNARGSYGIT AWKFLRDWEEHTDLDNIWTGE" /locus_tag="LOCUS_3030" /note="MGA_414" CDS complement(1827..2327) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MKSKHEHITAFYIETLLLIVSFVLVILMLTNVFGLGKRESSRAQD LTNAVRLAETGAEAFAAADGPAELADILDEGNVTLASTSSQYPVPPKDRLPAIIFAYYD NDLNPVAEENAAYRLIISWDADQSTASGDSVLAKGTISVRRPGSEEDIYSLDTAVYIQE VQP" /locus_tag="LOCUS_3040" /note="MGA_415" CDS complement(2324..2794) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MTFKEDQKSPLGLYSIGIAALFLLGFFLLVVFGAQNYRNAVAAQH ANNDSRVLLSYVSTCIKGSDQTGCVRIREEDGNTVLVIADEESGYASRLYLSHGNLVED YAETGAALDPENAQIIGQTSVFTVEELTEGLLAVTTDAGRSLIRLRSQGGVL" /locus_tag="LOCUS_3050" /note="MGA_416" CDS complement(2816..3127) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MYQDRVSHKQRNILLIVLCALVLACGYFAFSGSGKDLDEETVTAI RDAIRRSALQCYVVEGVYPPDLAYLQDHYGLQVNTDNYYVVYEAFASNVPPTINVIEK" /locus_tag="LOCUS_3060" /note="MGA_417" misc_feature complement(3131..>3641) /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_005065941.1:type II secretion system inner membrane protein GspF" /note="WP_005065941.1 type II secretion system inner membrane protein GspF (Acinetobacter) [pid:26.6%, q_cov:73.4%, s_cov:30.9%, Eval:3.2e-07, partial hit]" /note="MGA_418" /locus_tag="LOCUS_3070" ORIGIN 1 ctccgtgccc gcaaggaccg tctccattct ttccagcgca gcatccctgc ggcgggtcac 61 gtttacctcc tcgaagaaat cgtccacgta ttttttattt ccggtcacga caaaacagcg 121 gacacggtcc gtcagatagt ccgaagccgc catcatatcc tgggtatcct gctgcagttc 181 gatgtactgg tccgtggagc gctgcaggat ccggtaaccc gtcatgacgc tgttcgtcgc 241 gtataagagc aggatggcaa gcaggatcgc gacgcccatc ataaacagat gcatccgccg 301 gatcgatatg cttcctgccg ttctgtcgtt tctattctcg tccatacgtt tccgcccgtg 361 cggctatccg agccgcttcg ccatgttctc gtaatttgca caggccatca gcgcggtctc 421 cctgctgatg cgtccttcct tataaagctt taacagactg ccgtccatgg tgcacatgcc 481 ctccgcgcct cccgcctgca tggcggactc cagctggtgg agcttgtctt cgcggatcat 541 gttctggatg gcggtcgtag atttcatgat ctcgaatacc gggatgaggt taccgtccac 601 cgaaggcacc agctgctggc agacgatgcc tttgagcatc tgcgccagct ggatcttcac 661 ctgctgctgc tgattggccg ggaacacgtc caggatacgg ttgatcgtgt tcgccgcgct 721 gctggtatgc agcgtggata gaagcagcac accggtctcc gccgacgtaa tggcggagga 781 gatggtatcg taatcccgca tctcgcccag caggataacg tccgggctct cccgcagcgc 841 gctgcgtaaa gattccatgt agcccggcgt atcgatggag atctcccgct gggtgacgat 901 ggatctcttg tgctgatgga tgtactcgat ggggtcttcc atcgtgatga tatgcgcctc 961 ccgggtatgg ttgatccggt cgatgagaca ggccagcgtc gtggattttc ccgaaccggc 1021 agagccggtg atgagcacca ggcccttctt cgtatccgcc agagagagca cgctctcggg 1081 gatgctgaga gccgctggat cgggcagccc gaaccggatg acccggataa cggcagcaag 1141 agaaccgcgc tggcggaaga tattcacccg gaagcggccg acgccgttga gcgcgaagga 1201 aaagtcgtcg tccaacccgt tgtccaggtt cgtcttcggc cgtctgctga tctcgtagat 1261 atcgtccacg cacaggcgga tatcgtccgg cagcatcttc ggacggtcca tgcgctcctg 1321 cgtgttgccg atcttgtagg tgatgggcag ccctgctacc acgaagatat ccttgacgtc 1381 ccggatgact gactgttcca ggatggtctt gatgtccatc ggctgatagg ctttgttttc 1441 gtccataact tgctattctc ccgtccagat gttgtccaga tccgtatgct cttcccaatc 1501 ccgcaggaac ttccaggcag tgataccgta ggagccccgg gcgttctgtt tcaactcgat 1561 atgcaggctg agaccgtttt ccccctcgat cgtctcgctt acggtgggaa gcccggactg 1621 cagatcgttt ccgcggcaga cgtccgccag gaatgcctgc ccttccgcct ccagcgcata 1681 gcgctccgtt accgtatccg catagcgctg cgccaggcgc agatctgcct gccccgtcgt 1741 aaaggaaagc accgccagga tcgtaagaca gatgctgatg accgccagca acagtgccag 1801 ggggccgagc cttatgggta cgtgtttcat ggctgcacct cctgaatata gacagccgta 1861 tccaggctgt agatgtcctc ttcagaacca ggtcttctta cggagatggt tccttttgcg 1921 agaacagaat cgccggaagc agtgctctga tccgcatccc acgagatgat cagcctatag 1981 gcggcatttt cttctgcaac agggtttaaa tcattgtcgt aataggcaaa gatgatcgcc 2041 ggaagccggt ctttcggggg aacggggtac tgagaggacg tcgatgccag ggtcacgttg 2101 ccctcgtcca ggatatccgc cagttccgcc gggccgtccg ccgccgcaaa cgcttctgcg 2161 ccggtctccg ccaagcgcac cgcgttcgtc aggtcctgtg cccgggagga ctcccgtttg 2221 cccagaccaa acacgttcgt cagcatcagg atgacgagga cgaacgagac gataagcagc 2281 agcgtttcga tatagaaggc ggtgatgtgc tcgtgtttgc tcttcatagc acgcctcctt 2341 ggctgcgaag gcggatgagg ctgcgtccgg cgtccgtcgt gactgccagc agcccttctg 2401 tcagttcctc caccgtaaag acggaagtct gcccgatgat ctgagcgttt tcggggtcaa 2461 gcgcagcccc ggtctcggcg taatcctcca ccagattccc atgggagaga tagagccgcg 2521 acgcgtagcc gctctcttcg tctgcgatca cgaggaccgt gtttccgtct tcctcgcgga 2581 tacgcacgca tccggtctgg tcgctgccct tgatgcaggt ggagacatag gaaagcagca 2641 cgcggctgtc gttgttcgca tgctgagccg ccacggcgtt ccggtaattc tgggcgccga 2701 atacgaccag caggaaaaag ccgagcagga acagcgcggc aatgccgatg gagtataatc 2761 ctaatggact tttctgatct tctttaaaag tcatgcgttc tgagagatct tccgtttatt 2821 tttcgatcac gttgatggtg ggaggcacgt tcgatgcgaa agcctcgtac accacgtagt 2881 agttgtccgt gttcacctgc agcccgtaat gatcctgcag atacgccaga tccggcgggt 2941 atacgccctc gacgacgtag cactgcagcg cgctgcgtcg gatcgcgtcg cggatggctg 3001 taacggtctc ttcgtccaga tccttgccgc tcccggaaaa tgcaaaatac ccgcacgcca 3061 aaacgagggc gcacaggacg atgagaagga tatttctttg tttatgggag accctgtcct 3121 gatacatacg ttatcctacg gaattcatca tgccgatgag gggcagcatg acgctcagca 3181 gcgacagccc caccgtgacc attagaatgc cggaaagcag cggatccaca aagcctacca 3241 gacggtccac ttcgttcgag cagttttcct ccagcagatc ggtgagcctc tccagcacgt 3301 tttccagatt gccgctgcgt tcgcctgcca gcagcatgcg gccgtaagtg ggctcgaaca 3361 gttcctcgtc ataggcagcc tgggcgatgc tgtggccttc cagcatgccg gatgcgacac 3421 gcttgagttt ctcttccaca ggaccgtaat ccgccatggg aatgcttttc tccacggctt 3481 cgtcctgcat gtcaccgctg gcgataaagg tggccagagc ggacgtgaac cggaacatgg 3541 ccatgttctc caggatggac gcgcagacgg gggacttcct cagcagcgct tccacggatt 3601 cccgtttgcc gcctttccac atccggtagc cgatcagcag c // LOCUS sequence080 3615 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence080 VERSION sequence080 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3615 /mol_type="genomic DNA" /organism="" /note="sequence080" CDS complement(552..2255) /product="Na+/H+ antiporter NhaC family protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_001048829.1" /transl_table=11 /codon_start=1 /translation="MEKKSTRTAYLVAVCAIIVLLVILAMSYKNAPILVEDAASPFAGT FWSLLPPICAIVLALISKEVYSSLFFGCIVGALLYTQFSPWDTLTSLVGADYGLICVLA DSWDMGIIIFLVELGIISDLMNKGGGSEAFGRWAKDKVKSRASAQLLTMLLGVLIFVDD YFNCLTVGAVMRPVTESHNISRAKLAYVIDATAAPVCMIAPISSWAAAVSGYVNSDNVN GFELFIKQIPWNYYCILTLVMIITISLKNIDYGPMLKHEYNAQVKGDLFTTEHRPFAGA DDYEAPSGKKTSVADLLIPVIVLIICCVVGMIWTGGFFDGAAFTDAFADADAAAGLAVG GTLGMIFTFIYFWCRRTIGFDKSFESVPNGFIQMVSPILILTLAWTLSSFTRGALCSAD YVSAALAGAGSLKNFLPAVIFVIGAAIGFATGTSWGTIGIMAPIVVAVFNYDVEPTLCT IGLAAACAGGVMGDHCSPISDTTIMASAGAHCYHLNHVFTQLPYALTVAVVSFISFILA GIIQNAAICLVIGIVLMIGTVIVIGKMERSKHADMFKEMDEAYAKMLAGK" /locus_tag="LOCUS_3080" /note="WP_001048829.1 Na+/H+ antiporter NhaC family protein (Vibrio) [pid:34.4%, q_cov:90.8%, s_cov:98.3%, Eval:3.4e-81]" /note="MGA_420" CDS 2537..2854 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MSLEAMRMVEKAESDARKMIADAKAEAKAAADNAAKSGRERMDAE AEKARKAAEDILENAKLVGKASCTDIDRASADAVARLRSAAEGKLPEAAKFIAERITED L" /locus_tag="LOCUS_3090" /note="MGA_421" ORIGIN 1 agcagggcgt ccatgccgtc gaggacggaa gatttgcagg ggatgccgat gacgggcagg 61 gtggtgcctg cggcgacgac gcctgccaga tgggcagcca taccggctgc cgctatgatc 121 acgccgaaac cgttgtctct cgcggcggcc acgaaatcgt ggacctgctg cggggtgcgg 181 tgggcggaat agacgtggac ttcgaaggga acgccgaggg cggtcaaaat gtccgtcgcc 241 ttcttggcga cgggcagatc gctgtccgat cccatgatga ttccgacttt tttcatttca 301 gcctccttat atagagtaag attcctgttt gcacattcta aatgtacctg aacaaactcc 361 atatttcaat gaaatccgga caaatttgga acattaaaaa atgataaaat ccgaacgttc 421 ggattatcag gaacgatggg tttacgttat atgcactatg ttcggttttg caaaattttg 481 caaaagaaaa gaccggatcc cgaaggaccc ggtctttaaa tgtcttgtga caaatgcgct 541 atgttccgga attactttcc agcgagcatt ttcgcatacg cttcgtccat ttccttgaac 601 atatccgcat gcttggatct ctccatcttg ccgatgacga tcacggtgcc gatcatgagg 661 acgatgccga tgaccaggca gatcgcggca ttctggatga tgccggccag gatgaaggag 721 atgaaggaga cgactgcgac cgtcagcgcg tagggcagct gcgtgaacac gtggttcagg 781 tggtagcagt gcgcaccggc ggaagccatg atcgtggtat cggaaatggg ggagcagtgg 841 tcgcccataa cgccgcctgc gcaggcagcc gccagaccga tggtgcagag ggtgggctct 901 acgtcgtagt taaagactgc aacgacgatg ggagccatga tgccgatcgt accccaggaa 961 gtaccggtcg cgaaaccgat cgccgcgccg atcacgaaga tgactgcggg caggaagttc 1021 ttgagggaac ctgcgcctgc cagggcagcg cttacgtagt cagcggagca cagagcgcct 1081 ctggtgaagg agctcagggt ccaggccagc gtcaggatga ggatcgggga taccatctgg 1141 atgaagccgt tgggaacgga ttcgaagctc ttgtcgaagc cgatggttct gcggcaccag 1201 aaatagatga aggtgaagat catgcccagc gtgccgccga cagcaaggcc ggctgcagcg 1261 tctgcgtcag cgaaagcgtc agtgaacgca gcgccgtcga agaagccgcc ggtccagatc 1321 atgccgacaa cgcagcagat gatgagcacg atgacgggga tgagcaggtc cgcgacggaa 1381 gtcttctttc cgctgggcgc ttcgtaatcg tccgcgccgg cgaacggtct gtgctcggtg 1441 gtgaacaggt cgcccttgac ctgcgcgttg tactcatgct tgagcattgg accataatcg 1501 atgttcttca gggagatcgt gatgatcatg accagcgtca ggatgcagta gtagttccag 1561 ggaatctgct tgatgaacag ttcgaagccg ttgacgttgt cgctgttgac atagccggaa 1621 acggcagctg cccaggaaga gatcggggcg atcatgcaga cgggagccgc ggtagcgtcg 1681 atgacgtaag ccagcttggc tctggagatg ttgtgggact cggtgaccgg tctcataaca 1741 gcgcctaccg ttaagcagtt gaagtagtcg tccacgaaga tgagcacgcc cagcagcatg 1801 gtcaagagct gcgcggacgc tctggacttg accttgtcct tagcccagcg gccgaatgcc 1861 tcggaaccgc cgcccttgtt catcaggtcg gagatgatgc ccagttcgac caggaagatg 1921 atgatgccca tatcccagct gtctgccagt acgcagatga gaccgtagtc agcgcctacc 1981 agagaggtga gggtgtccca agggctgaac tgcgtataga gcagcgcgcc tacgatgcag 2041 ccaaagaaca gggaggagta aacttccttg ctgatgagcg ccagaacgat ggcgcagatc 2101 ggcggaagca gagaccagaa cgtgcccgcg aatggagacg cagcgtcctc cacgaggatg 2161 ggggcgttct tgtaggacat ggccaggatc accagcagca cgatgatcgc gcagacggca 2221 accagatagg ctgtccttgt gcttttcttt tccatagaaa ataacctcct aaatgaataa 2281 agataaatag tgcggcaggt attcaaaaga tttgcggcat acctgcacgg atacattata 2341 tcatcgattt ggcatttgtg aacaaaaaaa cgatgtccgc agggcttttt tattggtctg 2401 cggttgaatt aactttttcg ccgaaaaggc atgaactatg gtataattca aataagtatg 2461 aaaacggatg tgtgtagaga tggttaccac tgttccctac gctattttta tatctcgagc 2521 aaggagagtg atgcggatgt cactggaagc catgagaatg gtcgaaaaag cggaatctga 2581 cgccagaaag atgatcgcgg acgccaaagc ggaagccaag gcggctgcgg acaacgcggc 2641 gaagtccggc agagaacgga tggacgcgga agcggaaaag gcgaggaaag ctgcggaaga 2701 tatcctggaa aacgcaaaac tcgtgggaaa agcttcctgc acggatatcg acagggcttc 2761 tgccgacgcc gtggcaagac tgcgcagcgc cgcggaaggg aaacttccgg aggctgcgaa 2821 gttcattgcg gaaaggatca cggaagacct atgagcattc agaagatgaa acggatccgg 2881 ctgatcggcc tgcgcagcga gaaagaggcg ctgctggacg agctgctccg cttcggcaag 2941 gtcgaggtct cggattatcc gcaggcggaa ggcgacgtcg tggtgttcag cacgaacaac 3001 tacgacaaga cggccatccc cgcggacatg ctggcggtga accagcagaa gctgacggcg 3061 gccctggata tcctgcagag gtacttcccg gaaaagaaga aactgctgga tcccaagccg 3121 gaagcgcctc tggagacctt cctgagcaac gcccgtctca acagctgcct gcacagcgct 3181 acccgggtca tacggctgga cggcgagatc aagaactgga cggcaaagat ccaggaactg 3241 aaggaaacgc agaccgctct gcagccctgg atggatctgg acatgccgtt ggataccgaa 3301 ggaacggaac acgtctgcgt gacgctgtgc tccctgcccg cggacgcgcc ggaggcggac 3361 gtgctctccg cgctggaata cgcggcgccg gagagcgaac tcatcccggt ctcctcggat 3421 aaattcatgc gctactgcgt gctgatctgc cacagagacg aattcgccgc ggcggaggac 3481 gcgctgcgca acttcagcta cagccccatg gagggtctga agatgagcgg cacggcgaag 3541 ctcaacgcgg accatatcgc ccacgagatc gaattcaacg aagtcaagat cgaacgggcc 3601 aaggcgaaac tgatg // LOCUS sequence081 3609 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence081 VERSION sequence081 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3609 /mol_type="genomic DNA" /organism="" /note="sequence081" misc_feature <1..714 /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_000076736.1:polyribonucleotide nucleotidyltransferase" /note="WP_000076736.1 polyribonucleotide nucleotidyltransferase (Bacillus cereus) [pid:63.3%, q_cov:92.0%, s_cov:30.6%, Eval:3.8e-73, partial hit]" /note="MGA_423" /locus_tag="LOCUS_3100" CDS 767..2050 /product="pitrilysin family protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_000592996.1" /transl_table=11 /codon_start=1 /translation="MIEVRQLPCGVRLVMEKLPDRQSASIGIWIGAGSARETAKNNGVS HFLEHMFFKGTKTRDQLQLAKDTDDLGCDMNAFTGKEATCFHIKALSSVFPKAVDILLD MLCNSLFDEEEMEKERGVILEEFNMVCDTPDDYIMDLLDAKVFWRTPLAKSVLGSRANI RNLQRSDILEYIDTWYTRDNIVVSVVGNFDEERLAQQLEEKLSGFGAGSPSRKAASAAR GSRYLSLTKDINQTHLALGIPTIALDSPEYYAQAAVCDVLGGSMSSRLFQNIRERKGLA YSVFSASESYACGGQFYIYAAVKPGTEAKVLQAIGEELSALAEEGISEEQTHVVKQRLK SGFIFSLESTNSRMYRLGKNMLLLGRTYTEEETMAEIDAVSREQVNAFAKRIADIRSYS GAAISPRSLDWEELWNGSQNLNGSAKRG" /locus_tag="LOCUS_3110" /note="WP_000592996.1 pitrilysin family protein (Bacillus cereus) [pid:40.2%, q_cov:92.7%, s_cov:95.4%, Eval:1.6e-77]" /note="MGA_424" CDS 2005..2490 /product="dUTP diphosphatase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_000049186.1" /transl_table=11 /codon_start=1 /translation="MERIAKFERVSEARLTEDSAHLKEAPLPIELPVRATAGSAGYDFK TPWDIHLQPGESVRIPTGLRCRIAPGWVLLIAPKSGLGFKYRLQLDNTLGVIDEDYYGA DNEGHIQIQITNDSRSGKVLEIPAGKAFAQGLFVPYGITEDDEAEGKRTGGFGSTNA" /locus_tag="LOCUS_3120" /EC_number="3.6.1.23" /note="WP_000049186.1 dUTP diphosphatase (Streptococcus) [pid:43.1%, q_cov:80.1%, s_cov:86.5%, Eval:2.0e-21]" /note="MGA_425" CDS 2500..3519 /product="deoxyguanosinetriphosphate triphosphohydrolase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011392159.1" /transl_table=11 /codon_start=1 /translation="MVFREEQEKREYEMLSAFACKSAESRGRVVPEKPCDLRTEFQRDR DRIIHSKSLRRLMHKTQVFLSPEGDHFRTRLTHTLEVAQIARTISRALGLNEDLTEAIA LGHDLGHTPFGHNGEEFLNEIHPGGFAHNVQSLRVVDVIERNAAGRTMNLTEEVRDGIV NHTGPVWPFTLEGQVVRHSDRIAYINHDIDDAMRGGIIRAEDLPAECTAFLGPDHRSRI NTLVTDIVKHSDGQDKVAMSEDAAFYMNALRDFMFANVYRSPAVKQASELDKIRGLIHS LYGYFLEHSDELPSEYRSILERDGGNEAVKDYIAGMTDRYAINMYNEKFVPSGWKLPK" /locus_tag="LOCUS_3130" /note="WP_011392159.1 deoxyguanosinetriphosphate triphosphohydrolase (Moorella thermoacetica) [pid:58.0%, q_cov:98.8%, s_cov:99.4%, Eval:2.8e-103]" /note="MGA_426" ORIGIN 1 gtcaaggaag acggcaccag cgaatacgcc atcctgtccg atatccaggg catggaagac 61 ttcctgggcg acatggactt caaggtcaca ggcaccgcgg aaggcgtcac cgccatccag 121 atggacatca aagtccacgg tctgtccaga gagatcctcg agaaggctct gaagcaggcg 181 aaggaaggca gaatgtacat catgagccag atgctcgaag agatccccga acccagaaag 241 cagctgtcca agtacgctcc gctcatcacc agcatgcaga tcgatccgga caagatccgc 301 atcgtcatcg gcaagggcgg cgagaccatc aaccgcatca tcgcccagac cggcgcgaag 361 atcgacatcg acgatacggg cctcatcttc atcgcagcgc ccaacaccga atccggcgac 421 gcggcgcgca aggagatcga gtacctcacc aaggacatcg aagtgggcga gacttatacc 481 ggtaaggtcg tccgtctgat gaacttcggc gctttcgtgg aatgcctgcc cggcaaggac 541 ggtctgctgc acatctccaa gatctgcaag gagagagtgg agaaggtgga agacgttctc 601 aatatcggcg atatcgttac cgtcaaggta tccgagatcg attcgcaggg ccgtgtgaac 661 ctcaccagaa gaggtctgga agacacgccc atcatcaaag caagcgagca gtaaacgagt 721 tcgggccggc tttttaagcc ggccctgatg cattttagga taaaacatga tcgaagtaag 781 acaactgccc tgcggcgtgc ggctggtgat ggaaaaactg ccggaccgcc agtccgccag 841 catcggcatc tggatcggcg caggctccgc cagggaaacg gctaagaaca acggcgtctc 901 gcattttctg gagcacatgt tctttaaagg cacgaaaacg cgggatcaat tgcagctggc 961 gaaggatacg gacgatctgg gctgcgacat gaacgcgttc acggggaaag aagccacctg 1021 ttttcacatc aaggcgcttt cttccgtctt tcccaaggct gtcgacatcc tgctggacat 1081 gctctgcaat tccctgttcg acgaagagga gatggaaaaa gagcggggcg ttatcctgga 1141 agagttcaac atggtgtgcg acacaccgga cgactatatc atggatctgc tggacgctaa 1201 ggtgttctgg cgcacgcctc tggcaaagtc tgtcctgggc agccgcgcga acatccggaa 1261 tctgcagaga agcgatatct tagagtatat cgacacctgg tatacccgcg acaacatcgt 1321 agtttccgtc gtggggaatt tcgacgaaga gcgtctggcg cagcagctgg aggaaaaact 1381 gtccggcttt ggtgccggca gcccttcccg caaagcagcc tctgccgcac ggggaagccg 1441 gtatctctct ttaacgaagg atatcaacca gacgcatctc gcgcttggca taccgacgat 1501 cgctctggat tctccggagt attacgccca ggccgccgtc tgcgacgtgc tgggcggcag 1561 catgagctcc cggctctttc agaacatacg ggagagaaaa gggctggcat acagcgtgtt 1621 cagcgcttcg gagagctacg cctgcggcgg tcagttctac atctacgcgg cggtaaagcc 1681 cggcacggaa gcgaaagtgc tgcaggccat cggcgaagag ctgtccgctc tcgcagaaga 1741 aggcatcagc gaggaacaga cgcatgtcgt aaagcagcgg ctgaagagcg gctttatctt 1801 ctcgctggaa tccacgaatt cccgcatgta ccggttgggc aagaacatgc tcctgctggg 1861 acggacctat acggaagaag agaccatggc ggagatcgat gcggtctcgc gggagcaggt 1921 gaacgcattc gcaaagcgta tcgcagacat ccgcagttac agcggggcag ccataagccc 1981 acgcagcctg gattgggagg aactatggaa cggatcgcaa aatttgaacg ggtcagcgaa 2041 gcgaggctga cggaagacag cgcccatctg aaagaagcgc ctcttcccat cgaacttccg 2101 gtccgcgcga cggcgggaag tgccggatac gactttaaga cgccctggga tatccatctg 2161 cagccgggag agagcgtgcg catccccacg ggactgcgct gccgcatcgc accgggatgg 2221 gtgctcctca ttgcgccaaa gagcggtctc ggctttaaat accgcctgca gctcgacaat 2281 acgctcggtg tcatcgacga agattactac ggcgcggaca acgaagggca tatccagatc 2341 cagatcacga acgattcccg gtcgggaaaa gtgttggaga tcccagccgg aaaagccttc 2401 gcgcagggcc tgttcgttcc ctacggcatt acggaggacg acgaggcgga agggaagcgc 2461 acgggcggat ttggttctac gaacgcatag gaggcagcta tggttttcag agaagaacag 2521 gaaaagcggg aatacgagat gctttctgca tttgcctgca agtctgcgga gagcagggga 2581 cgggtcgttc ccgagaagcc ctgcgacctg cgcacggaat ttcagcgcga cagagaccgc 2641 atcatccaca gcaaatccct gcgccgctta atgcataaaa cgcaggtctt cctgagtccg 2701 gaaggcgacc atttccggac gcgtcttacc cataccctgg aggtcgcgca gatcgcgcgg 2761 acgatctctc gcgcgttggg tttgaacgaa gatctgaccg aagccattgc tctgggtcac 2821 gatctgggcc atacgccgtt cggccacaac ggggaggaat ttcttaacga gatccatccc 2881 ggcggcttcg cgcataacgt ccagagtctg cgcgtcgtgg acgtgatcga acgcaatgct 2941 gcaggccgca cgatgaacct cacagaggaa gtccgggacg gcatcgtcaa ccataccggt 3001 ccggtctggc cctttacgct ggaaggtcaa gtggtgcgcc attcggaccg catcgcctac 3061 atcaatcacg atatcgacga cgccatgcga ggcggcatca tccgcgcgga ggatctgccc 3121 gcggaatgca cggcctttct tggccccgac catcgcagcc gcatcaatac gctggtgacg 3181 gacatcgtaa agcacagcga cggtcaggat aaggtcgcca tgtccgaaga cgccgctttt 3241 tacatgaatg cgctgcgcga tttcatgttc gcaaacgtgt accgcagccc ggcggtaaag 3301 caggcgtcgg aactggacaa gatccgggga ctcatccatt ccctgtacgg ctatttcctg 3361 gagcacagcg acgagctgcc ctccgaatac cgcagtattc tggagaggga cggcggaaac 3421 gaagccgtaa aggactacat cgccggcatg acggaccgtt acgccataaa catgtacaac 3481 gagaagttcg tcccttcggg ctggaagctc ccgaaataag acgggcaaaa aaaaggatga 3541 gacgctgttt tcctgtaaac agataacagg aggggaagta tggcagtcac atcgctgatc 3601 tcggcagca // LOCUS sequence082 3607 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence082 VERSION sequence082 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3607 /mol_type="genomic DNA" /organism="" /note="sequence082" CDS 171..3017 /product="molybdopterin-dependent oxidoreductase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011392899.1" /transl_table=11 /codon_start=1 /translation="MAFTNSKTFLYNAHILKSFFEDLDRWREECACFGIRSTIEDQQYD DLFKGTDADVYIPMWASACKGHGDILIDRTTYDCIRFYKAYGYETIHMDGNPADFLGEQ LRFLEYISVCGLKGTGNAGLVIEAFIEQFTLDTVKEFCKSLRAQNAVPISEELGFVCEA LEALVRLQPKALVTEIGCDEFYCWQWSQKPPLPVEEPHIVRSAGVNNCGGNCKLEVWCA EGCVLDISADTTINGVQLRTCPRGRGYRHTFLTSHRLRYPMKRREARGSGKYKRISYEE AAKEIADKIKECGEKYGPGSRYMIYSTGVCAVARPDHLMKRLLCLDGGYLQHYNSYSSA QANYITPYIYGTERTNNHPADVMNSKLIILWGHNTAESIIGPFRNYYFAKAKEAGVRIV VIDPRNSESALTFADEWIPIKPGSDCAMANAMAFVIFQKNLQDQEFMNKFCVGFDEAHM PEGVPVGESYKSYLFGLQDGIVRDPKWAEEICGVPADKIEELAVEYATSKPASIQPGLG VQRTFIGENAIRAISALCAMTGNVGIPGGGAGGTVTPNGHYEAQEMFKPENGCTYSTPV FLWSKIIDKWETMTAEEDGIKGADKLPCGIKLMFSLASNVMMNQHSDLNDTQRILSDTS KCELIVNSDLFYTSSVRWSDIVLPGASLFETEFIPSVWNSDDYVLYANQCTQPLFGSVF EYEWMKLVAKDMGLYEAFTDGCETRQDWSRKIYNEDLLPREPELPDFDTFMERGGHMYS GPCDEPVAFRKQIRDGVPFATPSGKIEIFSKQLFDMHKPDIGGIPKWFDGPEGPTDYAG LNKYPLQLIGYHTKRRCHSIHDQNQWMEELDPPALWIHPKDAAVRGIEDGDMIEVYNDR GTVRIPAFVTDRIVRGAVALSQGGWYTPDKDGVDVRGSINVLTYAYKPSPVAKGNPQHT NLVEVRKYEAAEGQKPAK" /locus_tag="LOCUS_3140" /note="WP_011392899.1 molybdopterin-dependent oxidoreductase (Moorella thermoacetica) [pid:42.7%, q_cov:77.6%, s_cov:93.1%, Eval:2.9e-163]" /note="MGA_428" ORIGIN 1 acaacatgca gccggacctg ttcgcggtca acaagaaatt tatccgttcc tacgaaaagc 61 gcttctactg cggcgaaaag ctggtgggcg ccatcatcat cggcaatctg gcccgcatgc 121 aggaactgaa ggagaagatc ctggggatcg ctccccgtga ggtatagacc atggcattta 181 cgaacagcaa gaccttttta tataacgcgc acatcctgaa gtcgttcttc gaggacctgg 241 accgctggag agaggagtgc gcctgcttcg gcatccgcag caccatcgag gaccagcagt 301 acgacgatct gtttaaaggg actgacgcag acgtgtatat cccgatgtgg gcctcggcct 361 gcaagggtca cggagacatc ctgatcgacc ggacgaccta cgactgcatc cgtttctata 421 aagcctacgg ctacgaaacg atccacatgg acggcaaccc cgcggacttt ctcggagagc 481 agctgcgctt cctggaatac atcagcgtgt gcggactgaa gggcaccggc aatgccggcc 541 tcgtgatcga ggcgtttatc gaacagttca cattagatac cgtaaaagaa ttctgtaaat 601 ccctgcgtgc acagaacgcc gttcccatct cagaggaact gggtttcgtc tgtgaagcgc 661 tggaagcgct ggtccgcctg cagcccaagg cgctggtgac cgagatcggc tgcgacgaat 721 tctactgctg gcagtggagc cagaaaccgc ctcttcccgt cgaggagccg catatcgtgc 781 gctctgccgg ggtcaacaac tgcggcggca actgcaaact ggaagtctgg tgcgcagagg 841 gctgcgtgct ggatatctcc gccgatacaa cgatcaacgg cgtacagctg aggacctgtc 901 ccagaggaag aggctaccgg cacacgttcc ttacgtctca ccggctgcgc tatcccatga 961 agagaaggga agcgagaggc agcggcaaat ataagcgtat ttcctatgag gaagcagcga 1021 aggagatcgc agataagatc aaggaatgtg gcgagaagta cggtcccggc agccggtaca 1081 tgatctattc caccggcgtc tgcgccgtgg cgcggccgga ccatctgatg aagcgcctgc 1141 tgtgcctcga cggcggctat ctgcagcact ataactccta cagcagcgcc caggcaaact 1201 acattacgcc gtacatctac ggtaccgagc gcaccaacaa ccaccccgcg gacgtcatga 1261 actccaaact catcatcctg tggggccaca atacggcgga aagcatcatc ggaccgttcc 1321 gcaactatta cttcgccaag gcgaaggagg cgggcgttcg catcgtggtc attgaccccc 1381 gcaacagcga atccgctctg acgtttgccg acgaatggat ccccatcaag ccgggcagcg 1441 actgcgcgat ggccaatgcc atggccttcg tcatcttcca gaagaacctg caggaccagg 1501 agtttatgaa caagttctgt gtgggcttcg acgaagcgca catgcccgaa ggcgtgcccg 1561 taggggagag ttataagagc tacctgttcg gcctgcagga cggcatcgtg cgtgacccga 1621 aatgggccga agagatctgc ggcgttcctg cggataagat cgaggaattg gccgttgaat 1681 acgccaccag caagcccgcc agcatccagc ccggtctggg cgttcagcgc acgtttatcg 1741 gcgagaacgc gatccgcgcc atctcggcgc tctgcgccat gacgggcaac gtcggcattc 1801 ccggcggcgg ggcaggcggc accgttacac ccaacggcca ttacgaagcc caggagatgt 1861 tcaagcccga gaacggctgc acctattcca cgccggtgtt cctgtggagc aagatcatcg 1921 acaaatggga gaccatgact gccgaagaag acggtatcaa gggcgcggac aagctgccct 1981 gcggcatcaa actgatgttc tccctggcgt ccaacgtgat gatgaaccag cattcggatc 2041 tgaacgacac ccagcgcatt ttaagcgata ccagcaagtg cgagctgatc gtcaactccg 2101 atctgttcta tacctccagc gtccgctggt ccgacatcgt gctgcccggc gcgtcgctgt 2161 tcgagaccga gttcattcct tcggtctgga actccgacga ctacgtgctg tacgccaacc 2221 agtgcacgca gccgctgttc ggctccgtct tcgaatacga atggatgaag ctggtcgcaa 2281 aagacatggg cctgtacgaa gcctttaccg acggctgcga gacacggcag gactggagcc 2341 gcaagatcta caacgaagac ctgctgccga gagagccgga gctacccgac ttcgatacgt 2401 ttatggaaag gggaggccac atgtattccg gcccctgcga cgagccagtg gcgttccgga 2461 agcagatccg ggacggcgtg ccgttcgcaa cgcccagcgg caagatcgag atcttcagca 2521 aacaattgtt cgacatgcat aaacccgaca tcggcggcat acccaagtgg ttcgacggac 2581 cggaaggccc gacggactat gcggggctca acaagtatcc gctgcagctg atcggctacc 2641 acacgaagcg gcgctgccat tccatccacg accagaacca gtggatggag gagctggatc 2701 cgcccgcgct gtggatccat cccaaagatg ctgccgtaag agggatcgag gacggcgaca 2761 tgatcgaggt atacaacgac cgcggcacgg tgcgcattcc ggccttcgtg accgaccgca 2821 tcgtgagggg cgcggtagcg ctgtcccagg gcggctggta tacaccggac aaggacggtg 2881 tagacgtgag aggctccatc aacgtgctca cgtacgccta taaaccgtct ccggtggcga 2941 agggcaatcc gcagcacacc aatctggtgg aggtgcggaa atacgaggcc gcagaaggcc 3001 aaaaaccggc gaaataagaa gagaaaaagc cctagacgat aaatgagtcg tccggggctt 3061 tttacgtata ggaatcctcg atctttaacg acgaccacac catcatggcg atggtggagc 3121 agggactatg cgtaagcatt ctgtcggagc tgatgctgca gcccggcggt ttctggactt 3181 tttccaggag cgcatcgaaa cgctgatcta gaaagaaggc aataaaaaga accgggggag 3241 gtcctcccgg tccttttaac gtctgcagga gagctgcaga gcggccgcaa actgttgtta 3301 tttcagcaag gtgcggatgg tctcgaaagt aatgttgggt acgttcttga aggtctgctt 3361 catgtcgacg cgttcggtca ccatgtggcc gtcgcggccg aaggtgccga tgtttacgac 3421 gggtacgtcg atctcgcgga tctttgagat gtcgtggaaa tacttatact tggaggacgg 3481 catgttgtcg ttcagatcgt ccaccgtgga cgggtcaccg ccgacggcca tgaagctgga 3541 atccgcgatg tacgggtaga acatgcgggt cttgatctgt ctgccggcct cggggcggac 3601 cttctcg // LOCUS sequence083 3561 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence083 VERSION sequence083 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3561 /mol_type="genomic DNA" /organism="" /note="sequence083" CDS 449..1999 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MKKNIAKFSSLLLAALLLLTNLAMPAAVFAEQAPTKNGITSIEEL NGKDLGVQTGVLYEDHIKDDLEGETWYYYKMPNDMIPALESNKIAAYLIEEVGFYAQRF EHPELVRLEEPVGVSDFAVIVGNNDKQDRLFAELQEFIAQGRENGWLDKLYDYWVINWN PNTCKIENSPETTGENGTVSIAIEGGYEPFSFESNGEFSGYDVEFMMNFCAAYGYNWEF HAMEFDSIAPAVIAGKYDFGMNIVVDEERAEASVLTDPYYSCDIVFVLEGVTEDGVHFM DGIKDSFYKTFIKEDRWKLFAQGIGTTLLITLCSIAFGTLFGFAVYMLCRHGNPLANRV MNVFDGFIHGIPTVVFLMILSFVIFANSSHITAISILGFTLIFGCSMFDMLKVGNNAVH RGQAEAAKALGYSDTQSFFKILLPQAAQHFLPIYKNDVISLIKETSVVGYIAVMDLTKM GDLVRSRTYQAFFSLIAVAIIYFILEWILISIVTRVQISIDPKRRAKSKILEGIREVE" /locus_tag="LOCUS_3150" /note="WP_005903444.1 amino acid ABC transporter permease (Fusobacterium nucleatum) [pid:31.6%, q_cov:42.2%, s_cov:97.0%, Eval:3.6e-26, partial hit]" /note="MGA_431" CDS complement(2296..3033) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MEVEIEGELRYRRYPNGSAVPYRISGSRKNRKRVKLDPLADRETI RILRDKTLALQAIPLLKEHIAKLEASLGFEDFNLYSLCRFLGEEFWESADFFMGRINGR IANPAFDALKERQNTYPYDSRKVTTELGIFRSKSESLEAEYIADTGCRFKYEPRIIVGS KSVCPDFAVERIWRLDIGFVEHLGLIDKPDYREKKLEDIKDMADNGIYPGIQLLILGES RKDGFDAAMAKRLIRGFCMPYMF" /locus_tag="LOCUS_3160" /note="MGA_432" ORIGIN 1 agcagatctt cgagaatccg cggcagtaca acaccaagaa attcatccag agactctcca 61 ccctcagcta ccgcatcgag tccgacgagt tcgacttcga gcccgtcatc gacgaactgc 121 aagcctacgc ggagaagctg ctcatcgaga acgagagaac gtccaaactg cagctggcac 181 tggaagagat ctgcgtcaac aacctgttcg agctcaaccg tgagccgaac atctacgccc 241 agatcgacta ctccgaaaag agcgacgtgc tgtccctgga gctcaaatat tccggcgaac 301 acttcgaccc gagagattcg gacaacgagc tgttcaacaa cattctggct gagcccacca 361 ccgagctggt ggacgaagag atcatcaatt cgccgaaatg gtacaacaac cacaccaaga 421 tcagcttcag atgggaggat taggagacat gaaaaagaat atcgcaaagt tttcttccct 481 gctgctggcg gcgctgctcc tgctgacgaa cctggccatg ccggccgccg tgttcgcaga 541 gcaggcgccc accaagaacg gcatcacctc catcgaggag ctgaacggca aggacctggg 601 cgtccagacc ggcgtgctct acgaagacca catcaaggac gacctggagg gcgagacctg 661 gtattactac aagatgccca acgacatgat cccggcgctg gaatccaaca agatcgccgc 721 ctatctgatc gaagaagtgg gcttctacgc ccagcgcttc gagcatccgg aactggtgcg 781 gctggaagag cccgtaggcg tttcggattt cgccgtcatc gtgggcaaca acgacaagca 841 ggacagactg ttcgccgaac tgcaggaatt catcgcccag ggccgggaga acggctggct 901 ggacaagctg tatgactact gggtcatcaa ctggaacccc aacacctgca agatcgagaa 961 cagtcccgag accaccgggg agaacggcac cgtatccatc gccatcgagg gcggctacga 1021 gcccttctcc ttcgagagca acggcgaatt ctccggctac gacgtagaat tcatgatgaa 1081 cttctgcgca gcttatggct acaactggga gttccacgcc atggaattcg actccatcgc 1141 gccggccgtt atcgccggca aatacgactt cggcatgaac atcgtcgtgg atgaagagcg 1201 cgcggaagcc tccgtgctga ccgatccgta ttacagctgc gacatcgtgt tcgtgctgga 1261 gggggtcacc gaggacggcg tccactttat ggacggcatt aaggacagct tctacaagac 1321 cttcattaag gaagaccgct ggaagctttt cgcccagggt atcggcacca cgctgctcat 1381 caccctgtgc tccatcgcct tcggcacgct gttcggcttt gcggtctaca tgctctgccg 1441 ccacggcaac ccgctggcca accgcgtgat gaacgtcttc gacggcttta tccacggcat 1501 tccgacggtc gtgttcctga tgatcctctc gttcgtcatc ttcgcgaact cgtcccacat 1561 taccgccatt tcgatcctgg gcttcaccct catcttcggc tgcagcatgt tcgacatgct 1621 aaaggtgggc aacaacgcgg tgcacagagg ccaggcggag gccgcgaagg cgctgggcta 1681 cagtgacacc cagagcttct tcaagatcct gctgccccag gcagcgcagc acttcctgcc 1741 gatctacaag aacgacgtca tctccctcat caaggagaca tccgtcgtcg gctacatcgc 1801 cgttatggac cttacgaaga tgggcgacct ggtgcgcagc cgcacctatc aggccttctt 1861 ctccctcatc gcggtggcca tcatctactt catcctggag tggatcctga tctcgatcgt 1921 gacccgtgta cagatctcca tcgatccgaa gcggcgcgcc aagtccaaga tcctggaagg 1981 gataagggaa gtggaatagc acagatatcc cagcattaca aaaccgcgca tcgaaaggtg 2041 cgcggttttt ggttgcgtcg gtctattttc agcggctacg gtgacccaaa gatcgatggg 2101 tcactgtaaa accgtgcccc acaggccaaa actgccccat gggtccccgt aatttgccat 2161 tttccgtgcc ccacagccta taagccgctc ttgggtcacg caaaaaccgt gaccccggca 2221 ttctggggtc acggtcgagt attcggagac acgctgaact acagatttca tccgaatccg 2281 gcatggatca tcgtcttaaa acatatacgg catgcagaat ccgcggatca ggcgctttgc 2341 cattgcggcg tcgaacccgt ctttgcggct ttccccgaga atcagcagct gaatgccggg 2401 gtaaataccg ttatccgcca tatctttgat gtcctctagt ttcttttccc gataatccgg 2461 tttgtcgatc aatcccagat gctcgacaaa cccaatgtcc aaacgccaga tccgctcaac 2521 ggcgaagtcc ggacaaacgc tcttggaccc cacgatgatc cggggctcat acttgaatct 2581 gcaccctgta tccgcgatat attccgcctc caaagactcg cttttggatc gaaaaatacc 2641 caattctgtc gttaccttcc tggaatcgta cggatatgta ttctgccttt ctttcagtgc 2701 gtcaaatgcc ggatttgcta tccgcccatt gatccgtccc atgaaaaaat ccgcagactc 2761 ccagaattct tctccaagaa accggcaaag cgaatacaga ttaaagtctt cgaaccctaa 2821 tgaagcttcc agtttcgcaa tatgctcctt cagcagcgga atcgcctgga gcgccagcgt 2881 cttatcccgt aagatccgaa tcgtttccct atctgctaac ggatccagct ttacgcgttt 2941 tcgattcttc cgcgacccgc tgatccgata cggtaccgcc gagccattcg gatacctgcg 3001 gtaacgaagt tcgccctcga tctccacctc cacagctttt tggagcttct gcagaagtgc 3061 cttttgcctt actatcgttt tttcgagatc caccacttgt atcatgacct agttatatca 3121 cagaaggtaa tatttgacaa ccattattta gcataatttc aaataatttt taatttctgc 3181 aggatccgta cggcatatac ccaaatgtaa cgttgggaag atgcctaaag tccatctaca 3241 ttggtgccac ttcgggcttt acggtgaccc aaagatggat gggtcactat aaaaccgtga 3301 cccacaggcc aaaactgccc aatgggtctc cgtaatttgc catttttcgt gacccacagt 3361 ctataaaccg ctccggggtc acgcaaaaac cgtgaccccg gcattctggg gtcacggttc 3421 ggtgcatatg tctgttacat tttatccgcc gtacaagtaa tctgctatct cagtccctgc 3481 cagaccagga tgagaatgag gatcggcagg ataaactgga agtagacctt taagcctctg 3541 gcgaacttga ggcccttgcc g // LOCUS sequence084 3550 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence084 VERSION sequence084 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3550 /mol_type="genomic DNA" /organism="" /note="sequence084" CDS 134..1030 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MKKFLAILLAALMIFGVTACTSSQEPAAEPEAAEGTETETEGEAA QEQLTIAPGKLSVALSPDFAPMEFVDTSKSGQDQYVGFDVTLAKFIAEEMGCELTIEPM SFDACQAAVQTHSVDMSISGFSYTPERAENFNLSDYYYAGDNETEQTIIVLAENADKWT KAEDYSGLKVGAQSASLQYNLCTAQLPSDTEIVLYADLGTAVEALRSGIVDAVAVAYGN GEAIISNNDAIAMSGFEFEVSEEAENNVIMMTKGNDALLEKVNEILAKAYDAGYYGQWY EEAKALAGIDTAEEVSY" /locus_tag="LOCUS_3170" /note="WP_010989934.1 ABC transporter permease subunit (Listeria monocytogenes) [pid:36.3%, q_cov:78.5%, s_cov:46.5%, Eval:4.0e-31, partial hit]" /note="MGA_434" CDS 1132..1800 /product="amino acid ABC transporter permease" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003358158.1" /transl_table=11 /codon_start=1 /translation="MSFFSNIVKIMSKYWRVFLIRGVGYTLALTSITVFFGAILGIFIC LARMSKSKVLNSIALNLGEIVRGTPMLLQLYVFYLGLPRLFPGIPTFVSVSIGFILNSA CYVSEVFRSGIQAVDKGQTEAARSLGLSGKQTMTKIVLPQAVKNILPALGNEFITITKD TSLASTFFVGEVMTSYLIVKGNTFLTMECLFIVAVIYYVMTLILNRVVGRMERRMRTSD " /locus_tag="LOCUS_3180" /note="WP_003358158.1 amino acid ABC transporter permease (Clostridium) [pid:45.9%, q_cov:95.5%, s_cov:96.9%, Eval:1.5e-49]" /note="MGA_435" CDS 1793..2536 /product="amino acid ABC transporter ATP-binding protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011986547.1" /transl_table=11 /codon_start=1 /translation="MIKPVDLHKSFIIEGQPEPLHVLKGVNEHIEKGEVVSIIGPSGGG KSTFLRCLNLLEVPEKGQIFFEGVDITAKGIDIDVHRQKMGMVFQHFNVFPHLSVAENI TLAPVLTKKKTQAEADEMAKELLARVGLLDKWSEHPGRLSGGQKQRLAIVRALAMEPDV MLFDEPTSALDPEMVGEVLDVIKDLVKSGMTCVIVTHEMGFCREVSDRVLFMDGGNIAE EGTPEQVFNHPQNPRTAEFLSKVLY" /locus_tag="LOCUS_3190" /note="WP_011986547.1 amino acid ABC transporter ATP-binding protein (Clostridium botulinum) [pid:63.0%, q_cov:99.6%, s_cov:100.0%, Eval:1.4e-84]" /note="MGA_436" ORIGIN 1 aaattcccga taaatattta atttatgcaa aaataaccct tgactattca tttttatgca 61 atataatata cacatcagct gaaggaaaac acatcacaat agaaggaaaa cacaattaga 121 aggagacaat acaatgaaaa agtttttagc gatcctgtta gccgccctga tgatcttcgg 181 ggtcaccgca tgcacctcca gccaggaacc cgccgcagag ccggaagcag ccgaaggtac 241 cgagacggag acggaaggtg aagctgccca ggaacagctc accatagctc cgggtaaact 301 ctccgtggca ctgtccccgg acttcgcgcc gatggaattt gtcgatacgt ccaaatccgg 361 tcaggaccag tacgtaggat tcgatgttac gctggcaaag ttcatcgcag aagagatggg 421 ctgcgaactg accatcgagc ccatgagctt cgatgcctgc caggccgctg tccagacgca 481 ttctgtggac atgtccatct caggtttctc ctatacgccg gagcgtgcgg aaaactttaa 541 cctgtccgac tactattacg caggcgacaa cgaaaccgaa cagaccatca tcgttctggc 601 ggagaatgcg gacaagtgga ccaaggcgga agattacagc ggactgaagg tcggtgccca 661 gagcgcatct ctgcagtata acctctgcac ggctcagctg ccttccgata cggagatcgt 721 gctgtatgcg gatctgggaa cggctgtgga agccctgcgc agcggtatcg tagacgctgt 781 agcggtcgcc tacggcaacg gggaagccat catttccaat aacgacgcca tcgccatgag 841 cggcttcgag ttcgaagttt ccgaggaagc ggaaaacaac gtcatcatga tgaccaaggg 901 caacgatgca ctgctggaaa aggtgaacga gatcctggcc aaggcctatg acgccggcta 961 ttacggtcag tggtatgaag aagcgaaggc tcttgccggt attgatacgg cagaagaagt 1021 cagctactag agcggtagag aatcgaaaac agattcggat cagacaggcg ggctgctcct 1081 cctcaggcgg cccgcttctc tgtcacattc atcagtttca ggagggattc cgtgagtttt 1141 ttttctaaca tcgtcaagat catgtcgaaa tactggaggg tgttcctgat ccggggcgta 1201 ggctataccc ttgccctgac ttcgatcacc gtctttttcg gcgcgatcct gggcatcttc 1261 atctgccttg cccgcatgtc gaagagcaag gtgctgaaca gcatcgcctt aaatctgggt 1321 gagatcgtcc gcggcacgcc catgctgctg cagctgtacg tcttttatct gggcctgccc 1381 aggctgtttc cgggcatccc gactttcgtg agcgtcagca tcggctttat cctcaacagt 1441 gcctgctacg tgtcggaagt gttccgttcc ggcatccagg cggtggacaa gggtcagacg 1501 gaggcggcca gaagcctcgg cttaagcgga aaacagacca tgacgaagat cgtgctgccc 1561 caggccgtca agaacatcct gcctgcgctg ggcaacgagt tcatcaccat caccaaggat 1621 acctctctgg catctacctt cttcgtaggc gaggtaatga cctcctatct gatcgtaaag 1681 ggaaatactt tcctcaccat ggaatgcctg tttatcgtgg ccgtgatata ctatgtgatg 1741 accctcatcc tcaaccgggt agtgggccgc atggagagga ggatgcgcac cagtgattaa 1801 accggtagac ctgcataaaa gttttattat agaagggcag ccggagcccc tgcacgtcct 1861 gaaaggggtc aacgagcaca tcgaaaaagg cgaggtcgtc tccatcatcg gcccgtccgg 1921 cggcggcaag agcacgtttc tgcgctgctt aaacctgctg gaggtgccgg agaaaggcca 1981 gatcttcttc gaaggggtgg acattacggc gaagggcatc gacatcgacg tgcaccgtca 2041 gaagatgggc atggtgttcc agcactttaa cgtatttccg cacctgagcg tcgcggagaa 2101 cattacgctg gcgccggtcc tcacgaaaaa gaagactcag gcggaagccg acgagatggc 2161 gaaggaactg ctggccagag tcggtctgct cgacaagtgg agcgagcatc ccggacggct 2221 gtccggtggg cagaagcagc gtcttgcgat cgtgcgggcg ctggcgatgg agcccgacgt 2281 catgctcttc gacgaaccga cttcggcgct tgacccggag atggtcggcg aagttctgga 2341 cgttatcaaa gacctggtga agtccggcat gacctgtgtg atcgtgaccc acgagatggg 2401 tttctgccgg gaagtctccg accgcgtgct gtttatggac ggcggcaata tcgccgaaga 2461 gggaacgccg gaacaggtgt tcaaccatcc gcagaatccc agaacggcgg aattcttaag 2521 caaagtactc tattaaaaaa ttgacacaag gggacaggtc cactgtgttt gcacattgta 2581 cctgtccccc tgtgttatgt ttatgatata atccctgtat gtcctttgca tccgatgtaa 2641 aaaatgaact gaccagaacc gtgccggaga agaaatgctg ccaactggcg gagatcgctg 2701 gctttttgcg ttttgcgggg agcatcacgc tgtcctcggg gcgcatgggc attaaggtga 2761 ccacggacaa tgcatctgcc gcccggctgt tcatccggct tgtaaaggag tatttcggcg 2821 cgaagacggc gctctccctg ggcgaaccca cgccgctggc aaagggccgc gtctacgagc 2881 tcaccgttac cccggagatg aattccgaac agatcctgcg ggaagtgggc atcttaggcg 2941 taaaggaagg cagcaattac attacggatg gtttcgacgc tgcgatcgtg cgcaagcgct 3001 gctgcaaaaa ggcggcactg cggggcgcgt ttctggcatg cgggtcggtg tccgatccgg 3061 tgaaaggcta tcacctggag ctggtctgcg gctcggacta catggcgcag gtcatgcgca 3121 gggtcgtcaa cagcttcggt ctgaaggcaa agacggtaaa gcgccgcaac aagcacgtgg 3181 tctacctgaa ggacagcgaa cagatcgggg atttcctcaa catcatcggc gcgacgtcga 3241 tgtactttca gtatcaggaa gtgcggatga cgaaggaaaa cctgaacaag gccaaccgta 3301 tcgccaattg cgagagcgcc aacgtggata aacaggtgag cgctgcccag aaacaactgg 3361 ccgatatccg ggtcatcgag gagacgaaag ggctgggagc gctgtccgcc gcgctgcagg 3421 aaacggcaca gatgcgaaag gaacatccgg agctctccct ggcagatctg gcggaactgt 3481 tcgatccgcc cctgaaaaag tccggactca accacagatt tgcaaaatta gcagaagaag 3541 caaacaagat // LOCUS sequence085 3550 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence085 VERSION sequence085 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3550 /mol_type="genomic DNA" /organism="" /note="sequence085" misc_feature <1..708 /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_012583434.1:amidohydrolase" /note="WP_012583434.1 amidohydrolase (Dictyoglomus turgidum) [pid:36.6%, q_cov:90.2%, s_cov:42.2%, Eval:3.4e-34, partial hit]" /note="MGA_438" /locus_tag="LOCUS_3200" CDS complement(705..1442) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MEDYKFTRDTYMDAYNTDIARRATAGGVLRQFNETATRNMAHFGP SYDELLDSGRALMVSRMDIEILQPPMMEEPIQASTWPVLPKGAVIHRCYEIAKDGAVLA RGSSDWALVEIESRKILRMTQETFPNYRYGDYVPLFDKKLHIDHDTAEAMENVGSHRVT LRDCDCNGHINNTYYLDILCDLIPELYDYEHHWVRSARIHFAKEAPLGSEITIRRCKED NIYLFQTFLEDGSLNIECQIELA" /locus_tag="LOCUS_3210" /note="MGA_439" CDS 1564..2091 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="METKRLILRPSVFEDCVRFAEMEGTAGVRKGFTMSKDWDYNKIAP DFVKKSLDDTCEQWTIVLKETGKIIGRVIICDINEHYDSLDITRIYIGEDDLRGKGLGR EALEALLAYSFNEKHMERVTLDYVTGNEASDLYRSVGFKDEGNAVHCGKKDGYYVDLHK MAILSGEYYGRE" /locus_tag="LOCUS_3220" /note="MGA_440" CDS 2098..2547 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MAKTINATVKSREEQVVHGLWVRSTLNSSGTEWENLMRLYSKRSG DMGIRFVIRENTDEKRDCDLFCGGLTGGEDISDFTILAGEYVSVTVTPKFGLFWGSAIE EAEVYLRDEWPKQSGRKLDDFHMEIRDMMGKKPSLEILYRLLPEE" /locus_tag="LOCUS_3230" /note="MGA_441" CDS complement(2619..2807) /product="50S ribosomal protein L28" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003416297.1" /transl_table=11 /codon_start=1 /translation="MSRKCEICGKGQVSGNNVSHSNRHTRRKWNANIQSVRVEENGTVV RKNVCTSCIRSGKVTRA" /locus_tag="LOCUS_3240" /gene="rpmB" /note="WP_003416297.1 50S ribosomal protein L28 (Clostridioides) [pid:56.5%, q_cov:100.0%, s_cov:100.0%, Eval:2.9e-16]" /note="MGA_442" CDS 2979..3410 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MLTQIKNNMGTLTVSRQIIDQIIEHAFEPLEGKLWLANYRGAVSD VLVKLGGFDAIAEKKVEMHGDKLFIRLYVVSRLGESITENCVLVMQRIAKDVTQLLELS LENIEIRITGTVSKNNNIAKRDLSVDLHQMLNYRKISYE" /locus_tag="LOCUS_3250" /note="MGA_443" ORIGIN 1 ggcgttctct attacagcga tgaaaaggtg atcgaattct gcaaggcagc caaccgcgca 61 ggactgcaga tcgagatgca cgccatcggc gaccgcgcgt tcgaccaggc ctgccgggcg 121 atcaaggcag cgctggacga cttccccaga gaagatcacc ggcatggcat catccacgcc 181 tgcctgacga cggagtgggg cagacacgtc tgcatggact ataacatcca gctcccgatg 241 caggtcgcct tcgacaactg gcggcaggag ccggcggaat acacggaagc gatcctggga 301 aaagagcggg cggcaagcct caatcccatc cgcaccttta aggatctggg ctgcacggtg 361 tccttcagct ccgacggacc ctgcacggcg cccgatccca tcgtctggct ggataaggcg 421 gtcaactaca gcaatcccga agagcgcgtg agcattcagg atgcgctgcg catgtccacg 481 tataacggat actgggcgac gttcgacgaa aagcagagag gttctctgga aggcggcaag 541 atcgcggata tggtcgtgct gtcggaaaac ccctacgaga tcccggccga acggatccgc 601 gaattaaaag tcgagcgcac catcctggcc ggaaagcctt acgcaaaaca aaaaggcggg 661 tttgtaccca ccattttgaa aggcatcgcc ggaaacggta atttctaggc gagctcgatc 721 tgacattcga tgttcagaga accgtcttcc aggaacgtct ggaagagata gatattgtct 781 tctttgcagc gccgtatggt gatctccgat cccagcggcg cttcttttgc aaaatggatg 841 cgagcggacc gcacccagtg gtgctcataa tcgtagagct ccgggataag gtcgcacagg 901 atgtccagat aataggtgtt attgatgtga ccgttgcagt cgcagtcccg cagggtgacc 961 ctgtgagaac ccacgttttc catggcttcg gcagtgtcgt ggtcgatgtg gagcttcttg 1021 tcgaagaggg ggacataatc cccatatctg taattcggaa aagtttcctg ggtcatgcga 1081 aggatcttgc ggctttcgat ctccaccagc gcccagtcgg aactcccgcg ggcgagaact 1141 gcgccatcct ttgcgatctc gtagcagcgg tggataacgg cgcctttggg gaggacgggc 1201 caggtgctcg cctggatagg ctcctccatc atgggcggct gcaagatctc gatatccatc 1261 cgcgatacca tgagcgctct gccggaatcc agcagttcgt cgtagctggg gccgaagtgc 1321 gccatgttcc ttgttgccgt ttcgttaaac tgtctcagca cgccgccagc cgtcgctctt 1381 ctggcgatat cggtgttgta ggcgtccatg tatgtgtctc ttgtgaattt gtaatcttcc 1441 attggctctc tctttctcgt ttcagacgac ttattatatc ggtttgcaat ggacaactca 1501 accacagact tggtttttta tgaggcagaa ggtataatat tatgcgaaaa ggagatgcgt 1561 gttatggaaa cgaaacgact catcctccgt ccttcggtct tcgaggactg cgtgcggttt 1621 gccgagatgg aaggcaccgc cggcgtccgc aagggtttta ccatgagcaa ggactgggat 1681 tacaataaga tcgcgccgga tttcgtaaag aaaagtctgg acgatacctg cgagcagtgg 1741 accatcgtgc tgaaggagac cggaaagatc atcggccggg tcatcatctg cgatatcaac 1801 gagcactacg attcgctgga tatcaccagg atctacatcg gcgaggacga tctgcgcggc 1861 aaagggctgg gcagggaggc gctcgaagcg ctgcttgcct acagctttaa cgagaagcat 1921 atggaaaggg tcaccttgga ctacgtgacc ggaaacgaag cctcggatct gtaccgcagt 1981 gtcgggttta aagacgaagg caacgccgtg cactgcggta aaaaagacgg ctactacgtg 2041 gatctgcaca agatggcgat cctcagcggc gagtattacg ggagagaata agatagtatg 2101 gcgaaaacga taaacgcgac ggtcaagtcg agagaagaac aagtcgtaca cgggctctgg 2161 gtccggtcca cgctgaattc ctccggtacg gagtgggaaa acctgatgag actctactcc 2221 aagcgttccg gggatatggg gatccgtttc gtcatccggg aaaataccga tgagaagagg 2281 gattgcgacc ttttctgcgg cggtctgacc ggcggagagg acatcagcga ttttacgatc 2341 ctggcaggag aatacgttag cgttaccgta acgccgaaat tcggcctgtt ctggggctcc 2401 gccatcgagg aggcggaagt ctacctccgg gacgaatggc cgaagcagag cggccgcaag 2461 ctggacgatt tccacatgga gatccgggac atgatgggga agaagccctc gctggagatc 2521 ctgtaccgtc tgctgccgga agaatagggc tcgccgcacc ggcaaatgcg cacgaaaaaa 2581 ccgcctgaac gctcaggcgg tttttagatt cgtttttctt acgctctggt aactttgccg 2641 gaacggatgc agctggtgca gacgttcttt ctgacgacag tgccgttttc ctcaactctt 2701 acgctctgga tgttagcgtt ccactttctt ctggtgtgtc tgttggagtg ggaaacgttg 2761 ttgccggata cctggccctt accgcagatc tcgcactttc tggacatgtt ctgaacctcc 2821 tttaataccc cgaaaagggt tgaaattatt gcttttaaac gcctttcgag gcggtgtcta 2881 tgatttcaga caggtgatat tgtaccacag caattcattt gaggcaacaa ttttttgcag 2941 ggctatggta caatattttt gtttacggga ggaaaggcat gctgacccag atcaagaaca 3001 atatgggcac gctcacggtg agccgccaga tcatagacca gatcatcgaa cacgccttcg 3061 aaccgctgga gggaaaactc tggctggcga attaccgggg cgccgtttcg gacgtcctgg 3121 taaagttggg cggattcgac gccatcgcgg agaagaaagt ggagatgcac ggcgataaac 3181 tgtttatccg tctgtatgtc gtatcccgtc ttggcgagag cattacggaa aactgtgtgc 3241 tggtgatgca gcgcatcgcg aaggacgtga cgcagctgct cgagctttcg ctggaaaaca 3301 tcgagatccg gatcacggga acggtgtcta agaataacaa catcgcgaaa cgggatctgt 3361 ccgtggatct ccatcagatg ctcaactacc ggaagatcag ctatgagtaa aggcgttacg 3421 aagatagaac tgaattcccc catggaagac ctgaaaggcg tggggcccaa gaaggcgcag 3481 tgcttcgcga aagcgggtat cctgcgtctt tccgacatgc tctggaactt tcccagggat 3541 tatgaggacc // LOCUS sequence086 3514 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence086 VERSION sequence086 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3514 /mol_type="genomic DNA" /organism="" /note="sequence086" CDS 170..622 /product="arginine repressor" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_010965374.1" /transl_table=11 /codon_start=1 /translation="MRYARHQKILELINAHEIDTQERLAEKLRESGFNVTQATVSRDIK ELQLVKHAGPSGRSCYTQNRSTDAPVSERFRKILRETILSISAAENIIVIKTLSGCANA AAEAIDTTNFPEIIGTLAGDNTIFMVISSKEAVPALMDQFSEMTAK" /locus_tag="LOCUS_3260" /note="WP_010965374.1 arginine repressor (Clostridium) [pid:48.3%, q_cov:98.0%, s_cov:98.0%, Eval:5.5e-33]" /note="MGA_445" CDS 631..2286 /product="DNA repair protein RecN" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_012583410.1" /transl_table=11 /codon_start=1 /translation="MISHISIKDFAIIKELELDLHPGLNIITGETGAGKSIVIEAVSMA LGSRADTDYIRTGADKASITLTADMDAVSVGNLLEEAGVPADDPLIIRREISSGSKSLC RVNGTIVPLSFLNRLCRHVADIHGQYDNQTLLNTDHHVEVLDLYAGEETQNVRRMVCGF YRDLTKAKADLQALEKKLADSERQKDLTRYELQEIEAAGLTAGEDEALEDEIRLMQNSE EIYNTLSQVYDAVYDSDDSASGRLSSCLSSLESISSYSKDLSDAAQQFSDAYYALDDLG RDLRRLRDSVSFSPEELEEKMERLDLIDRLKRKYGGSLDAVFAYREKAEKELRTIENAD AELEDLKSKCRLYREQYETSAARLSVLRKRAAKDLQQAVDKELAELNFQDAALSVSVEP SEASERGSDNVEFLIRTNKGEAFKPLAKIASGGELSRIMLGLKRILAGLDHIPTLIFDE IDAGISGATAGVVGEKLRSIAADHQIVCITHLPQIAALGDHHYRIEKISDEISTHTTVV PLSEEERVEELARLLSGTQITESARQQARELLKR" /locus_tag="LOCUS_3270" /gene="recN" /note="WP_012583410.1 DNA repair protein RecN (Dictyoglomus turgidum) [pid:36.1%, q_cov:99.6%, s_cov:96.7%, Eval:3.2e-100]" /note="MGA_446" CDS complement(2343..3170) /product="ribosome biogenesis GTPase YlqF" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011861161.1" /transl_table=11 /codon_start=1 /translation="MEHINWYPGHMKKTRELIQENLKLVDVCVEVLDARIPVSSRNPIL AELTANKIRVLVLNKSDLADEAKTAEWAEKLRQDGAYVLVTNCNTGAGSAALVKLLEKI RDEKNEGRERKKDLRLMIVGIPNVGKSSLINRLTGKKAAKTGNKPGVTRGKQWISLGEH MMMLDTPGILWPKFEDPKVGLNLAFCGSIKDEIMDLETLGMELIGVLARDYPDLLSVRY KLEEIAETPLENMENISLKRGFILPGKRIDYERTARTVIDEFRAGTIGRITLE" /locus_tag="LOCUS_3280" /gene="ylqF" /note="WP_011861161.1 ribosome biogenesis GTPase YlqF (Clostridioides difficile) [pid:53.6%, q_cov:99.3%, s_cov:95.8%, Eval:9.1e-80]" /note="MGA_447" ORIGIN 1 ggggtctatt cctaatatgc ggatcatccg aaaagcgcct ttcttttgcg attttgcaga 61 attcatttga ttttatcata ttttctatgc tttgtatagt tggcaagacc gccatggtat 121 gttatagtta gtgtgcatta ttgtatattt atgcagtcag gaggagaaga tgcgttacgc 181 aagacaccag aagatccttg agctgatcaa cgctcatgag atcgacactc aggaaaggtt 241 ggctgagaaa ttgcgtgaat cgggcttcaa cgtaacacag gctaccgtat ccagagacat 301 caaagaactg cagctggtaa aacacgccgg tccgtccggc cgcagctgct acacccagaa 361 ccgctccaca gatgctcccg tcagcgaaag attccgcaag atcctgcgcg agacgatcct 421 cagcatcagt gcagcggaga acatcatcgt catcaagact ttgagcggct gcgccaatgc 481 ggctgccgaa gccatcgata cgacgaattt ccccgaaatc atcggcaccc ttgccggaga 541 caacacgatc ttcatggtca tctcctccaa ggaagccgta ccggccctca tggaccagtt 601 tagcgaaatg actgcaaaat aaaggataaa atgatttcac acatctctat caaagatttt 661 gccattatca aagaactgga attggatctg caccccggtc tcaacatcat cacaggcgag 721 accggcgcag gaaaatcgat cgtcatcgaa gccgtctcca tggctctcgg aagccgtgcc 781 gacaccgact atatccgcac aggtgcggac aaagcatcca tcacgctcac ggcggacatg 841 gacgctgttt ctgttggcaa tttactggag gaggcgggcg ttcccgcgga tgaccctctg 901 atcatccgca gagagatctc ttccgggagc aaaagtctgt gccgggtcaa cggtaccatc 961 gttcccctct ccttcctcaa ccgtctttgc cgccacgtgg cggacatcca cggacaatac 1021 gacaatcaga cgctgctcaa tacggatcat cacgtcgaag tgctggatct gtacgcagga 1081 gaagaaacgc agaacgtgcg acgcatggtc tgcggttttt atcgcgacct gacgaaagcg 1141 aaagcggatc tgcaggctct tgagaaaaag ctggcggaca gcgaacggca aaaagatctt 1201 acgcgatacg aactgcagga gatcgaggcg gcaggcctta cggcaggcga agatgaagcg 1261 ctcgaagatg agatccgcct gatgcagaac agcgaagaga tctataacac gctgagccag 1321 gtctacgacg cggtgtatga cagcgacgac agcgcctccg gcaggctgag cagctgtctg 1381 tcttcccttg agagcatctc ctcttattcc aaggatctct ccgatgcggc gcagcagttc 1441 tccgacgcct actacgcatt ggacgatctg ggcagagatc tgcgcagact gcgcgattcc 1501 gtcagtttct ccccggaaga actggaggaa aagatggagc ggctcgatct gatcgaccgg 1561 ttaaagcgca aatacggcgg cagcctggat gcggtcttcg cctaccggga gaaagcagaa 1621 aaggaattgc gcacgatcga gaacgctgac gcggaactgg aagatctaaa gagcaagtgc 1681 agactgtacc gcgaacagta cgagacctcc gcagcgaggc tgtccgtgtt aagaaagcgc 1741 gctgccaagg atctgcagca ggccgtggat aaagaactgg cggaactgaa cttccaggac 1801 gccgccctct ccgtctccgt agagccatcc gaagcttcgg aacgcggcag cgacaatgta 1861 gagtttctta tccgcaccaa caagggagaa gcctttaaac cgctggccaa gatcgcttcg 1921 ggcggcgaac tgtcccgcat catgctggga ctgaagcgga tcctggcagg tctggatcac 1981 attccgacgc ttatcttcga cgagatcgac gccggcatct ccggcgctac ggcgggcgtc 2041 gtaggagaaa aactgcggtc catcgcagcg gaccatcaga tcgtctgcat cacccacctg 2101 ccccagatcg cagcgctggg agaccaccac taccggatcg agaagatctc cgacgagatc 2161 tccacgcata cgacggtcgt tcccctctcg gaggaagagc gggtggaaga gctggcccgc 2221 ctgctttccg gcacgcagat caccgaaagc gcaagacagc aggccagaga gctgttaaag 2281 agatagcaaa tgatcaaacg gggacggttc tttgtcttaa agaaccatcc ccgttttatt 2341 gtctattcca atgtaatgcg tcctatcgtg ccggctcgga actcgtcgat gacggtcctg 2401 gccgttctct cgtagtcgat ccgcttgccg ggcaggataa acccacgctt gagcgagatg 2461 ttctccatgt tttccaacgg cgtttctgcg atctcctcca gcttataccg gacggagagc 2521 aggtccggat agtctcttgc cagcacgccg atgagctcca tgcccagcgt ctccagatcc 2581 atgatctcgt ccttgatgga accgcagaaa gcgagattca gccccacttt cggatcttcg 2641 aacttcggcc acaggatgcc gggggtatcc agcatcatca tgtgctcgcc cagagagatc 2701 cactgctttc cccgggtcac gccgggttta ttgccggtct ttgccgcctt tttccccgtc 2761 agccggttga tgagcgacga tttgcccacg ttgggaatgc cgacgatcat cagccgcaga 2821 tctttcttgc gttccctgcc ctcgttcttt tcgtcccgga tcttctccag cagttttacg 2881 agcgctgcgc tgcctgcgcc ggtattgcag ttcgtcacca gcacataggc gccgtcctgc 2941 ctcagctttt ccgcccattc cgccgtcttc gcctcatccg ccagatcgct cttgttgagc 3001 accagcacgc ggatcttgtt cgcggtcagc tccgccagga tgggattgcg gctcgacacg 3061 gggatgcggg catccagcac ttccacgcag acgtccacca gttttaagtt ttcctggatg 3121 agttcccggg tctttttcat gtgacccgga taccagttga tatgttccat aatcttttct 3181 taaagcacta cgcgtgccag agcagcgtgg acagatacag gataaagggg atcgttacga 3241 tcgaaagcag tgtggagatg atgaccgttt ccaccgcata aggatagtcc ttgccgtgca 3301 gctgcgcgta gaccgccacg tttgagccca ccgggcaggc ggcgacgatc agcagcaccg 3361 ttttcatgac gtacatggag gaaggcagca gcgacaggat gagcagcgac agcacaggga 3421 tcaccagcag gcgaagcgcg gagaccagat acagcgtcct gcgcccgaac atcttcacca 3481 gatccgtttg cgccagatag acgccgacag tgaa // LOCUS sequence087 3496 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence087 VERSION sequence087 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3496 /mol_type="genomic DNA" /organism="" /note="sequence087" CDS 178..1770 /product="peptide chain release factor 3" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003704258.1" /transl_table=11 /codon_start=1 /translation="MDTKELQKQIERRRIFGIISHPDAGKTTLTEKLLLHGGAIREAGT VKARRNSKFATSDWMEIEKQRGISVTSSVMQFEYGGKVISIMDTPGHNDFGEDTYRILT SVDSAVMVIDAAKGIEAQTKKLFAVCRMRGIPVFTFMNKLDREARDPLELIGELEDILG MPATAVTWPIGSGLNFQGVYNILKNEVYLYKEKETLKLDDSGVNDPRLDGIITQFNIKA LREEMELLEGAGYPMDEEAVLAGELTPVFFGSALADFGVTAFLEHFLEMSPAPGPRKLA DGGSVNPTDPEFSGFIFKIQANMNPAHRDRLAFFRICSGEFTRGMTATLARTGKPIKLA QSTQLMANERENVEKAQAGDIIGIYDTGNFQIGDTLYTGKQELFFEPLPTFPPELFALV APRDTMKTKQFHKGVQQLAQEGAIQVYHNEYNEIYIGAVGQLQFEVFQYRLENEYNAQV RMTPQELTVARWVLEADRDKVKSTLDSRSRLVFDRFERPLILFANQFTLSYYQEKHPDI KLTEAMDLKDPGK" /locus_tag="LOCUS_3290" /note="WP_003704258.1 peptide chain release factor 3 (Ligilactobacillus salivarius) [pid:58.0%, q_cov:98.1%, s_cov:99.4%, Eval:5.6e-171]" /note="MGA_449" CDS complement(1830..3221) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MNNDYGYNNKYSNKDPKKKRSGKFMEFVVKYNKIGWVLLIVLALY LGRGTLSRTINTFRNWEDIQEAKGDVILMQRLFNADRFYLEDPAEYSDVVVLENGTYSH NLRVGSDITLEQEKFEFENGDVFRHVTLPYVDTLDIMEVETLKMFTRYKYRSGSVYFYD TEKSEWSQINTLRGGTQLPQNTLMYFVFDDAYYVLFDPLYTYEEVDDGVWEAMDELTLL SHTNRQGGGWDIISPYYVREGMVSQNWTLESSQPLVDLESGELLPGMDHTEKELILMGL GLGNGFRWLSDGYYASVPEGYTPYGEGYYYRSDDTEQLDLLLAAEESRTASELAFIQLY KIAQNINENGYFDVPVQDTQLYNEYGIRYGYADLGANAQIGQRLVTAAQRYGKDAFEPA IRALADFYAARLAEGTLPEYWHYKGEIQTVPASADTLKETARFLAAAGELLGESSYAEL ADSLM" /locus_tag="LOCUS_3300" /note="MGA_450" ORIGIN 1 aaatgcattt ctattatacc ttatgaaccc catctgtgct aaaataaatt gttatggtca 61 agaacaaaac gcggaaaaat aaagatttgg gtcgaagact tctccggtta agtccgccct 121 aacggtgcga aaaacgcatc cgttttttct gtgtttattt ataaggaatc gattatcatg 181 gatacgaaag aattacaaaa acagatcgaa agacgccgca tcttcggcat catctcccac 241 ccggacgccg gtaagaccac tcttaccgag aaactgctgc tccatggcgg cgccatccgg 301 gaagcaggca ccgtaaaggc ccgcagaaac agcaagttcg caacctctga ctggatggag 361 atcgaaaagc aaagaggcat ctccgtcacc agctccgtca tgcagttcga atacggcggc 421 aaggtgatct ccatcatgga tacgccgggt cacaacgact tcggcgaaga tacctaccgc 481 atcctcacct ccgtggactc cgcggtgatg gtgatcgacg cagccaaggg tatcgaagcc 541 cagacgaaaa aactgttcgc ggtctgccgc atgcggggca tccccgtgtt caccttcatg 601 aacaagctgg accgggaagc cagagacccg ctggaactca tcggagaact ggaggacatc 661 ttaggcatgc ctgcaacagc cgtcacctgg ccgatcggaa gcggactcaa cttccagggc 721 gtctacaaca tcttaaagaa cgaagtctat ctttataaag aaaaagagac cctcaaactg 781 gacgattccg gcgtaaacga cccccgtttg gacggtatca tcacccagtt caatattaag 841 gctctgcgcg aagaaatgga gcttctggag ggcgccggct accccatgga cgaggaagcg 901 gtgctggctg gagagcttac gcctgtgttc ttcggatctg ctctggcgga tttcggggtc 961 accgcgttcc tggagcattt cctggagatg tcccctgccc ccggcccgag aaagctggcg 1021 gacggcggca gcgtaaaccc gacagatccg gagttttccg gcttcatctt caagatccag 1081 gccaacatga atcctgccca cagagaccgc ctcgccttct tccgcatctg ctccggcgaa 1141 ttcacccggg gcatgacggc aacgctcgcc cgcaccggca aacccatcaa actggcgcag 1201 tccacccagc tgatggccaa cgagcgcgaa aacgtggaga aagcccaggc cggcgacatc 1261 atcgggatct acgataccgg caacttccag atcggcgaca cgctgtacac ggggaaacag 1321 gagctgttct tcgagcccct gcccacgttc ccgccggaac tcttcgcgct ggtcgcgccc 1381 cgcgacacca tgaagaccaa gcagttccac aagggcgtgc agcagctggc ccaggaaggc 1441 gctatccagg tctaccacaa cgagtacaac gagatctaca tcggcgccgt cggacagctg 1501 cagttcgaag tgttccagta ccgtctggag aacgagtaca acgcccaggt ccggatgacc 1561 ccgcaggaac tcaccgtagc ccgctgggtg ctggaagcgg accgggacaa ggtcaagtcc 1621 acgctggact cccgcagcag gctggtgttt gaccgcttcg agcggcccct catcctgttc 1681 gcgaaccagt tcaccctctc ctattatcag gagaagcatc cggacatcaa actcacggaa 1741 gccatggatc tgaaggatcc cggaaaataa agacatacaa gaaagaccgg aggatcatcc 1801 tccggtcttt ttatatcgat tttatcgtat tacatcagcg aatccgccag ttccgcatag 1861 gaactttctc ccagcagttc tcctgctgcc gccaggaaac gcgctgtttc cttcagggtg 1921 tccgcggatg cgggcaccgt ctggatctcg cccttatagt gccagtattc cggcagcgtt 1981 ccttccgcga gacgggccgc atagaagtcc gccagtgcac ggatcgccgg ttcgaacgcg 2041 tccttgccat accgctgcgc tgcggtcacc aggcgctgtc cgatctgtgc gttcgccccc 2101 aggtctgcat atccgtaacg gatgccgtat tcgttataca gctgcgtatc ctggaccgga 2161 acgtcaaaat aaccgttctc gttgatgttc tgtgcgatct tgtacagctg gataaaggcc 2221 agttccgaag cagttctgct ctcttccgcc gcaagcagca gatcgagctg ctccgtatcg 2281 tcgctgcggt aataataccc ttcgccgtag ggcgtgtacc cctccggaac ggaagcgtaa 2341 tagccgtccg acagccaacg gaaaccgttg cccaggccca gccccatcag gatgagttcc 2401 ttttccgtat gatccatgcc ggggagaagt tctccgctct ccagatccac cagaggctgg 2461 gaagattcca gcgtccagtt ctggctcacc atgccctccc gcacgtaata cggcgagatg 2521 atgtcccagc cgccgccctg gcggttcgta tgggacagca gtgtgagttc gtccatcgcc 2581 tcccagacgc cgtcgtccac ttcctcgtag gtataaagcg gatcgaacag aacgtagtag 2641 gcatcgtcga agacgaagta catcagggtg ttctgcggaa gctgtgtacc gccgcgcagg 2701 gtattgatct ggctccattc gctcttttcc gtgtcgtaga aatagaccga gccggatctg 2761 tatttatagc gggtgaacat cttgagcgtc tccacttcca tgatgtccag cgtgtctacg 2821 tacgggagcg taacgtggcg gaacacgtcg ccgttttcga actcgaattt ttcctgttcg 2881 agcgtaatat cgctgccgac gcgcaggtta tggctgtacg tgccgttttc cagaacgacg 2941 acgtccgaat actccgcagg atcttccagg tagaagcggt ccgcgttgaa cagccgctgc 3001 atcaggatga cgtcgccctt tgcctcctgg atatcctccc agttgcggaa ggtattgatc 3061 gtgcggctca gggtgccgcg tccgagatag agggcaagaa cgatcaggag cacccagccg 3121 atcttgttgt atttgacgac aaattccatg aatttgccgc tccttttctt cttgggatcc 3181 ttattgctgt atttgttgtt atatccgtaa tcgttgttca ttccatcctc ttttcgataa 3241 atgccagcat tctcgtgctg tctttacagc gtctgtaaga ccagaacatc tccggttcgc 3301 agcaggtgca atggggcgat atttcgatct tcgtgacccc ttccagcatc agcagttcgg 3361 cgttgatccc tttgagatcc agccgcggcc ttccgccggg atggcagtat acgtagtctt 3421 ccgcccacca gaacgcatcc gtaaactgtt ccgccacgtc cggaccgacc tcgaagcagc 3481 aggcgccgat cccggg // LOCUS sequence088 3491 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence088 VERSION sequence088 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3491 /mol_type="genomic DNA" /organism="" /note="sequence088" CDS complement(397..792) /product="Fe-S cluster assembly scaffold protein NifU" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003391905.1" /transl_table=11 /codon_start=1 /translation="MALYSDKVMDHFRNPRNVGVIEDADGIGEVGNTMCGDIMKIYLKV SDDGIIEDVKFETFGCGSAIASSSMATELIKGKPISEAMELTNKAVAEALDGLPAHKMH CSVLAEEAIQAALEDYQNKKLAGKLQA" /locus_tag="LOCUS_3310" /gene="nifU" /note="WP_003391905.1 Fe-S cluster assembly scaffold protein NifU (Clostridium) [pid:76.5%, q_cov:90.8%, s_cov:83.1%, Eval:1.2e-46]" /note="MGA_453" CDS complement(805..1995) /product="cysteine desulfurase NifS" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011986887.1" /transl_table=11 /codon_start=1 /translation="MNIYADNAATTRMSKTAIDAMIPYMGEIYGNPSSLHTVGQKANEA LQSARERVAKIFNCSAREILFTSGGSEADNQAIISAARIGEKKGKKHIISTAFEHHAVL HTLAKLEKEGFEVTLLDVHENGIVTPEEVAAAIRPDTCLVTIMYANNEIGSIQPIPEIG AVCREKGVLFHTDAVQAAGHLHIDVQAQNIDMLSLSAHKFHGPKGVGVLYAKKGIALTN IIEGGAQERGKRGGTENIAGIMSMTAALEEACANIDKNAAHLIPLRDKLIAGLEAIPHS ILNGDRTNRLPSNVNFCFEGIEGESLLLLLDDKGICASSGSACTSGSLDPSHVLLAIGR VHDVAHGSLRLSLGEDITEEEIDYMIEAVTDVVTYLRNMSPVWRDLQEGKREYVLK" /locus_tag="LOCUS_3320" /gene="nifS" /EC_number="2.8.1.7" /note="WP_011986887.1 cysteine desulfurase NifS (Clostridium botulinum) [pid:53.2%, q_cov:98.5%, s_cov:98.7%, Eval:4.5e-111]" /note="MGA_454" CDS complement(2072..3064) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MRPVPEHEYPTYPRRFISYRWFKPLLAGLLFAVLYLGSNVAIVLL GALNQGGLESVMKIAGSYDTMDVSSGPGILLNLGSLAVAIPLLALTALIVRDRPFSSYS SARGGWDWSIFGRMMLLALLVCGVPNLVWILLDHGPLNNQFTIATFLLLTVMGPLQCIA EEYMFRGLLMQTFGGWFRIPVIAVILQALIFMSMHPYNLTGKLTILATGCMMGLMAWIS RGIEASSAIHIVNNMVAFYADGLGLGAIGSEVSTLDLVVTLIIDAVYVAVLLVLRKKGF FDRIKRDDAAEFNAKVAPKYAKRDLKNMELHWKPGVAGSAAAQENKPEE" /locus_tag="LOCUS_3330" /note="WP_012803896.1 CPBP family intramembrane metalloprotease (Brachybacterium faecium) [pid:30.7%, q_cov:69.7%, s_cov:72.2%, Eval:3.1e-19, partial hit]" /note="MGA_455" tRNA complement(3352..3427) /product="tRNA-Lys" /inference="COORDINATES:profile:Aragorn:1.2.38" /locus_tag="LOCUS_t0060" /note="Aragorn_6" ORIGIN 1 atagccgttg atcatcagat tgagtttgtc ccagaccggg agcgtcttgc actctcccgc 61 atattcgcag ggggccgcgc cgtgttccag gcaggcgacg ggcgccaggt ctccttcggt 121 gacccggagg atctccccga cggtatattc ctctgccggc ttgttcagcc ggtagccgcc 181 tcccttgccg tggacggcgt cgaccaggcc cgccttcgac aggctggcca tgatggcttc 241 gatgtatttt ttcgagatgc gctgccgctc ggcgacttcc ttcaagggcg tataagtctc 301 tctgccctgc tccgccaggt cgatcatcac ccggagcgcg tatcttcctc ttgtcgagat 361 catagatcct ccttctgccc cctggcaaat tgcgatctac gcctgcagtt tacccgccag 421 ctttttattc tggtaatctt ccagggctgc ctggatggct tcttcggcca gaacgctgca 481 gtgcatcttg tgggcgggca ggccgtccag cgcctctgcc acggctttat tggtaagctc 541 catggcttcg gagatgggtt ttcccttgat gagctccgtc gccatggaac tggaagcaat 601 agcgctgccg cagccgaagg tctcgaactt gacgtcttcg atgatgccgt cgtcgctcac 661 cttcaggtag atcttcatga tgtcgccgca catggtgttg ccgacttccc cgatgccgtc 721 tgcgtcttcg atgacgccca cgtttctggg attgcggaaa tggtccatta ctttgtcgct 781 atagagtgcc atatatgttt cctcctactt gagtacgtat tctctcttgc cttcctgcag 841 gtctctccag acgggagaca tattccgcag gtacgttacc acgtcggtga ccgcctcgat 901 catgtagtcg atctcctctt ccgtgatgtc ttctcccagg ctcagccgca ggcttccgtg 961 ggccacgtcg tgcacccggc cgatggccag cagcacgtga ctgggatcga gagacccgga 1021 cgtgcaggcg gaaccggacg aagcgcagat gcccttgtcg tccagcagga gcagcaggct 1081 ttcgccttcg atgccttcga agcagaagtt gacgttgctg ggaagacggt tcgtgcggtc 1141 cccgttcagg atggaatggg ggatcgcctc cagccccgcg atcagcttat cgcgcagcgg 1201 gatcagatgc gccgcattct tatcgatgtt cgcgcaggct tcttccaggg ccgctgtcat 1261 ggacatgatg cccgcgatgt tctccgtgcc gccgcgcttg cccctttcct gcgcgccgcc 1321 ttcgatgatg ttcgtcaggg cgatgccctt ctttgcgtac agcacgccca cgcctttcgg 1381 cccgtggaac ttgtgcgccg acagcgagag catgtcgatg ttctgcgcct gtacatcgat 1441 gtggagatgg cccgctgcct gtacggcgtc tgtatggaac aatacccctt tttcccggca 1501 gaccgcgccg atctcgggga tgggctggat gctgccgatc tcgttgttgg catacatgat 1561 ggtgacgagg caggtatccg gccggatggc tgccgccact tcctccggcg taacgatgcc 1621 gttttcatgc acgtccaaaa gcgttacttc aaagccttcc ttctccagct tcgccagcgt 1681 atgcagcacc gcgtggtgct cgaaggcggt ggagatgata tgcttcttgc ccttcttttc 1741 gccgattcgg gcggcggata tgatggcctg gttgtccgct tcgctgccgc cggacgtaaa 1801 caggatctcc cgggcgctgc agttgaagat ctttgcgacg cgctcccttg cgctctgcag 1861 ggcttcgttc gccttctgcc caacggtatg caaactggac gggttgccgt agatctcacc 1921 catgtagggg atcatggcgt cgatggccgt cttgctcatc cttgtggtcg ccgcattatc 1981 tgcgtatatg ttcatgtgct ttcctccttt tgcggtccta tgttcttgca aaaggagtat 2041 aagcctattt acccactgtg tcaataggtt attattcttc cggcttattc tcctgcgccg 2101 cagcggaacc cgcaaccccg ggcttccagt gcagttccat attctttaag tcccgtttcg 2161 cgtacttggg cgccactttt gcgttgaatt ccgccgcatc gtcccttttg atccggtcga 2221 agaagccctt ctttctcagg acgagcagca ccgcgacata gaccgcgtcg atgatcaggg 2281 tcacaacgag gtccagggtg ctcacctcgg agccgatggc ccccagtccg agaccgtccg 2341 cgtagaacgc gaccatgttg ttgacgatgt ggatcgcaga cgacgcctcg atgccccggg 2401 agatccaggc catcaggccc atcatgcagc ccgtcgctag aatcgtaagc ttgccggtga 2461 ggttatacgg atgcatggac atgaagatga gggcctgcag gatcaccgcg atcactggga 2521 tgcggaacca gccgccgaag gtctgcatga gcaggccccg gaacatgtac tcctccgcga 2581 tgcactgcag cggccccatc acggtaagca gcaggaaggt ggcgatggta aactggttgt 2641 tcagcggccc gtgatccagc aggatccaga ccagattcgg cacgccgcag acgagcagcg 2701 ccagcagcat catccggccg aatatgctcc agtcccagcc gccccgggcg gaggaatagg 2761 aggagaatgg ccggtcgcgc acgatgaggg cggtgagcgc cagcaggggg atggcgaccg 2821 ccagtgaccc cagattcagc aggatgccgg ggccgctcga cacgtccatg gtgtcgtagc 2881 tgccggcgat cttcatgacg ctctccagtc ctccctggtt cagcgcaccc aggagaacga 2941 tggcgacgtt cgagccaaga tagagcacgg caaacagcag gcccgccagg aggggtttaa 3001 accagcggta ggagatgaac cgccgggggt aggtcggata ttcgtgttcc ggtacaggtc 3061 tcataggttt gtcctttcta agcgttttca tcctattcta acaccggtgg gggcagagcg 3121 gcgagaaatg tgctataata cataggattt aagagttttt tcagccaatc cttttgcttt 3181 ggaagaaagt aaaaagtcat cgaaaagttg cttaaaagtt gttagagagt tgcttaaatt 3241 tagtctcatt tcagacaccc tgattcctca aaatacgtgt gaaaatcagg gtgtctgttt 3301 ttatttcaca gaaaatgaaa aagccttgaa accgttgaga tttcaaggcc ttggtacacc 3361 atcacgggct cgaaccgtgg acaccctgat taagagtcag gtgctctacc aactgagcta 3421 atggtgcatg tcaaacgcaa gtaatatatt aaccgtgcgg cttgcgtttg tcaagaaaga 3481 atttaagcaa t // LOCUS sequence089 3487 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence089 VERSION sequence089 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3487 /mol_type="genomic DNA" /organism="" /note="sequence089" CDS 270..620 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MKNEYAKAMETAPAMVNESRAGYRNDNEEFLFDIREHIGVLRKSN NGWTRELNVVSWNGSAPKFDIREWDPRHEKMTKGISFTKAEATELCKWLTARNMEPVVP KKEEPAEAAPAF" /locus_tag="LOCUS_3340" /note="WP_002381076.1 YdbC family protein (Enterococcus) [pid:55.4%, q_cov:56.0%, s_cov:90.3%, Eval:2.1e-16, partial hit]" /note="MGA_457" CDS 869..1387 /product="folate family ECF transporter S component" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003641760.1" /transl_table=11 /codon_start=1 /translation="MKKGISVQKLVVLGVLIAMEVVLSRFVSISTWNMKIGFAFIPVAA AAILLGPVEAAVCGGMADFLGATLFPIGAYFPGFTATAALTGLVFGLFFHKEQTFGRVL GAVLINQFILGLLCNTYFISVLYGSEFKVLLATRVVQSLILTVVQTAGILVLAKVLQRV KPSLPAMER" /locus_tag="LOCUS_3350" /note="WP_003641760.1 folate family ECF transporter S component (Lactiplantibacillus) [pid:38.4%, q_cov:92.4%, s_cov:93.5%, Eval:8.6e-24]" /note="MGA_458" CDS 1391..2662 /product="folylpolyglutamate synthase/dihydrofolate synthase family protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011392070.1" /transl_table=11 /codon_start=1 /translation="MNYQQAIEFLEISNWMGSRLGLSRVKQLLHLAGDPQNRMQFVHIA GTNGKGSTAAMLASVLQEAGYKTGLYTSPHLRKYNERIRIDGKDVSDEEMCRAAEILEQ CVEQMDDRPTVFERITALAMVCFERAGCEVVVLEVGMGGRLDATNVVDEPACSVLCHID LDHTEILGDTLEKIAEEKAGIIKPGCPAVAQDQSEEALAVFRRTCEELDSPLTVTDPGL LTVREQSLDGQIFDYRDRRDLRIPLVANYQLVNVMGVLDTVDVLQRSGWHISEEALREG LKKTRWAGRFEILSRDPLMIIDGAHNPDGATQLAECLATYLADRKIVFLMGVMADKDYR RMIRTVAPFAKRFVAVTPNSSRSLPCEDLARVIEEETGLPALPGGDVKSGLSLAVQGLE AGDILCIFGSLYQVGDVQEWLEGV" /locus_tag="LOCUS_3360" /note="WP_011392070.1 folylpolyglutamate synthase/dihydrofolate synthase family protein (Moorella thermoacetica) [pid:38.8%, q_cov:99.5%, s_cov:97.7%, Eval:5.8e-80]" /note="MGA_459" ORIGIN 1 acgcaacatc cattacatca ccatgaaact cgaggagaac gaaaactcca cgaaggtccg 61 cctgatcaag gtgaaagaga tggtgctgca gaaggcgcat aattattcgg tataacacaa 121 agggacaggt acactgtgca gcagcgtgcc tgtctctttt gttttgccta aaaagtgaaa 181 aagtaatata agttattgtt gacatatatt aacatttacg atatactttc cttacttctc 241 cgcagcggga cgcggaaagg aaagaaacga tgaaaaacga atacgcaaag gcaatggaaa 301 cggcccctgc catggtcaac gagagcaggg cgggctatcg caacgacaac gaggaattcc 361 tcttcgacat ccgcgaacac atcggcgtgc tccgcaagag caacaacgga tggacgagag 421 agctcaacgt cgtctcttgg aacggcagcg cgccgaaatt cgacattcgc gaatgggatc 481 cgcgtcacga gaagatgacg aagggcatct cctttacgaa ggcggaggcg accgagctct 541 gcaagtggct caccgcgaga aacatggagc ccgtggtgcc gaagaaggag gaaccggcag 601 aggctgcacc cgctttctag catcagtgga attgatgggc atcagcaaaa actttttggg 661 caaaacccgt tgagaatgga ggccgggtag ggtacaatca acttgttaag agaatacttt 721 ctggtcagag taggagcagc gcgttaagtg tccggaggat gggatgtcgc cccggaacga 781 aggcttgccg cggtgctgcc ccgcgtccgc tgccgaaaaa ggatgtcgat aaactccttt 841 cacggcgacg agaaaggagt tttgcattat gaagaaaggc atcagtgttc agaaactggt 901 cgtcctcggc gtgctcatcg ccatggaggt cgtcctcagc cgtttcgtct ccatcagcac 961 ctggaacatg aagatcgggt ttgcgtttat cccggtggct gccgcagcca tcctgctggg 1021 cccggtcgaa gccgccgtct gcggcggcat ggcagacttc ctcggtgcca ccctctttcc 1081 catcggagcc tatttccccg gtttcacggc gactgccgcg ctcaccgggc tcgtcttcgg 1141 cctgttcttc cacaaagagc agacctttgg ccgcgtgctg ggcgcggtcc tcatcaacca 1201 gttcatcctg ggacttttgt gcaacacgta tttcatctcc gtgctctacg gctcggaatt 1261 caaggtgctg ctggcgaccc gcgtcgtcca gagcctcatc cttaccgtcg tgcagaccgc 1321 gggcatcctc gtgctggcaa aggtcctgca gcgggtcaag ccgtcgctgc ccgccatgga 1381 aaggtgaccc atgaattatc agcaagcgat cgaattttta gagatatcta actggatggg 1441 aagccgcctg ggactgtccc gggtaaagca gctgctgcat ctggcgggtg acccccagaa 1501 caggatgcag ttcgtccata tcgccggtac caacggcaag ggatctacgg ccgccatgct 1561 ggcgtccgtg ctgcaggaag cgggatataa gacgggactg tacacgtcgc cccatctgcg 1621 gaagtataac gagcgcatcc gcatcgacgg gaaagacgtc tccgatgagg agatgtgccg 1681 cgctgcggag atcctggaac agtgcgtcga acagatggac gacagaccca cggtgttcga 1741 acgcattacg gcgctggcca tggtctgctt cgagcgggcc ggctgtgagg tcgtggtgct 1801 cgaagtgggc atgggcggca gactggatgc gacgaacgtc gtcgacgagc ccgcctgcag 1861 cgtgctgtgc cacattgacc tggaccacac ggagatcctg ggcgacaccc tggagaagat 1921 cgcggaggaa aaggccggca tcataaaacc tggctgccct gctgtggcgc aggatcagag 1981 cgaagaggcg ctagccgtgt tccggcgcac ctgcgaagaa ctggacagcc cgcttaccgt 2041 taccgacccg ggtctgctga cggtcagaga acagtctctg gacggacaga tcttcgacta 2101 tagagaccgc agggatctgc ggatccctct cgtcgcgaac tatcagctcg taaacgtgat 2161 gggcgtgctg gatacggtgg acgtgctgca gcgaagcggc tggcacatct ccgaagaggc 2221 actgcgcgaa gggctgaaga agacccgttg ggcaggccgc ttcgagatcc tttcccgcga 2281 tcccctgatg atcatcgacg gcgctcacaa tccggacggc gcaacgcagc tggcagagtg 2341 cctcgccacg taccttgcgg accggaagat cgttttcctg atgggcgtga tggccgacaa 2401 ggactaccgg cggatgatcc gcaccgttgc accgttcgcg aagcggttcg tcgcggtcac 2461 ccccaattcg agccgcagcc ttccctgtga agatctcgca agggtcatcg aagaggagac 2521 cggccttccg gcattgcccg gaggcgatgt gaaaagcggt ctttcccttg ccgtacaagg 2581 cttggaggcg ggcgatatcc tgtgcatttt cgggtctttg taccaagtgg gggatgtgca 2641 ggagtggctc gaaggagtat aataaaaagt agcagaattc gcaggacctg ctccccgaag 2701 catcggaggg caggcccttt tcataaaaac acgaaaagga gtattcagga tggaacaaat 2761 cacgatcaga ctgaaaaaac agcccggcgc gcctgaagaa gagatccgca tcgagaaagg 2821 atccaccatc gagagcatta tcctggaaaa cgatattcag accgaatatc ccgtttacgc 2881 tgccaggatc aacaataccg tcaagacgct tacggagatc ccggaagaag gggacgaagt 2941 cgtcctgctg gacatccgcg acaactgtgc caaggagatc ttccagcgca gcatcatcga 3001 cctgttccgc tgcgccatcg ggaaggcgtt ccccgaggcg aaggtgacca taggcaactc 3061 cctcaaccgc ggtatcttta tggatattaa gcgggagcgg ggcttcggcg tgctcgccgt 3121 ggagaagacc gaatgggtga tgaagcagat ggtgaaggac aaggtgccgt tctccatgat 3181 cgaacacggt ctggatatgg tggtgcccca cgccggctat ctgcagaact tcgatctgcg 3241 caaatgccgc agcggcctcg tcatccgcat tccggaggat acgcatcccg gcggactggc 3301 gcctgccgtg gacaacagaa atctgtacaa agccttccag gtgcagcgca agtgggcgga 3361 gaagctcaac atcctcacct gcgcggatct caaccgcgcc atcgcggcag ggcagatcaa 3421 cgacgtcatt caggtgtccg aagcgcttca ggagaagaag atcgcgcaca tcgccgacga 3481 gatcgta // LOCUS sequence090 3483 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence090 VERSION sequence090 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3483 /mol_type="genomic DNA" /organism="" /note="sequence090" CDS 648..1751 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MIEIRHLRKEYEDTTPLKDVNAVINSGDIIAVIGPSGTGKSTLLR CINMLETPTSGQIIVDGQIINDGKCDLNEVRKKMGMVFQSFNLFGHLTVIENIMNPQIT LLGRSRQEAYEKAMDLLSKVGLSSKALAYPDELSGGQQQRIAIARTLAMDPEIILFDEP TSALDPSMIGEVQSIIRMIAKTGRTMMIVTHEMDFAKKISNRVWYMDEGGIYEEGTPKQ IFENPRQYNTRKFIQRLSTLSYRIESSEFDFEPVIDELQAYAEKLLIEIDRTSKLQIAL EEICVNNLFEIHTEPNIYAQIDYSEKNDVLSLELKYSGEHFDPRDSDNELFNSILAEPT TELIDEEIINSPKWYNNRTKISFRWED" /locus_tag="LOCUS_3370" /note="WP_002355616.1 amino acid ABC transporter ATP-binding protein (Enterococcus) [pid:54.6%, q_cov:64.9%, s_cov:97.1%, Eval:2.5e-73, partial hit]" /note="MGA_462" CDS 1757..3307 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MKKNIAKISSLLLAAVLLLAGLAMPAAAFAEQAPTKNGITTIEEL NGKNLGVQTGVLYEDHIKDDLEGETWYYYKMPNDMIPALESNKIDAYLIEEVGFYAQRF EHPELVRLEEAVGVSDFAVIVGNNDKQDRLFAELQEFIAKGRENGWLDKLYDYWVINWN PNTCTIETIPETTGENGTVHIAIEGGYEPFSFESNGQFSGYDVEFMMNFCAAYGYNWEF HAMEFDSIAPAVIAGKYDFGMNIVVDEERAEASVLTDPYYSCDIVFVLEGVSENGVHFM DGIKDSFYKTFIKEDRWKLFAQGIGTTLLITLCSIAFGTLFGFAVYMLCRHGNPLANKI MNFFDGFIHGIPTVVFLMILSFVIFANSSHITAISILGFTLIFGCSMFDMLQVGNNAVP RGQAEAAKALGYSDTQSFFKILLPQAAQHFLPIYKNDVISLIKETSVVGYIAVMDLTKM GDLVRSRTYQAFFSLIAVAIIYFILEWILVSIVTRVQVSIDPKRRAKSKILEGIREVE" /locus_tag="LOCUS_3380" /note="WP_005903444.1 amino acid ABC transporter permease (Fusobacterium nucleatum) [pid:32.5%, q_cov:42.2%, s_cov:97.0%, Eval:2.8e-26, partial hit]" /note="MGA_463" ORIGIN 1 tagttgatct gcagctgcac gaactcgatc tccgggtgcg cctgcaggat gggttccagc 61 acttccgcct tgtcgtggaa ggaaatgccg atatgtttga tcaggccttc cgccttcttc 121 tccttgacga aggaccacat gtcgaaatcg tcgtagaact tcgtgcggtg ttcgcccagg 181 ttgtgcagca gatagtagtc gaaatagccg gcgccgctgc gttccaggga cgtctcgaac 241 tgcttcatcg cgtcttcgcg ggtctcgcac ttgatccacg cggccagctt cgtagccacg 301 gtgtagttct ctctgggatg ccgctcgatg agggccttgc gcatcgcttc ttcgctgccg 361 ttataggccc aggcggtatc aaaataggtg aatcctgctt cgaggaactt gtccaccata 421 atgcaggtct gttcgatatc gatctcgtcc cccttcttgg gcagacgcat cagaccgaag 481 cccagcttct tctggttgct taccgaaaag ttgtccatct ttcgcctcct taaaaaatgt 541 taaaccgtat tgtaattgta acataaaaat gattgacttt tacccccata tatcgtaccc 601 ttctcttgcc ctttaaatcc cacagaaatc aacggaggag gagacgcatg atcgagatca 661 gacatctgcg caaagaatac gaagacacga cgcctctgaa ggacgtgaac gcggtcatca 721 acagcggcga catcatcgcc gtcatcggac cgtcgggcac gggtaaatcc acccttctgc 781 ggtgcatcaa catgctggag acgcccacgt cggggcagat catcgtggat ggtcagatca 841 tcaacgacgg caaatgcgat ctcaacgaag tccgaaagaa gatgggcatg gtgttccagt 901 ccttcaacct gttcggacat cttaccgtta tcgaaaatat catgaacccg cagatcaccc 961 tgctgggccg cagccgccag gaggcctacg aaaaggccat ggacctgctg tccaaggtcg 1021 gtctgtcctc caaggcgctg gcttatccgg acgagctttc cgggggtcag cagcagcgta 1081 tcgccatcgc ccgcacgctg gccatggatc cggagatcat cctcttcgac gagccgacgt 1141 cggcgcttga cccctccatg atcggcgaag tccagtccat catccgcatg atcgccaaga 1201 ccggccgcac gatgatgatc gtcacccacg agatggattt cgcgaagaag atctccaacc 1261 gggtctggta catggacgaa ggcggcatct acgaagaagg cacgcccaaa cagatcttcg 1321 agaacccgcg gcagtacaac accagaaaat tcatccagag actgtccacc ctcagctacc 1381 gcatcgagag ctccgagttc gacttcgagc ccgtgatcga cgagctgcag gcttacgcgg 1441 agaagctgct catcgagatc gacagaacgt ccaaactgca gatcgccctg gaagagatct 1501 gcgtaaacaa cctgttcgag atccacaccg aacccaacat ctacgcgcag atcgactatt 1561 ccgaaaagaa cgacgtgctg tcgctggaac tcaagtattc cggcgagcat ttcgatccca 1621 gagattcgga caacgaactg ttcaacagca ttttagcgga gcccaccacg gaactcatcg 1681 acgaggagat catcaattcg ccgaaatggt acaacaaccg caccaagatc agcttcagat 1741 gggaggacta ggagacatga aaaagaatat cgcgaaaatt tcttccctgc tgctggcagc 1801 ggtgctcctt ttggcaggtc tggccatgcc ggctgcagcg ttcgcagagc aggcgcccac 1861 caagaacggc atcaccacca tcgaagagct gaacggcaag aacctgggcg ttcagaccgg 1921 cgttctctac gaagaccaca tcaaggacga tctggagggc gagacctggt actactacaa 1981 gatgcccaac gacatgatcc cggcgctgga atccaacaag atcgacgcct acctgatcga 2041 agaggtcggc ttctatgccc agcgcttcga gcatcccgaa ctggtgcggc tggaagaggc 2101 cgtcggcgtc tcggatttcg ccgtcatcgt aggcaacaac gataagcagg accgcctgtt 2161 tgccgagctg caggagttca tcgcaaaagg ccgcgagaac ggctggctgg acaagctcta 2221 cgactattgg gtcatcaact ggaacccgaa cacctgcacc atcgagacca tacccgagac 2281 caccggcgaa aacggcaccg tgcacatcgc catcgaaggc ggctacgagc cgttctcctt 2341 cgaaagcaac ggccagttct ccggctacga cgtggaattc atgatgaatt tctgcgcggc 2401 ctacggctac aactgggaat tccacgccat ggaattcgac tccatcgcac ctgccgttat 2461 cgcgggcaag tacgatttcg gcatgaacat cgtcgtggat gaagagcgcg cggaagcctc 2521 cgtgctcacc gatccgtatt acagctgcga catcgtattc gtgctggaag gggtctccga 2581 gaacggcgtc cacttcatgg acggcattaa ggacagcttc tacaagacct tcatcaagga 2641 agaccgctgg aagctctttg cccagggcat cggcaccacc ctgctcatca ccctgtgctc 2701 catcgccttc ggcacgctgt tcggcttcgc cgtctacatg ctctgccgcc acggcaaccc 2761 gctggccaac aagatcatga acttcttcga cggctttatc cacggcattc cgacggtcgt 2821 gttcctgatg atcctctcct tcgtcatctt cgcgaactcg tcccacataa ccgccatctc 2881 catcctgggc tttacgctca tcttcggatg cagcatgttc gacatgctcc aggtaggcaa 2941 caacgcggtt cccagaggac aggcagaagc ggcgaaggcg ctgggctaca gcgacaccca 3001 gagcttcttc aagatcctgc tgccccaggc agcgcagcac ttcctgccga tctacaagaa 3061 cgacgtcatc tccctcatca aggagacctc cgtcgtcggc tacatcgcag ttatggacct 3121 cacgaagatg ggcgacctgg tgcgcagccg cacctatcag gccttcttct ccctcatcgc 3181 cgtagccatc atctacttca tcctggagtg gatcctggtc tccatcgtca cccgcgttca 3241 ggtctccatc gatccgaaga gacgcgccaa gtccaagatc ctggaaggga tccgggaagt 3301 ggagtaatga tctaaagaga accgtcccca acagtgcaat aacaaaaccg cgcaccgaaa 3361 gtgaactgac ccccaaaagt tagaccaaga atctaactag aggaggtcag ttttgttatg 3421 gcaaagtata gttttgagtt taaaggaaag cttgtaagag agtatctgaa cggaaaaggc 3481 gga // LOCUS sequence091 3454 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence091 VERSION sequence091 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3454 /mol_type="genomic DNA" /organism="" /note="sequence091" CDS complement(774..1571) /product="glutaconate CoA-transferase subunit B" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_005902656.1" /transl_table=11 /codon_start=1 /translation="MADYTNYTKQEMQAYAIAKNIKENQIVIVGTGLPLIGASLAKRAV CPSCHPIVESGLMDCAPVEVPRSVGDLRFMAHCAVQWPNVRFVGFETNEWIHDEDRLIA FIGGAQIDPYGNVNSTCIGDYHNPVTRFTGSGGANGIATYCNTIIMMQHQKRRFMDKID YITSCGWMDGPGGREKAGLPGNRGPQMVVTDLGIMKFDDETKRMYLAYYYPFSSPEMVL ENTGFDVDVSRAQLMEGPSPEIIKLIREDIDPGQAFIKVPKAK" /locus_tag="LOCUS_3390" /gene="gctB" /EC_number="2.8.3.12" /note="WP_005902656.1 glutaconate CoA-transferase subunit B (Fusobacterium nucleatum) [pid:73.6%, q_cov:98.1%, s_cov:97.8%, Eval:4.2e-111]" /note="MGA_466" CDS complement(1591..2622) /product="glutaconate CoA-transferase subunit A" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_005902658.1" /transl_table=11 /codon_start=1 /translation="MNKVMSLHDAVAKYVQSGDTICFGGFTTNRKPYAVMGEILRQGQT DFTVWAGPAGGDWDMMIGEGRVKAYINCYTANSGYTNVSRRFRAAIEGGKLTYEDYSQD VLMLQLHAAALGLPYLPVKLMSGSGLCKFWGISEEQRKTIDSVDNLKFAYVENPFNPGE TVVAVPVPKLDTAVIHVQKASPDGTCIIEGDEFHDVDIAVAAKKVIVTCEELVSDEWIR FDPSKNNIFGECVSAVVHAPFGAWPSQCYNYYDCDDAAMKEYDKASKYQDKEDAEKQIA KEKAKAEKKGLPYNAPVDPETFKDYLDKWVYSVKDNDELLDKIGGARLAKLKVIPGLGY AKR" /locus_tag="LOCUS_3400" /gene="gctA" /EC_number="2.8.3.12" /note="WP_005902658.1 glutaconate CoA-transferase subunit A (Fusobacterium nucleatum) [pid:58.1%, q_cov:100.0%, s_cov:98.1%, Eval:1.9e-107]" /note="MGA_467" misc_feature complement(2710..>3454) /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_005902660.1:sodium ion-translocating decarboxylase subunit beta" /note="WP_005902660.1 sodium ion-translocating decarboxylase subunit beta (Fusobacterium nucleatum) [pid:75.0%, q_cov:98.8%, s_cov:65.1%, Eval:7.7e-96, partial hit]" /note="MGA_468" /locus_tag="LOCUS_3410" ORIGIN 1 cgatcatgcc ctgagcaccc tcaaggtcaa cgtagggctt ggagtccatg ccgccgacga 61 tgccggcgcc gccgactgcc atgttgccct tctcatgggc gatcaggatg gtcggggaga 121 tggagtgata gccgccgcct gcggggttgg ttccgtagat acctacgatg accggaacgc 181 ccatctggtt cagctcggag ttgcggtaga agggggtgcc gccgcctctg cggttcgggt 241 acaccttctc ctgctcgtcc agcttaacgc cggagcagtt caggacgtag accagcggga 301 tgcccagcat ctttgcggtg tcggagccgc ggagcaggtt gtccgcctgg cccgggaccc 361 atgcgccggc catcttcttg ttatcggaag cgatgatcac cgcccacttg ccgttgatgc 421 ggccaaggcc cttcacgacg ccggtggaga tgataccgat cttctcctcc tggttgtcct 481 gcgggttgta gatggtgttc agcgggcaga aagagcccgg atcgaccagc tggttgattc 541 tctcaagtgc ggtgtactgg cccttctggt ggatcttgtc atcgggcgta ccggcggaga 601 gcatcttctc ggcctgggcg tggatctctt cctcgatctt cttcagctcg gcgacgttgt 661 ccgggttcgg cttgtaagcc ggcgcattca gaacgggcat gttctgaaaa taagtcggca 721 ttgaataatc gttcatgttg gaatctcctc ctgaatacgg gtttaggggt tacttacttc 781 gccttcggaa ccttgatgaa tgcctgtccg gggtcgatgt cctcacggat gagcttgatg 841 atctcggggc tcgggccctc catcagctgt gctctggaaa catcaacgtc gaagccggtg 901 ttctcaagaa ccatctccgg ggaggagaag ggataatagt aagcgagata cattctcttg 961 gtctcatcat cgaacttcat gatgccgaga tcggtaacga ccatctgcgg gcctctgttg 1021 cccggaaggc cggccttctc acgtccgccg gggccgtcca tccagccgca gctggtgatg 1081 tagtcgatct tgtccatgaa gcggcgcttc tggtgctgca tcatgatgat ggtgttgcag 1141 taggtagcga tgccgtttgc gccgccggag ccggtgaaac gggtgactgg gttgtgatag 1201 tcaccgatgc aggtggagtt cacgtttccg taggggtcga tctgagcgcc gccgatgaag 1261 gcgatcagtc tgtcttcgtc atggatccac tcgttggtct cgaagccgac gaagcggacg 1321 ttcggccact gcactgcgca gtgagccatg aagcggaggt caccgacgga acgcgggact 1381 tcgaccggag cgcagtccat aaggccgctc tcgacgatcg ggtggcagga cgggcagacc 1441 gcgcgcttcg cgagggaagc accgatcagc ggaaggcctg taccgacgat gacgatctga 1501 ttctctttga tgttcttagc aatggcatac gcctgcattt cctgttttgt gtagttcgtg 1561 taatcagcca tgtccttctc tccctccttc ttatctcttg gcatatccca ggcccgggat 1621 gactttcagc ttcgcaaggc gggcgccgcc gatcttgtcg aggagctcgt cgttgtcctt 1681 cacgctgtag acccacttgt caagataatc cttgaaggtc tcgggatcca ccggagcatt 1741 gtaaggaagg cccttcttct cagctttcgc cttctccttg gcgatctgct tctcagcgtc 1801 ttccttgtcc tgatacttgg aagccttgtc gtactccttc atggctgcgt cgtcgcagtc 1861 atagtagttg tagcactggg acggccatgc gccgaacgga gcgtggacaa cagcgctgac 1921 gcactcgccg aagatgttgt tcttgctcgg atcgaaacgg atccactcgt cggagacaag 1981 ctcttcgcag gtcacgatga ccttcttcgc agcaacagcg atatcgacgt cgtggaactc 2041 atcgccctcg atgatgcagg tgccgtccgg agaagccttc tggacgtgga tcactgcggt 2101 gtcaagcttc gggaccggaa cagcgacgac agtctcgccc gggttgaagg ggttctcgac 2161 ataggcaaac ttcagattgt cgacggagtc gatggtcttt ctctgctctt cggagatgcc 2221 ccagaatttg cacaggccgg agccgctcat cagcttcacc ggcagatacg gaaggcccag 2281 ggcagcggcg tgaagctgca gcatcaggac gtcctgggaa taatcctcgt aggtaagctt 2341 tccgccttca atagcagcgc ggaagcggcg ggaaacgttg gtgtagccgg agtttgcggt 2401 atagcagttg atataagcct ttacacggcc ttcgccgatc atcatatccc agtcaccgcc 2461 agcggggccc gcccacacgg taaaatcagt ctgtccctga cgaaggatct cgcccatgac 2521 agcatagggc tttctgttgg tagtgaagcc accgaagcag atggtatccc cgctctggac 2581 atatttggcg acggcatcat gtaaactcat tactttattc aaggtaatac cctcctttcc 2641 atagttccaa aaacgtatct ttatttaata cagataaatc tgaaacactt acaccttttg 2701 cactgctggt caatgcttaa agaaggtaag gaagaagccg gctgcaactg cggaaccgat 2761 aacgccagcg acgttcgggc ccatagcgtg catcagaagg aagttggtgc ggtccacttt 2821 cgcgcccacg gtctgggaga cacgggctgc catcggcact gcggaaacgc ccgcggaacc 2881 gatgagcgga ttgatctttc cgccggtgat cacatagagc agcttgccca gcagcaggcc 2941 gccgacggtg gaaagggaga aggcgcagag acccatgaca acgatggcca gagtctgggg 3001 cttcaggaac agttcgcctc ttgccgtcgc gccgacggaa aggccgagga agatggtgca 3061 gatgttgcac agcgcgttct gcgccacgtc ggaaagtctc tcaacgacac cggactctct 3121 gaacaggttg ccgagcatca gcatgccgag cagcggagcg acatccggaa gaaggaggga 3181 aacaaggcag gcgaccatga cggggaagat gatcttctcg gtcttggtga cctttctgag 3241 ctgggtcatc ttgacacggc gctctttgtc cgtggtcagc gccatcatga tgggcggctg 3301 gatcagcggg atcagagcca tgtaggagta ggcggccaca gcgatgggtg ccaccagctc 3361 cggtgccagg ttgttcgcac agtagatggc ggtcgggccg tcagcaccgc cgatgacgcc 3421 gatggctgct gcctgctgcg gagtgaaaag gccg // LOCUS sequence092 3450 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence092 VERSION sequence092 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3450 /mol_type="genomic DNA" /organism="" /note="sequence092" CDS complement(98..958) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MINILSIHYPVSELCRQMNVNRSGYYKWCARKGKKNQYEKNREVL TGLLREAHQKHPSYGYHRLAHMVRTQTGWLFSDNLAHKCCKYVGIRANVRHYNWNRPLL GQEHKKYPNIVQGNWNADRPMKLIASDMTIIRHGGKPYEWTYLLDTFNNEILSSHLSAI PGDRRPYFGCLKDLIAKAKEQADPVILHTDQGSVYSSAAFYDAHKEYTILRSMSRAGTP TDNPVIEAVNGWIKAEIYAEGWHRKYASAEEMIASYVAYYNNDRPAYALQYKTPVQYRI EQGFG" /locus_tag="LOCUS_3420" /note="WP_099835063.1 IS3 family transposase (Staphylococcus) [pid:27.0%, q_cov:97.9%, s_cov:70.5%, Eval:1.8e-25, partial hit]" /note="frameshifted, insertion/deletion at around 957" /note="MGA_469" CDS complement(1433..2326) /product="arginase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_012258791.1" /transl_table=11 /codon_start=1 /translation="MKKRIDLIGAKLDQGASKRGVCIGPEAIRFAGICQGIEKLGYELN DKGNLTQLSTGRTSEKLRNYDQVIDMNRRLYEHTKQSLEEGAFPIMLGGDHSAAAGTVS AVAKAHNGNIGIIWVDAHGDWNNDESSETGNMHGMPFSALCGWGPDCMVDFGQGPAFVD PKHCVQIAGRDIDMKERERMKAAGVTVFSIDVIDRLGMREVVRRAIEIASDGTEGFHVS YDIDSVSPEYAPGTGTIVHDGLTAREAFLCMEMFAECDNMLSLDMVEVNPILDEVNRTA TLASELVLSALGKTVF" /locus_tag="LOCUS_3430" /gene="rocF" /EC_number="3.5.3.1" /note="WP_012258791.1 arginase (Chloroflexus aurantiacus) [pid:46.8%, q_cov:98.7%, s_cov:98.0%, Eval:1.3e-69]" /note="MGA_470" ORIGIN 1 aggcagcagc tctggcggac aagttctaag ttccggacaa gcaaaaagga ggcttcggct 61 gaactagtca agcaaaagta gacaaactaa aaaagcatta gccaaacccc tgttcgatcc 121 tgtattggac aggggtcttg tattgcagcg cataggctgg tcggtcgttg ttgtaatacg 181 ccacataaga agcgatcatc tcttcggccg acgcatattt tcggtgccag ccttcagcat 241 atatttcggc tttgatccat ccgtttacag cttcaatgac aggattatct gttggtgttc 301 ctgctcgcga catggatcga agtatggtat actctttatg agcatcgtag aatgccgcgg 361 aggaatagac ggaaccctgg tcggtgtgca aaatgacggg atctgcctgt tcctttgctt 421 ttgctatcag atctttaaga cagccgaagt atggacgtct gtcacccgga atggctgaga 481 ggtgactcga aaggatctcg ttgttgaatg tgtccagcag ataggtccat tcgtatggtt 541 ttccgccgtg cctgattatc gtcatgtcag atgcgatcag tttcatcggt ctgtctgcat 601 tccagtttcc ctgaactatg ttgggatatt ttttatgttc ctgacctaat aacgggcggt 661 tccaattgta gtgccggaca ttagcccgta ttcccacgta tttgcagcat ttgtgcgcca 721 gattatcgga gaaaagccat cctgtttgag ttctcaccat atgtgccagc cgatggtatc 781 cataggaagg gtgcttctga tgggcttcgc gcagcagacc agtaagcacc tcacgattct 841 tctcgtattg attcttcttg cctttacgtg cacaccattt gtagtagccg gaacgattaa 901 cgttcatctg cctgcacaac tcgctcacag gataatgaat acttaaaata ttgatcactt 961 gatattcctg tctcttaaag aaacgaattc cttgtcggca ccagctcctt tcaccatgta 1021 tccttttttt aaccgttcgt tctcgatttg aagtttttcg acaagaagcc gcaatctgtc 1081 ttcttcggaa agagatttgc tggcatgcag ggccgcaaac cggtttcccg tacgcagttt 1141 taccggattg agtgcgtcaa cgccgccatt cctgtaccgt cgcacccaac cgtccagagt 1201 tccgcgcggt attccggctt ctctggcaag tgcttttgca gaaacatgtt cctcttcaca 1261 catcaaaaca tatttcaacc gttcttcatt tgtccaccgt ctgttctttc cgcctttagg 1321 tctacccata gttccacctc cacataaact ttaacatgaa aaaagtagac atgctttttt 1381 acatgtctac tttcatctta ctagttcact ttgcaggctt ctttttattt gcttagaata 1441 ccgtctttcc cagagcggag agcacgagtt cgctggccag cgtggcggtg cggttgactt 1501 cgtccaggat ggggttgacc tccaccatgt ccaggctgag catgttgtcg cattccgcga 1561 acatctccat gcacaggaag gcttcgcggg cggtcaggcc gtcgtgcacg atggtgcctg 1621 tgcctggcgc gtactcaggc gaaacgctgt cgatgtcgta ggacacgtgg aacccttcgg 1681 tgccgtcgct ggcgatctcg atggcgcgcc ggacgacctc gcgcatgccc aggcggtcga 1741 tgacgtcgat ggagaagacc gtgacgccgg cagccttcat gcgctctctc tccttcatgt 1801 cgatgtcgcg gccagcgatc tgcacgcagt gcttcggatc tacgaaagcc ggtccctggc 1861 cgaagtcgac catgcagtcc ggtccccagc cgcacagggc ggagaagggc atgccgtgca 1921 tgttgccggt ctcggaggat tcgtcgttgt tccagtcgcc gtgggcgtcg acccagatga 1981 tgccgatgtt gccgttatgc gccttggcca cggcgctgac cgtgcctgcc gccgcggagt 2041 ggtccccgcc gagcatgatg gggaacgcgc cttcttcgag gctctgcttc gtgtgttcgt 2101 acaggcggcg gttcatgtcg atcacctggt cgtaattgcg cagcttttcg ctggtgcggc 2161 cggtggaaag ctgggtgagg ttgcctttgt cgttcagttc atagccaagc ttttcgatgc 2221 cctggcagat gccggcgaaa cggatggctt cgggaccgat gcagacgccg cgcttggaag 2281 cgccctggtc gagctttgcc ccgatcagat cgatgcgttt tttcatggta aactcctttc 2341 ggtaggggta gttgcttttg tggacctatt atatcgtaaa acgttatatt tatacaagac 2401 tgaataaata tgcaaccaat cacggggacg ggggcttgat cggtatttga aaccttacac 2461 gccccgtccc cgtgattcat gatataatta atataagaac ataaggaggt tttccatgtt 2521 aaagatctcg agagaatttg tgacgggcga ccacagcccg gataataagc cggtcgcgtt 2581 ctgcgagagc ggcgaaacgg tcgagttcga ctgcagaaac tgctacgacg accgtctgca 2641 cgcggacggc tccgtggatc acgaggagct gaccatcgac aatcccgcca ccggcccgct 2701 gtacgtgaac ggcgccgaac ccggcgacgt gctgaaagtg gagatcctga agatccggct 2761 gaacggcaaa ggctatatgc ggcagtccct ggtcggcggc gcgttttacc agcgtcccgg 2821 cgttaaggaa agagtcgtgc gcgagttcga cgtgtctgga gatacggtga aattcaacga 2881 taaattggaa ttccccatcg atacgatgat cggggtcatc ggcacggccc ccgtgcctgg 2941 cagcctgccc ggcgtgtggg agaacgagac cccgggcaaa tggtccacgg aactgcccgg 3001 cgaccacggc ggcaacatgg actgcaacaa gatcgtggaa gggtccacgc tgtatctgcc 3061 ggtgaacgtg cccggcgcgt tgctttccat gggcgacatg cacgcgctga tgggcgatgg 3121 cgaatccatg atctgcggtc tggaatccgc gggcaaggct acggtgcgcg tatccgtcgt 3181 caagggctgg catctgccta cgccctgcct gatccacaag ggcggcaagc gcttctccac 3241 gatccagagc gatccggacc tgatggcctc cgcgaagaaa gccgcgaact gcatgctgga 3301 cttcctgctc gaatacacgg acctgggcga atatgacggc ggcaaactgc tgtcgctgaa 3361 aggcgacctg gcgatctgcc acatcatcaa cgacctgctg accgtgcgca tggagatcga 3421 tacgtatatc ctggatcagt atgggatcaa // LOCUS sequence093 3432 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence093 VERSION sequence093 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3432 /mol_type="genomic DNA" /organism="" /note="sequence093" CDS 165..1088 /product="50S ribosomal protein L11 methyltransferase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011861555.1" /transl_table=11 /codon_start=1 /translation="MKYKEIKIYPKREELDALVEALNAAGRTDLVINDPGELEGIMRAR DEHVWDYVDPEVIEDLQGNPYVCFYLQEGEDDPAAMDIAKGFDFTLTHVDDEDWLHKWE EYFMPTKISKRFVVKPAWRQYEPKEGEDVITIDPGLAFGTGTHATTFLTLRLMEKYLQP GDDVLDVGSGSGILSIGAVKLGAERIWAVDLFDDAVQSTKKNAALNGCEDKIEAFQGDL TKGLDVKADLVCANLMADLVKMLSKDVAKHLKGRGIYISSGILDEKEEDVAGAIKGAGF DILESIHADGWCAICAVWNRSFPPRT" /locus_tag="LOCUS_3440" /gene="prmA" /note="WP_011861555.1 50S ribosomal protein L11 methyltransferase (Clostridioides difficile) [pid:36.9%, q_cov:94.8%, s_cov:96.5%, Eval:1.6e-51]" /note="MGA_473" CDS complement(1045..1341) /product="putative quinol monooxygenase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_002285944.1" /transl_table=11 /codon_start=1 /translation="MIIVRVKYRTPEGQRDAFLQQLFDEGLPQACRAEEGNICYDYFLN YEDPNEILLLEMWKNGDALAKHGKEPHFTRIGQVRVENDVKSVVESFDSKPRK" /locus_tag="LOCUS_3450" /note="WP_002285944.1 putative quinol monooxygenase (Enterococcus) [pid:35.8%, q_cov:96.9%, s_cov:97.9%, Eval:2.9e-13]" /note="MGA_474" CDS 1452..1958 /product="methylated-DNA--protein-cysteine methyltransferase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003232502.1" /transl_table=11 /codon_start=1 /translation="MRYTVFMDSPIGKLQLAEEDGKLTHLLFAWHNTLADYGLQAEEKE TPLLKKAKKQLNEYFAGKRKVFDLPLAPSGTAFQQKCWEGLRTIPYGETRTYRDIAAYA GNPKAVRAAGGANHNNPISIIVPCHRVVGSTGSLTGFGGGLEAKAFLLNLEQKGIGGDK VWQAK" /locus_tag="LOCUS_3460" /gene="ogt" /EC_number="2.1.1.63" /note="WP_003232502.1 methylated-DNA--protein-cysteine methyltransferase (Bacillus) [pid:49.7%, q_cov:92.9%, s_cov:96.4%, Eval:5.8e-38]" /note="MGA_475" CDS 1943..3343 /product="tRNA (N(6)-L-threonylcarbamoyladenosine(37)-C(2))-methylthiotran sferase MtaB" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_004454735.1" /transl_table=11 /codon_start=1 /translation="MAGEIGSLKKKTVSFFTLGCKVNQYESQALAEAFRRAGCEVTDSE DSPADIYVVNTCSVTRLADRKSRQYMRRVKRENPGALVIVMGCYPQTNPKEVGAIEEAD FILGTTEKMRAVELAEEWFSCDPSSRLRHNFVEDPVVHQTAYEQHEGITGMETKTRALI KIQEGCNRFCSYCVIPHARGQVRSRSAAAIKKEAMALVSAGYKEITLTGINTALYGAEK GFTDDLNTGLEGVEIIVKALNDIPGDFLIRLGSMEPTVIDADYIQRLFRYEKLAHHVHL SIQSGSDAVIAGMNRHYTAADYLEIVRRCRAFDPLYGITTDIITGFPGETEADLEASKE IVRQVAYLHVHCFPYSRRMYTPAADMPGQIAPPVKKQRNKELIAVAEEVSKQFRSSMIG SVQRVLAEEIEETEQGRLWKGHCSNYCVVYFRDPAMNDPSRAASLENQWIGVKVESVYR DGVLGNMV" /locus_tag="LOCUS_3470" /gene="mtaB" /note="WP_004454735.1 tRNA (N(6)-L-threonylcarbamoyladenosine(37)-C(2))-methylthiotran sferase MtaB (Clostridioides difficile) [pid:39.1%, q_cov:97.0%, s_cov:99.5%, Eval:6.1e-86]" /note="MGA_476" ORIGIN 1 acaacggcgc caacgtgctg gagatcgacc acgaaagaga agacgccaag accgaggtga 61 attcctgcgt cgtcacccta accctggaaa cgaaggacga agaccatatc cgcaagatcc 121 gcagagatat ggaggagaac ggatatcagc tgttcgatta gaccatgaaa tacaaagaga 181 tcaagatcta tccgaaaaga gaagaactgg atgcgctggt cgaggcgctc aatgcggcgg 241 gaagaacgga cctggtcatc aacgatcccg gggagctgga aggcattatg cgggccagag 301 acgaacacgt ctgggactac gtggatccgg aggtgatcga ggacctgcag ggcaacccct 361 acgtctgctt ctatctgcag gagggggagg atgacccggc agcgatggat atcgccaagg 421 gttttgattt tacgctgacc catgtggacg acgaagactg gctgcacaag tgggaagagt 481 actttatgcc cacgaagatc tcgaagcgct tcgtcgtaaa gcccgcctgg cggcagtacg 541 aaccgaagga gggggaggac gtcatcacga tcgatcccgg cctcgctttc ggcacaggta 601 cccacgccac gacctttctg accctgcggc tgatggaaaa gtatctgcag cccggagacg 661 acgtgctgga cgtgggctcc ggcagcggca tcctgtccat cggggcggtc aagctcggtg 721 cggagcgtat ctgggcagtg gacctgttcg atgacgccgt ccaaagcacg aaaaagaacg 781 ccgccctaaa cggatgcgag gataagatcg aggcgtttca gggcgatctg acgaagggcc 841 tggacgtaaa ggcggatctg gtgtgcgcca atctgatggc ggatctcgtt aagatgctct 901 cgaaagatgt agcgaaacat ctgaagggca gggggatcta tatctccagc ggcattctgg 961 acgaaaaaga agaggatgtc gccggcgcca taaagggcgc gggattcgac atcctcgaaa 1021 gtatccatgc agacggatgg tgtgctattt gcgcggtttg gaatcgaagc tttccaccac 1081 ggacttgacg tcgttttcca cccggacctg accgatgcgg gtaaaatgag gctctttgcc 1141 gtgcttagcc agcgcatcgc cgttcttcca catttccagg agcaggatct cgttgggatc 1201 ttcatagttc aggaaatagt catagcagat gttgccttct tcagcgcggc aggcctgggg 1261 caggccctcg tcgaacagct gctgcaggaa ggcatcgcgc tggccttccg gggtccggta 1321 tttcacgcgt acgatgatca ttttttccct ccgttcttta cagagaacat ttgttctgtt 1381 ataatcaggt tgctgttacg tttattatac aacgtttttt ccgtcgcgga gagcaaagtt 1441 aggaggacaa catgagatat accgtattta tggattctcc catcggcaaa ctgcagctgg 1501 cagaagaaga tggcaagctt acgcaccttc tctttgcgtg gcataatacg ctggcggact 1561 acggtctgca ggcggaagag aaggagacgc ctctcctcaa aaaggcgaag aaacagctga 1621 acgagtattt cgcaggaaag cgcaaggtgt tcgatctgcc cctggcgcct tccggcaccg 1681 cgtttcagca aaaatgctgg gaagggcttc gcaccatccc ctacggcgag acccgcacct 1741 accgcgatat cgctgcttat gcgggcaatc ccaaggcggt aagagcggcg ggcggcgcca 1801 atcacaacaa tcccatcagc atcatcgttc cctgccaccg ggtagtcggc agcaccggct 1861 ccttaacggg cttcggcggg ggactggaag ccaaggcctt cctgctcaac ctggagcaga 1921 agggcatcgg cggagacaag gtatggcagg cgaaatagga tctttaaaaa agaagaccgt 1981 atcgtttttt acgctgggct gcaaagtaaa ccagtacgag tcccaggcgc tggcggaagc 2041 gttccgccgg gccggatgcg aagtaacgga ttccgaagac agcccggcgg atatttacgt 2101 ggtaaacacc tgcagcgtaa cgcggctggc cgatcgcaag tcccggcagt acatgcggcg 2161 ggtcaaacgg gagaatcccg gcgcgctcgt catcgtcatg ggatgctatc cccagacgaa 2221 tcccaaggaa gtgggggcga tcgaagaggc cgacttcatc ctcggcacga cggagaagat 2281 gcgggcggtg gagctggcgg aagaatggtt ctcctgtgac ccttccagcc gcctccggca 2341 caatttcgtc gaagatcccg tcgtgcatca gaccgcatac gagcagcacg agggcattac 2401 cggcatggag accaagacgc gcgctctcat caagatccag gagggctgca accggttctg 2461 ctcctactgc gtcatccccc acgccagagg acaggtgcgc agccgcagcg ccgcagccat 2521 caaaaaagag gcgatggcgc tcgtttccgc aggttataag gaaattaccc ttacgggcat 2581 caatacggcg ctctacgggg cggaaaaggg ctttacagac gatctgaaca cggggctcga 2641 aggcgtggag atcatcgtaa aggcgctcaa cgacatcccc ggcgatttcc tcatccggct 2701 gggctccatg gagccgaccg tcatcgacgc ggactatata cagcggctgt tccgctacga 2761 aaaactggcg catcacgtgc atctgtccat ccagagcgga tccgatgccg tcatcgcggg 2821 gatgaaccgc cattataccg ccgcagacta tctggagatc gtccgccgct gccgtgcgtt 2881 cgatcctctg tacggtatta cgacggatat cataacgggt tttcccgggg agacggaagc 2941 cgatctcgaa gccagcaagg agatcgtaag acaggtggcg tacctgcacg tgcactgttt 3001 cccctacagc cgcaggatgt atacgccggc ggcggacatg cccggacaga tcgctccgcc 3061 tgtcaaaaaa cagcgcaaca aagaactcat cgccgttgcc gaagaggtct cgaaacagtt 3121 ccgttcttcc atgatcggct ccgtgcagcg ggtgctggcg gaggagatcg aagaaacgga 3181 gcagggcagg ctctggaagg gtcactgcag caattactgc gtcgtctact tccgtgaccc 3241 cgccatgaac gatccgtccc gcgccgcttc tctggagaac cagtggatcg gcgttaaggt 3301 ggagtccgtt tacagagacg gcgttttggg aaatatggta taataacttg tttaagaaag 3361 gaggagaccc tatgtccgat tgcttattct gcaagatcgt tgcgggagag atcccatcca 3421 ataaggtcta tg // LOCUS sequence094 3395 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence094 VERSION sequence094 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3395 /mol_type="genomic DNA" /organism="" /note="sequence094" CDS 641..1408 /product="30S ribosomal protein S2" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003424537.1" /transl_table=11 /codon_start=1 /translation="MSVVSMKQLLEAGVHFGHQTRRWNPKMAPYIFTERNGIYIIDLSK TVHKMDDAYEFVKSVAAEGKPVLFVGTKKQAQAAIKDEAERCGMFYVNERWLGGMLTNY KTISTRIKRLAEIKEMEANGTFDLLSKKEVQTLRKEMEKLEKYLNGIKDMKGMPGAMFV VDPKKEKIAVKEARVLGIPIVGMCDTNCDPDDVDYVIPANDDAIRAVKLIAGKMAEAVI EGKQGESFADAPAEEAAPAEETPAEAEEAKVEE" /locus_tag="LOCUS_3480" /gene="rpsB" /note="WP_003424537.1 30S ribosomal protein S2 (Clostridioides) [pid:74.9%, q_cov:89.0%, s_cov:95.8%, Eval:7.2e-97]" /note="MGA_479" CDS 1425..2366 /product="translation elongation factor Ts" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003424535.1" /transl_table=11 /codon_start=1 /translation="MAAVTAALVKELREMTGAGMMDCKKALVATEGDIDKAVDYLRENG LAKAAKKAGRIASEGLVRMAFAADGSAAAAVEVNSETDFVAKNEEFIEFVEKLADISLN AEKVCAECIKDMPYGEEGTVGEVLVAKIAKIGENMNIRRCVKCNTPGVKYVGYSHGGGR IGVIIGLKTDASVEEVTTCGKDVAMQAASMRPQFVDEASVDPEYLAHEKEVILAQAINE NNELPENKRKPHEIIEKMITGRVKKSLKEVCLVDQAFVKDSNMTVAEYVASCAKALGKD IKVVEMVRYEVGEGLAKKEENFAEEVAKQIRG" /locus_tag="LOCUS_3490" /gene="tsf" /note="WP_003424535.1 translation elongation factor Ts (Clostridioides) [pid:54.5%, q_cov:99.7%, s_cov:100.0%, Eval:1.2e-86]" /note="MGA_480" CDS 2531..2917 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MNDKERLLQAAFDMALQTKVVKENQTDNADPDIKAAMIDYILTAA VGLNSDQITEFIADQTAMEDKYLKASFEQAAAEIKDIEEMGEIRSHIQDEMEQYFRERQ ANIRKRRIELYIQDQVEAKRNETK" /locus_tag="LOCUS_3500" /note="MGA_481" ORIGIN 1 gcagtcgacg atcgggaaac tgaaggcgga cgtggcggag gcgcgggtga aaaacatcaa 61 cccggacgtg cagctgcgca agtttgcgct gcgcatcgac gaaacgacca tagcggatct 121 ggatatcccg tcctgggact atatcgcgga ctgcatcgac gatgtggatg cgaaagttct 181 cctgatcaaa aaggcgcggg atgcgggcgt tcccatcctg tgttccatgg gaacggggaa 241 caagctcgat gcctctgcat ttaaggtgac caacatcaaa aagactgaac aggacaggct 301 tgccaaggtc atgcggaaac gcctgcggga cgagggaatc gatgaagggg tcaccgtcgt 361 gtattcgccc gagccgcccg taacagagat ccatgatggg gtcatcccca gcatctcttt 421 tatgccggcg acggcaggtc tgcggatagc gggggagatc attcaaaacc ttataaaata 481 acgcttgcaa ggagtgcagc acctgtgtat aatatttgag gttgcgctcc tttttgcgtg 541 acagtatttt atttcgcaca cctgaaggcc tgcatttcgg tgcccgcaag ggttttctgc 601 aggaacaaac aggtggaagt tttaaccggg aggtaaacaa atgtcagtag tttctatgaa 661 acagttgctg gaagccggtg ttcatttcgg acatcagacc agaagatgga accccaagat 721 ggctccgtac atcttcaccg aaagaaacgg catctacatc atcgacctgt ccaagacagt 781 tcacaagatg gacgacgctt atgaattcgt taagagcgtt gcagcagaag gcaagcccgt 841 tctcttcgta ggtacgaaga agcaggcgca ggccgcgatc aaggacgaag ccgaaagatg 901 cggcatgttc tacgtaaacg agagatggct gggcggcatg ctcaccaact acaagaccat 961 ctccaccaga atcaagagac tggccgagat caaggaaatg gaagccaacg gcaccttcga 1021 tctcctctcc aagaaggaag tccagaccct gcgcaaggaa atggaaaagc tggagaagta 1081 tctcaacggc atcaaggata tgaagggtat gcccggcgcc atgttcgtcg tagaccccaa 1141 gaaggaaaag atcgccgtta aggaagccag agttctgggc attcccatcg tcggtatgtg 1201 cgataccaac tgcgacccgg acgacgtgga ttacgttatc cccgctaacg acgacgctat 1261 ccgtgcggtc aagctgatcg ccggcaagat ggcagaagcc gttatcgaag gcaagcaggg 1321 cgaatccttc gcagacgctc ccgctgagga agcagctccc gccgaagaga cccccgcaga 1381 agcagaagaa gctaaagtcg aagagtaatt aaaggagaaa tacaatggca gcagttacag 1441 cagcactcgt aaaagaactc cgtgaaatga ccggcgccgg catgatggac tgcaagaagg 1501 ccctcgttgc taccgaaggc gacatcgata aggcagtcga ctatctgaga gaaaacggac 1561 tcgcgaaggc agccaagaag gccggccgta tcgcttccga aggcctcgta agaatggcgt 1621 tcgcagcaga cggctccgca gccgcagctg tcgaggtcaa ctccgagacc gacttcgtcg 1681 caaagaacga agaattcatc gaattcgtcg aaaagctggc cgatatctct ctgaacgcag 1741 aaaaggtctg cgcagagtgc atcaaggata tgccctacgg cgaagaaggc actgtcggtg 1801 aagtcctcgt cgctaagatc gcaaagatcg gcgaaaacat gaacatccgc agatgcgtca 1861 agtgcaatac gcctggcgtc aagtacgtcg gttattccca cggcggcggc cgtatcggcg 1921 tcatcatcgg tctgaagacc gacgcttccg tcgaggaagt caccacctgc ggcaaggacg 1981 tagccatgca ggctgcttcc atgagacccc agttcgtgga cgaagcaagc gtcgatcccg 2041 aatatctggc tcacgaaaag gaagtcatcc tggctcaggc catcaacgag aacaacgaac 2101 tgcccgagaa caagagaaag cctcatgaga tcatcgagaa gatgatcacc ggccgtgtaa 2161 agaagtccct gaaggaagtc tgcctcgtag atcaggcctt cgtaaaggat tccaacatga 2221 ccgtggccga atatgtcgct tcctgcgcca aggctctcgg caaggacatc aaggtcgtcg 2281 agatggtccg ctacgaagta ggcgaaggcc ttgcgaagaa ggaagagaac ttcgcagagg 2341 aagtcgccaa gcagatccgc ggctaatcag caatactgat cgaaacctca aactcccggc 2401 ttactgccgg gagtttttgc atccttttgg ataaatttta cgcagccctg ttctttttgc 2461 tgaaaaatgg tatataatag cagtacagaa agatgagcgc tgctcatgat cttaaaggaa 2521 ggaacataaa atgaacgata aggaaagact gttgcaggcc gcattcgaca tggcgctgca 2581 gacgaaagta gtcaaagaaa accagaccga taatgcagac cccgatatca aggccgcgat 2641 gatcgattat atcctcaccg cagcggtggg tctcaacagt gaccagatca cggaatttat 2701 cgcagatcag accgcgatgg aagataagta tctgaaggca tccttcgaac aggctgccgc 2761 cgagatcaag gacatcgaag agatgggcga gatccgcagc cacatccagg acgagatgga 2821 gcagtacttc agagaaagac aggccaacat ccgtaagaga agaatcgaac tctacatcca 2881 ggatcaggtc gaagccaaga gaaacgaaac caaataaacc gcaaacagag ctcccggctg 2941 tatgccggga gtttttttat ggtatactga agccatggat acgaaacagg aaaaactcag 3001 aaatctgccc aaggcagatg tcatcatgga tttacccgtc ctgcaaccgt ttctcgcgtc 3061 tgcgggccgg aaaacggcct tagaagcggt gcggaaagcc gtggatgaga tgcgtcagga 3121 tatcctatcc ggcgatgacc cggacatccg cccggaagcg gcggcggccc gcgcctgccg 3181 cattctcgaa aaggaggaca gaccctccct gcgtcccgtc atcaacgcaa cgggcatcat 3241 tctgcacacg aatctgggcc gtgccaggct caactcccag gcggcggaaa aagcggcgca 3301 gatcgcctgc agctactcga cgctggagta cgatccggaa aagggcgtgc ggggcagccg 3361 ccacgaccac gtgggaaagc ttctcgcgca ggtga // LOCUS sequence095 3363 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence095 VERSION sequence095 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3363 /mol_type="genomic DNA" /organism="" /note="sequence095" CDS 443..1564 /product="stage V sporulation protein E" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003426995.1" /transl_table=11 /codon_start=1 /translation="MKTLTGTKKQRPEGDFLMAALVLALSLFGVVMVFSASYYTSLSKF GNAYEYLKQDALWMAVGWVAFIFFAKLDYHFLKLLAWPALGVGIVLLALLFTPLGVTLN NATRWLDFGFATVMPGEIIKFALIIWIATFLGDDPEKIKRVKDGLVPIVAVLAVVLVLI VKQPNMSTAGIIGILVIGMMFVAGLRLYLLVGLGGLGVAGFVGFILSPKGAYMLQRVHT FFDPFEDELGSGYQVVQSLLALGSGGVTGVGLGRSIQKALYLPEPMNDFITAIIGEELG FVGLIVMLLAFLLLIWRCCRIALRAKDYYGMLLASGISILLGTQVILNVAVISASFFPT GVVLPFITLGGNATLIFLSLMGILFNISKNPAE" /locus_tag="LOCUS_3510" /gene="spoVE" /note="WP_003426995.1 stage V sporulation protein E (Clostridioides difficile) [pid:39.2%, q_cov:97.1%, s_cov:95.7%, Eval:1.4e-71]" /note="MGA_484" CDS 1576..2676 /product="undecaprenyldiphospho-muramoylpentapeptide beta-N-acetylglucosaminyltransferase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_009893705.1" /transl_table=11 /codon_start=1 /translation="MKAILSCAGTGGHIYPAIAIADKIRRMEPDSQILFIGTKTGMENR LVPAAGYEIRGIDASGFNRKNLLKNFKTAVDLARGGHETDAILAEFQPDVVIGTGGYVT GTVVRKAAKKGIPCYIHEQNVVPGMANKMLEKYVKKVFISFEGSRDHFQEPDKLVLTGN PIRKEFLIEDVSDARRQLGLTDSDFMILITGGSLGAEVPNMASLDLIAELAKDTKGAKV FFVTGKRYYEEIAAKVKEIAGAEEFVRVIDYADNMPVLMSASDLIVSRAGAIALSEITA SGKPSILIPSPNVTNNHQYYNAKSVADEGAAVLIEESSLQEGFAPFTAAVMQLLASRDR LNRMAEKAAAIGKTDAVDIIYKNIKM" /locus_tag="LOCUS_3520" /gene="murG" /EC_number="2.4.1.227" /note="WP_009893705.1 undecaprenyldiphospho-muramoylpentapeptide beta-N-acetylglucosaminyltransferase (Clostridioides difficile) [pid:42.9%, q_cov:99.5%, s_cov:88.5%, Eval:3.2e-76]" /note="MGA_485" ORIGIN 1 gggcgtcgaa caccgcatcg aattcgtgaa ggaagtgaag ggcgtgcgct acgtaaacga 61 ctcgaagggc acgaatccgg acgcttccat caaggccatc gaagccacga acaccccgat 121 cctgctgatc gcggggggct acgagaagaa ctccgacttt acggacttca tcaacggttt 181 taatggtaag gtaaaatatc tgctgctgct ggggcagacg gcgcaccgct ttgcggacac 241 cgccagaaaa tgcggcttcc cggaagaccg catgatcttc tgcgacagta tgaaagacgt 301 aatttcccac gcctacagcc tggcagaagt aggagatact gtcctccttt ctcctgcttc 361 tgccagctgg ggcatgtata acaacttcga ggagaggggc gaggacttta aaaacctggt 421 ccgcgcttta ccggaataag atttgaagac gttaacagga acgaaaaaac aaagaccgga 481 aggggatttc ctgatggcag cgctggtatt ggcgctgtct ctgttcggcg tggtcatggt 541 gttctccgcc agctactaca cgtccctcag caagttcggc aacgcctacg agtacctgaa 601 acaggacgcg ctgtggatgg ccgtcggctg ggtggcgttc atctttttcg ccaagctgga 661 ctaccacttc ctgaagctcc tggcctggcc cgctctgggc gtaggcatcg ttttgcttgc 721 ccttttgttt acgcctctcg gcgtgaccct caacaacgcc acccgctggc tcgactttgg 781 tttcgcgacg gtgatgccgg gggagatcat caaattcgcc ctcatcatct ggatcgccac 841 tttcctgggg gatgacccgg agaagatcaa acgggtgaag gacggccttg ttcctatcgt 901 tgccgtgctt gccgttgtcc tcgtcctgat cgtaaagcag cccaacatgt ccacggccgg 961 catcatcggt atcctggtca tcggcatgat gttcgtagct ggacttcgcc tgtacctgct 1021 cgtgggcctc ggcggcctgg gcgtcgcggg attcgtgggg ttcatcctca gcccgaaggg 1081 cgcctacatg ctgcagcgcg tgcacacttt cttcgatccc ttcgaagacg agctggggtc 1141 ggggtatcag gtcgtgcagt ctctgctggc tctcggaagc ggcggcgtga ccggcgtagg 1201 cctcggacgc agcatccaga aggcactgta tctgcccgaa cccatgaacg actttattac 1261 cgcgatcatc ggcgaggagc tcgggtttgt cgggctcatc gttatgctgc tcgccttcct 1321 gctgctgatc tggcgctgct gccgcatcgc gctgcgggca aaggactact acggcatgct 1381 gctcgcgtcc ggcatctcca tcctgctggg cacccaggtg atcctgaacg tggcggtcat 1441 ctccgccagt ttcttcccga cgggcgtcgt gcttccgttt attacgctgg gcggcaacgc 1501 caccctcatc ttcctgtctc tgatggggat ccttttcaat atctccaaga atcctgccga 1561 ataaggagta tttttatgaa agccatctta agctgcgccg gtacgggcgg ccacatttat 1621 cctgccatcg ctatcgcgga taagatccgc cgcatggaac cggattctca gatcctgttt 1681 atcggtacga agaccggcat ggagaaccgt ctggtgccgg ctgcgggata tgagatccgc 1741 ggcatcgatg ccagcggctt taaccgcaaa aacctgctga agaacttcaa gaccgccgtg 1801 gatctggcga gaggcggcca cgagaccgat gcgatcctgg cggaatttca gcccgatgtg 1861 gtgatcggca ccggcggcta cgtgaccggg acggtcgtgc gcaaggctgc gaagaagggg 1921 attccgtgct acatccacga acagaacgtg gtgccgggca tggccaacaa gatgttggag 1981 aaatacgtta agaaggtctt tatctccttc gaagggtcgc gcgaccactt ccaggagccg 2041 gacaaactgg tgctgacggg caaccccatc cgcaaggaat ttttgatcga agacgtgtcc 2101 gacgcgcggc ggcagctagg ccttacggac agcgatttta tgatcctgat caccggcggc 2161 agcctggggg cggaagtgcc caacatggcc agcctggacc tgatcgcgga actggcgaag 2221 gatacgaagg gggcgaaggt cttcttcgtg accggcaaga gatattatga agagatcgcc 2281 gcgaaggtga aggagatcgc cggagcggag gagtttgtgc gggtcatcga ttacgccgac 2341 aacatgccgg tgctgatgag tgcctccgac ctgatcgtga gccgggcagg ggccatcgcc 2401 ctgtcggaga tcacggccag cggcaagcct tccatcctga tcccgtcccc caacgtgacg 2461 aacaatcacc agtattacaa cgccaagtcc gtggcggacg agggcgctgc ggtgctgatc 2521 gaagaatcct ctctgcagga gggattcgcc ccctttacgg cggccgtgat gcagctgctc 2581 gcttcccgtg acaggctcaa ccgcatggcg gagaaggccg cggccatcgg aaagaccgac 2641 gcggttgaca ttatctacaa aaacattaaa atgtaaagga tggacgatta ttcacaggac 2701 tatcctgcgg agtatccgca ggaggaacac gtttataccg gtgaggaact gtccggctac 2761 gaggactatg ccccggaaca gccgaagcat cccgccaaga aaaagaagaa gaggagaaga 2821 aaacactact tcctccgctt ttgtattttt tgcgccttgg tgttcggcct gtatgcgttc 2881 ctgaattccg actttttcgc ggtccgcaat ttcgaggtga ccggcaacca gtactacacg 2941 ccggcgcaga tcatcgagat gtccgggctg cagagcgggg tcaacctgtt cttcgagacc 3001 aagacccgcc ccgcgagaaa cgcgctgctg gaagatccct acatccgcct ggcggagatc 3061 aagcgcaagc ccaaggatac gatccagatc aacatcgagg agcgccggga atacgccggc 3121 gtgccctacg gcgaccagta cgtgctgatc gaccgggagg ggacggtgct gcgggtcgcg 3181 gacgccgagc ccacgctgcc gatcctgggc aacatgacca ttacggagat gaccccgggc 3241 agcgcactgc aggtggagca ggcctacctg ctgacggata ccctcagtct gctgcagctg 3301 gtggaggaga acgacatcta ctttaagcgc atcgactttt ccaccgttat cgtgcgcgcc 3361 tac // LOCUS sequence096 3358 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence096 VERSION sequence096 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3358 /mol_type="genomic DNA" /organism="" /note="sequence096" misc_feature <1..1069 /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_011860656.1:M20 family metallopeptidase" /note="WP_011860656.1 M20 family metallopeptidase (Clostridioides difficile) [pid:39.6%, q_cov:88.7%, s_cov:77.6%, Eval:6.0e-64]" /note="MGA_487" /locus_tag="LOCUS_3530" CDS 1122..2219 /product="alanine racemase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_071542276.1" /transl_table=11 /codon_start=1 /translation="MEALRDTIVTVDLGRIGRNMDKIRNMVGPDVAVMPVIKANGYGCG AVGIAPTLMEHGAAYLAVATLTEAIELRTAYPDYPVFILGHTPARFLEHVVDGRFTQTV IDYDHAKALSDVALAKGTKATVHLKMDTGFHRLGTSDKEELLKMAKLPGLNVEGIFSHL ALAGEKEDWDQYNMLCDAIDYLEANGCTFKYKHIADSISLGDYPEFRMNMVRPGALVFG LTSFSRAHLDVEQCMGMQTRISQIHEIKAGEGVSYDYLWKAQRDSHIATVPVGYADGYP RNMRDKGYLTVHGVKCPTVGVLCMDQLMIDVTDCPEAKEGDAAIIYGDGSGNTMSIPEA ASLAGTNKNEIIARILSRPPRVYVK" /locus_tag="LOCUS_3540" /gene="alr" /EC_number="5.1.1.1" /note="WP_071542276.1 alanine racemase (Moorella thermoacetica) [pid:38.0%, q_cov:97.0%, s_cov:97.3%, Eval:7.3e-65]" /note="MGA_488" ORIGIN 1 ggagaaactg ggtgtggctt accgggtcac gccggagaaa gcagtggtgg gcaccgtgcc 61 cggcaaaggc cccgcgcctt ccggaaaata tacgggcctg ggtatccggg cggatttcga 121 cgcgcttccc atcacggagg agagcagcgt cacctgggcc agccaaaatc ccggcgtgat 181 gcacgcctgc ggccacgaca tgcatacagc catgctgctg ggcaccgcga tggtgttgca 241 gagcatgccc gaagccttcg gcggaaacgt taagctgctg ttccagccca acgaagaggc 301 ggaaggcggc gcggaaaata tgatcaaggc cggctgcatg gaggatccgg cggtggatgc 361 ggtcatcgca ttccatatcg aaccgggcat tcccagcggc tatatccagc tgtgccccgg 421 taagatgaac gccgccacct gcgacgtgca catcaccgtg gagggcgtcg cctgccacgg 481 cgctcacccc gaccgcggca tcgatgcgat cctggcagcc agccagatcg tcacggcact 541 gcaggcggtc gtcgccagaa atcttgcgcc gacgcagccc ggtgtcgtca ccatcggtca 601 gttccacgcc ggcaacgcca gtaatgtggt ggcaggtacg gctgaactct ccggcaccct 661 gcgggcgctg gacatgaaga ccatggcgca gatcaagtcg ctggtcaagc agacggctga 721 aggcattgca gcaggcttcg gcgccaaatc catcgtgacc ctcacagacg gctatcccag 781 cctggagaac aatatcgaac tcggcaaaac gctggagcag ctggcggtcg agctggtggg 841 caaagaccag atcgactata tggaggcgcc cagcctcggc gcggacgact tcgcgttctt 901 tacccagtac tgcgacggcg tctacatgaa cgtcggcacg acgcccaagg actggagcgg 961 caagccccag gcgctgcaca gcgagttcct gtgcccggac gaagaagcta tgaaaacagg 1021 catcctgatg gaggccatgg cggcgctccg gctgctcgga aacctttaaa ttgcaagccc 1081 ttaggccatt acacaaaaac gacacaaacg ggagttataa tatggaagca ttaagagata 1141 cgatcgtaac ggtcgatctg ggacggatcg gccgcaatat ggataagatc cggaatatgg 1201 ttggaccgga cgtggccgtt atgcccgtca tcaaggccaa cggttacggc tgcggcgcgg 1261 tgggcatcgc acccacgctc atggaacacg gcgccgctta tctggcggtg gcgaccctca 1321 cggaagccat cgaactgaga accgcctacc cggactatcc tgtttttatt ttgggtcaca 1381 cgcctgcgcg gttcctcgaa cacgtggtgg acggccgctt tacgcagacc gttatcgatt 1441 atgaccacgc caaggcgctg tcggatgttg cgctcgccaa gggaacaaag gcgacggtcc 1501 atctgaagat ggatacgggc ttccaccgtc tgggtacctc cgataaagaa gaactgctga 1561 agatggcgaa gctgccgggc ctcaatgtgg aaggcatctt ctcgcacctg gcgctggccg 1621 gagagaagga agactgggac cagtataaca tgctctgcga cgccatcgac tatctggaag 1681 cgaacggctg tacctttaag tacaagcaca tcgcggacag tatctccctc ggcgactatc 1741 ccgaattccg catgaacatg gtgcgccccg gcgccctggt gttcggcctc acgagctttt 1801 cccgggctca cctggacgtg gaacagtgca tgggcatgca gacccgcatc tcccagatcc 1861 acgagatcaa agcgggggag ggcgtgtcct acgactatct gtggaaagcc cagcgggatt 1921 cccacatcgc aacggtgccc gtgggctatg ccgacggcta tccccggaac atgcgcgata 1981 aaggctattt aacggtgcat ggggtcaaat gccccacggt cggcgtcctg tgcatggatc 2041 agctgatgat cgacgtcacc gattgcccag aggcaaagga aggggacgcg gccatcatct 2101 acggggacgg ctccggcaac accatgagca ttcccgaggc tgcaagcctg gccggcacca 2161 ataaaaacga gatcatcgca cgcatcctga gcagaccgcc cagagtatac gtgaaatgaa 2221 atagataaca aattgcaaag gagatgaaga tgcgaagagg aaagagaact cttattttca 2281 tctgtacctt cgccatgctg ctcgcatccg ccggcatggc gtacgcggac gaatccggcg 2341 ctgcccccgc actcgacgag gccggcagta tggagaactt cgtccgcagc ctggtctacg 2401 aagaccagtt cgccgatgtg gcggatacag cctggtacag ccagcacgta aaagacgctt 2461 atgaatacgg gttcgtgtcc ggaaattctg aaacaacata taacccggac agcgagatca 2521 cggtggcgga agcgatcgtc atcgcctgcc agctccacag catctactac gacgaggcgt 2581 tcgaccgcta cgacgtagag gagggtgacc cctggtatca gccttatgtg gactatgcca 2641 tcgaacacgg catcatctgg gcaaactatc cctatgctct tacggcaaag gccacccgct 2701 ccatctttgc cgggatcatg gccaacgcct tgcccgacga cgaactggat gccatcggta 2761 cggtcacgaa catccccgat gtgaccgatc aggtccattt ctccgcttcg atctaccagc 2821 tgtacaacgc aggtgttctg agcggcaagg acgaatatgg atatttccac ccctacgaca 2881 ccatcaagcg cagcgaagtg gcggtggtgg tgctgaacct ggcggacgaa gcgagacgga 2941 aggctcccgt gctgaaggag atcccggaca tcaccctgta ctccgactac ggcacgagca 3001 ttacggtcaa gaaggatctg gccccgaact atcagaaact gggctggtcc acggctcccg 3061 tgtccgttcc tgcgggcagc aacgcagaga ctatcctcaa cgccgcgacc ctcactccca 3121 tgaagaccaa caacgcggag ctggacggca tcatcgacgg cattttcgcc cagatcatta 3181 cggacgacat gtccacctac cagaagacca aggccatcta cgactatctg atggataact 3241 gctactacgg caacggctgg gcttcctgga gcggcaagta cgtaaagcac gacgacgatt 3301 acgtggtcgt catgggcaag acgatcctca agacaggtca cggcacctgc gacaacta // LOCUS sequence097 3356 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence097 VERSION sequence097 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3356 /mol_type="genomic DNA" /organism="" /note="sequence097" CDS complement(668..1588) /product="ABC transporter permease" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011016361.1" /transl_table=11 /codon_start=1 /translation="MVKYIVNRVLVTIPIIIAIILIVFLLLQVLPGNPIQVMMKEKVNQ QVIDRVTEQMGLNDPLMIRFGRYLWNMLHGDLGQSYKLKRPVTQLIMTAFPNTVKLAIT SALVAWIIGIPTGIISAIKKDSLLDRILMGFSLVGISLPVFWAAMLLQYFLGFKLKLLP ISGYSTIRHMIMPAIVLGWASSGSIARLTRSSLLGVMKNDYIRTARSKGLVESAVVIRH GLKNSMIPVVTMMAMQFASLLSGAVITESVFGIGGIGQLMVSAISQRDMPLLQSSVIFS TMIIIVGNLVADILYSFLDPKIRTQ" /locus_tag="LOCUS_3550" /note="WP_011016361.1 ABC transporter permease (Fusobacterium nucleatum) [pid:42.5%, q_cov:100.0%, s_cov:99.4%, Eval:1.8e-71]" /note="MGA_491" misc_feature complement(1692..>3356) /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_012868765.1:ABC transporter substrate-binding protein" /note="WP_012868765.1 ABC transporter substrate-binding protein (Thermanaerovibrio acidaminovorans) [pid:30.0%, q_cov:88.1%, s_cov:89.5%, Eval:2.1e-51]" /note="MGA_492" /locus_tag="LOCUS_3560" ORIGIN 1 cttccacgta ttccttctct cttaaggaca gcacttcgga gcggacgact ctggcagtgc 61 cggcccagtt gacaaaactc agagccagga agatcgtcag gaagcccggt ccgatggtgt 121 aggaaacgac catcgccaga agcagcgagg ggaatgccat gcagatgtct gcaagacgca 181 tgatgatcat gtcgactttc ccgccgacga agcccgccgt gatgcccagg atggtgccca 241 gggtcatgga gaccagcgtc gggaaaaggc cgatcatcag ggagatgcgt ccgccgtaga 301 tcatgcggga caatacgtcg cggcccagct tatcgcagcc cagcagatgc tctgcggagg 361 gctttgcgag accctgcgaa agatcctgcg ccaaaggatc gtagggagcg aacagcggag 421 cgccgacgca caccacgata tacaggatga tgacgatcag ggagatgagg gccaccttat 481 tatgcttgaa gatgctccag aactgctccc agagggtctg gttcggagcg atctccgcct 541 ccgcggattc ctctacgtgg acaggcgtaa ggccgtcctc agggatccat gcggttcctt 601 ccgccggagc cggattcgtc gtgaccgcag cagcggccag tttcttttta ccgaacatag 661 gcacctccta ctgcgtacgg atcttcggat ccaggaagga atacaggata tccgccacca 721 ggttgcccac gatgatgatc atcgtggaaa agatgacgga gctttgcagc agcggcatgt 781 ctctttggga gatggcgctt accatcagct ggccgatacc gccgatgccg aatacggatt 841 cggtgatgac ggcgccggac agaaggctgg caaactgcat ggccatcatg gtgaccaccg 901 ggatcatgga gttctttaag ccgtggcgga taacgaccgc gctctccaca aggcccttgg 961 accgtgcggt gcggatgtag tcgttcttca tgacgccgag caggctggaa cgggtgagac 1021 gggcgatgga gccggaagaa gcccagccca gaacgatggc cggcatgatc atgtggcgta 1081 tggtggaata gcccgagatc ggcagcaatt tcagtttaaa tcccaggaag tactgcagca 1141 gcatcgccgc ccagaagacc ggcagagaga tgccgaccag agagaatccc atcaggatgc 1201 ggtccagcag ggagtctttt ttaatggcag agatgatgcc ggtcggtatg cctatgatcc 1261 aggctaccaa cgcggacgtg atcgccagct taacagtatt cgggaatgct gtcatgatca 1321 gctgggtgac gggccgtttc aacttgtatg attgccccag gtctccgtga agcatattcc 1381 acaggtatcg cccgaatcgt atcatcagcg ggtcattcag gcccatttgc tcggttactc 1441 tgtcgattac ttgctgattt actttttctt tcatcatgac ctggatcgga ttgcccggaa 1501 gcacctgcag gagcaggaac acgatcagga tgatggcgat aatgatggga atcgtcacga 1561 ggacacggtt aacgatatat ttaaccattc ctctaaatcc tttttaacca taatggggag 1621 tgcccccgaa gaggcggcac tccccaaaat tttaagagtc gtttgtttca gtttccgtta 1681 cggaaccgca attagttttc cagataggtc tcgtagtaac cgcagtcacc gtagccggcc 1741 cacatgggaa cgaagccctt tacacgatcc tgcaggactc tgaccttctg cttgtgccac 1801 agaacgatca tggctgcatc gtcgcgggtg atcagcttat ccagagctgc gtattcagct 1861 tctctggctt ccggatcggt catgtgtctg gcagcttcga gtcttgcgat agcatcggtg 1921 ttgtagtagt tccaggatct tctcacgttg gaggaagaac catacatctg atacaggaag 1981 ttatcggggt cgttgaagtc agcagtccag gacgttctgt acatcgggga accgccggtc 2041 gctctcagat cgtaccagga agcggaatcc atctgcttga tggtgcagcg gacgccgatc 2101 gcttcgaagt aggactggat cgcttcgttg acttcgatat cgctctggct ggagtcggtg 2161 gtctgaacga tctcaagatc gaaaccgtct tcataaccgg cttccttcag cagctctctg 2221 gcctggtcgg gatcataggg gatcgcacca atctcggggt catagcccgg gacgccggga 2281 gcgaggaagg tacctgcggg agtcgcagcg ccgtagtact gggtgtcgat cagggtctgt 2341 ctgtcgatcg ccagctgcag agcctttctg actctgacgt cgttgagggg ctcgatggac 2401 tcgttgatgt gcaggtagct ggtgcccaga acggtcttga tgttgatgtt gtccgcataa 2461 gcggggtcgt ctctgtagac ggggatctgg tcgagcgcgt ggtccatatc gaagatatcg 2521 atctggccgg cgtcgaacag catcttttca gtctgtgcat cggggatgat gcggatgagg 2581 ataccatcca tcttgttggc gcctctccag taatccgggt tggtcttcag gaagacgtgg 2641 tcgttcagga cccattcgga gagttcgaac ggaccggagc cgcagaagta ctcgggatcg 2701 gagccgtaca gggaggtcat cgggccgccg ccggcttcgt cagctgcttc gcccgcttct 2761 ctgttgcaca gagaccatgc gggggtagac aggcaagcca ggaacggggc ataggcagac 2821 tcgaggacga tgtccacgtc gtagtcgccg ttgatgatga tgccggtgcc ttcgaccgtg 2881 tcgatcttgc cgtccagcat atcctgagcg cccttgatca tatccatcca ggaggtgtta 2941 acagcagctc tttccggctg cagcatgcgg tcgacggtgt acagaacgtc gtcggcagtc 3001 agcatctcac cgttgtggaa cttgacgtcg tctctcagat ggaagctgta ggtgagaccg 3061 tcatcgctga cttcccagct ttcagcaacg ctgggaacgg taacgttttc accggcttca 3121 ttcgtctcgg tgcggaccaa ggtgtccatg cagttcatca tcaggatgta gtctgcggtg 3181 gtgcaggccg ggtctgcgga ttcgggctct gcctgatagg tgattctcag gacgttttcg 3241 gggaatccgt cttcgtaaac aacagcagag gtttcgcctt cgccgccttc agcaggctcg 3301 gcaggttccg tctctccgcc gccgctggtg caagccgcca tagaaaatac catggc // LOCUS sequence098 3352 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence098 VERSION sequence098 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3352 /mol_type="genomic DNA" /organism="" /note="sequence098" misc_feature <1..919 /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_003723559.1:alpha/beta hydrolase" /note="WP_003723559.1 alpha/beta hydrolase (Listeria) [pid:40.3%, q_cov:88.2%, s_cov:86.9%, Eval:4.8e-48]" /note="MGA_493" /locus_tag="LOCUS_3570" CDS 929..1591 /product="uracil-DNA glycosylase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003416528.1" /transl_table=11 /codon_start=1 /translation="MVHIGNSWDEKLKSEFEKEYYLKLREFLKQEYSTRVIYPDMHDIF NALKATAYEDVKVVILGQDPYHEPGQAHGMCFSVKPGVPVPPSLQNMYKEIAAEYPGWP IPQDGYLQKWADQGVLLLNAVLTVREHAANSHRGKGWEILTDRVIELLNEREDPVVFLL WGRNAREKKALITNPKHVVMEAAHPSPLSAYNGFFGCGHFRAANDKLREFGKTPIRW" /locus_tag="LOCUS_3580" /EC_number="3.2.2.27" /note="WP_003416528.1 uracil-DNA glycosylase (Clostridioides difficile) [pid:63.6%, q_cov:100.0%, s_cov:97.8%, Eval:1.3e-80]" /note="MGA_494" ORIGIN 1 cctgcagatc atccacggca tgagcgaata cgtcggccgt tatggcagtt ttgcgcagtg 61 gctcgcggag cagggcatcc tagtcgtcgg cgacgaccat atcggccacg gtacgtccgc 121 ggatcctgcc gattacggct atttcggcca caccgacggc tggaagcacc tggtggacga 181 cgaggaaaag ctcagaaaca tcatgcgccg cgactatccg aacacaccct acgtcattct 241 gggtcacagc atgggttcct ttatcctgcg ggcctggctc gccatgtacg cgaaggctgc 301 ggatgtggac ggctgcatca tcatgggcac ctgcggcacc aacaaggcgc tgggcgcagg 361 cgctgccctt acgacgctgc tgctgggcct gaagggcgaa aagaagacca gcaacctcat 421 cacgggtctc gccatgggac cctacgcaaa gcctttcgct tccgaaaaga gccccgtcgc 481 ctggctgtcc cgcgacaagg aactgtacca ggcctacgaa aaagatccca tgtgcggctt 541 cccctttaag ctgggcggct acatggatct gttcgcgctc atccgctaca ttacggcgga 601 cagttggtac gaaaaggtcc ccaagaatct cacgatgctc atcacgtccg gttcgaacga 661 ccccgtgggc gatatgggca agggcccggc ggagacctac gacaagctgc aggctgcggg 721 ctgcaaagac gtcaacctgc tgctgtacga agacatgcgg cacgagatcc tcaacgagat 781 cggcaaagag aaagtctggg aggatatgag agacttcgtc ctggatatgg cggaggaaca 841 cggactgccg caggacaaac gcggcgtgcc cgacgcgccg gagacggtca cttccttcac 901 ggaaggcggc gcctggtagg agagatccat ggtccatatc ggcaattcct gggacgaaaa 961 actgaaaagt gagtttgaga aggagtatta tctcaaactg cgggaattcc tcaagcagga 1021 gtattccacc cgggtcatct atccggacat gcacgacatc tttaacgccc tgaaggcgac 1081 cgcttacgag gatgtaaagg tcgtcatcct gggtcaggat ccgtatcatg aaccgggtca 1141 ggcgcacggc atgtgctttt ccgtaaagcc tggtgtgccc gtgcctcctt cgctgcagaa 1201 catgtacaag gagatcgcgg cggaatatcc cggctggccc atcccccagg acggctatct 1261 gcagaagtgg gcggatcagg gggtgctgct gctcaacgcg gtgctcaccg tgcgggagca 1321 tgcggcgaat tcccaccggg gcaagggctg ggagatcctc acggaccggg tcatcgaact 1381 gctgaacgaa cgggaagacc ctgtcgtctt cctgctctgg gggcgcaatg ccagagagaa 1441 gaaggcgctg atcacgaacc caaagcacgt ggtgatggag gcggctcacc ccagtccgct 1501 gtctgcctat aacgggttct tcgggtgcgg ccacttccgc gcggcgaacg acaaactgcg 1561 cgagttcgga aagacgccca tccggtggta ggagaaacag atgctgcgtt atgcaaaaga 1621 tcttaagaaa aaccgtacac taaggcacgt ttttgcgtgc cttttttgtt tgctgctcat 1681 cgccctgcag acggtgccgg cgctcgcggt cgactatacg acggagagct tccacacgac 1741 gctggacgtg aaagagaatt cctcgatgca tgtgacggag atcatcaccg tggattttga 1801 atccccggcc cacggcatct accgcgatat ctggacttac ggaaccgtct ggtttatgaa 1861 ggacgacgag ctggtctgga cggagatgct gtataagctg aagaacttcg agtgcgaagg 1921 cgaggagatc aaaaagagta cggatacgga ttacgtttcg atccggatcg gttctgccga 1981 taaaacggtc accggccggc acacgtacac gctggaatac gacgtgctca tgtacaaaga 2041 cgatctggac gacatggatc agctgtactg gaacatcatt cctatgtact gggagacgcc 2101 cgtagagaag gccagcttta cgatcaacat gccgaaggca ttcgacgaga gcaagctgga 2161 gatcattgca ggacccatcg gagacaacga tacgtcccgg tcggtctata cggtaaacgg 2221 cacgacggtc gagggacata tgaccggacc catcgattcc cgggaaggcg ttacagcccg 2281 catcgtgctg cccgaaggat actggagagg cgcgagaagc gatgcgccct gggtctatgg 2341 catcatggcg gcgatcggcg ccgcgacgtt tgccgtcgtt acgctgttcg tgcgctacgg 2401 caaagaccgc cggcctgtaa agaccgtgga attctatccg ccggacgaca tctcttccgc 2461 agaggcgggc tacctgtacg acaagaaact ccagagaaaa gatatggtat ccctggtgat 2521 gtggtttgct tcgaagggct atctgaagat ccacgcagtc gaaaacgacg atccgaaaga 2581 aaagcggaaa gtcccatata aaataacgct caccaagctg caggacatac cccacagcgc 2641 gccgcgctat caggagacgt tttttaacgg attgttcaaa ggcggcgaca aggtgcgtct 2701 ggaaaaaatg cccggttcgt tcgcgcgtgc gtattcgcgt gcggagagcg agctgcagga 2761 agtgtttaca gacgacagag actttatcga tcctgccagc aggaccgcga aaaataccgg 2821 ctgcctcctc ggcatccttg ttatcctcgc gacgatcatc ggcgctgccg cgtttacgat 2881 cacggaggat ctcatttcca gcctgctcgg ggagtgcacg ctctgtaccc tcatcatcct 2941 tgtctgcgtc aaattcatgc tgcggccttc ggattaccgc accggcatgc tgggacgcct 3001 gaagggattc cgcacgttca tcaaaagggc ggagctggac cgcatcaaac tgctggtgca 3061 cgacgatccg gagtatttct accggatcct gccctatgcc tatgtattcg gattgacgga 3121 ccgttgggcg aaaaactttg aagcgatcgt gcccgagatg ccggtttggt acgacggtcc 3181 ggcggatctt ttcgaaacgc cgcagacgtt ctgctcgaac tttgcccgtt ccgtcgatac 3241 aggcatctcg catgccatgc cgaaacccac gcattccagt ttctccggcg gaggtggcgg 3301 ccgcagcagt tcttccggcg gaggcggcgg atcatccggg ggcgggttct cc // LOCUS sequence099 3346 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence099 VERSION sequence099 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3346 /mol_type="genomic DNA" /organism="" /note="sequence099" misc_feature <1..1277 /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_004399059.1:bis(5'-nucleosyl)-tetraphosphatase (symmetrical) YqeK" /note="WP_004399059.1 bis(5'-nucleosyl)-tetraphosphatase (symmetrical) YqeK (Bacillus) [pid:40.8%, q_cov:29.5%, s_cov:79.0%, Eval:5.0e-23, partial hit]" /note="MGA_496" /locus_tag="LOCUS_3590" ORIGIN 1 ccggagacca tcccttcttc ggcatcagcg acatcgaact gaagagggaa ggcccttcct 61 atacgtacga tacgctggca gcactgaagg agcgggatta tccggacgac gagctgttct 121 tcatcatggg aacggattcg ttctatcagc tggagcattg gcataaggca gaggagctca 181 ttgagaactt cggttttctc atcggcatgc gcaaaggcta cgacgaggac gaactgaaac 241 agaccatttc ccgcctgcag cagaagtatc cgctgcgggc ggagtacatc cgcatcccgg 301 agctggagat cagctctacg gacatcaagc agcgcatccg ggccggcaag tccgtgcgct 361 tcctgctgcc ggacgcctgc atctcctaca tccgggagca cgagctctat ctggatctcg 421 tcggcaaggt gagggaatac gcccgcaccc acgagaagac cagccggttt gctcacacct 481 gcggcgtcgt caagatggcg aagcaactgg cgcggcaata tggcgcagat cccgaaaaag 541 cggagatcgc ggcctggttc cacgacgtgc ggcggcctgc gggcaacctg gaacacggcc 601 ctgcggcggc ggacctgctg cagcagctgt acggggtcac cgacgaggat atcctgaatg 661 ccatccgctt ccataccacc ggccgccccg gcatgagcct gctggaaaag gtcatcaaga 721 tcgcggacca gctggaggaa ggaagggatt atccgggtgt ggagcacatg cggtccttta 781 cgaaactccc ggtggacgaa tgcgtctacc ggctgatgac ccacaccaga gaatacgtac 841 acagcatcgg cggcaccttc gacccgctgt ccgatgaagc catagagtgg ctgagaaaaa 901 gattgaacaa ggaggaaatc atggacaata aggaacttgc tctgctggcg gcgaagctgc 961 tggacagcaa gaaggccaaa gacatcagca ttatcgacat cgcagagaaa tccggttttg 1021 ccgattactt cgtgatcgcg accgccggtt ctgcccgtca gatctccgcc ctgtgcgatg 1081 aggtggagga tggcctggcg aaggacaaca tcctgataaa ccacaaagaa ggaaaaggcg 1141 agaccggctg ggtgctcctg gattacggcg acgtcatcgt caacgtcttt tccgcagaac 1201 agagagatca ttaccagatc gagaaggtct ggatcgactg cccgcaggtg gaattcgagc 1261 ccgcggctga gaaatagaag caagaaacgg tacagaaagg cagatctatg gaacgtcagt 1321 ataatttcaa aaagatcgaa cccagatggc agaagatctg ggcagaaaag gacgcatttc 1381 acgtaacgga ggatccggac aaggagaagt tctattgtct ggagatgttc ccgtatccat 1441 ccggtaaact gcacatgggt cacgtgagaa actattccat cggcgacgtg ctggccagat 1501 acctgcacat gaacggcaag aacgtgctgc atcccatcgg attcgactcc ttcggtctgc 1561 ccgcggaaaa cgccgctatc aagaaccaga cccatcccgc cgtatggacc agctccaaca 1621 tcgcggagat ggagaaccag ctccgccggc tgggcttctc ctacgattgg gacagagaag 1681 tgtgcaccta taaagaggat tattaccgct ggatgcagtg gatcttcatc cagttctaca 1741 agcacggcct cgcttataag aaagagaacc ccgtcaactg gtgcccgtcc tgccagaccg 1801 tactggccaa cgagcaggtc gtggaaggcc gctgcgaacg ctgcggaacg gaggtcacga 1861 agaagagcct gtcccagtgg tacttaaaga tcacggatta cgccgaccgc ctgctggaag 1921 gtctcgatac gctgcccggc tggcccgaac acgtcaagac catgcagcgc aactggatcg 1981 gccgttccga aggtacggag gtcgtttata agctgaaggg ttccgatact ccgatgcccg 2041 tgttcacgac ccgtgtggac actatcttcg gcgccacctt tatggtcatc tctccggagc 2101 atcccatggt ggaagagctc atcgccggca gccccgaaga ggagaactgc cgcgcctata 2161 tcgaacaggc caagaagcag agcgacatcg aaagaacctc caccgtcaag gaaaagaccg 2221 gcgcctttac cggccgctat gccatcaacc cggctacggg cgaagacatc cccatctatc 2281 tggcggacta cgttttgatg ggctacggta ccggtatcgt tatgggcgta ccttacggcg 2341 accagagaga cttcgagttc gcgaagaaat acgatctgcc catcattcct gtggttgacc 2401 cccacaggga cgacatcgac atcaacgatc tgaaggaagc cttttccgat gacggtacgg 2461 tcatcaactc cggcaaatac aacggcatgg acaaccggga agccatcaag gccatgcaga 2521 aggacttcga ggaagcaggc ttcgccgttc ccaaggtcaa cttcaagctg cgcgactggc 2581 tcatctcccg tcagcgctat tggggcacgc cgatccccat gatcaactgc ccggactgcg 2641 gctgggtgcc cgagaaggaa gataatctgc cggtcatcct gcccacggac gtcgaattta 2701 ccggcaaggg cgaatctccg atcgtaacct ccaagacctt cgtcgacacc gtatgcccct 2761 gctgcggcaa gccggctaag agggaagtgg acaccatgga tacgttcctg gattcctcct 2821 ggtacgagct gcgctactgc gacaataaga acgacaaggc ggtctgggac agagagaaag 2881 cggattactg gatgaacgta gaccagtaca tcggcggtgt ggaacatgcg atcctgcacc 2941 tgatgtacgc gcgcttcttc tgcaagttcc tgcacgacat cggactcacc aaggcggagg 3001 aaccgttcca gaacctgctc acccagggca tggtcttaaa ggacggaaag aagatgtcca 3061 agtccatcgg caacgtggtc tccccggaag agatcatcga aaaatacggc gcggataccg 3121 ccagactgtt catcctgttc gcggcgccgc ccgagaagga actggaatgg tccgacaccg 3181 gcgtcgaagg ttcctataag ttcttgggcc gcgtctaccg tctggtcgcc gacatggcgg 3241 aactgacggc aggcattccc aagcgctaca ttccggaagg caaggacgac aaacagcttg 3301 cctatatttt aaacaacacc atcaagagag tttccgagga catcca // LOCUS sequence100 3344 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence100 VERSION sequence100 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3344 /mol_type="genomic DNA" /organism="" /note="sequence100" misc_feature <1..1128 /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_005810412.1:ferrous iron transport protein B" /note="WP_005810412.1 ferrous iron transport protein B (Desulfitobacterium hafniense) [pid:61.7%, q_cov:98.7%, s_cov:47.3%, Eval:1.1e-132, partial hit]" /note="MGA_498" /locus_tag="LOCUS_3600" CDS 1252..2100 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MKIYPEYVAKDRVMQPGQEGSAVDALDFVWKGSRILGQIYVPVHT PGEKHPLAITLHGFPGYTNNQDLDHALRRTGFVTVHPFAPGAWGSEGYYSFDGLVECAM ALLDYCKTDEFAEKYHICRDNIFFVGHSMGGMTSINVLRRRDDVKAGVFLAPFDVAQFY YEGHTPDELRPLFEEGVILRTPGNYMDFLLQNGADTAKDLLFIDAAEGIKEKNFLFVGG ELDPLAPPATMCAPLYEKAKALSSGKAKQEYVLIHSDHGFNDQRIYLAQKVAEYLADLV E" /locus_tag="LOCUS_3610" /note="MGA_499" ORIGIN 1 cccggcttta tcgccatcat gggcgtcgtg ttctacctga cgtttttcct gatcggtccg 61 tatttacagg acctgctgga tgccggaatt accagaattg cggattctgt cgaccaatgg 121 atgaccgccg caggcgtctc ggacgtcctg cacggcctgg tggtagaagg catctttgcc 181 ggagtgggaa gcgtcctgag ctttattccc atcatcgtca tcctgttttt cttcctgtcc 241 ctgctggaag atacgggata catggcgcgc atcgccttcg tcatggataa accgctgcgc 301 aaagtcggcc tttccggccg ttccatcgtg ccgctgctga tcggattcgg ctgcacggtg 361 ccgggcgtta tggcgtcccg gaccatgcct tcggagcgtg accgcaagat gaccatcatg 421 ctgacgcctt tcatgagctg cacggcgaaa ctgccgatct acggcttcct ggctgccgca 481 tttttcccgg cccataagcg gctggtgatc gtcggcatct atgtgctggg cgtgctggta 541 gggatcatcg cggcgatcat attgcggcgc acgatgttcc gcggcgaagc ggttcccttc 601 gtgatggaac tgccgaacta ccgcctgccc ggcgcgaaga acgtgctgcg gctgctgtgg 661 gaaaaggcca aggacttcct gcagagggcc tttacgatca ttttcctggc gagcatcatc 721 atttggttcc tgcagcactt cgacttcggt ctcaacatgg tggatgacgc ggaaagcagc 781 atcctggccg cagtcggcgg cgcattggcg cctgttctgg caccgctggg cctgggaagc 841 tggaagtatg ccacggctct catcaccggc ttcctggcca aagagagcgt cgttgcgacc 901 cttaccgtgc tctttggaga gggaacagcc atcgcgtcca cattgtcgac ccccgcagct 961 tcggcgctgc tggtgttctc cctgctctac acgccttgcg ttgcggcgat ctcctccatc 1021 aagagagagc taggacacaa gtgggcgttg ggcattgtcg tcggacagtg tgccgtggct 1081 tgggtttgtg ccctgatcat gaagttcatc gttggactca tcctttagat aaaaatgcaa 1141 acagcggaca aattcctcgg aatgcgtccg ctgttttatt gtataataat cgtatacata 1201 taagtcttca ttccgtaacg tatcggtcgt cttattttaa ggaggcaatc tatgaagatc 1261 tatcctgaat acgtcgcaaa agaccgtgtg atgcagccgg gccaggaagg ctccgcggtg 1321 gacgccctgg acttcgtctg gaagggcagc cgcatcctcg gtcagatcta tgttccggtt 1381 cacacccccg gcgagaagca tccgctggcc attacgctgc acggcttccc gggatatacc 1441 aataatcagg acctggacca cgccctgcgc agaaccggct tcgtaacggt acatccgttc 1501 gcgcccggtg cctggggcag cgaaggctat tattccttcg acggcctcgt ggaatgcgcc 1561 atggcgctgc tggattactg caagaccgat gagttcgcgg aaaaatatca tatctgccgc 1621 gacaacatct tcttcgtggg tcattccatg ggcggcatga cctccatcaa cgtcctgaga 1681 agaagagacg acgtcaaagc cggtgtgttc ctggctccct tcgacgtggc ccagttctac 1741 tatgagggtc acaccccgga cgagctccgg cccctgttcg aggaaggcgt catcctgcgc 1801 actccgggca actacatgga tttcctgctg cagaacggtg cggataccgc caaggatctg 1861 ctgttcatcg atgcggcgga gggcatcaag gagaagaact tcctgttcgt cggcggcgaa 1921 ctggatccgc tggctccgcc tgccaccatg tgcgccccgc tgtacgagaa ggcgaaagcc 1981 ctcagctccg gcaaggcgaa gcaggaatac gtcctgatcc attccgacca cggctttaac 2041 gatcagcgca tttatctggc acagaaggtc gcagaatatc tggcggacct tgtggaataa 2101 tgcacttata gttatctaaa ggaggacaaa aatgcgtaac agcaaattca ttgcgcttct 2161 gctggcgctg gcattggtcc tgggttcctt cggctttgct ttcgcagacg aagacgcagc 2221 tgcccctgcg gacgcgcccg agatcaccgc agcaccggcg gatgaccctg ccgaatcagg 2281 ggacatcgtg atcctgcaca cgaacgacgt gcactgcacc aattacgaga attatgccaa 2341 gctcgttgaa ctggctaaga gcgcagattt cgtcgttgac gccggtgatg ccatccaggg 2401 cggcccgatc ggcgctctgt ccaagggcga atacatcacc gagatcatga actatgtcaa 2461 atatgacgta gttgctcccg gcaaccacga atttgactac ggtatggagc agttcaagaa 2521 gatcacaggc gaagtggcag aattcccgta cgtctgctgc aacctcgtgg atctgaagac 2581 cggcaaaccc atgttcgacg cttacaagat cttagaagcc aagggcaaaa agatcgcgtt 2641 cgtcggtgtg gatacaccgg agacgttcca taaatccacc cctgcttatt tccaggatga 2701 gaacggcaag tacatctaca gcttctgcga aggcaatgaa ggcaaggatc tgtacgacgc 2761 tgttcagaag gctgccgacg cagccagagc tgaaggtgcg gactatgtta tcgtgctcgg 2821 ccatctgggc attgacaaag aatcttcccc ttggtgctcc accgaagtcg ctgccaacac 2881 cagcggtatc gatgtcttta tcgacggtca ttcccataac gatttcacta tgaccgtcgc 2941 taataaagaa ggcaaggatg tcgttatcca gcagaccggt acaaaactgg tgaacattgg 3001 caaactcgtg attgcggaag acggcaccat ttccggtgaa cttgttccga ccgaaggcct 3061 cgaagctgac gcagatgctg cagcgtttat cgatagtgtt actgccagat ttaaagcgct 3121 gacggatgag gtcgtagcta agacggaagt caacctcacg atccttaatg cggatggtac 3181 cagagctgtc cgctccaagg agaccaacct gggcgacctg tgcgcagatg cttataaaac 3241 cattctggaa gcagacgtcg ctttcgtcaa cggcggcggt gtccgtgata atctgcccct 3301 cggagacatc acttatggtg atatcatcaa ggtccatccg ttcg // LOCUS sequence101 3326 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence101 VERSION sequence101 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3326 /mol_type="genomic DNA" /organism="" /note="sequence101" CDS complement(344..1078) /product="amino acid ABC transporter ATP-binding protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011860947.1" /transl_table=11 /codon_start=1 /translation="MIEPIIRVKDLYKNFGDVHVLKGISTDIAPGEVVSIIGPSGSGKS TFLRCLNRLEEPTSGQIFFKGEDIMKAGKKLPQYRQKIGMVFQNFNVFPHMTVLENITL TPVLEKGVPEKEAAAQAEALLARVGLLDKRDVYPRQLSGGQKQRLAIVRALAMEPDVML FDEPTSALDPEMVKEVLTVIEDLAKEGMTILNVTHEMGFARQVSDRILFIDEGIIQEQG DPESFFSSPTSPRAKEFLSKVL" /locus_tag="LOCUS_3620" /note="WP_011860947.1 amino acid ABC transporter ATP-binding protein (Clostridioides difficile) [pid:61.7%, q_cov:98.4%, s_cov:100.0%, Eval:4.0e-81]" /note="MGA_502" CDS complement(1071..1730) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MDKIIKILAKYYPVFLKGLGGTMWLAGVTLLAGTVLGLLVAFLRM SKFKPLSGLTAIYIQILRGTPILLQLYFFWILLPKVLPFEMSDTACIIVALIINASAYI AEIVRAGIAAVDPGQWEAGRSIGLTEIHLMQKIIMPQAIKNILPALVNQFIACIKETSL ASVFFIRELTTAYKTVQASTFLTIQPLLISGLIYLVVTTVLSFAAGRIEGRLKASD" /locus_tag="LOCUS_3630" /note="WP_000649908.1 ABC transporter permease subunit (Staphylococcus) [pid:45.8%, q_cov:96.8%, s_cov:43.7%, Eval:1.0e-45, partial hit]" /note="MGA_503" CDS complement(1816..2673) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MKKVFAILLALAMVFSMAACSSGGGDSSGDAAEPANRLEAIKARG YIEMATEPYFAPYEFIDSSKSGDEQYQGLDIELGKYIAEKLGVELRIVPLEFSAVLASI TEGKYDFAASALAYSPGRAENMNMSKGYRFSDEVASYGFLVREDMIDSIKTADDTADLV LVTQSGSVQEGFVNDQISKYKDFKLVSSMTDGFLMVAEGKADACACDINNGQLYADANG GLAIAPFRFVVDESTQGTRVGIPKGEDELTAFIDQCIDELRAEGTIDKWYDEYSDYART LGVD" /locus_tag="LOCUS_3640" /note="WP_011674478.1 ABC transporter substrate-binding protein/permease (Lacticaseibacillus paracasei) [pid:26.0%, q_cov:98.6%, s_cov:55.5%, Eval:1.3e-20, partial hit]" /note="MGA_504" CDS complement(2870..3175) /product="MGMT family protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011837349.1" /transl_table=11 /codon_start=1 /translation="MARLTDDLAYEILSVVEEIPEGCVATYGQIARLIGREKNSRLVGK VLSNAEYYGRYPCHRVVSHNGRLAPGWTEQARLLAMEGVTLKEDGHVDLKKYQWDC" /locus_tag="LOCUS_3650" /note="WP_011837349.1 MGMT family protein (Streptococcus sanguinis) [pid:58.4%, q_cov:99.0%, s_cov:99.0%, Eval:7.8e-27]" /note="MGA_505" ORIGIN 1 agccgtgacc cggggcaccg gcgcacagcg cctgccgttc ggtggtcccc gctgcctggc 61 tcagctccgc cagcgcatcg tattcgccga ggatggccgc caccggtttg ccgctgccgg 121 acacgaaggt agccgtaaag gccgtcggaa tgtccgcgat gcccttttcg atcgtaaaac 181 cttcggaagc cagcgcctgt tccagcgccg cagcagactt ttcctcttcg taagccagtt 241 ccgcgtagcc ccagatctct cttgccagag atttgatgcg gtccgccttt gcgtcgatca 301 cctgggataa aaattgcagt tcactcatat cgatactctc ctgttacagc actttgctca 361 agaactcttt ggcacggggg ctggtggggc tggagaagaa gctctccggg tctccctgct 421 cctggataat gccttcgtct ataaacagta tacggtccga gacctgccgt gcaaagccca 481 tttcgtgggt cacgttcagg atcgtcatgc cctccttcgc caggtcttcg atgaccgtca 541 acacctcctt caccatttcc gggtccagcg cgctggtggg ttcatcgaac agcatgacgt 601 cgggttccat ggccagcgcc cgcacgatgg cgagcctctg cttctgaccg ccggacagct 661 gccgcggata gacatcgcgc ttatccagca ggccgaccct tgccagcagc gcttccgcct 721 gggcagccgc ttctttttcc ggcacgccct tttccagcac cggggtaagg gtgatgttct 781 ccagcaccgt catgtggggg aatacgttga aattctggaa caccataccg attttctgac 841 ggtattgcgg cagcttttta ccggccttca taatgtcctc gcccttgaag aagatctgtc 901 cggatgtagg ctcttccagc cggttgaggc agcggaggaa cgtgctcttg ccgctgccgg 961 agggtccgat gatggacacg acttcgccgg gggcgatatc cgtggagatg cccttcagca 1021 cgtggacgtc cccgaaattt ttatagagat cttttacccg gatgataggc tcaatcactt 1081 gccttcagcc tcccttcgat gcggcctgcc gcaaaggaca gcaccgtggt gaccacgaga 1141 tagatcagcc ctgagatgag cagcggctgg atcgtgagga acgtcgatgc ctgcacagtc 1201 ttgtaggcgg tcgtcagctc ccggataaag aagacggaag ccagggacgt ttccttgatg 1261 caggcgataa actggttgac cagcgccggc aggatgttct tgatcgcctg gggcatgatg 1321 atcttctgca tcaggtggat ctcggtaagg ccgatgctgc ggcccgcctc ccactgaccc 1381 gggtcaacgg ccgcgatgcc tgcccggacg atctcggcga tataggccga ggcgttgatg 1441 atgagggcca cgatgatgca ggccgtgtcg gacatctcga agggcagcac cttgggcagc 1501 aggatccaga agaaatacag ctgcagcaaa atcggcgtgc cccgcaggat ctggatgtag 1561 atggccgtga ggccgctcag aggcttaaac ttgctcatgc gcagaaaggc gacgagcagt 1621 cccaggaccg tgcctgccag cagcgtgacg cctgccagcc acatggtgcc ccccagacct 1681 ttgaggaaca ccggataata ttttgccagt atcttgatga tcttatccat aggttttctc 1741 tacaagttac ggattcggga gcagcgcttg cccccgaatc cggttgcttt catatttgtt 1801 tgatttcagc cgtctctagt ctacgccgag ggtgcgggcg taatcggagt attcgtcgta 1861 ccacttgtcg atggtgcctt ccgctctcag ttcgtcgatg cattggtcga tgaaggccgt 1921 cagttcgtct tcgcccttgg ggatgcccac ccgggtgccc tgggtgctct cgtctacgac 1981 gaaacggaag ggagcgatcg cgagaccgcc gttggcgtcc gcatagagct gaccgttgtt 2041 gatatcgcag gcgcaggcat ccgccttgcc ttccgcgacc atcaggaagc cgtccgtcat 2101 ggaggagacc agcttaaagt ccttgtactt ggagatctga tcgtttacaa agccttcctg 2161 cacgctgccg ctctgggtga ccagcaccag atccgcggta tcgtccgccg tcttgatgct 2221 gtcgatcatg tcttcgcgga ccaggaagcc gtaggatgcg acctcatcgc taaagcggta 2281 gcccttggac atgttcatgt tttcggcgcg gcccggggaa taggccaggg cggatgcagc 2341 gaagtcgtac ttgccttccg tgatggacgc cagcaccgcg gagaattcca gaggaacgat 2401 gcgaagctct acgcccagct tttcggcgat gtacttgccc agttcgatgt ccaggccctg 2461 atactgctcg tcgccgctct tggaggagtc gatgaattca tagggggcga aataaggttc 2521 cgtcgccatt tcgatgtagc ctctcgcctt gatggcttcc agtctgttgg cgggttctgc 2581 cgcatcgccg ctgctgtcgc cgccgccgga gctgcaggcc gccatcgaga ataccattgc 2641 cagtgccagt aagatcgcga atactttctt cattgctttg tccttgcctt tctatacaga 2701 gatcttttca tccttacgcc cctgaaaacg ggccgtgttt tcctttgatg gtttgtattg 2761 tagcactgcc gctttagtgt gtcaacactt tagtgcggtg tagtgataaa ttatttttat 2821 atttttcata aagaaacgtg acccggacat cctgtccggg tcaacgcatc taacaatccc 2881 attgatactt tttcagatcc acgtgtccgt cttctttcag ggtcacgccc tccatggcca 2941 ataaccgggc ctgttccgtc cagcccggcg ccagcctccc gttgtgggag accaccctgt 3001 ggcagggata gcggccgtag tattcggcgt tgctgagcac tttccccacc agacgggagt 3061 ttttctcccg cccgatgagc cttgcgatct gtccataggt cgcgacgcag ccttccggga 3121 tctcttccac cacggagagg atctcgtagg ccagatcatc tgtgagcctt gccatggatc 3181 actgcgccag gatggcgaaa tagacgtcca ccatcgtccc gatcagctcg tccataaaat 3241 cgaaggccgc ggtgtggatg gcgggtctgt cccctgcaga gacggtaaat tccgcgccgg 3301 ggcactgctt taagaaccag ccgaag // LOCUS sequence102 3310 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence102 VERSION sequence102 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3310 /mol_type="genomic DNA" /organism="" /note="sequence102" CDS complement(76..954) /product="DMT family transporter" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_005902565.1" /transl_table=11 /codon_start=1 /translation="MTNNRLAKAIFFMVASAFCSAMMSTCTKLVPGVPAMEKTFFTAFV CMAAAWIVQIHRHHEPPHFLKKDIKDLTLRAVYGIISMYLTFWCASAMDIGDATALFNL SPTFTMIYAHFAMGERFDRRQGLLVVLAFVGGLFVVKPSFHNVNLVPALAAVLCGMIGG LAHAYVRKLNAYNKVEGNAVILYNYTFSAIVELLLCLKIFVFPDARQLFWMLAAGGFCF LTQVCMNVAFSLASASEVSVYKYTQIIISSIIGMVIFAEFPDALSVAGYVVIIGSAVIM WRYNASLEKAQ" /locus_tag="LOCUS_3660" /note="WP_005902565.1 DMT family transporter (Fusobacterium nucleatum) [pid:26.9%, q_cov:96.6%, s_cov:97.6%, Eval:2.0e-27]" /note="MGA_507" CDS complement(944..1663) /product="purine-nucleoside phosphorylase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_001829961.1" /transl_table=11 /codon_start=1 /translation="MSTPHNSAEKGAFAKTVLMPGDPLRAKFIAETYLEEPKLVNNVRS IQGYTGTYKGVPVSVMASGMGMPSMAIYSYELFNMYGVENILRVGSAGAVSMELKLRDI VLGQGACTSSSMQDNFGVHGHFAPIADFDLLRCAAQICEERKLRYKAGNLISSDIFYND DPAFNQPFLNLGALAVEMEAAALYMNAARAGKRALAICTISDHVLTGEATSAEERQTTF NEMMELALEVAVRMNDK" /locus_tag="LOCUS_3670" /gene="deoD" /EC_number="2.4.2.1" /note="WP_001829961.1 purine-nucleoside phosphorylase (Staphylococcus) [pid:54.3%, q_cov:97.1%, s_cov:98.3%, Eval:1.1e-67]" /note="MGA_508" CDS complement(1667..2938) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MKIKVAAKPLAEVRRIPKPPRQKPVRPARFWRWVMKTAGAGDLKD AQFSYAFEGMDRMPEEPCLVVMNHSSFIDLEIAARILYPHPFNIICTSDGFVGKEGLMR RIGCIPTDKFVTDLGLIAQMSYALHDLGDHVLLYPEASYTFDGCATPLLARMGVLLKKL KVPVVLIKTEGAFLRDPLYNCLQKRHVKVSAKVSLLASAEEIRTLPAAELTRRLEEAFT FDNFRDQQENQIRVDEPFRADGLHRILYKCPECGKEGEMEGKGTQLICSACGASWTLDE TGLLRANAGEGDAHIPDWYAWERQFVRSELENGTYRLDTPVRILVFRDFKAIYDVGHGR LTHDNTGFTLTDGDDALIYRQDPGKSYSLYADYYWYEIGDIICIGDSEFQYYCLPEGNV PVAKARLATEELFRIVKKKRKEGE" /locus_tag="LOCUS_3680" /note="MGA_509" CDS complement(2979..3107) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MKNYEELKQQAFAKIDVLQCIRIFTDPEKHAAMKVDFEKTRG" /locus_tag="LOCUS_3690" /note="MGA_510" tRNA complement(3213..3288) /product="tRNA-Thr" /inference="COORDINATES:profile:Aragorn:1.2.38" /locus_tag="LOCUS_t0070" /note="Aragorn_7" ORIGIN 1 cgatcccatc gcacaaccag aaaaaggccg ggcagcacat gcccggcctt tattgaatac 61 aaaattttct gaggctcact gcgccttctc cagcgacgcg ttataccgcc acatgatcac 121 ggccgatccg atgatcacca cataccccgc cacgctgagc gcatccggga actccgcgaa 181 gatcaccatg ccgatgatgg acgaaatgat gatctgcgta tacttgtaca ccgacacctc 241 gctggcggac gccagggaaa aggcgacgtt catgcagacc tgggtgagga agcagaaacc 301 gcctgccgcc agcatccaga agagctgtct cgcatcggga aagacaaaga tcttcaggca 361 gagcaacagc tccacgatcg ccgaaaacgt gtagttgtac aggatgacgg cattaccctc 421 caccttgttg taggcgttga gctttcttac gtaggcatgg gccaggccgc cgatcatgcc 481 gcagagcacg gcagccagcg ccggcaccag gttgacgtta tgaaagctgg gcttgaccac 541 gaacagcccg ccgacgaagg ccagcaccac cagaaggccc tgtctgcggt caaaccgctc 601 ccccatggca aagtgggcgt agatcatcgt aaaagtcggg ctcaggttga acagcgccgt 661 cgcgtcgccg atgtccatgg ccgacgcgca ccagaacgtc agatacatgc tgatgatgcc 721 atagacggcc cgcagcgtaa ggtccttgat gtctttcttc agaaaatggg gcggttcgtg 781 atgccggtgg atctggacga tccaggcggc cgccatgcag acaaaggcgg taaagaacgt 841 cttctccatg gcgggcacgc ccggcaccag tttcgtgcag gtggacatca tcgcgctgca 901 gaacgcggat gccaccataa agaatatggc ttttgctaaa cggttatttg tcattcatcc 961 tcacggcgac ttccagagcc agctccatca tctcgttgaa ggtcgtctgc cgctcttcag 1021 cggaggtcgc ttcgcccgtc agcacgtggt cggagatcgt gcagatcgcc agcgctctct 1081 tgcccgctct cgcggcgttc atgtacagcg ctgccgcctc catctccaca gccagcgcgc 1141 cgaggttgag gaagggctgg ttgaaggcgg gatcgtcgtt atagaagatg tcggaggaga 1201 tgagattgcc ggccttgtag cgcagttttc tctcctcgca gatctgggct gcgcagcgca 1261 gcagatcgaa atcggcgatc ggtgcgaaat gaccgtgcac gccgaagttg tcctgcatgg 1321 aggaagacgt gcaggcgccc tggcccagca cgatgtctct cagcttcagt tccatggaaa 1381 cggcaccggc ggagccgacc cgcaggatgt tctccacgcc gtacatgtta aacagttcgt 1441 agctgtagat cgccatggag ggcatgccca tgccgctggc catcacgctc acgggcacgc 1501 ctttgtaagt gccggtgtag ccctggatgc tccgcacgtt gttcacgagc ttaggctctt 1561 ccagataagt ctccgcgatg aactttgccc gcagagggtc gccgggcatc agaacggtct 1621 ttgcaaatgc gcctttttcc gcgctgttat gaggggtaga catgggtcac tctccttcct 1681 ttctcttctt cttaacgatc cggaacagct cctccgttgc cagtctcgcc ttcgccacgg 1741 ggacgttccc ctccggcagg cagtagtact ggaactcgct gtctccgata catattatat 1801 ccccaatctc gtaccaataa tagtccgcat agagactgta ggatttgccg gggtcctggc 1861 ggtagatcaa ggcatcgtct ccgtccgtca gcgtaaagcc ggtattgtcg tgcgtgagcc 1921 gcccatggcc gacgtcgtag atggccttaa aatcccggaa gacgaggatc cgcaccggcg 1981 tatccagccg gtacgtgccg ttttccagtt cggagcgcac gaactgccgc tcccaggcgt 2041 accagtcggg gatgtgggca tccccctccc ccgcattcgc gcgcagcagg ccggtctcgt 2101 ccagggtcca ggaagcgccg caggcgctgc agataagctg tgtgcctttg ccttccatct 2161 ccccttcctt gccgcactcc ggacatttgt acaggatgcg gtgcaggccg tccgcacgga 2221 agggttcgtc cacccggatc tgattttcct gctgatcccg gaagttgtcg aaagtaaacg 2281 cctcttccag gcgcctcgtc agttcggcag ccggcagcgt gcggatctcc tccgcggacg 2341 ccagcaagct taccttcgca ctcaccttta cgtgccgctt ctgcaggcag ttgtagagcg 2401 ggtcacggag gaacgcgcct tccgttttga tgagcaccac cggtaccttc agcttcttca 2461 gcagcacgcc catgcgggcg agcagcggcg tcgcgcagcc atcgaaggta tagctggcct 2521 ccggatagag cagcacgtgg tcgccgaggt cgtgcagcgc gtaggacatc tgggcgatga 2581 gccccagatc cgtcacgaac ttatccgtcg ggatgcagcc gatgcggcgc attaaacctt 2641 cttttccgac gaagccgtcg gaagtgcaga tgatattgaa ggggtgcgga tatagaatgc 2701 gggctgcgat ctccaggtcg ataaaactgg agtggttcat cacaacgagg cagggctcct 2761 ccggcatgcg gtccatacct tcgaacgcat aagaaaactg cgcgtccttc aggtctcccg 2821 cccccgcggt cttcatcacc cagcgccaaa agcgcgccgg gcgcacgggt ttttgccggg 2881 gaggcttcgg gatgcgccgg acctctgcca gcggttttgc tgcgactttt atcttcatat 2941 ccaacctctt tttccgggcg ccccgacccg tgttggggtc accctctcgt cttctcgaaa 3001 tccaccttca tggccgcatg cttttccggg tccgtaaaga tgcggatgca ctgcagcacg 3061 tcgatctttg cgaatgcttg ctgtttcagt tcttcgtagt ttttcatatg ccggcctccc 3121 ttttgctgcc cattatgctt tttttctatt ttaccatagg gcgttttttc gcgcatagca 3181 aaacagacgt cctttcggac gtctgtttgc actggagctg atggccggac ttgaaccggc 3241 gacctgctga ttacgaatca gctgctctac cgactgagcc acatcagcat acgcacggat 3301 tatattacca // LOCUS sequence103 3305 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence103 VERSION sequence103 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3305 /mol_type="genomic DNA" /organism="" /note="sequence103" CDS complement(328..1779) /product="methylaspartate mutase subunit E" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011460941.1" /transl_table=11 /codon_start=1 /translation="MDIKNKKISDDEFYRIRAEVLTQWPTGKDVDFQEAVEYQKSIPED RRFGAKLIKAKNEGRTLTQPRAGVALINEHIELLQHLQDAGEADLLPTTIDSYTRQNRY EDCENGIRVSQQEGRSMLNGFPAVNHGVQGCRRVIESLKTPVQVRHGTPDARLLAEITF AGGFTSYEGGGISYNLPYTKNVPMERTIRDWQYVDRLTGIYEEAGVSINREPYGPLTGT LVPPCISHAVAVIEALLAAEQGVKNVTVGYGQGGNLLQDIAAIRSLEELTNEYLEKYGY KDVIVTTVFHQWMGGFPQDEAKAFGVISWGSVAAALSRATKVIVKTPHEAAGIPTKEAN AAGLRCTKQAISMLADQSFGDTHLADEKEIIKRETRCIVDKCFELGDGDLAVGVCRAVE AGALDVPFAPCRVNAGKMLPARDNQGAIRILEPGNLPFPQDIKDFHRAKIEERAKFEKR DASFQMVIDDVYAISKGRLVGRPRK" /locus_tag="LOCUS_3700" /EC_number="5.4.99.1" /note="WP_011460941.1 methylaspartate mutase subunit E (Desulfitobacterium hafniense) [pid:66.3%, q_cov:99.8%, s_cov:99.8%, Eval:2.6e-188]" /note="MGA_512" CDS complement(1763..3154) /product="methylaspartate mutase accessory protein GlmL" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_015945203.1" /transl_table=11 /codon_start=1 /translation="MIDFGSTYTKVTAVDLETEELLGTSQSWTTIQTDIGEGLADAVRK LEEKTGPLNFEARYACSSAAGGLRMITSGLVPELTAEAAKQASLGAGAKIRGVYSFELT EDDIEDIDAEHPDIFLLTGGTDGGNKECILHNADMLATCKTDFPIVIAGNRSVARTCAR KLEGREIHIVENVMPKFGTLNIKPAQDKIREIFLKRIVEAKGYTKAQSLIDNIAMPTPS AMMQAMQLLAEGCENPDGSKETGIGDLLAVDVGGATTDIYSVCDGMPRAGMDTIFKGLP EPYIKRTVEGDIGMRYSIHGIEEAVGTGYISQLSGLPEERCREMIDYLGKNTEVVPTDA ESEALDFALASGAIKTAVTRHAGRLEEFYTMNGIAYMQTGKDLREIRQIIVTGGSLIHT KRTGKIASAAFWDPQDPFSLKPKQADIWVDRSYILAAMGLLSGYYPGTALRIMKKELKK DGYQE" /locus_tag="LOCUS_3710" /gene="glmL" /note="WP_015945203.1 methylaspartate mutase accessory protein GlmL (Desulfitobacterium) [pid:45.2%, q_cov:98.1%, s_cov:97.6%, Eval:6.9e-106]" /note="MGA_513" ORIGIN 1 cgagcatggg cttgatgtac ttgtcgatga cggggatgaa gtcctttgcc aggaacagag 61 gatctctgcc gcctgcaccg gagtactgaa cagccgcgca gtcgccgaat gcgacctggc 121 cgtcttccag aatgatctgc acggagatgg attcgccggg cattctgacg gaggtgaagc 181 cttccgttac gggagctccc tgatagaaca cgccgtcgtg ggcagcgccc ttcttgatgg 241 cgcgctgatc gtcgaagtag aagccggtac ggcccttgga acaaactacg tctaagattt 301 tcatggtttt gtttctcctt tataaaacta ctttctgggg cggcctacga gtctgccctt 361 cgaaattgca taaacgtcgt cgatgaccat ctggaaggaa gcgtctctct tttcgaactt 421 cgctctttcc tcgatcttgg ctctgtggaa atccttgatg tcctggggga acggcaggtt 481 gcccggttcc aggatacgga tggcgccctg gttgtctctg gcgggaagca tcttgcccgc 541 gttgacccgg cagggagcga agggaacgtc cagcgcaccg gcttcgaccg ctctgcagac 601 accgaccgcc aggtcgccgt cgcccagttc gaagcacttg tctacgatgc agcgggtctc 661 gcgcttgatg atctcttttt catccgccag atgcgtgtcg ccgaagctct gatctgccag 721 catggagatg gcctgcttgg tgcagcgcag tcctgctgcg ttggcttcct tggtggggat 781 gcctgccgct tcgtgcgggg tcttgacgat gaccttggta gcgcgggaga gtgccgctgc 841 tacgctgccc caggaaataa cgccgaaggc ctttgcctcg tcctggggga aaccgcccat 901 ccactggtgg aaaacggtgg tgacgatcac gtctttgtat ccgtactttt cgagatattc 961 gttggtgagc tcttccaggg agcggatggc tgcgatatcc tgcagcaggt tgccgccctg 1021 gccgtagccg acggtgacgt tcttaacgcc ctgttccgca gccagcagcg cttcgatgac 1081 ggctaccgcg tgggagatgc agggaggaac gagggtgccg gtgagggggc cgtaaggctc 1141 tctgttgatg gagacgcccg cttcttcgta gatgccggtg aggcggtcta catactgcca 1201 gtcgcggata gtgcgttcca tgggcacgtt cttggtgtag ggcaggttat aggagatgcc 1261 gccgccttcg taggaggtaa agccgccggc gaaggtgatc tctgccagaa gtctggcgtc 1321 gggggtgccg tggcggacct gcaccggggt cttcagggat tcgatgaccc gtctgcagcc 1381 ctgtacgccg tggttgaccg ccgggaagcc gttgagcatg gaacggcctt cctgctggga 1441 aacgcggatg ccgttctcgc agtcttcata gcggttctgt ctggtatagc tgtcgatggt 1501 ggtggggagc aggtctgctt cgcctgcatc ctgcaggtgc tgcagcagtt cgatgtgctc 1561 gttgatgagc gcaacgcccg ctctgggctg ggtgagggtg cggccttcgt tcttggcctt 1621 gatcagctta gcgccgaacc gtctgtcctc ggggatagac ttctgatatt cgacggcttc 1681 ctggaaatcc acgtccttgc cggtgggcca ctgggtgagg acttccgctc tgatgcggta 1741 aaattcgtcg tctgagatct tcttattctt gatatccatc ctttttaagc tcctttttca 1801 tgatcctgag ggctgttccc gggtaataac cgctcagcag tcccatggct gccaggatat 1861 agctcctgtc cacccagatg tctgcctgtt tcggttttaa tgagaaggga tcctggggat 1921 cccagaaagc ggcggaagcg atcttcccgg tccgcttggt gtggatgagt gatcctcccg 1981 taacgatgat ctgacggatc tctctgaggt ccttgccggt ctgcatgtag gcgatgccgt 2041 tcatggtgta gaactcttcc agcctgcctg cgtgtctggt gacggccgtc ttgatggcgc 2101 cgctcgccag ggcgaaatcc agggcctcgc tctccgcgtc cgtgggtacg acttcggtgt 2161 tcttaccgag atagtcgatc atctcgcggc agcgttcttc cggaagaccg gacagctggg 2221 agatgtagcc tgtccccacc gcttcttcga tgccgtggat gctgtagcgc atgccgatgt 2281 cgccttccac ggtccgtttg atgtagggtt caggcagtcc cttgaagatc gtatccatgc 2341 cggctctggg cataccgtcg cacacggagt agatgtccgt cgtggcgccg cctacgtcca 2401 ccgccagcag atcgccgatg ccggtttcct tggaaccgtc cggattttcg cacccttccg 2461 ccagcagctg catggcctgc atcatggccg acggcgtcgg catcgcaatg ttgtcgatga 2521 gggattgagc cttggtgtag ccctttgcct ctacgatgcg ctttaaaaag atctcccgga 2581 tcttatcctg agccggcttg atgttgagtg tgccgaactt gggcattacg ttttctacga 2641 tgtggatctc ccgaccttcc agctttctgg cgcacgtgcg ggcaacactc cggtttcctg 2701 cgatcacgat aggaaagtct gttttacagg tcgccagcat gtctgcgttg tgcaggatgc 2761 attccttgtt gccgccgtcc gtgccgccgg taagaaggaa gatgtcggga tgttccgcat 2821 cgatatcctc tatgtcatcc tccgtgagtt cgaaggagta cacgccccgg atcttggcgc 2881 ctgcgccaag cgatgcctgt tttgccgctt ctgcggtgag ttcgggaacc agaccgctgg 2941 tgatcatccg aaggcctccg gctgcggaag aacaggcgta gcgcgcttcg aagttcagcg 3001 ggccggtctt ttcctccagc ttgcggaccg catcggctag gccttcgccg atgtccgtct 3061 ggatcgtggt ccaggactgg gaggtgccca gcagttcttc agtttccaga tctacggcgg 3121 tcaccttcgt ataggtgctg ccgaagtcga tcaaaagtac gggtctcata gtttagttca 3181 gatgaaagtc ttctttcagg cagtcgatgg tggtctgggg atccgttccg ggcgggaagg 3241 ctctgtcgaa gcccatgtcc ttgaatctct tttccacttc cgaaaattcg tgcttgccga 3301 tgacg // LOCUS sequence104 3283 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence104 VERSION sequence104 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3283 /mol_type="genomic DNA" /organism="" /note="sequence104" CDS 1338..1664 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MITISIQQLLIYILLVVAIVAIAVLIVVFTKLLPTLKSLAKTMEN VEALSTTAREDLDSVQGIITNVSRSVTDVTGVIANNKSNLKAATNLVNAAAGLAKLTRS KTKK" /locus_tag="LOCUS_3720" /note="MGA_516" CDS 1807..2049 /product="AbrB/MazE/SpoVT family DNA-binding domain-containing protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003388120.1" /transl_table=11 /codon_start=1 /translation="MKATGIVRKLDQLGRIVIPKELRNTFDLAEGDPIEIFVEGHDIIL RKYQPACIFCNDATDVVQFEGKNVCRKCLGKLKDL" /locus_tag="LOCUS_3730" /note="WP_003388120.1 AbrB/MazE/SpoVT family DNA-binding domain-containing protein (Clostridium) [pid:62.0%, q_cov:98.8%, s_cov:97.5%, Eval:1.7e-26]" /note="MGA_517" misc_feature complement(2143..>3283) /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_005903692.1:uracil-xanthine permease family protein" /note="WP_005903692.1 uracil-xanthine permease family protein (Fusobacterium nucleatum) [pid:43.9%, q_cov:94.5%, s_cov:85.0%, Eval:1.3e-75]" /note="MGA_518" /locus_tag="LOCUS_3740" ORIGIN 1 aatttctcgt agcctctttc gatatgatag atctctgaga cctcggtctt tccctttgca 61 accaggcctg ccagcaccag cgctgcgccc gcgcgcaggt ccgtggagat gacgtgcgct 121 ccgaccagct gatgcttgtt gccgggtacg atcgccgttc ttccttcgac gcggatgttc 181 gcgcccatgc gcgacagctc tgcagcgtgc atgaagcggt tctcgaacac cgtctcgatg 241 acggcgctcg ttccgtctac cgtcgtgagc agcgccatga ataaagcctg catgtccgtg 301 gggaaaccgg ggtagggcag cgtcttgata tccgtcgcta ccagctggtt gagatcgccc 361 cgcacccgca gcccgtcgac ttcgtcgttg accgctgcac cgcattccag cagctttgcg 421 atgacgggtc ttacgtggtc gggcacgctg ttcttgatga ggacgtcgcc ccgggtgatc 481 gctgcagcga tcataaacgt gccggtctcg atccggtccg gaatgacggc gtgccgcgta 541 ccgtgcagcg tttccacacc ttcgatgcgg atggtatccg tgccggcgcc cttgatcttc 601 gcgcccatct tgttgaggaa gttcgccagg tcgacgatct ccggttcttc cgccgcgttt 661 tcgatggtgg tcgtgcctct tgccagcgtc gcggccatca tgatgttctc tgtcgcgccg 721 acgctgggga agtccagata gaccagcgcg cctttcagtc catagcgggc ggacgcctct 781 acgacgccgt ctcccgtgag gatctttgcg cccagaaggc ggagcccttt attatgcagg 841 tcgatgggac ggttgccgat ggaacatccg ccggggagcg cgatgctcgc gaaaccggtc 901 tttgccagaa gcggtcccat tacgaaaatg gatgcgcgca tctttttgac cagttcgtgg 961 ggcacctcgg atatgttgcc tctgccgggc tgcacaacga tcgtgtggtt ctgccagtct 1021 tccgtaacgg tggctcccag cgatctgagg atctcgcaca tgacgtccac gtccagaaga 1081 tggggcacgt cgttgatctc gcatacgccg tccgacagga tcgtcgccgc cataatgggc 1141 aaaacagcgt tcttgctgcc ggaaatggtg acttcgccgc ggagtggacc gctttgttct 1201 acgatatatt tagccaaagt tataaacctc cgaaattttc cactcttatt atacttgcaa 1261 acccccgtaa aaacaacact tgcaaaggat gcccaaaaat tacataatta cagataaaga 1321 aaagaggtgg aaaaacgatg atcacgatta gtattcagca gctccttatc tatatcctgt 1381 tggtggtggc gatcgtagcc atcgctgtcc tgatcgtagt ttttacgaag cttctgccta 1441 cgctgaagtc ccttgcgaag acgatggaga acgttgaggc gctttctacg acggcaagag 1501 aggacctgga cagcgtgcag ggcatcatta cgaacgtttc ccgctctgta acggacgtta 1561 ccggggtgat cgcgaacaac aagagcaatc tgaaggctgc taccaacctg gtaaatgcag 1621 ctgccggcct tgcaaaactt acccggagca agacgaaaaa ataaacatct gtgcataaac 1681 tctgcaaaaa atattcagat ttccgtataa tattggttga caaaaattgc tattttgcta 1741 taatggtatt tgagttaaaa gcaaaactta aatcttgtgc gtaatcaaaa agggagcaaa 1801 ggtactatga aagcaacggg aatcgtaaga aagttggatc aacttggaag aattgtcatc 1861 cccaaggaac tgagaaatac attcgacctg gccgagggcg atcccatcga gatctttgta 1921 gaaggtcacg atatcattct tcgcaagtat cagcctgcct gtatattctg caatgacgca 1981 acagacgttg tccagttcga agggaagaac gtctgcagaa agtgcctcgg aaagctgaag 2041 gatctgtaga gtagacaaaa taaacgaaca acaaagccgt gtttgaagat ccaaacacgg 2101 cttttgcttt tgtgtatttt cttttcagaa cggtccaaag gatcagtact tgcctaagct 2161 gctggccagg gtcttgtccg ggtcatcgcc gaaggcttcg tccttgccgg gcaggatggc 2221 gttgagcacg atgccgacga tggacgctac cgcgatgcca gagagagata cgcttccgat 2281 gtggatggcg ccggcttcgc tgtaggagat gccgacggcc aggcccagga tgagcgccgc 2341 gatgatgacg tttctgctct cctggaagtt cgtcttgttc tcgacgacgt tgcggatgcc 2401 gatggcggag atcatgccgt acaggatgag ggagacgccg ccgatggtgg ctgcgggcat 2461 gacccggatg agggccgcga acttcgggaa gaaggaaagc acgatggcgt agaaggctgc 2521 caggcggatg acgaaggggt catagacctt ggttagggcc agaacgccgg tattttcacc 2581 gtaggtggtg ttggccggag cgccgaacag agctgcgatg gtggtgccga cgccgtcgcc 2641 cagcagggtg cggtgcaggc cgggatcttc gatgaagttc tttccgaccg tgccgccgat 2701 ggcggagatg tcgccgacgt gctccatcat ggttgcgaaa gcgatgggta cgatggtaat 2761 gatggaagag atcatgaagg aagtgttgac gtttccgctg gccagcagac cgaagaccgt 2821 atcctgcatt tcgaagggaa ctccgaagat gctcgcttcc ttaaacatcg tccaatccac 2881 gttgccggtt gcagctgcga cgacatagga agcgacgacg cccagcagga tggggatgat 2941 cttgatcatg cccttgcccc agatgttgca tacgatgacc acgacgatcg cgaccagagc 3001 gatgggccag ttggcggagc agttgttgat agcggaaggc gccaggttga gtccgatggc 3061 gatgatgatg gggcctgtga ccacaggggg gaagaaccgc atcactttct tggagccgta 3121 ggctttgcag atgccggaca gcaccaggta cagaaggcct gcgcaggcga cgccgatgca 3181 ggcgtaggga agggcttctc tctgggagag cccgatgttt tctcccgctg ccacgacggc 3241 tgcataaccg cccaggtagg cgaaggagga tcccaggaag acg // LOCUS sequence105 3265 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence105 VERSION sequence105 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3265 /mol_type="genomic DNA" /organism="" /note="sequence105" CDS complement(545..1165) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MSERNTVAVKIYGQEYNISGEASREHIMRVADYVDNKMQEIGDAI NASNSGVAVLAAVNIADEYFARENDIAELQEKNDQLVSDTQRYSLLWEEAKQSLAQYKE EMAGTRAQQEENLRTLTEKNDRIAELTRQLQEVNGHNEVLRARCEELTRRAESAEAAPE EAQRTIRELEAKSRDIESSFFDIQMENIHLKNELENLRKQMNR" /locus_tag="LOCUS_3750" /note="WP_000082701.1 cell division protein ZapA (Bacillus) [pid:39.5%, q_cov:35.9%, s_cov:84.3%, Eval:4.8e-07, partial hit]" /note="MGA_520" misc_feature complement(1181..>3265) /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_011860925.1:phenylalanine--tRNA ligase subunit beta" /note="WP_011860925.1 phenylalanine--tRNA ligase subunit beta (Clostridioides difficile) [pid:47.6%, q_cov:99.6%, s_cov:86.3%, Eval:1.5e-182]" /note="MGA_521" /locus_tag="LOCUS_3760" ORIGIN 1 ccttgttgtc cgcagagttt acgatctggt tgatcttgct gcggatatcc tcgttcttct 61 tgaggatggc ccggcggatg cggcgcagtt cggagctggc gccatcggcg atctcgtcct 121 ccgacaggat gcagcgctcg atctcgtcct ccaggtgctt cagcaccgtg atggcggaga 181 ccagaccctg gatcgtctgc atcggctgca gttcctcggt gtgcagaaac gcctcggtgc 241 gtctcgccga ctgcaggtta tatgccacct ccagcagctg cttcggggtc aggctgccct 301 ccttcgccgc caggtgcacg acgcctttga tgtcgtagaa cccgcccaga ggcggcgtgc 361 ctttcttgag caccacctgc atggcttcgt ccgtcgcctg cagctcgtcc tcgatccacc 421 gcgctttgcg ggagggcttt aagctgcgga cggcgtcccg ggtcatgccc gagcagcact 481 gctctgccag catctctatg atcttttcgt attccagcac gcgcagcgct ttttcgttca 541 tgggttatcg gttcatctgc ttgcgcaggt tttccagttc gttctttaag tgaatgtttt 601 ccatctggat gtcgaagaag ctgctctcga tgtcgcggct cttggcttcc agttcgcgga 661 tggtccgctg ggcctcttcc ggagcggctt cggcggattc cgctcttctt gtcagttctt 721 cgcagcgggc gcggagcact tcgttgtgtc cgttgacctc ctgcagctga cgggtgagtt 781 ctgcgatccg gtcgttcttc tccgttaagg tgcgcaggtt ctcctcctgc tgggcgcggg 841 tgcccgccat ctcctcctta tactgggcca ggctctgctt tgcctcttcc cagagcaggg 901 agtagcgctg ggtgtcgctc accagctggt cgttcttttc ctgcagctcg gcgatgtcgt 961 tctcccgggc gaaatattcg tccgcgatgt tgaccgccgc cagcaccgcc acgccgctgt 1021 tgctggcgtt gatggcgtcg ccgatctcct gcatcttgtt gtccacatag tcggcgactc 1081 tcatgatgtg ttctctggag gcttctccgg agatgttgta ctcctggccg tagatcttta 1141 cggcgactgt gttccgttcg ctcatggcag ttcctttccg ctacatttca cgtaagaccg 1201 cgttgtaagc atccttcagg gcgatcagca ccttctggtt gatctcgttt acctcgtttt 1261 ccttcagggt gcggtctgcc gccctgtagg tgagggaata cgctacgctc ttgaagcccg 1321 gcagcaccgg agctcctctg tatacgtcga acagcttgac gctctccagc agcggacctg 1381 cgttggcctt gatggccttt tccagttcgc ctgccgctac ctcgtccttt acgaccatgg 1441 agaagtctct caccatggcg ggatatttgg gcagcgggct gtatttgatc tccgtctttg 1501 cgaggctgta cagcagatcg aaatcgatct ccgccgcata gacctcagcg tcgatgttat 1561 aaacttccgt tacggccggg tgcacctggc ccatgatggc aacgggcttg ccgtccaccg 1621 tgacccgcgc acatctgccc gggtggaacg tcggatcgtt cttcacggct tcgtattccg 1681 caccgtggat gcccagggaa gccagcagtt cttccacata gcccttcagg gtgaagaacg 1741 tctcgccttc cgcgtacatg gcgatgcaca gagcgtcttt ttcctcgggc aggatgccct 1801 cttcgccctt gccgttgttg aagaacgtat tgcccagctc gaagcctctc acgttcgcgt 1861 tgcttctcgc atagttgagc gccagcacgt ccagcaggtt gggcaggatc atggtgcgca 1921 tgacggaagt atcttcgccc agcgggttga tgagctttac gaagtttctt ctgtagctgt 1981 ctgccgggat gcggacctta tcgcttgcct tcggagagac gaagctgtag gtctggaact 2041 cggagatgcc catgcctctc agagcagcct tcgccaggtt gcgaagctcc tgcttttcgg 2101 agatgcggct ctccgtcgcg ctcttgggca gcgtggtggg cagcttgtcg tagccgtaca 2161 ttctggccac ttcttcgacg tagtcttcct cgatctccag atcctggcgg atcgtgggcg 2221 gggtcaccgt gatgatgtcg ccgttgaggg aagcctccat ctccagcgcc ttgaagtagt 2281 ccaccatctg ttcgccggga atgtcgatgc ccagcacctt gttgatgcgg ctcacgcgca 2341 cgtccatggt cttcgccttc tcgggcacgg gatagacgtc cacgtcgccc gttaagacgg 2401 tgccggcacc cagcagttcg ataaggtagc agactctgtc gcaggcatcc ttggccaggt 2461 tggggtcgat gcccttctcg aagcggccgg aagcctcggt gcgcagcgtc agcttcttgg 2521 aagtctggcg cacggaatcg ccgaggaagt tggcggattc gatcaggacc atgttcgtat 2581 cgggcttgat gtcggagttc agaccgccca tgacaccggc gatcgccagc gcttcttcgg 2641 tatcgcggat cgtcagcatg ccttcggaga gttttctctc ggtgccgtcc agcgtaacga 2701 aggtatcgcc gtccttcgct gcatccacga tgatcttacc gcccttgacg gtgttgatgt 2761 cgaaggcgtg gatgggctgg ccgtattcca gcatgacgaa gttcgtgatg tctacgatgt 2821 tgttgatggg gcgcatgccg gccatcatca gatatttctg catccaccag ggagactgtt 2881 ccaccttgat gtccttgacg acgcggcagc agtagcgctt gcacaggtcg gggcgcttga 2941 tctccacctg gatgtagtct tcgctcttct ccggggcaat ctttttgcat tcagtctcgg 3001 gataggtgag cttcgtaccg aacgtcgccg cagcttctct ggccatgccg atcatggaca 3061 ggccgtccgg gcggttcggg gtgatctcga aatcgatggc ggggtcgttc agctgcagtg 3121 cctcgaggat atccatgccc ggcgtatatt cgccgtccag gatccagatg ccgtccttat 3181 cgcgataggg aacgatcttg tcggggaaac cgagttcgga gcagttgcac atcatgccgt 3241 tgctagcaac gccgcgcagc tcgcc // LOCUS sequence106 3249 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence106 VERSION sequence106 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3249 /mol_type="genomic DNA" /organism="" /note="sequence106" misc_feature <1..1747 /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_012048014.1:selenocysteine-specific translation elongation factor" /note="WP_012048014.1 selenocysteine-specific translation elongation factor (Clostridium botulinum) [pid:39.2%, q_cov:99.7%, s_cov:91.2%, Eval:1.8e-122]" /note="MGA_522" /locus_tag="LOCUS_3770" CDS 2084..2458 /product="GrdX family protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_009897539.1" /transl_table=11 /codon_start=1 /translation="MIILTNNPDVMETMTERDVRFVDGSYRDVLIKARDLVHQGHRLLS HPLMGSLKPNETPYRTIALSDSGGPLDTDSLLLIENAIETFDKFARVTRPDRGINTPQE MLADFRLIDLSLIQSMEVNE" /locus_tag="LOCUS_3780" /note="WP_009897539.1 GrdX family protein (Clostridioides difficile) [pid:49.1%, q_cov:93.5%, s_cov:91.1%, Eval:1.2e-22]" /note="MGA_523" ORIGIN 1 ggatatcggt atcatcgatg tgccgggcca tgaaaaattc atacgcaaca tgcttgcagg 61 catcggaggc atcgacctgg tgctgctggt ggtcgctgcg gacgagggtg tcatgcccca 121 gaccgtggag cacctggaca tcatgcgtct gctgaacatc cgccggggca tcctcgtcat 181 cacgaaggcc gacatggtag atgacgactg gatggatatg gtcgaatccg acgtgcgcga 241 cgccgtaaag gggacattcc tggagaacgc gccctgtctt cgcgtgtcgt cccaaacggg 301 ggagggcatc gaggaactgc ggcagctcat cttcgcggaa gttgccaagg tcggcgaaaa 361 gaacaacaat cccgcgctgc tgcgcatccc catggaccgg gtgtttacga tccagggttt 421 cggcacggtg gtcacgggca cgcttaccca gggcatgatc cgcacaggag acgaggtaac 481 gatttatccg gaaggcctga acgccaaggt gcgcggcctg caggtgcatg ggaagtccgt 541 ggatgcggca tacgctggcc agcggacggc ggtcaacctg acgggggtca agaaagaaga 601 catcgcccgg ggcaacgtgc tggcggcgaa ggacagtctt acgccatcct ccatgatcga 661 tgtaaaactg caggtgctgg gagattccaa gcgcacggtt ctgaacggat cgcggctgca 721 tctgcactac ggatcggcgc aggtgctgtg caaggcggtc ctgctggaca aagatgcgct 781 tgaccccggc gagagcggct atgcccagct tcgcacggag gaacccgtgg tcttaaagca 841 gggcgatccc ttcgtggtgc gctattattc cccggtggag acggtgggcg gcggcattgt 901 gctcaatccc aatgcgccca agcataagag gggagacgcg gcggtcgtaa aggccctttc 961 cgtgcgggag agcggcgatg acagcgcgca gatggaacag atcctgcggg acgagagcaa 1021 gaccttcccg acggcggaaa agctggcaaa acagctggga ctgagcacgg aagaagggtt 1081 gcagcagctg cagagccttg ctttgcaggg gaaagcggtc tcaattgcgg atgggattta 1141 cgtacatcaa gattatgtta actacataaa agacgctgcc tttgccattc tggatgccta 1201 ttatgccaag aatccgctgc ttgccgccat gccaagggaa gagctgcgca gcaagctggg 1261 cggtgccgtc aaggtgaccg acacgagaag tctcgaccgg gtgctgcagt atttgggaga 1321 gaccggcgtt ctggccttga cgccctctac ggcaggaaaa cagggctatt ccgtgcagtt 1381 cacgaaagcg cagctgcgtc tgatcgacga actattaaag ctttataagc aagcaggctg 1441 cgagagcccc gatcccgatg aagtttttgc cggacgaaag gataaagaag aatgcaaacg 1501 gctggtcgca gcgctgtgcg ccgatggccg gctcacccgc gtaagcggca agttctgcct 1561 ggacagtgca tttctgcagc agaccatcgc ctggatccgc gagaccattc agaccaacgg 1621 ttccataact cttgccgaac tgcgcgacca cctgaacacc tcccgcaaat atgccctcat 1681 gatcctcgaa tactgcgaca atgcgaagat caccaggctg caggacgata gaagggtgtt 1741 ctattagaat tatttataaa tttataaggc gctttgcatt gtccgataaa tcggaaaatg 1801 gtagaattat ttgaaaggta aagaacattc ggttgatgat tgcgggagag cgcggtaggc 1861 gcaccgaagg cgtaagttct ctgtccccgg ccagggcgga gggcgattat ctcaggtaaa 1921 cggaccgcag tcggacgaaa ctctggagag cgtaagcacc gaaggggcaa tttccggaca 1981 caatttccaa cgcagatttg tggaaagaaa ctctcaggtt agtgtacaga gcaggaaggc 2041 agtttgtttt cctgttcttt ttatttgccg aaaggaaacc gctttgatca tcctcacgaa 2101 caacccggac gtaatggaaa ccatgacaga acgcgacgtt cgcttcgtcg acggctccta 2161 ccgggacgtg ctcatcaagg cgagggatct ggtgcaccag ggtcaccggc tgctctccca 2221 tccgctgatg gggagcctga agcccaacga gaccccgtac cgcaccatcg ccctcagcga 2281 ctccggggga cccctggata cggacagcct gctgctgatc gaaaacgcca tcgaaacgtt 2341 cgacaagttt gcaagggtca cccgtccgga ccggggcatc aacaccccgc aggagatgct 2401 ggcggatttc cggctcatcg acctgagtct catacagagt atggaggtaa atgaatgaag 2461 ttagaattgg gtatcatcaa gatctcggat attcagttcg gcagcgaaag caaggtggaa 2521 ggctccactt tgtacgtcaa caaagacgag gtaaaggccc tcatcctgga ggacgagacc 2581 tttgcgagct gcgaactgga catcgcgaga cccggtgaat ccgtgcgcat cgctccggtg 2641 aaggacgtca tcgagccccg ggtcaaggta tccggcgaag gcggcgtgtt ccccggctgg 2701 atggcgaagg tgaagaccgt gggaagcggc cgcaccaacg ttctgaaagg cgctgccgtg 2761 gtcaccaccg gtaagatcgt cggattccag gaagggatca tcgacatgtg cggagagggc 2821 gcccagtata cgccgttctc ccagctgaac aacctggtgc tgtgtctgga gcctgtcgaa 2881 ggcaccctgc agcacgccta cgagaaggct gtccgcctgg ccggtctgaa gaccgccacc 2941 tacctgggca agctggcaaa ggacatcgaa gcggaggaga tccgcaccta cgagactccg 3001 agcatcacgg aaggcatcaa gctctatccg gatctgccca gagtgggcta cgtcctgatg 3061 ctgcagtccc agggcctgct gcacgacacc tacgtctatg gcgtggacgc caagcagtcc 3121 ctcaccacga tgatctatcc gaccgagacc atggacggtg ccatcatcag cggcaactgc 3181 gtatccgctt gcgacaagaa caccacgtat catcacctga acaaccccgt catcgaagat 3241 ctgtacgcc // LOCUS sequence107 3249 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence107 VERSION sequence107 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3249 /mol_type="genomic DNA" /organism="" /note="sequence107" CDS complement(1252..2037) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MAVRTEQLDRDHERLNEAIRFAVEAHAGQLRKGTQLPYIVHPMEV LAILAAMGVDFDVMIAGVLHDCIEDAEVGREEIAAKFGEKVADMVAAHSEKKDLPWEER KAIALDELEAADPDFQKMVLADKLSNMRAIARDLKKVGDELWNRFHAPKEKQSWYYSES IDVLEPLQFDDMAEEYFWELNDLYKDVFVEYFFDPQEQRVYQQALHEDYCHVFERGDCI WYEGDKLPSDLIPVDKLFAERMEANWTEEMMDVSLGPVS" /locus_tag="LOCUS_3790" /note="WP_003730082.1 HD domain-containing protein (Listeria monocytogenes) [pid:39.9%, q_cov:54.8%, s_cov:79.4%, Eval:9.7e-28, partial hit]" /note="MGA_526" CDS complement(2050..2784) /product="LamB/YcsF family protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_002851457.1" /transl_table=11 /codon_start=1 /translation="MKNIDINSDLGESFGAYTMGNDAEVLRYVTSANIACGFHASDPLT MQKAVRLAKEAGAKIGAHPGYPDLVGFGRRELKVSPAELKAMVIYQVGALQAVCKAEGT KLHHVKPHGAMYNMAAKDEKLADAIAEAVAAVDGSLVLVGLSGSCMKAAAEKHGLAFAA EVFADRAYEDDGSLVSRTKPGAMIEDEDLAIRRMLHLLETGTIESSNGKEIRLEADTIC VHGDSPKAVLFAKKLREALTAK" /locus_tag="LOCUS_3800" /note="WP_002851457.1 LamB/YcsF family protein (Bacteria) [pid:56.0%, q_cov:98.8%, s_cov:94.5%, Eval:2.5e-75]" /note="MGA_527" ORIGIN 1 atttccagga acgcttccag tctcgtggcc agctggccgc tgtccgaaag cgagtaatcc 61 gtttcgatcg ccatataggg catgcccagg ctttccatct tgcggcggat cgtcgtactc 121 tccaccgtgt aggccgtaca ggcctgcagg tcgatctcca cgacgccgtc caccttgtat 181 tcgtccacca gcttctccag aagcgccaga cggcggctgt ccggggtcat gacggcgcag 241 ccgatcttta aatacttttc cgcaactgcc tgcacgatat ccggggcatc cacgtccacg 301 tcgtccagcg tcgccttaat accggagcag ttctcgaagc ataccacaac gccgcctgcg 361 gcttcgatgg cttttacggt cttctccagc acgccgccga tggggcagcc cgttacgaga 421 atgcgcttgg catccgcagg aaccgggcgt tttccggccg cataatcggc ttccagcccg 481 tccgccagac gggtgagctc cttgcagacc tcgttaacat cgaagtagaa accagcgcct 541 tccagggctt tatagatcgc gtaacccgtg cttgcggggg gctgcagttt ctgcagttcc 601 atcaggcgtc tgcggcaagc tctctctttg ttgcgcgctc tggccgcatc gcggatcgct 661 tcgtccggaa tggcctcgcc gaacttctgc tccagaaatt cgcggaaccg ctgcacctcc 721 tgcgtccact gctccagcgc gtgctcgcgg tcaccctggg gaagatgcag cagatagacg 781 tccttcatgt cgcccagcag ctcgtacatc ttcttcttgc catcgcaggt cgtctctccc 841 acgataatgt ccgagaagta cgtgtacgga catttatcgg acacggcaaa accgtagctc 901 gacttgatga gcgggcacag attcttcggc aggtgcactt ccgccgcggg gatcgtctct 961 tcgctcatgc cgcacaaaga taccgggctg accccggcag catccaggat ctcctggggc 1021 gtaaacgtac agaacgtgcc ggcgactctg ccgccgtttt ccttaatgct tttgacccgc 1081 agaaacccgt tttttcgggc atctccgaac tgcgcaaatt gctccggaag ttcgtaattc 1141 ataggtcttt cctccctctt ccaacctatt ccattataaa tcggatatgc aaattgattc 1201 atttacatat ccgatagaac ttcccgtttt atctgtttgt cagattctgc actagcttac 1261 cggtccgagg ctcacatcca tcatctcttc cgtccagttc gcctccatgc gctcggcgaa 1321 cagcttgtcc accgggataa ggtctgacgg gagcttgtcc ccttcgtacc agatgcagtc 1381 gccccgttca aacacgtggc agtagtcctc gtgcagagcc tgctgataga cgcgctgctc 1441 ctgggggtcg aaaaagtact cgacaaagac gtccttgtac agatcgttca gctcccagaa 1501 atactcctcc gccatgtcgt cgaactgcag cggctccagg acgtcgatgc tctcggaata 1561 gtaccaggac tgcttctcct tcggagcgtg gaagcgattc caaagctcat cccccacctt 1621 cttcagatcc cttgcgatcg cccgcatgtt ggacagtttg tccgccagga ccatcttctg 1681 aaagtccgga tcggccgcct ccagctcgtc cagcgcgatg gctttgcgct cttcccaggg 1741 aagatccttc ttctcggaat gcgccgccac catgtccgcc accttctcgc cgaacttcgc 1801 tgcgatctcc tcccggccga cctctgcgtc ttcgatgcag tcgtgcagca cgcctgcgat 1861 cattacgtcg aagtccacgc ccatggcagc gaggatcgcc agcacctcca tgggatgcac 1921 gatatagggc agctgcgtgc ctttgcgcag ctgacccgca tgggcctcca ccgcgaagcg 1981 gatcgcctcg ttcagccgtt catgatctct gtctaactgt tctgttctta ctgccatact 2041 gttctccgtc tattttgccg taagcgcctc gcgcagtttc ttcgcaaaca ggacagcctt 2101 ggggctgtcg ccgtgcacac agatcgtgtc tgcctccagc cggatctctt tgccgttact 2161 gctctcgatc gtaccggtct ctaaaagatg cagcatgcgc cggatcgcca gatcctcgtc 2221 ctcgatcatg gctccgggtt ttgttcggct cacgaggctg ccgtcgtcct cgtaagcccg 2281 gtccgcaaag acctccgcag caaaggccag gccgtgcttt tccgccgcgg ccttcataca 2341 gctgccggat agacccacca ggaccagtga cccatccacc gccgccacgg cttccgcgat 2401 ggcgtccgcc agtttctcgt cttttgccgc catgttatac atggcgccgt ggggctttac 2461 gtgatgcagc ttcgtccctt ccgctttgca gaccgcctgc agcgcaccga cctggtagat 2521 caccatagcc ttcagttctg ccggggacac cttcagttcc cggcggccga atcccacgag 2581 atccggatat ccgggatgcg cgccgatctt tgcaccggct tccttcgcca gacgaaccgc 2641 cttctgcatc gtcagcggat cggatgcatg aaatccgcag gcgatgttgg cggacgtgac 2701 gtagcgcagc acttccgcgt cgtttcccat ggtataggcg ccgaaggatt ctcccaggtc 2761 gctgttgata tcgatgttct tcataaggat tcacccaatt cttccaatgt gaccggcaca 2821 aaatggatcc ttttcccggg tcccagctgt gccagcagcg gcagatcttc cgagaggacc 2881 gtcccgatct tcgcatagcc gccggtggtc tggtggtcgg ccatcatcac gatgggctgc 2941 ccgtttgcag gcacctggat cgacccgaag cagatgccct ccgagaggat atccgtgccg 3001 ttcagggacg ggaccgccgc gccttccaac cggtatccca tgcggtcgca ggcggcgctg 3061 agggtataga tactgtccgt aaacgttttt ttcgcatctt ctgcaaacat ggcatcctgg 3121 gggccgaaca gaaagcggat ccgcgttacg ccctccggat ctgtggcctt cgcaagacgc 3181 tgcaggacgg gttcgcaggg cgttccctgt acttcggcaa gctcagcagc cgcttgtggg 3241 cgggacccg // LOCUS sequence108 3236 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence108 VERSION sequence108 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3236 /mol_type="genomic DNA" /organism="" /note="sequence108" CDS 404..919 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MKKLLSILLALAMIFSMAACSSKEEAPAEEPTPTEETGEETAEES AEETGEEGQNPVMNLVGDYASDRCTITVEAGEGNVANITIDWASSAAERSEWTMSGEFD EETTSVYYQDCIKKNLVFAEDGSISSEETVYEGGHGTFTFNADEQTLTWTDDIENIADG AVFTYIPR" /locus_tag="LOCUS_3810" /note="MGA_530" CDS 1108..1323 /product="helix-turn-helix transcriptional regulator" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_002262994.1" /transl_table=11 /codon_start=1 /translation="MKNLKLKAARAAKDLSQADLAQMCGVSRQTINAIEKGDYNPTINL CIAICKALGRTLDELFWEEENEDAEK" /locus_tag="LOCUS_3820" /note="WP_002262994.1 helix-turn-helix transcriptional regulator (Streptococcus) [pid:75.0%, q_cov:90.1%, s_cov:100.0%, Eval:1.1e-20]" /note="MGA_531" CDS 1304..1774 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MKTQKNNLDERQEQILLKIEHIGCWLAFWGLLAAILVQEVMYPGE LRAIAGEWIVFMVLCIYIMAGCLKNGIWDRRLKPNFRTNLLASFVAAAVVALISVAIGL RRIEDLDPKIILLICAIAAGVTFVACFLLLSAAAAATKRKQKQLEEEPEDEV" /locus_tag="LOCUS_3830" /note="MGA_532" CDS 1816..3009 /product="aminotransferase class I/II-fold pyridoxal phosphate-dependent enzyme" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011015808.1" /transl_table=11 /codon_start=1 /translation="MAHIQTDVLYTREYRDDAINMGKAESFPYYPATAFGATAFEEIKT AYQQGYTYIRTNNPDRDVLAGLMTKLEAPGMDAASTILSSGMAAITATAAALLQSGDHI LSNRCLYGETIELFDFLFGKFGVETTYVDMSDLDAVRAAVKPNTKMIYTEICANPTIDL VDLPELVTIAKDAGALLVVDNTFCSPLSIRPLEWGADIVINSLTKFLSGHSDILLGCVT ARPELVEKIYEFSLFMGSPADPFPAFQMIRALESAPMRIERQMSNAAKLAAYFETDPRI VKVNHPSVESFRQRALAKKLWKDDEKITGMMSVEFCTEDDAKIDAFMKRLKYVHYAPTL GGMRTTMSHPVTSSHNTTPDDVRRAMGITPALMRISIGIENIDDLIEDFRQAFVELE" /locus_tag="LOCUS_3840" /note="WP_011015808.1 aminotransferase class I/II-fold pyridoxal phosphate-dependent enzyme (Fusobacterium nucleatum) [pid:48.6%, q_cov:97.5%, s_cov:96.5%, Eval:2.4e-104]" /note="MGA_533" ORIGIN 1 cctgtggatc ccgatcccgt cgatccgacg gacattccgg acgatcccac accgcaggcc 61 ggtccgaccg gcggtgtcga cgacggctcg gatgagtacg gcggaaaaga tccggattcc 121 ggtctggaag acatggaaga cgaggacacg ccgaagatgg aatactctcc gctcaccggc 181 gatgaacgcc atacggcggt ctggatgggc gtgagcctgg catccctcgc cgcgatcctg 241 tggctggcat cccgccgcag aagagaagaa taggcgttct tgacgatttt tcaaaaaccg 301 gcgctccaat ttgcttcttt cgcaagttgg ggcgcttttt tcttttcatt tccaggcgat 361 tgtgctataa caacagggtg tgttaaaaag gaggaaatta gagatgaaaa agttactcag 421 cattttactc gcacttgcga tgatcttcag catggcagcc tgctcttcca aggaagaagc 481 acctgcagaa gaacccactc ccacagagga gaccggtgag gagactgcgg aagaatccgc 541 agaagagacc ggcgaagaag gtcagaaccc cgtgatgaac ctcgtaggcg actacgcttc 601 cgacagatgc accattactg tcgaagcggg cgaaggcaat gttgcgaaca tcaccatcga 661 ctgggcttcc agcgctgcgg aaagatccga atggaccatg tccggtgaat tcgatgaaga 721 aaccacttcc gtttattatc aggactgcat caagaagaac ctggtcttcg cagaagacgg 781 cagcatttct tctgaagaga ccgtttatga aggcggtcac ggcaccttca ccttcaacgc 841 agacgaacag acgctcacct ggaccgacga tatcgaaaac atcgcggacg gtgcggtctt 901 cacttacatt cccagataat tcagtttgag acacatgcgt gaccctgcca atggcagggt 961 cactttttta tgctcaaaac accgtagatt acattttgtc gtttttatca aattaattgt 1021 aaaatatact tgacaatatg tcgtgcaagt cgtatagtta tcccagaaca agaccgcagg 1081 atgcggccag gaggaaagta cggatagatg aaaaacctga aattgaaagc agcccgggcg 1141 gcaaaggatc tgtcgcaggc agacctggca cagatgtgcg gggtgtcgcg gcagacgatc 1201 aacgccatcg agaagggcga ttacaatccg acgatcaatt tgtgcattgc tatctgcaag 1261 gctttgggaa gaacgttaga cgaactgttc tgggaggaag aaaatgaaga cgcagaaaaa 1321 taatctggat gaaagacagg agcagatcct gctgaagatc gaacacatcg gctgctggct 1381 cgcattctgg ggactgctgg cagccatcct cgtccaggaa gtgatgtatc ccggcgagct 1441 gcgcgctatc gcaggtgagt ggatcgtctt tatggtcctc tgcatctaca tcatggccgg 1501 atgcctgaaa aacggtatct gggaccgccg cttaaagccg aatttccgca cgaatctact 1561 ggcatccttc gtggcagccg ccgtagtcgc gctcatctcc gtcgccatcg gcctgcgcag 1621 gattgaggat ctggatccga agatcatcct tctgatctgc gccatcgccg ccggcgttac 1681 cttcgttgcc tgctttctcc tgctctccgc tgccgctgct gccaccaagc gcaagcagaa 1741 gcagctggaa gaagagccgg aggatgaggt ataataaaca aggcaacata ccgctttgca 1801 gcaaggaggc actctatggc acacatccag accgatgttt tatacaccag agaataccgc 1861 gacgacgcga tcaacatggg aaaggcggaa tcgttcccgt attacccggc cacggcgttc 1921 ggcgctacgg cttttgagga gatcaaaacg gcctatcagc agggctacac ctacatccgg 1981 accaacaacc cggaccgcga cgtgctggca ggcctgatga cgaaactgga agcgccgggc 2041 atggatgcgg caagcacgat cctttcctcc ggcatggctg cgatcactgc gacggcggca 2101 gctttgctcc aaagcggcga ccacatcctc agcaaccgct gcctgtacgg cgagaccatc 2161 gaactgttcg acttcctgtt cggcaagttt ggtgtggaga cgacctatgt ggacatgtcc 2221 gacctggatg cggtccgcgc ggcagtcaag ccgaacacga agatgatcta taccgagatc 2281 tgcgccaacc cgaccatcga tctggtggat ctgccggagc tggtaacgat cgcgaaggac 2341 gccggtgcgc tgctggtcgt ggacaacacg ttctgttcgc ctctgtccat ccgcccgctg 2401 gagtggggcg cggacatcgt catcaactcg cttacgaaat tcctgtccgg ccattcggac 2461 atcctgctgg gctgcgttac ggcgcggccg gagctggtcg agaagatcta tgaattctcg 2521 ctgttcatgg ggtcaccggc ggatccgttc ccggcattcc agatgatccg ggccctggag 2581 agcgccccca tgcgcatcga gcggcagatg tccaacgcgg caaagctggc tgcctatttc 2641 gagaccgatc cccgcatcgt aaaggtgaac cacccatcgg tggagagctt ccgtcagcgg 2701 gcactcgcga agaaactctg gaaggacgac gaaaagatca cgggcatgat gagcgtggag 2761 ttctgcacgg aggacgatgc caagatcgac gcctttatga agcggctgaa gtacgtccat 2821 tacgcgccta ctctgggcgg catgcgcacc accatgagcc accccgtaac atcctcccac 2881 aacacgacgc cggacgacgt gagaagggcc atggggatca cgccggcact gatgcgcatc 2941 tccatcggca tcgagaatat cgacgacctg atcgaggatt tcagacaggc atttgtagaa 3001 ctggaataat gtgcatcgcg gcataaaaaa ataattcagg agcggagcga tccgctcctt 3061 ttttgttgga catttgttgg acttaccctg ttaaactggt agtcggttaa gtttgggacc 3121 ggcttatgac cttcatgtgt ccggtagtta tattgggaaa ggggaaggaa actatgaagc 3181 actctttcag aaagttattg tctgtactgc ttgcggcagt catggtattc ggcggc // LOCUS sequence109 3226 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence109 VERSION sequence109 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3226 /mol_type="genomic DNA" /organism="" /note="sequence109" CDS 404..2209 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MDQDKGKYSERIGKVKFSILQQVALLFVLGVLVTGFFTYFAQYDA ADESIKQRTASLADEIGNEVTMAVKEYPAYPWLIRYWYENSDSLDIEYDVRFTKATQTA GKCMQLLLRHPGFRLQYADEGDLEALPEKDQKLYAEIIYSWLITRVNEIKQAHGVDYLF CVVSDDPYSEQFFLFSAADPGSIRGTNYEEVYPIGVTVTVAESQQKAMRDARQNSRYLA DAGDYVDYYELLDTVDGHAVLIGMTYNLSDIRASIESQTDRSTALAVAYQLFLSAICLV LILLTVLKPVQMIQQSIRKYEQSKDSEVVRQDLAQVRSTNEIGQLKNDIIVMTEEIDEH LHQIESITAERERVGAELAVASRIQSRSLPGVFPPFPDRSEFDVYATMTPAKEVGGDFY NFFMIDDDHLALMIADVSGKGIPASLFMMITMVLLKTETKAGVSPAEVLRQVNEQICSN NPEEMFVSVWMGILEISTGRLTAVNAGHEYPVVKHGNGKYELLKDVHGFVVGGFDDMTY DDYELQLEPGSRLFVYTDGLPEAMAAERSMFGMARIVETLNEGPDGTPKEVVEHMRDAV NRFVKDEEQFDDLTMLCLSYEGPAK" /locus_tag="LOCUS_3850" /note="WP_011203082.1 SpoIIE family protein phosphatase (Bacteroides fragilis) [pid:39.8%, q_cov:44.3%, s_cov:70.4%, Eval:6.3e-49, partial hit]" /note="MGA_535" CDS 2237..2854 /product="trimeric intracellular cation channel family protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_004254956.1" /transl_table=11 /codon_start=1 /translation="MIYTLELIGTIAFAVSGASVGIKKKMDILGVAVLAMTTAVGGGIL RDLIINVVPPAAFRDPAFTVTAIAVGLIAFLPPVREDYRRKAEFYEKVLLVTDALGLGI FTAIGIQAAYSAIPWCNGFLAGFVGVLTGVGGGVMRDVMAGEQPYIFVKHFYASASILG AVYCVLTWDHMSQAASLLSCTALVVLLRILAAKFRWKLPKAE" /locus_tag="LOCUS_3860" /note="WP_004254956.1 trimeric intracellular cation channel family protein (Lactococcus) [pid:40.9%, q_cov:98.0%, s_cov:95.0%, Eval:1.2e-37]" /note="MGA_536" ORIGIN 1 cagcattctg gaacggatcg gcatcgaagg cctggcggag ctggaagaga cgctcgcctc 61 ggtcttccac gtgagcaacc tgatcgtggc cggggtcggc cttctggcgg tcctgatgct 121 ttacgcctat ctgccgatca cacggcactc gctgaagagc cgcctgccgg gagcggtctt 181 taccggggtc atctggttcc tgtttacgaa gatcttttcc ttcgcgatcc cccggtttta 241 ccgcgcatcc agcctgtacg gctcgctggc atccctcttc ctggttctgc tgtgggtgcg 301 gatcatcatg atgatcctgt ttgccggcgg agctctgaac aaggcgctgg aggcggaagg 361 gatcgatacg gagcggctgc tccgccggag aaaatagaag acgatggatc aggacaaggg 421 caagtattcc gaacggatcg gaaaggtaaa attcagcatc ctgcagcaag tcgccctcct 481 cttcgtgctg ggcgtccttg tgacgggctt ttttacgtat tttgcccagt acgatgccgc 541 agatgagagc atcaaacagc ggacggcgtc gctggcggac gagatcggca acgaagtgac 601 catggcggtg aaggaatatc ctgcctatcc gtggctcatc cgctattggt acgaaaacag 661 cgattccctg gacatcgaat acgacgtgcg ctttaccaag gcgacccaga ccgccggaaa 721 gtgcatgcag ctgctgctgc gccaccccgg attccgtctg cagtatgcgg acgaagggga 781 tctggaggcc ctgccggaaa aggatcagaa actctacgcg gagatcatct actcctggct 841 catcacgcgg gtcaacgaga tcaaacaggc ccacggcgtg gattatctgt tctgcgttgt 901 ctcggatgac ccctacagcg aacagttctt cctgttcagc gcggcggacc ccggttcgat 961 ccgcggcacg aactacgagg aagtttaccc gatcggggtc accgttacgg tggcggagag 1021 ccagcagaag gccatgcgcg acgccaggca gaactccaga tatctggcgg atgccggcga 1081 ttacgtggac tactatgaac tgctggatac ggtcgacggc cacgctgtcc tcatcggcat 1141 gacctacaac ctgtcggata tccgggccag catcgagtcg cagaccgacc ggagcacagc 1201 cctggcggtg gcttaccagc tcttcctttc ggcgatctgc ctggtgctca tcctgctgac 1261 ggtgctcaaa ccggtgcaga tgatccagca gagcatccgc aaatacgaac agagcaagga 1321 cagcgaagtc gtgcggcagg atctggcgca ggtccgcagc accaacgaga tcggccagct 1381 gaagaacgat attatcgtta tgacggagga gatcgacgaa catctgcacc agatcgagtc 1441 catcacggcg gagcgggagc gtgtcggcgc ggagctggcg gtggcttccc gcatccagtc 1501 ccggtctctg ccgggggtgt tcccaccgtt cccggaccgc agcgaattcg acgtttacgc 1561 cacgatgacc ccggcaaagg aggtcggcgg cgatttctat aacttcttca tgatcgacga 1621 cgatcatctg gctctgatga tcgcggacgt ttccggcaag ggcattccgg catcgctgtt 1681 catgatgatc accatggtgc ttctgaagac cgagacgaag gccggcgtaa gccccgccga 1741 agtgctgcgg caggtgaacg aacagatctg ctcgaacaat ccggaggaga tgttcgtcag 1801 cgtctggatg ggcatcctgg agatctccac gggccggctg accgctgtaa acgcgggcca 1861 cgaatacccg gtggtaaagc acgggaacgg gaagtacgaa ttgctgaagg acgtccacgg 1921 cttcgtggtg ggcggcttcg acgatatgac ctacgacgac tacgagctgc agctggagcc 1981 cggctcccgc ctgttcgtct acacggacgg cctgccggaa gccatggcgg cggagcgcag 2041 catgttcggt atggcccgga tcgtggaaac gctgaacgag gggccggacg gcacgccgaa 2101 ggaagtcgtg gagcacatga gagatgcggt caaccgcttc gtgaaagacg aggagcagtt 2161 cgacgatctc accatgctgt gtctgtccta cgagggcccg gcaaaataat acgaaactca 2221 gaaaggttgg aattctttga tctatacgtt ggaactcatc ggcaccatcg cgtttgcggt 2281 ctccggtgcc tctgtgggca ttaaaaagaa aatggatatt ctcggcgtcg ctgtcctggc 2341 catgaccact gccgtgggcg gcggcatttt gcgtgacctc atcatcaacg tcgtgccgcc 2401 ggccgcgttc cgcgatccgg cgtttacggt cacggcgatc gctgtagggc tcatcgcctt 2461 ccttcctccc gtgcgggaag attaccggcg caaagcggag ttttacgaga aggtcctcct 2521 ggtgacggat gcgctgggcc tgggcatctt taccgccatc ggcatccagg ctgcctacag 2581 cgccatcccc tggtgcaacg gctttctggc gggcttcgtc ggcgtgctga cgggcgtggg 2641 cggcggcgtg atgcgcgacg tgatggccgg cgagcagccc tacatcttcg taaagcattt 2701 ctatgccagc gcctccattc tgggcgctgt ttactgcgtc ctcacctggg accacatgag 2761 ccaggcagcg tcgctgcttt cctgcacggc gcttgtcgtg ctgctgcgca tcctggcggc 2821 caaattccgc tggaagctgc ccaaggcgga gtagggggaa acaggcgcct tttttggctc 2881 tttacgaggt gcatgttctt ttcccgccgt gtttttgtta taatcatctt aactagaaat 2941 cccataacca aggaggacag ttaaatgtgt aaaaaggtgt attcaatcgt gctgtgccta 3001 tgcctgctgc ttacgctgct gccggcacag gtgtttgctg ccaatgtgca agaaggctta 3061 tattggcgct gggcaaaacg ggtcagccat gatcctgctt cgtgggagca aatgccgaac 3121 gaacagttgg aaacaaagat aaatggcagc tatcccggtt cgcaggggat agagttcatt 3181 tatgtggaca gcgccggaac ggaaaatccc gttgctgtca gcgaac // LOCUS sequence110 3226 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence110 VERSION sequence110 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3226 /mol_type="genomic DNA" /organism="" /note="sequence110" CDS 214..876 /product="(d)CMP kinase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_010943242.1" /transl_table=11 /codon_start=1 /translation="MRTKTIVAIDGPAGAGKSTIAKRLAQRIGADYIDTGAMYRAVALK LLRTGTDYNDPEALQTMLDAMDVDFSQGKTILDGEDVSGLIRTPEISALASPSSGVPAV RYKLTALQQAMGKRKSIVMDGRDIGTVVFPDADFKFFLTASADERARRRTEEMRAKGQE ADFETIRADIIQRDYQDSHRAFRPLQKAEDAVEIDSTDMSIDSVVDTMMAFIEARDR" /locus_tag="LOCUS_3870" /gene="cmk" /EC_number="2.7.4.25" /note="WP_010943242.1 (d)CMP kinase (Geobacter sulfurreducens) [pid:46.6%, q_cov:99.5%, s_cov:95.7%, Eval:4.1e-47]" /note="MGA_539" CDS 895..1881 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MAGSENQKYKLLYLYKILMEETDEDHVLTTPQLIEKLAAKGIRAE RKSIYADLEALRNEFGVDIVDVGRGGHYVGERTFEFPEVKLLADSVLSSRFITDRKTVE LVEKLKTLASTHQARQLTGRMFVADRVKSMNSSVYYSVDTIASAIDSGCKVSFRYFTFN AAKEKQYHHEGQAVSVSPYDLVWDNEYYYLIAYDGADRKIKHYRIDRMERIKVLGNEKR EGADLYDKADVRSYSKRMFSMFAGEETAVTLRFADKLAAVFIDRFGKDVIVSPDGEGHS RVNVRVFVSPQFYGWLFGLGPDVQILAPEAVRTEYTKRLKEVQAQYE" /locus_tag="LOCUS_3880" /note="MGA_540" CDS 1878..2801 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MIYHSIFNEVLGPITTGPSSSHTAGCGRIGLVARSLYGKDVCRAD IVFDKNGSYPSTYQGQGSDYGFTGGLLGIPIDDPRFRDSLRLAKAQGVDICFKTEDLGS EHPNQAEIRFYESKDAQRPSMRLMTYSIGGGMIEIRAMDDFPVYIDGSSKEAFILCSEA CEDAVEEVIRKNRFFYDRTDGKGDRFFEVDIEADQDSAPLLELRGWEGVQYVRIADPVM AVPKRRASLMPFGTAAQALEYGEAHGLNAAQLACVYESAYGFVSEEGAYALAARTEEVM RASSVPPDPETTAVNGFLPYFGKKMA" /locus_tag="LOCUS_3890" /note="WP_164922193.1 L-serine ammonia-lyase, iron-sulfur-dependent, subunit alpha (Rhodopirellula baltica) [pid:30.5%, q_cov:91.2%, s_cov:51.9%, Eval:2.8e-27, partial hit]" /note="MGA_541" ORIGIN 1 gatcagcagt tccttcatcg gcgaggtcgt catggagaaa ctgaaggatc tggacgaggt 61 cgcctacgtg cgctttgcct cggtctaccg tcagtttaag gacgtcaaca cctttatcgc 121 agagatcgaa aaactgctgg gaagcggcgc aggaacaaag ctcaagaagg ctgccaaggc 181 tccgaaggcc gctcccgggg aggaataagc cctatgcgga ccaagaccat cgtcgccatc 241 gacggaccgg caggcgcagg gaaaagcacc atcgccaagc ggctggcgca gcgcatcggt 301 gcggattaca tcgatacggg tgctatgtac cgggcggtag cgttaaaact gctccgcacc 361 ggcacggatt ataacgaccc ggaagcgctg cagactatgc tggacgccat ggatgtggat 421 ttctcgcagg gaaagaccat cctggacggg gaagacgtga gcgggctcat ccgcaccccc 481 gagatctcgg cactggcttc gccttcgtcg ggcgttcctg ccgtgcggta taagcttacg 541 gcgctgcagc aggccatggg aaagcggaag agcatcgtca tggacggcag ggacatcggc 601 accgtcgtgt tccccgacgc ggattttaaa tttttcctga cggcctccgc ggacgagcgg 661 gcccgccgcc gcaccgaaga gatgcgcgcg aaaggacagg aagcggactt cgagacgatc 721 cgggcggata tcatccagcg cgactaccag gattcccacc gggcattccg gccgctgcag 781 aaggcggaag acgcggtgga gatcgactcg acggacatga gtatcgacag cgtcgtggat 841 accatgatgg cctttatcga ggcgagagac cgctagcgat ccgggaggca gaccatggca 901 gggagcgaaa atcaaaagta taaacttttg tatctgtaca agatcctgat ggaggaaacg 961 gacgaagacc atgtcctgac gacgccccag ctgatcgaaa aactggcggc gaagggcatc 1021 cgggcggagc gcaagagcat ctacgcggat ctggaagcgc tgcgaaacga gttcggcgtg 1081 gacatcgtcg acgtgggccg gggcggtcat tacgtagggg agcgcacgtt cgagtttccc 1141 gaggtaaaac tgctggcaga cagcgtgctc tcttcgcggt tcatcacgga tcgcaagacc 1201 gtggaactcg tggagaagct caaaacgctg gcgagcactc atcaggcacg gcagctcacc 1261 gggcgcatgt tcgtcgcgga ccgggtaaaa tccatgaaca gcagcgtcta ctacagcgtg 1321 gacaccatcg catctgccat cgattccggc tgcaaggtgt cgttccgtta tttcaccttt 1381 aacgcagcca aggaaaagca gtatcaccac gagggccaag ccgtctccgt cagcccctac 1441 gatctcgtat gggacaacga atactattac ctgatcgcct acgacggcgc ggacagaaag 1501 ataaagcact accgcatcga ccgcatggag cgcatcaaag tcctcgggaa cgagaaacgg 1561 gagggtgccg atctgtacga caaagcggac gtgcgttcct attccaagcg catgttttcc 1621 atgtttgcgg gggaagagac cgcagtgacc ctccgatttg ccgataagct ggcggctgtc 1681 tttatcgacc gcttcggcaa ggacgtgatc gtctcgccgg acggcgaagg acattcccgg 1741 gtaaacgtcc gggtgtttgt gagcccgcag ttctacggct ggctgttcgg tctcggaccg 1801 gacgtgcaga tccttgcgcc cgaagccgtg cggacggagt atacgaagcg tctgaaggaa 1861 gtgcaggcgc aatacgaatg atctatcaca gcatattcaa cgaagtgctc ggccccatca 1921 ccacagggcc ttcgagctct catacggcag gctgcgggcg cattgggctc gtagccaggt 1981 ctttatatgg aaaagatgtg tgccgggcgg acatcgtgtt cgacaagaac ggttcctatc 2041 ccagcaccta tcagggccag ggttcggact acggttttac cggaggactg ctgggcatcc 2101 ccatcgacga cccgcgtttt cgggacagcc tccggctggc aaaagcgcag ggcgtcgata 2161 tttgttttaa gacggaagat ctcggaagcg agcaccccaa tcaggcggag atccgcttct 2221 acgagagcaa agacgcgcaa agaccgtcta tgcgccttat gacgtactcc atcggcggcg 2281 gcatgatcga gatccgcgcc atggatgact ttcccgtcta tatcgacggc agcagcaaag 2341 aggcctttat cctctgcagc gaagcgtgcg aagacgcggt ggaggaggtc atccgcaaaa 2401 accgcttctt ctacgaccgc acggacggca aaggcgatcg ctttttcgag gtagatatcg 2461 aagcggatca ggacagtgcg ccgctgctgg aactgcgtgg ctgggagggc gtacagtacg 2521 tacgcatcgc agaccctgtg atggccgtac cgaagagaag ggcttcgctt atgccattcg 2581 gcaccgcagc gcaggcgctg gaatacggcg aggcgcacgg tctgaacgcg gcgcagctgg 2641 cctgcgtcta cgagagcgct tacggatttg tctccgaaga aggggcatac gcgctggctg 2701 cccgcacgga agaagtgatg cgcgcgtctt ctgtaccgcc ggatccggag acgacagccg 2761 taaacggatt tttgccctat ttcggaaaaa agatggcgta aaaagcgccg gcaaccgttc 2821 tgttcggcgg agacgtcttc cgcagtgcca tgcttgccag cgtggccgtc atggaaaaca 2881 acaacgccca caacgtggtg gcggctgcac cgacggcagg cgccagcggc gtgctgcccg 2941 gggcgatcgt cgccatggga tctgccatgg gcttttcttc ggagaagata caggaaggcc 3001 tgctggccgc aggactcgtg ggcgcgttca tcggcaacca ggcgaccttc ggcgcggagg 3061 tggcgggttg tcaggcggaa aacggcgccg catccgccat ggctgcggca ggcatcgcgc 3121 acatgctggg gtgtcctctg aaggacgtat tcggcgcagc ggggctggcg cttcagaaca 3181 tgctgggact ggtctgtgac cccgtagcag gccttacgga gctgcc // LOCUS sequence111 3160 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence111 VERSION sequence111 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3160 /mol_type="genomic DNA" /organism="" /note="sequence111" CDS 336..1601 /product="phosphoribosylamine--glycine ligase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011393539.1" /transl_table=11 /codon_start=1 /translation="MNVMVIGGGGREHAIIKKIKENPEVTAIYALPGNGGIAMDAYCVD IKATDLEGIKEFVKGHPVDYAVVAPDDPLVLGCVDMLQDMGIPCFGPEAKAAIIEGSKV FSKDLMKKYGIPTAKYETFDDMEDALAYLDSAPIPTVIKADGLALGKGVIIAQSTGEAK QAVISMMQDKQFGKSGERIVIEEFLEGPEVSVLSFTDGKTVVPMISSMDHKRIGDGDTG LNTGGMGTIAPNPYYTEDVAKRCMEEIFLPTIAAMNAEGRTFKGCLYFGLMLCADGPKV IEYNCRFGDPETQVVLPLLESDLLTVMQAVTNGTLAETEVKFSDKHACCVILASEGYPV SYKKGFPISIPADVLPCTYIAGAKKEMGQLVTSGGRVLGVTAVADSLKEAIDASYAMAE QIRFEGAYKRSDIGARALKAVR" /locus_tag="LOCUS_3900" /gene="purD" /EC_number="6.3.4.13" /note="WP_011393539.1 phosphoribosylamine--glycine ligase (Moorella thermoacetica) [pid:50.1%, q_cov:99.5%, s_cov:99.8%, Eval:9.7e-112]" /note="MGA_544" ORIGIN 1 tgacagagac aacgccatcg acggctacat caaccagaac gagctggacg tctgcgccga 61 aggcaactgg cagagatatt tcagcagaca gcccgaaccc ttcaccaagg aaaagcagaa 121 ggcctacctg gcgacgatcg acggcatcgc cctgggttcc gacgctttct tccccttcga 181 cgacaacatc gagagagcca agctctccgg cgtcaaatac atcgcggagc ccggcggatc 241 cgtccgcgac gacctcgtca tcggcgcctg cgacaagtac ggcatggtca tggcctttac 301 cggcatgcgc ctgttccatc actaggaggc aaactatgaa cgtaatggtc atcggaggag 361 gcgggcgcga gcacgccatc atcaagaaga tcaaggaaaa cccggaagtg accgccatct 421 acgccctgcc cggcaacggc ggcatcgcca tggacgcata ctgcgtagac atcaaggcga 481 cggatctgga aggcatcaaa gaatttgtaa agggtcaccc ggtggattac gccgtggtcg 541 ccccggacga tcctctggtc ctgggctgcg tcgacatgct gcaggacatg ggcatcccct 601 gctttgggcc cgaggcgaag gcagccatca tcgaaggcag caaggtcttt tcgaaggacc 661 tgatgaagaa atacggcatt cccaccgcga aatacgagac gttcgacgat atggaagatg 721 ccctcgctta tctggacagc gcccccattc ccaccgtcat caaggcggac ggactggctc 781 tgggcaaggg cgtcatcatc gcacagagca ccggagaagc caagcaggcc gtcatctcca 841 tgatgcagga taagcagttc ggcaagagcg gcgagcgcat cgtcatcgaa gagttcctgg 901 aggggccgga agtgtccgtc ctgtccttta cggacggcaa gacggtcgta cccatgatct 961 cctccatgga tcacaagcgc atcggagacg gcgacaccgg cctgaatacc ggcggcatgg 1021 gcaccatcgc ccccaacccc tattacacgg aagacgtggc caagcgctgc atggaagaga 1081 tcttcctgcc caccatcgcc gccatgaacg ccgaaggccg cacctttaag ggctgcctgt 1141 acttcggcct catgctctgc gccgacgggc cgaaagtcat cgagtacaat tgccgcttcg 1201 gtgacccgga gacccaggtg gtgctccccc tgctggaaag cgacctcctc accgtgatgc 1261 aggccgttac gaacggcacg ctggcggaga cggaagtcaa gttcagcgat aagcacgcct 1321 gctgcgtcat cctggcatcc gaaggatatc ccgtctccta caagaagggc ttccccatca 1381 gcattcccgc ggacgtgctg ccctgcacgt atatcgcggg cgcgaagaag gagatgggcc 1441 agctcgtaac gtccggcggc agagttctgg gggtcaccgc ggtagcggac agcctgaagg 1501 aagccatcga cgcctcctat gccatggcgg agcagatccg cttcgaaggc gcctacaaac 1561 gctcggatat cggggcaaga gccctgaagg cagtcagata aagccagttg ttttcacgga 1621 aaggacaaga aaagaaacat ggtttacaga gtatacgtag aaaagaaacc cggattcgat 1681 ctggaagcga agagcatgct ggcggatctg aaatccagtc tggggatcga aggtctgaag 1741 gacgtccgga tgttcaaccg ctacgacgcg gagaacatgt cgaaggaaca gttcgactac 1801 gccgtaaagt atgtcttctc cgaaccgcag atggataccg cctgcgagct gcctgacttc 1861 ggcgatgcta aggtcttcgc cgtggagttc ctgcccggcc agttcgacca gagagccgac 1921 tccgctgccc agtgcatcca gctgatcttc cagggcgaac gtcccctcac ccgctccgcc 1981 agagtctatg ctctttatgg cgatctgagc aatgcggacg tggaagcggt caagaagtac 2041 gtcatcaacc ccgtggaagc cagagaagcc gcggcggaag tccccgagac cctggtcgtc 2101 aactacgaca ttcccacgga agttgccacc ctgacgggct ttaccgccat gaccgacgcg 2161 gatctggaca agttcatcgc agacaacggt ctggcgatgg acgaggcgga cctggcaatg 2221 gtccgggact acttcgcttc cgagcaccgt gaccccacca tcaccgagat caagatgatc 2281 gacacctact ggtccgatca ctgcagacat accaccttca acaccgtgat cgacggcgtt 2341 acgttcgagg acgagctgct ccagaacgcc tggaacgact acctcaagac ccgcgaggat 2401 ctgggccaca cgaagcccat ctgcctgatg gacctgggca ccatcgcagc caaagagctc 2461 aagaagcagg gcaagatgga caagctggac gaatccgacg agatcaacgc ctgcaccatc 2521 aagatgaccg tgaatatcga tggcaaggaa gaaccctggc tgcttctctt caagaacgag 2581 acccacaatc atccgaccga gatcgagccc ttcggcggcg cagccacctg caccggcggc 2641 atcatccgcg atccgctttc cggcagagcg tacgtctatg cagcgatgcg cgtgagcggc 2701 gcggcggacc cgacgcggcc cctgagcgaa gcgcttcccg gcaagattcc ccagaagaag 2761 ctcacccaga ccgcagcagc gggcaactct tcctacggca accagatcgg tcttcccgcc 2821 ggcgtcgtgg aagagatcta ccaccccggc tacgtagcga agagaatgga gctcggcgca 2881 gtcgtagcgg cagcgcccgc ggagaacgtg cgcagagaag ttccggctcc cggcgacgtg 2941 gtcatcctgc tgggcggcgg cacgggccgt gacggcatcg gcggcgccac cggcgcttcc 3001 aaagcccacg acgtgcactc cgtcgagacc tgcggcgcgg aagtccagaa gggcaacgca 3061 cccgaagaga gaaagatgca gagactgttc cgcaacggcg aagcgacccg cctcatcaag 3121 cgctgcaacg acttcggcgc aggcggcgta tccgtcgcca // LOCUS sequence112 3155 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence112 VERSION sequence112 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3155 /mol_type="genomic DNA" /organism="" /note="sequence112" CDS 1391..1600 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MKNVKKYTIVSEVFVCEEEPCLCYGIRREDDAIRYISTDRVFVEM VTEVVNRLDLDPQRARDLIESLLP" /locus_tag="LOCUS_3910" /note="MGA_547" CDS complement(1665..1877) /product="PTS ascorbate transporter subunit IIC" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_000796544.1" /transl_table=11 /codon_start=1 /translation="MTEDLKSTKKQVPLRLSPKLYAAIAAWAEDDFRSVNGQIEYLLTE CVKQRKKNGKYVGEEIDAPIELDIE" /locus_tag="LOCUS_3920" /note="WP_000796544.1 PTS ascorbate transporter subunit IIC (Bacteria) [pid:79.7%, q_cov:91.4%, s_cov:97.0%, Eval:2.8e-24]" /note="MGA_548" CDS complement(1893..2924) /product="SPFH domain-containing protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_000136824.1" /transl_table=11 /codon_start=1 /translation="MNEIILNKRKNGMGMLLLLLILYVGAVILLIGSASYALPIHGALR GIVIAVCILWLAIGWILFLGLKVIRPQEALVLTLFGNYVGTLREEGFYWVNPFCVAVNP AANTKLSQSGDVDSGDKTSLLTTLATSGKQTGEISSKKISLKVMTLSNSRQKINDCLGN PVEIGIAVMWRVTDTAKAVFNVDNYKEYLSLQCDSALREIVRIYPYDVAPGVDTTGDGI ADEGSLRGSSELVASRIRDEIQHKVTEAGLEILEARITYLAYAPEIAAVMLQRQQASAI IDARKMIVDGAVGMVEMALDRLAENNTVELDEERKAAMVSNLLVVLCGNKDAQPIVHSG SLY" /locus_tag="LOCUS_3930" /note="WP_000136824.1 SPFH domain-containing protein (Streptococcus pneumoniae) [pid:69.3%, q_cov:100.0%, s_cov:100.0%, Eval:2.3e-121]" /note="MGA_549" ORIGIN 1 atgatgtatt cttcttccag gttccagatc gaccgtccgg ggtcggactg gatgccgaag 61 cgctttctgg ggttgtccga gagcaatttg accagctgat cgagggtgag cgttccggac 121 tttaccagat aggtgtagag cagcgggaat gccgtttcga tccccacgat gccgaacgcg 181 ctcttctcta gacccttcgc cttttcttcg gcgctgtggg gcgcgtggtc ggtggctacg 241 atctcgatcg tgccgtcgca gatgccctcc agcagcgctt cccggtcggt tttatcccgc 301 accggcggat tcatcttgaa ccatccgtct tcggtcagct gggagtcgtc catcagcagg 361 taatggggcg ccgtctcgca ggatacgtcg atgccgtcct tcttgccctg gcggacgagc 421 tctgcgctct cttttgttga gatgtggcac acgtggtagc cgcagccggt ctgatacgcc 481 aggtcgatat cgcgttccac ctgccgccat tcgctctcgc tacagatgcc tcgatgtccg 541 tgctccttgg cgtagcggcc gtcgtggatg tagccgccgc gcagcagctc gttgacttcg 601 cagtgggcga cgacgagttt gcctaaggct ttggcccggg tcatcgcctc tttcatgagc 661 cccgcatcct gcacgccttt gccgtcgtcg gaaaaggcgc agacgtaggg cgccatggct 721 tcgagatccg cgatctcttt gccctgttcc ccgacggaga tgctgccgta gggatggaca 781 gcgatcacag ccgtcttttc gatgatctcg agctgttgct cgagatggga cagactgtcg 841 ggcacgggcg ccaggttcgg catggtgcag acggcagtat agccgccgtg cgccgccgca 901 gccgatccgg atgcgatcgt ctccttatat gaaaaacccg gctcgcggaa gtgcacgtgc 961 acgtcgcaaa agccgggaag gacagtgctg ccgctgtccg tctgtccgaa agttctgccg 1021 ttgttttttg cgttgaaaga catagtttct ccggattttt gcagaaaacc ctgccggaaa 1081 gccggcaggg tgaacgaaca tagcaggaga ggggcctgtg ctgcagcacc tgcccaaaac 1141 tttctatgac tcgatcttgc cgacctcacg ggatcgttct taaagatcaa ttatcttaag 1201 tattatgcgc ctgcacaggg aggagtgtca aggaaaagca gcgaagtttt ttgctgaaaa 1261 aattttttgg aaaattttca aaaaagtgcg tgataatttg ctaaaaaatt actcatttat 1321 tatagaaggg gtttttggga tctgccgtag gcaaatctga aaataaagga tgcgtttagg 1381 aggagaagcg atgaagaatg taaaaaagta cacgatcgta agcgaagtat tcgtctgtga 1441 agaagaaccc tgtttgtgtt acgggatccg gcgcgaagac gacgccatcc gttatatctc 1501 gacagaccga gtctttgtgg aaatggtcac agaggtggta aatcgcctgg atctggatcc 1561 gcagcgcgcc agagatttga tcgaaagcct gctgccctaa acgacctccg caaaaaaagg 1621 ccggccgggt ctcgatgaga ccggccggct tttttttgta ccgtctattc gatgtccagc 1681 tcgatcggcg cgtcgatctc ttcgccgacg tacttgccgt ttttcttgcg ctgcttgacg 1741 cactcggtaa gcagatactc gatctgcccg ttgaccgagc ggaaatcgtc ctccgcccag 1801 gccgcgatgg cggcatagag cttcggcgac aggcgcagcg gcacctgttt tttggtgctt 1861 ttcagatctt cggtcatttc ctcacccgtg gactaataca ggctgccgga gtggacgatg 1921 ggctgtgcat ccttgttgcc gcacagtacg accagcaggt tgctcaccat ggcggctttg 1981 cgctcttcgt ccagttcgac ggtgttgttt tccgccagac ggtccagcgc catctccacc 2041 atgccgactg cgccgtccac gatcatcttg cgggcatcga tgatggccga tgcctgctga 2101 cgttgcagca taacggctgc gatctccggc gcgtaggcca gataggtgat gcgggcttcc 2161 aggatctcga ggcctgcttc ggtcaccttg tgctggatct cgtcccggat acggctcgcc 2221 accagctcgg aagaaccgcg caggctgcct tcgtccgcga tgccgtcgcc ggtcgtatcc 2281 acgccgggcg ccacgtcgta ggggtagatg cgcacgatct cgcgcagggc gctgtcgcac 2341 tgcagggaca ggtattcctt gtagttgtcg acgttaaaga cggccttcgc cgtgtccgtg 2401 acccgccaca tgaccgcaat gccgatctcc accgggttgc ccaggcagtc gttgatcttc 2461 tggcgggagt tggagagggt catcaccttg agggagatct tcttgctgct gatctctccc 2521 gtctgcttgc cgctggtcgc cagggtcgtc agaagcgagg tcttgtcgcc gctatccacg 2581 tcgccgctct gggagagctt cgtgttcgct gcggggttca ccgcgacgca gaacgggttg 2641 acccagtaga aaccttcctc ccggagggtc cccacgtagt tgccgaacag ggtgagcacc 2701 agcgcttcct ggggccggat gaccttaagt cccaggaaaa ggatccagcc aatagcgagc 2761 cagaggatgc agacggcgat gacgatgccg cgcagggcac cgtggatggg cagagcatag 2821 gaggcgctgc cgatgagcag gatgaccgct cccacgtaca gaatgagcag aagaagcagc 2881 atccccatgc cgttctttct tttgtttaag atgatttcgt tcatatgatc agataccttc 2941 cttttgaaaa ccacgatatg tgatatcaaa ataatatcac ttcgatagca gacgtcaaga 3001 ggtttttgaa aaatgttata atggaaagca gacaggaggg caggatccat gaagaccata 3061 ggactgatcg gcggcatgag ctgggaaagc acggtgccgt attaccagat cataaacgag 3121 accgtaaagc agactctggg cgggctgcat tccgc // LOCUS sequence113 3155 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence113 VERSION sequence113 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3155 /mol_type="genomic DNA" /organism="" /note="sequence113" CDS complement(875..1399) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MTTALLLSCIKIFCCRILDVTCGTIRTILTVKENGKAAALVGFCE VFLWYVIVKDAMTSDGPVIAIAIAYAAGYATGTYVGGQIARRVISGNVTVQVVTSRRDD AMLSAIRDAGFAITVLNANESEFAEGKYLIIATVDKKQLKVFEDLVKEKDEKAFIMVSD TKSYVGGYFGK" /locus_tag="LOCUS_3940" /note="MGA_552" CDS 1531..1950 /product="CBS domain-containing protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_009889129.1" /transl_table=11 /codon_start=1 /translation="MNIAFLLQPKSDTAFLYDDFTLRQGLEKMRHHGYTAIPVIDREGK YITTISEGDFLWFILRDSEDGDLQEVPLQNLEKTQIKDIIHTDKNPPVPITATTDELVE RGMEQNFIPVVDDWGSFIGIITRRNLLERFAKYKD" /locus_tag="LOCUS_3950" /note="WP_009889129.1 CBS domain-containing protein (Clostridioides) [pid:48.1%, q_cov:94.2%, s_cov:88.0%, Eval:7.1e-31]" /note="MGA_553" CDS 2001..2903 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MHRPYKTRQGGCTVTVFVPYDCNNHCPFCVNKGEYADMTGFSLEK ICESIEVMDSITPACDFVFTGGEPFANLESLQVMLDKVPSTHHVYINTTLPVSKTVTEE DILAFTEKNKDKISCINVSRHMQHYVVESNDELLAKLPVPFRINCVLYKDYPVEGLIPF IERFKKIPGANIQFRFDYTATTPENLYDSEHDKIVHDLNKIGRYTGLDGCRMRCGFHYD YHGMEMVYHKTLPYSCIVEEDPKNRITYNILYDILIKQTGEIHADWSDAVLDDVRLDVP AYRHVVFEPYDMHWIEKID" /locus_tag="LOCUS_3960" /note="MGA_554" ORIGIN 1 acgcccagtt gatggcctgc tgcagcaccc aggtattcag ccggtgggcg ccatggccgt 61 attcgccgtt gatgtcgtgg tcgatcacga cttccggctt aaaccgccgc agcagcatta 121 cttcgtaagc ctcgacctcg tcgagatccc acaaagtctt cgcgtgctcc aggttatcgg 181 aatagtaatc cgtaaaagtc gaaataacgg gatagtgggt catgccaacg gtccaaaggc 241 cgtccagcag ttcgtggggc cgcatgggct gctcccaatg atgcgtcaga taggcgatct 301 gcaccttgta gcccagttcg cccgcgtagg tcggcatggt gccgccgaag aacaggtgct 361 cgtcgtccgc atgcgtggag atgagcagca tgtccgcatc gtcgtaaaaa ggctgccaaa 421 cctgcacgtc cgccggcaca tccccttccc cgtagcacag cacgtcgcag aggatggcgc 481 ctgcctgggg catgtggagg gtcacatgcg tggacggcgc gtccagcgcc acgtactcgt 541 ggagataatt cccctggccg cagagctgcc ccagggtgtg accctgggca tcttccgtca 601 gcagccagtt tccggggatg cggtcccaga cgatataaag gaaatggatg tcctggtcgg 661 aggagatctc caccaggccc gtttcgttaa aggtgagttt ggaataccag ttgtcgtcct 721 gcagtttggc ggcgctccag acttgcccgt cctcgatggc atccatctgc acggacagcc 781 gcggcgcgtc tgcggcaaag acgaggcagg cgcacagaag cacaagcaga acgctgaaaa 841 cggagattcg gatggtccgg gtcatgcgct tcgcctactt tccgaaatag ccgcccacat 901 agctcttggt gtcggagacc atgatgaagg ccttttcgtc cttctccttg acgaggtcct 961 cgaaaacctt caattgcttc ttgtccacgg tggcgatgat caggtacttg ccttccgcaa 1021 attcggattc gttggcgttg agcacggtga tggcaaagcc ggcgtcgcgg atggcggaca 1081 gcatggcgtc gtcccggcgg ctcgtgacca cctgcaccgt tacgtttccg ctgatgaccc 1141 tgcgggcgat ctgaccgccc acataggtgc ccgtcgcgta gcctgccgca tacgcgatgg 1201 cgatggcgat cacgggaccg tcgctggtca tggcgtcttt tacgataaca taccacagga 1261 aaacctcgca aaagcccacc aaagcggcag ctttgccgtt ctcctttacg gtaaggatcg 1321 tacggatagt gccgcacgta acgtccaaga tacggcagca gaagatcttg atgcagctga 1381 gcagcagcgc ggtcgtcata ggtttcgcct cccccaaagc acattatgtt gcgaatcgat 1441 atcgatgtat tataccatat gcagaaattt ttgtgtataa ttaaggtgta ggtatgcgcc 1501 ccgacgcgtg ccgcagaaag gaaagaacgc atgaatatcg catttctctt gcagcccaag 1561 agcgatacgg catttttata tgacgatttt accctccggc aggggctgga aaagatgaga 1621 catcacggtt acacggcgat ccccgttatc gaccgggagg gaaaatacat cacgaccatc 1681 agcgaaggag actttctctg gttcatcctc cgcgacagcg aggacggcga cctgcaggaa 1741 gtgccactgc agaatctgga gaagacgcag atcaaggaca tcatccacac ggacaagaat 1801 ccgccggtgc ccatcaccgc gacgaccgac gagctggtgg aacggggtat ggagcagaac 1861 tttatccccg tcgtggacga ctggggctct tttatcggca tcataaccag aagaaatctt 1921 ctcgaaaggt ttgcaaaata caaggattga gtgtatactt ttgaagttaa ttatatctct 1981 ggcacagtaa ggaaacattg atgcacagac catacaagac cagacagggc ggatgtaccg 2041 taaccgtatt cgtaccctac gactgtaata atcattgccc gttttgcgta aacaagggtg 2101 aatacgccga catgaccggc ttttctctgg agaagatctg cgagagcatc gaggtgatgg 2161 actccattac cccggcctgc gacttcgtct ttaccggcgg cgaacccttc gccaacctgg 2221 aatccctgca ggtgatgctg gacaaagtcc ccagcaccca ccacgtgtat atcaacacga 2281 ccctccccgt ttcgaagacc gttacggaag aggacattct cgcgttcacc gagaaaaaca 2341 aggacaagat cagctgcatc aacgtgtcgc gccacatgca gcactatgtc gtagaatcca 2401 acgacgagct gctggccaaa ctgccggtgc ccttccgcat caactgcgtg ctgtacaagg 2461 attatcccgt tgaagggctc atccccttta tcgaacgctt caagaagatc cccggcgcca 2521 acatccagtt ccgtttcgac tacacggcga ccaccccgga aaatctctac gacagcgaac 2581 acgacaagat cgtgcacgac ctgaataaga tcggccgcta caccggtctg gacggctgcc 2641 gcatgcgctg cggattccac tacgattacc acggcatgga gatggtctat cacaagactc 2701 tcccctattc ctgcatcgtg gaggaagatc cgaagaaccg catcacgtac aacatcctgt 2761 acgatatcct catcaagcag accggcgaga tccacgccga ctggagcgat gccgtgctgg 2821 acgacgtccg tctggacgtg ccggcctacc gccacgtggt gttcgagccc tacgacatgc 2881 actggatcga aaagatcgac tagaaaatac cgccgccccg cttttccggg gcggtttttg 2941 tgtgacccca tgaatatcat cctcggaaaa cttatcctgc tctttgttct gctcatcgtt 3001 ctgatgaagt gcagactcaa tttgtcctgg tccatgggga tcacgatcct ggccggtttt 3061 gtcctgtacg gcttcggatg gagcggttcc ctcgaccttc tgaagaccgc cacgtttacc 3121 tgggatacgt tctctctggt ggccacggtc tacgc // LOCUS sequence114 3148 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence114 VERSION sequence114 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3148 /mol_type="genomic DNA" /organism="" /note="sequence114" misc_feature <1..1060 /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_005808893.1:APC family permease" /note="WP_005808893.1 APC family permease (Desulfitobacterium hafniense) [pid:49.4%, q_cov:96.6%, s_cov:73.0%, Eval:1.5e-83, partial hit]" /note="MGA_556" /locus_tag="LOCUS_3970" CDS 1102..1914 /product="carbon-nitrogen hydrolase family protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011860835.1" /transl_table=11 /codon_start=1 /translation="MKIALIQMKVGMDKDKNLEKARRMVLQAGREGARIAVLPEMFCCP YANEYFPKFAEPVGGHIYTALSEMARDAGVTLVGGSFPEEEDGKLYNASFVFARDGSQR ARHCKAHLFDIDVEGGQHFHESEVFTPGDSITTFRTAGHTFGLAVCFDIRFPELFRAMA LKGAEAVFVPAAFNMTTGPMHWELSFRMRAVDNQLFTIGASPAQDKYGVYHAYGHSIVC DPWGKVLVDAGENESVTLVDIDLSENERVRQQLPLLSARRPSLYGMKE" /locus_tag="LOCUS_3980" /note="WP_011860835.1 carbon-nitrogen hydrolase family protein (Clostridioides difficile) [pid:52.5%, q_cov:98.1%, s_cov:96.4%, Eval:1.9e-74]" /note="MGA_557" CDS 2019..2390 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MANNDFEMGSTSVDSVIVETAIGVDTVFKGSITTNKPIRIDGHYE GEINSDNLIIITETGYFNGDMKCRELQLQGKGEGTVICTSLMQLSATGSFKGNIATKDI ILVTGSQLDGQIDMASLRK" /locus_tag="LOCUS_3990" /note="MGA_558" misc_feature complement(2438..>3148) /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_011016645.1:SAM-dependent methyltransferase" /note="WP_011016645.1 SAM-dependent methyltransferase (Fusobacterium nucleatum) [pid:45.9%, q_cov:88.1%, s_cov:53.9%, Eval:3.7e-52, partial hit]" /note="MGA_559" /locus_tag="LOCUS_4000" ORIGIN 1 ctggccgaat tttccgctgg tgatcccggc agagcagggc ggctgcatca tcggaccgga 61 atgcatgtgt ctgatgatgt tcttcctggt ctgcgcctat ctcgtaaacg cgctgtcgcc 121 gacgcttgcc ggtaaattcc agaccaccac gacggtcatc aagctcatcc cgctgttcct 181 aatggccatt gttggggtca tcgtcgggat cgtcggaccc aatcatatgc tgatcagcaa 241 tttcgccacg gcatccgtca atgccggcgg aacggctgcg ccgctgctgg cttctgtctg 301 cgcgacatct ttcgcctacg aaggctggat catcgcgacg tccatcaatg cggaactgaa 361 ggatgccaag cgcaacctgc ccagagcgct gatcatcggc ggggtcatca ttatcgttac 421 gtatatctgc tactatatcg gcgtcgcagg cggcgcatcc gtcgacgtgc tgatgcagga 481 aggcgctacc aaggcgttcg tcaacatctt cggcggcgtg ctgggcaaca tcctcaacct 541 cttcgtcgcc atctcctgcg cgggcaccat gaacggcctg atgctgggct gctgccgcgg 601 catctactcg ctggccgccc ggggcgacgg gccgcatccc aggctcttct cccacatcga 661 ccgtgtgtcc aatctgccga acaactccgc ggcgttcggc ctgctgctct gtgcgttctg 721 gggctgctac ttcgtgatgg ccagcctgct ggagacctgg ggcagcgtaa aggcctttgc 781 cggtacaccg ttcgagagcg tgccgttcag tttcgacgct tcggagctgc cgatcatcac 841 tatctatgcc atgtacatcc cgatcttcat caactggatg cgcaaggcga aggacgaatc 901 aacggtacgg cgcttcgtca tccctgtgct cgccatcgca ggttcgctct ttatggtcta 961 cgcttcgatc gtcggccacg ggatggaaaa cttctggtat ctgatcgtat tcgcggccgt 1021 catgctggtc ggacggctgt ttatcggaaa gaagcgctga tgacgagaga tgagtctgaa 1081 gaagaaagga tgtagatcga tatgaagatc gcactcatac agatgaaggt cggcatggac 1141 aaggataaga acctggaaaa ggccaggcgt atggtgctgc aggcagggcg ggaaggcgcc 1201 cgcatcgcgg tgctgccgga gatgttctgc tgtccctatg ccaacgagta tttcccgaag 1261 tttgcagagc ccgtcggcgg gcacatctat acagcgctat ccgagatggc gcgggatgct 1321 ggggtcaccc tggtgggcgg atcgttcccg gaagaggagg acggcaagct ttacaacgcc 1381 tccttcgtgt tcgcgcggga cggcagccag agagcccggc actgcaaggc tcacctgttc 1441 gacatcgacg tggaaggcgg ccagcatttc cacgaatccg aggtgtttac cccgggagat 1501 tcgatcacga cgtttcgtac ggcggggcat accttcggac tggcggtctg cttcgacatc 1561 cgtttcccgg aactgttccg ggctatggcg ctcaaagggg cggaggcggt cttcgtgccg 1621 gcagccttta acatgaccac gggacccatg cactgggagc tttccttccg catgcgggcc 1681 gtggataacc agctgtttac catcggcgca tcgccggcgc aggacaaata cggcgtgtac 1741 cacgcctacg gccattccat cgtctgcgat ccctggggga aggtgctggt ggacgccggg 1801 gaaaacgaga gcgtgaccct ggtcgatatc gacctctccg aaaacgaacg ggtgcggcag 1861 cagctgcctc tgctttctgc gagaagaccc tcgctgtacg gcatgaagga ataaacgaca 1921 gctgttcata aacgcccgaa aacccttgca ggggttgaaa tctgagcaca ggtgtgttaa 1981 gataatcggg cattctacaa aggaggctgt tgttttacat ggctaataac gatttcgaaa 2041 tgggaagcac gtccgtggat tccgtcatcg tggaaaccgc gatcggcgtc gataccgttt 2101 tcaaaggatc tatcaccacc aataagccca tccgcatcga cggacattac gagggcgaga 2161 tcaattccga taatctgatc atcatcacgg agaccggtta ttttaacggc gacatgaagt 2221 gccgcgaact gcagctgcag ggcaagggcg agggcaccgt tatctgcacc tccctgatgc 2281 agctttccgc gaccggttcc tttaagggca acatcgccac gaaggatatc atcctggtta 2341 ccggatccca gctggacggc cagatcgaca tggcttccct gcgcaaatag aaaaaacaga 2401 atatcagaaa accggtccat ggagaccggt tttttcttta ctcttttccg atggtggggg 2461 agacgtgcca gtactcgcat tgcctgcgga aatccgcctg agctttgcgc ctgtccgctg 2521 gacccgcctt gcccgcgatg caccgcagca tgatgttctt cgcggtgtgc tccagactgg 2581 tgaattcgat catgtctacc ttatagcccc actctgtgag ctttaaagcc cgcagggcgt 2641 cggtgaggat ggcggagaag cgctctctta agatcccgtg acccaggatc gcttccatgt 2701 ccggccgccg gatctggcgg ttgagctcgt gctggcagca ggggaccgac aggatgactt 2761 tcgcattcca ggcatgggct ttctgcaggg cgaaatccgt agcggtgtcg caggcgtgca 2821 gcgtgacgac catgtccgcc ttggcggtct cgtcgtagtc ggcgatgtcg cccacgagga 2881 actgcaggtc ttcgtagccc agatcctgcg ctacgccgct gcagaaggcg atgacgtctt 2941 cctttaagtc cagacccacc agcttcgctt tgtaatcgtt tttaacgttt agataccaat 3001 acagggcgaa ggtgaggtag gatttgccgc agccgaaatc gatgatgacc ggctctttgg 3061 gcagatattc caggcagtcc tccgcgatct cgagaaagcg gttgatctgc cggaacttgt 3121 tgcggtgttt gggcacgatc tggccgtc // LOCUS sequence115 3130 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence115 VERSION sequence115 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3130 /mol_type="genomic DNA" /organism="" /note="sequence115" CDS 1187..1513 /product="cysteine-rich small domain-containing protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003437519.1" /transl_table=11 /codon_start=1 /translation="MDNERPFWEGKHYAFTQNKECEFFPCHKTNKPEDFNCLFCYCPLY ALGTKCGGNFVITEKGIKDCSGCLVPHARNGYGYVIGKYSEISDLVSEQIRLQREEAQK GEEK" /locus_tag="LOCUS_4010" /note="WP_003437519.1 cysteine-rich small domain-containing protein (Clostridioides difficile) [pid:60.0%, q_cov:78.7%, s_cov:98.8%, Eval:8.1e-32]" /note="MGA_561" CDS 1513..2508 /product="DUF4428 domain-containing protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011459959.1" /transl_table=11 /codon_start=1 /translation="MGIFSNDKKGCPICGNPTPRLFPTKVEGLPLCKECAAKINMESSM LKDLTINELWDHLDYRKANSETFGTFTDNETHGMGNFVLHVDSDKKLFYIADGRPSNPA LFKFEELVSFNLMEDGRTVIQCNSSGYTEGVSSIENYKLPPLKPLVKPGVTKAAPASAQ PGRTSMAASSSSSQTAEEKPKAPDKPIDSLKLNVTLNNPYWKSKVYSISLPSIESEEEI REWVNDYKNTFAAAVDTCEAMAGIMGVKTGKQMMAAIKEKAEAILAVQEAEAAAKEAEA ANQVAEAAAKIAKTADDNAAIEMLKKWKELLDMGAINQEEFDAKKKELLG" /locus_tag="LOCUS_4020" /note="WP_011459959.1 DUF4428 domain-containing protein (Desulfitobacterium hafniense) [pid:21.9%, q_cov:100.0%, s_cov:99.7%, Eval:4.6e-15]" /note="MGA_562" ORIGIN 1 aagagcaatc tgtacaagaa agtcgatgaa aaatgggtca tcgaccagga gatcgcccac 61 cgccagatgt ccaacaactc catctactat ctgcacaagc ccacccgcga acagctgcat 121 tggcacctca cccagatgcg ctattccggc gaaccgggct acgtaaacgc ggaagaaggg 181 cagagaagac gcccgaactt taacggggtc aacccctgcg ccgagatcct gctggattcc 241 aagggcctgt gcaatcttac gaccgtcaac tgcatgggat tcgtggacga aaacggcgcg 301 ctggataagg cggggctgct ggaggcgcag cggctgtccg ccagagccgg ttaccgcatg 361 acctgcacag agctggagat cccggaatgg aacaccgtcc agcagagaga caagctcatc 421 ggctgctccc tcaccggctg gcaggacatg gtgaacgcca cccgcatgac gaaggacgag 481 caggctgcgc tgctgtccga gctgcgcgct gccgcaagag aagccgcaag aaagtatgcg 541 gaagaactgg gtatgccggc gccgctgctc gtgaccacgg tcaagcccga aggcacgctg 601 tcgctgctgc cggtcgtatc ctccggcgta cacttcagcc atgccccgta ctacgtgcgc 661 cgcgtgcgca tctccgcaga cgatccgctg acgaaggtct gcgaggaact gggctatcca 721 gtctatccgg aagtgggcca ggaccccgcc acctgcgcca ccaaggtcgt agaattcccg 781 gtaaaggcgc cggaaggccg ctgcaaggca gacgtttccg ccgtcgaaca gctggagatc 841 tacaagatgt ttatggagca ctacgtggat cacaactgct ccattaccgt gcacgtccgc 901 gacaacgaat gggacgccgt ggaagaatgg gtgtgggaga actgggactg cgccgtagcg 961 ctctcgttcc tgtcctacaa cgagtccttc tacgaactga tgccctacga ggagatctcc 1021 gaggcggaat acaacgaccg catggcgaag atggcgccgt tcgtgccgtc cctgatctcc 1081 aagtacgaga aggaagaagt tgcgtacgat atcggcaatg acggttgcga aaacggcatc 1141 tgccctgtaa gataataata gaaaactgtt tcggggggtg tttccaatgg acaacgaaag 1201 accgttctgg gaaggaaagc attacgcgtt tacgcagaat aaagaatgcg agttcttccc 1261 ctgccacaag acgaacaagc cggaagattt caactgcctg ttctgttact gcccgcttta 1321 cgcgttgggc acgaagtgcg gcggcaattt cgtcattacg gagaagggca tcaaggattg 1381 cagcggatgc ctggttcccc atgccagaaa cggttacgga tatgtgatcg gtaaatacag 1441 tgaaatcagc gacctcgttt ccgagcagat ccgtctgcag cgggaagaag cgcagaaagg 1501 tgaggaaaag tagtgggtat tttttcgaat gacaaaaaag gctgccccat ctgcggcaac 1561 ccgacgccaa gactgttccc gaccaaggtc gagggactgc cgctgtgcaa ggaatgtgca 1621 gcgaagatca acatggaaag ctccatgctg aaggatctta ccatcaacga actgtgggac 1681 cacctggatt accgcaaggc gaattcggaa acattcggta cgtttaccga caacgagacc 1741 cacggcatgg gcaatttcgt tctgcacgta gactccgaca agaagctgtt ctacatcgcg 1801 gacggacgtc cctccaaccc ggcgctgttc aagttcgagg agctggtaag ctttaacctg 1861 atggaggacg gccgcaccgt catccagtgc aacagcagcg gctacaccga aggcgtaagc 1921 tccatcgaga attataagct cccgccgctc aagccgctcg taaagcccgg cgtaacgaag 1981 gcggctcctg cttcggctca gcccggcaga acgtccatgg cggcgagctc ttcttcctcg 2041 cagactgcgg aagagaagcc caaggcaccg gataagccca tcgacagctt aaagctcaac 2101 gtcaccctca acaacccgta ctggaagagc aaggtctaca gcatctccct gccctccatc 2161 gagagcgaag aggagatccg tgaatgggtc aacgattaca agaacacttt tgcggcagcg 2221 gtagacacct gcgaagccat ggcaggcatc atgggcgtca agaccggcaa gcagatgatg 2281 gcggcgatca aggaaaaggc tgaagccatc ctggccgttc aggaagcgga agcggcggcg 2341 aaggaagccg aagcggccaa ccaggtcgca gaagctgctg cgaagatcgc gaagaccgca 2401 gatgacaacg cggcgatcga gatgctcaag aagtggaagg aactcctgga catgggcgcc 2461 atcaaccagg aagaattcga cgccaagaag aaagaactgc tcggataaga cagcaaagag 2521 gtaaatatga agagaactga gatcggtgtc gcgctgcttg gtttcggcaa cgtgggcagc 2581 ggcacctaca aagctctcga agagaatttt gcgctgatcg aaaagaaggt cggcgcaaaa 2641 gtcgttataa aaaagattct ggtgcggaac ctgaacgctc cccgcagagt ggaagctccc 2701 gcagaacttt ttacgacgga cttcgaggag atcctgagag atcccaagat cgacatcgtg 2761 gcggaactgc tgggcggcat caacccggcg acaggctata tccgggcggc gcttaccgca 2821 ggcaagcatg tcgtgaccgc caacaaagca gccctggccg tgcacctgcc cgacctgaac 2881 aaggcagcgg cgttccacaa gtgcatgctg cgctacgagg cgtccgtatg cggtgcgatc 2941 cccgtcatcg gctgcatttc ccgggcactt acggccaacc gcatcaccgc agtgaagggc 3001 atcgtaaacg gcacgacgaa ctatatcctc acccgtatgg cggcagaagg cgcatcctat 3061 gaggacgtgc tgaaggacgc ccaggctctg ggctttgcgg aagccgaccc cacgggcgac 3121 gtggaaggct // LOCUS sequence116 3123 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence116 VERSION sequence116 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3123 /mol_type="genomic DNA" /organism="" /note="sequence116" ORIGIN 1 cgacgatctc agccgcacat ccatctaccg gaaagacacg ttccagccca ccccggcgca 61 ggactttttc cataacaacg acatcagcac cgatctgagc gaattcgaga agatgctgat 121 ggaaagcacg aaggacgcgg aaggggacga gaccctggcg atcaaccgtg accgcatcaa 181 gggcgcagcc ctgtccgcgg aagagctgat cgatccgctg cccacgaagg ccggcgatac 241 gcatccctta ggtgaagcgc ccgcacccgc gcctgccgcg gaaccggaac ccgaaccggt 301 gccgcagacg ccggaagagg ccgccaagag cgagcacagg aagcgcatgg aggccatggc 361 gaaggccaga gaagcctatt ttgcaagcct ccgcaccatg acagccgaga tgaaggccgt 421 aaaggacgcg gaattcaagg cacagctgga gaaggaagcc cgcatctccc acgagccgtt 481 cgtaagagaa gctgttcccg aaaagacggc ggagcagatc gccgccgaaa aggcggaaga 541 ggcgaagaag gccgcagaga gggaagccgc ggaacgcgcc gccgccatcg agcaggcgaa 601 agccgagatg aaggccgcgc aggaagccca ggagaaggaa ctgggtctgg acgcgctgga 661 cgaagtggtc tcccgccagc cggaaaccgc cgaagagccg gaagaaaaac cggaaaaaac 721 acctgtggaa agtccggcag aagaacccaa ggaagatacg aaggaaattc ccgtcaaggc 781 gcagcccgaa cgggataaga ccgaagtcct cggagagatc ctggacgacg tggaagagga 841 gactgaaaag aaggagaagc gcgaacacag tcactggttc ctgaagttcc tgctggcgct 901 cctcatcgta gccggtgctg cggagggcgg cacgatcgcc ctgcgccact atgcgcccga 961 ttcgccggca tccatcatta cgacgggcat cgagcagaac gtcatccagt tcgtacagag 1021 cagcttcgat cagatcaagg cgaagttcca gaaggacgag ccggaagaga ccgtgccgga 1081 aggcgaaccg cagggcgaag aaggtcccgc tttcgtgctt tccgacctga tcgcggagaa 1141 caacaagaac atcgaggaag tcgtggagaa cctggccatc ggctacgatt cccagcgctc 1201 ctacgacgtg cccggacttg ctgcctccca gctcgtaacg gatacggcgg agaagaccgc 1261 ggtctgcaag accctcatcg gatacaacag cgcctggatc gacttcatca acggaacgag 1321 ccaggactgc ctcaacttcc tgaaagccga cggcaccgcc taccgcagcg ccgttacgtt 1381 cgacaagatc ggacagatca cggaagtgtt caagaagctg gagatcggtg agatccgcaa 1441 gaccgaagac gcgtactttg ccttcgccgg agagaccatc gaggtcaccc aggacgaagc 1501 gacagcccag tcctccggtt ttatggtcta cgagctcgtg cccgtaggcg aagaactcaa 1561 gatcaaggac tactacaaca tcacgaacta aacatttaga aaggaccccg catggagaag 1621 gaaaaacaca ggagaggcgc aaagctacgc atcgcgctcg gcgtactggt cttgctggcc 1681 gtactcatct acgcccttac gggttttctg acggacctgc tgtggttccg ggagaccggc 1741 tacgtgtcgg tgttctttac agagctgctt acgaagatca aggtgggtat tcccgtggtc 1801 atcgtcgtgg cgctcctcat gtgggctttc ctttccgccc tgaagaaagc gtttctgagc 1861 aagggcggct ataagctgga ggacgcggac gcgaaaaaac tgcgcaaagc aggcatcctg 1921 ctgagcgtcc tcttcagcgt catctcttcc gcaggcatca tctcccgcct ctggtggcag 1981 atcctgcagt tcctgcacgc aacggaattc aacgtcgcag acccgctgtt cggcaacgac 2041 gtcggttttt acgtgtttaa actcgaattc ctcgaatccc tgagcgcctc cgccctcagc 2101 atcgtgggct tcctgctcct ggccaccgtc atctactacg tgatgctcat caacctggtg 2161 gagccggacg gcacggcgca ggagaccgag gcggatacct acgattacga cattcccggc 2221 gaggacagcc ccggccggga tgaccccgcc aaaaagatca tcgatctgtt tacgaagcgg 2281 ggcttttcca gggaggaaca gcccagagaa ggcaagaatt taaagcagac cggacacgcc 2341 atcctgcggg tcgccggcac ccagatcgcg attctgggat ttctcggctt cctgctgctg 2401 gctgcccgct ttgccctcgc ccgctacgac ctgctgtatt ccggcacggg cgtggcctac 2461 ggcgccgggt acaccgacat caatgtgacc ctgaacgtct accgggcctg catgatcctt 2521 tctctggtct ccgcggtgct gttcgtggtc gccctgaaga agcgcagcat taagctcggc 2581 gtggctgccc ccatcctaat ggcggtcgtg ttcggcgcag gcacgcttgc cggcaccgct 2641 gtgcagaacc tcgtcgtggc gccggacgag atcaacaaag agcgcaccta tctgcagaac 2701 aacatcgatt acacccgcat ggcctacgat ctgcaggaca tcgcggtgcg ggatttcgtg 2761 ccccagaaca acctgtccat gaaggacgtg ctgctcaaca tgggcacgtt ctccaacatc 2821 cggatcaacg acttcgaacc tgcccagcag ttctataatc agacccagtc catccgtacg 2881 tactacgaat tcaacgacgt ggacgtggac cgttacaacg tgaacggcga atacacccag 2941 gtcttcttgt ccgccagaga gatcaaccag gcccggatcg aagatcagtg gctcatccgc 3001 cacctgaagt acacccacgg ctacggcatt acgctgtcgc gtgttgacaa ggtgacggcc 3061 tccggccagc cggacatgct catcgacagc attccgccgg tgtccgaagt gcccgagatc 3121 tcg // LOCUS sequence117 3116 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence117 VERSION sequence117 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3116 /mol_type="genomic DNA" /organism="" /note="sequence117" CDS complement(1291..2298) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MKLYLIKKKKGRKYTSEACAKAVAGVTLEHDASGRPVAIDGPFVS VSDTKNWWSLLTADSPCGLDLEEGSRTLSAVTAKKLHAAEQQYLAGLEPLSSEWRQEFL SIWVRKEAYMKYCGEGLRMGLSKFSVLDADLEYAKTVQAKNYPAAHMTSLEPGHGLYAA AALGSPEDLESIEICAYEGETEKEILDEAADLLAGRAYMSGDLQKKLRAKGYGAEETED AVTRLQELGYLDDEAYAKSFASDAARKGKGKLRIARELAQKGADSATAKAAIEAAAEEE DLLSERERAMEAAQKMLRGSQDIDEKMLARIGRRLSSLGYEPSVIWDVLGKLKS" /locus_tag="LOCUS_4030" /note="WP_011404862.1 RecX family transcriptional regulator (Salinibacter ruber) [pid:29.8%, q_cov:52.8%, s_cov:77.5%, Eval:1.3e-09, partial hit]" /note="MGA_567" CDS 2406..2696 /product="YerC/YecD family TrpR-related protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_010965963.1" /transl_table=11 /codon_start=1 /translation="MYDSKFKCEANDDLFKAILALETEEDCYRFFEDLLTIKELQSMAQ RWQVVRMLKEKMTYIDIAAETGASATTISRVNKCLNYGAGGYAAVLKKLEK" /locus_tag="LOCUS_4040" /note="WP_010965963.1 YerC/YecD family TrpR-related protein (Clostridium) [pid:58.9%, q_cov:99.0%, s_cov:96.9%, Eval:1.8e-26]" /note="MGA_568" CDS 2715..2846 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MAIKVVSIAGTPVEGPSPAAEPVELPLIDPADEMYELLLKGAL" /locus_tag="LOCUS_4050" /note="MGA_569" ORIGIN 1 accaggacgg cttcgcgtaa tagacgagcg gcgtgtcgca gcgccagcag tgcggatagt 61 tgtggacgat cttcttcttg tcgtacagct tgccctcgga ggccagccac ttgatgatct 121 ccacgtccag gccttcctcc atgatgaagt gacccttcca gggcgtcgcg gtgtatttgc 181 cttccggatc gacggggttg gcgacggcca gaccgtattt cttacctgcc tggtagtcgt 241 cttcaccgaa cgccggcgcg cagtgaacga tgccggtacc gtcttccgtg gagacgtagt 301 cggcggtgcc tacgaagaag gccttgccgg gaacgtccac gaagggcatc agctgttcgt 361 attccatgta ttccaggtcc ttacccttca tttcggcaac gaccgtgtat ttgccttcgc 421 cgagaacggc gtccgctctg gccttggcca gatagtagaa cttgccgtcc tgctcggcct 481 tgatgtagtc gatctcaggg ccgaccgcca ggaattcgtt ggctgccagg gtccacgcgg 541 tggtggtcca ggccaggaaa taggtattct cttcggtctt ggacttaaag ggcaccgtca 601 gggtgatgac ggcgacttcc ttgtagccct gtgcgacttc gtgggaagcg aggcccgttc 661 cgcagcgcgg gcagtaagga agcaccttgt gaccctcgta gatcatgccc ttcttgaaga 721 actgatccag gatccaccag acggattcga tatagtcgtt gttcagggtg atgtacggat 781 gatccagatc taccaggtag cccatgcggt ggctcatctt gcgccacagg ccctcgtagg 841 tgaagacgga ttccttgcac ttctcgttga attcgcggat gccgtatttt tcgatatcct 901 gcttgccgga gaagccgagc tgcttttcca cttcgatctc tacgggcagg ccgtgggtgt 961 cccagccggc tttgcgcgcc acgcggtagc cctgcatggt cttgtagcgg cagatggagt 1021 ccttcagcgt acgggcgatc acgtggtgga tgcccggctt gccgtttgcg gtaggcggtc 1081 cctcatagaa aataaagtta ggctggcctt ctcttgcggt gacgcatttt tccagcagtt 1141 tttcctcgtc ccatttgtcg gcctgggcaa gctgcacctc tgcgatgggt gcgtcagaca 1201 ggtttttgta catcgttttt cctctattgt gatatggaat taaaaattga cgcgttaact 1261 tatttagtat attgaaaaat caaggtcgcg tcaagacttc agcttgccca aaacatccca 1321 gatgacggag ggttcgtagc ccagggacga aagcctgcgg ccgatgcggg cgagcatctt 1381 ttcgtcgata tcctgtgacc ctctcagcat cttctgcgcc gcttccatgg cgcgttcccg 1441 ctcggacagc aggtcctcct cttccgcggc cgcttcgatc gctgccttcg ccgtcgcgct 1501 gtctgcgcct ttctgcgcca gttctcttgc gatgcgcagt tttcccttgc cctttcgcgc 1561 tgcgtcggaa gcgaaactct ttgcgtacgc ttcgtcgtcc aggtagccca attcctgcag 1621 acgggtcaca gcatcttccg tttcctccgc accgtagccc ttcgctcgca gtttcttctg 1681 cagatcgccg ctcatatacg ctctgccggc cagcagatcc gccgcctcat ccaggatctc 1741 tttctccgtt tcgccttcat aagcgcagat ttcgatggat tccagatctt ccggcgatcc 1801 cagcgccgcc gcagcgtaca gaccgtgtcc gggttcgagg ctcgtcatgt gcgcagccgg 1861 gtagttcttc gcctgcacgg tctttgcgta ttccagatcc gcatccagca cggaaaactt 1921 cgaaagcccc atgcgaagcc cttcgccgca gtatttcata taggcctctt tgcgcaccca 1981 gatggacagg aattcctgcc gccattcgct gctcaggggc tccagacccg ccagatactg 2041 ctgttccgcc gcgtgcagct ttttcgcggt gaccgcggac agcgtgcggc tgccctcctc 2101 caggtccagt ccgcaggggc tgtctgcggt caaaagcgac caccagttct tcgtgtcgct 2161 cacggaaaca aaaggtccgt cgatagcgac cggccggccg gaagcgtcgt gttccagcgt 2221 gacccccgca accgctttcg cgcaggcctc gctcgtgtat tttctgcctt ttttcttttt 2281 gatcaaatac agtttcatag tacgtattat acaaatatta ccaacccttg tcaaaggggg 2341 ccatatatta tataatacta tatcacacta aagcaccgta gtctcaaaga cacaaaggac 2401 ctcccatgta cgattcgaaa tttaaatgtg aagccaacga cgatctgttc aaagctatcc 2461 tcgcgctcga gacggaagaa gactgctacc gcttcttcga agatctgctc acgatcaagg 2521 aactgcagtc catggcccag cgctggcagg tcgtccgcat gctgaaggaa aagatgactt 2581 acatcgatat cgcagcagag accggcgcgt ctgccacgac gatcagccgg gtcaacaaat 2641 gcctgaatta cggcgccggc ggctacgctg ccgtcttaaa aaagctcgaa aagtagacac 2701 aaaaaggagg cactatggcg atcaaagtcg tttccatcgc aggaacgcct gtcgaagggc 2761 catcgccggc tgcagaacct gtcgaactgc ccctcatcga cccggcggac gagatgtacg 2821 aactgttgct gaaaggcgcg ctgtaaacgg cgggatatcc gcaatgcaaa aggacggccc 2881 ctccggaccg tccttctttt tacgcttttc ccagcaggat ctgcagagac ttcagcaggt 2941 tctgatgcac cacgtccgcg gcgttgaaat gggtcatgtt gcagatcagc tgcaggatgg 3001 ggcccgccag ggctacgctc aggatggtgc cgatgccgag ctgaccatcc agcagccacc 3061 ctatgagggt cacgatgccc cacatgatca tcgtcatggc cccgatgggg atcttc // LOCUS sequence118 3113 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence118 VERSION sequence118 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3113 /mol_type="genomic DNA" /organism="" /note="sequence118" misc_feature <1..1159 /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_003435270.1:methionine gamma-lyase family protein" /note="WP_003435270.1 methionine gamma-lyase family protein (Clostridioides difficile) [pid:56.7%, q_cov:99.5%, s_cov:89.7%, Eval:8.9e-133]" /note="MGA_571" /locus_tag="LOCUS_4060" CDS 1495..1803 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MRNHRKYRVANKARFTAFVAVTLVLMAFIVSTALGYNTASGASTK EFVQVKVESGDTLWALAQEYGPADMDVRSVVFQICRLNGISAGDLQPGQYITIPTEL" /locus_tag="LOCUS_4070" /note="WP_012804685.1 LysM peptidoglycan-binding domain-containing protein (Brachybacterium faecium) [pid:35.2%, q_cov:89.2%, s_cov:65.6%, Eval:6.4e-08, partial hit]" /note="MGA_572" CDS 1926..2723 /product="M55 family metallopeptidase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_009889182.1" /transl_table=11 /codon_start=1 /translation="MRVFISADIEGTAFTTIWPETDHGEEEYPAAARQMTMEVKAACEG AIAAGADYIVVKDAHDGGRNIDLNEMPKCVEVIRASNGSPRTMVEGIEAGFDAALFIGY HSAAGKIGNPLSHTFTTKTTRVLLNGEDCSEFMIYSWCAAYYGVPTVFLSGDKMLTEDS LHLHPMLKTVWAKDGYGGYTRCRQPQLVCDLIRAGVEESLKQDLSKAMCELPKHFDLQI SYKEHRDAAPYVNYPGFEMVDSHTIRMQTDDYYEFLRCVPFVF" /locus_tag="LOCUS_4080" /note="WP_009889182.1 M55 family metallopeptidase (Clostridioides) [pid:41.7%, q_cov:99.6%, s_cov:100.0%, Eval:3.1e-53]" /note="MGA_573" ORIGIN 1 caaccagtac aagcttttgc actgctttca ggaggcccgc ataaacgacc agcacttcgc 61 ctggaacacc ggctacggct acgacgacgt aggccggacg gccctggaac agctctacgc 121 cgatgtgttc ggcgcggagg ccggtctggt gcgtcccacg atcgtcaacg gcactcatgc 181 gctggcaagc gtctacctgg ggctgctgcg tcccggcgac gagctcatct actgcaacgg 241 cgatccctac gataccatgc agaccgtcat cggcctgaag ggcgacgcct acggcaatct 301 gaaggaattc ggcgtcacct ataagcaggt ggacctgctg ccgggcaatc agatcgacct 361 ggaaggcgtt aagaaggcga tcggtcccaa cacgaagatc tgcgcgctgc agcgctcccg 421 gggctacgtg ttccgcaatg ccatgaccat tccccagatc gaagcctggg cagcggcctg 481 caagtccgtc aagcccgacg tcatctgcat ggtggacaac tgctacggcg agtttacgga 541 tacgaaagaa ccggtgcagg tcggcgcgga catcatggca ggctctctca tcaagaaccc 601 cggcggcggc cttgcggtct ccggcggcta cgtggtgggg cgcaaggatc tggtggataa 661 agtggctacc cgggtcacca gccccggcat cggcggcgaa tgcggcctta ccttcggcca 721 gacccgcagc atgttccagg ggctgtttat cgccccccgg gtgaccatcg gagcggtgaa 781 gggcgctgcg ctgtgcgccc aggtatttgc agatctcggc tacgaagtct gcccgggtcc 841 ggaggatccg agaaacgata tcgtggaagc ggtcaagctg ggcaccccgg aggcggtctg 901 cgccttctgc gaaggcgtgc aggcggcggc gcccatcgat tcctacgtta cgccggtgcc 961 ctgggacatg cccggataca ccgaccagat catcatggcg gccggagcct ttgtgggagg 1021 cagttccatc gagctgtcgg cagatgcgcc catgcgtgaa ccatacatcg tctacttcca 1081 gggcggtatt acctatgagc acgcgaaatt cggcgtcatc aaggcgctgc agaccttaaa 1141 agataagaaa atcgtataat atgcagctgt ctgttggaca tctgttggac agcaggctgc 1201 cgagctgatg gaagacatgg cggaaaaagg gcagggcgag tttatgggag acctgatgca 1261 gcggaaagtc cgcagtgact tgcaggacta gaacctgccg aagaagaagg aagaggcgga 1321 aaaagctttg gaaaaggacg tggagcagaa cgctccgcag ttgaaataac aagcctggaa 1381 gcggtgcaaa ggcaccgctt ctttttttat gaaaaattga aaaaagttct tgcaaaagaa 1441 caaatgttct gctattatgg tcttgcgaac aaatgttctt ggaggagaac gaccatgaga 1501 aaccacagaa agtacagagt tgccaataag gccagattca ccgcattcgt agccgtcacg 1561 ctcgtcctga tggcgtttat cgtaagcact gcgcttggtt ataacacggc gtccggcgcc 1621 agcaccaaag aattcgttca ggtcaaagtc gaatccggcg atacgctctg ggcgctggct 1681 caggaatacg gtccggcgga tatggacgtg cgcagcgtcg tattccagat ctgcagactc 1741 aacgggatct ccgcgggcga tctgcagccg ggtcagtata tcaccatccc gacggaactg 1801 tagcgtttgg ctttcagttg tatacattaa gcgataagcg gcagactttt ctgtcgcttt 1861 tcctgtatcg ggattataat ggtcttggaa actgttttcg ggaaaacagg ttaggaggaa 1921 gatccatgag agtatttatc agcgcagaca tcgaaggcac cgcttttacg accatatggc 1981 cggaaacgga ccacggcgaa gaggaatatc cggcagcagc cagacagatg accatggagg 2041 tcaaggcagc ctgtgaaggc gccatcgcag ccggtgcgga ttatatcgtg gtcaaggacg 2101 cccacgacgg cggccgcaac atcgatctga atgaaatgcc gaaatgcgtg gaagtcatcc 2161 gcgccagcaa cggcagtccc aggaccatgg tcgaaggcat cgaagccgga ttcgacgcgg 2221 cgctgtttat cggctatcat tcggcggcgg gaaaaattgg taatccgctg tcccatacgt 2281 ttacgaccaa aacgacccgc gtactgctga acggcgaaga ttgttccgag tttatgatct 2341 acagctggtg tgcggcatat tacggcgtgc ccacggtatt cctgtccggc gacaagatgc 2401 tcaccgaaga cagtctgcat ctgcatccga tgctcaagac cgtctgggcc aaggacggct 2461 acggcggata cacgcgctgc cgtcagccgc agctggtgtg cgatctcatc cgggccggcg 2521 tcgaagaatc cttaaagcaa gatctgtcca aggccatgtg cgaactgccg aagcatttcg 2581 atctgcagat ctcttataag gaacacagag atgcagcgcc ctatgtaaac tatccgggat 2641 tcgagatggt ggattcccac acgatccgga tgcagacgga tgactattac gaattcctgc 2701 gctgcgtacc gttcgtgttt taaaacggta aaatcgtcgg aaaacgcccg cagagaaaaa 2761 cagaaacgtt ttttaaggta taacttatcg acgaatcaaa aaaaatcgct taaatcggcg 2821 atttttggcc tcgtgtcctg aaagcattga aatttcaacg gtttgtggga ttgcggcacg 2881 atcataaggg attggagacg gaaaattggc aaaattggag cagcatctga cgggagactt 2941 cggtcagatc gtggaattcg ttcatggcga actgcataag caaagcgtgt cgctgagcct 3001 ggaagaagtt tcgaagaata cggtatgcgg caagcgtatc gaactgagag tctatgagag 3061 gttcagctat gcgggcggca accgggcaag tctgacggtg cagtttatag aaa // LOCUS sequence119 3088 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence119 VERSION sequence119 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3088 /mol_type="genomic DNA" /organism="" /note="sequence119" CDS complement(457..1098) /product="CBS and ACT domain-containing protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_005815172.1" /transl_table=11 /codon_start=1 /translation="MFVKDRMTKDPYTIQVSASINTLIGLMRDKKLRKVPVLDGEKLVG IVTDRDIERVSPSKATSLSVYEINYLLSKITVADAMVAEVITCSPDDYIEDAALVMREH RINSLLVTENDKLIGIVTDSDLFDALIDMMGGRTKGNKFVMRVPNQPGVMTKIGAITAS EGTNITHFTMTQSGEDAMLYVITDPNDDVEKTREALESEGFKIENLLIRK" /locus_tag="LOCUS_4090" /note="WP_005815172.1 CBS and ACT domain-containing protein (Desulfitobacterium) [pid:41.8%, q_cov:97.7%, s_cov:97.2%, Eval:8.8e-44]" /note="MGA_576" CDS 1217..2398 /product="aminotransferase class I/II-fold pyridoxal phosphate-dependent enzyme" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011015808.1" /transl_table=11 /codon_start=1 /translation="MSEFKRASEILYAGESVRGMDLKKPETLPIFETTAFTMNSLSELA EVTADKGWTYSRTRNPNRAALAEAISYLEGGEASLIFASGMGAITVPLITLLQPGDRVL CNANIYGETFSTLRDILSKMGVETDFVDYLDMDAVKAAVRPETKLIYSEVVSNPTVKIA DIPALAELAHNNGALLMVDNTFTSPFAIRPMDFGADIVINSLTKFLNGHADAMGGSMTT TQALVDRIRPVSMLVGTPGDAFSAWLILRGLKTAELRIPRQIKTAEKLARFFADDPHIT AVNHPSLATGKQKELADKLFGENGSTPMMSFVLPEDIEKIDAFMKALRFTRYAPTLGGL RTTMSHPVTSSHFSMPDEERRKIGITPGMIRLSVGLEDPDDLIADFKNALKVF" /locus_tag="LOCUS_4100" /note="WP_011015808.1 aminotransferase class I/II-fold pyridoxal phosphate-dependent enzyme (Fusobacterium nucleatum) [pid:57.9%, q_cov:99.5%, s_cov:98.7%, Eval:1.2e-129]" /note="MGA_577" misc_feature complement(2395..>3088) /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_002680943.1:potassium transporter TrkG" /note="WP_002680943.1 potassium transporter TrkG (Treponema denticola) [pid:36.6%, q_cov:98.7%, s_cov:46.7%, Eval:8.6e-35, partial hit]" /note="MGA_578" /locus_tag="LOCUS_4110" ORIGIN 1 aggcgcgggt cggcaaagaa ctgacgcaga ccagctacaa ctggaagacg ctgcacgaca 61 gcggcgtgtg catcgccggc ggttccgaca gcccggtgat cgacttttcc gtcatgaacg 121 gcatctactg cgcggtgacc cgcaagagat tgaacggcga gccggagggc ggctggctgc 181 ctgatcagaa actgacggtg gaagaggcgg tgcgtgctta cactatgggc ggcgcctatg 241 cctcctatga cgaaagagtg cggggcacga tccgcaacgg caagtacgcg gacctggtgg 301 tgttggaccg cgatatcttc gagatccctg cggaagagat aaaagatgcc aaagtggaga 361 tgaccgtgct gaacggcgag atcgtgttta cgagataatc ggaacagaat aaaacccctg 421 catcgcacag atgcaggggt ttagtttttt tggggcttat tttctgatca gcagattttc 481 gatcttgaag ccttcggact ccagggcttc tctggtcttc tccacgtcgt cgttcgggtc 541 ggtgatgacg tacagcatgg cgtcttcgcc ggactgggtc atggtgaagt gggtgatgtt 601 cgtgccttcg gaagcggtga tggcgccgat cttcgtcatg acgccgggct ggttgggcac 661 tctcatgacg aacttgttgc ccttggtgcg gccgcccatc atgtcgatga gggcgtcgaa 721 caggtcgctg tccgtaacga tgccgatcag cttatcgttt tccgtgacaa gcagcgagtt 781 gatgcggtgt tctctcatga cgagcgcagc gtcctcgatg tagtcgtcgg gggagcaggt 841 gatgacttcc gccaccatgg catcggctac ggtgatcttg gacagaaggt agttgatctc 901 gtagacgctc agagaagtcg ctttgctggg agagactctt tcgatgtctc tgtccgtgac 961 gattccgacc agcttttcgc cgtcgagcac gggcaccttg cggagttttt tatctctcat 1021 caggccgatg agggtattga tggacgcgct cacctggatg gtgtaggggt ctttcgtcat 1081 tctatcttta acaaacatgg tgtactcctt tctgttctca aatttatttt agcattcccg 1141 ccgtcatttt caacagaaaa tgatggtaca ataggaagag gaaaacgaaa aactgtccat 1201 tggacgagga ggcattatga gcgaattcaa gagagcaagc gagatccttt acgcgggaga 1261 atccgtaaga ggcatggacc tgaagaaacc ggagaccctt cccatcttcg agacgacagc 1321 gttcacgatg aacagcctgt cggaactggc ggaggtgacc gcagacaagg gctggaccta 1381 ttcccgcacc cgcaatccta accgggcggc gctggcggag gccatcagct atctggaagg 1441 gggagaggcg agcctcatct ttgcttccgg catgggtgcc atcaccgtgc cccttatcac 1501 gctgctgcag ccaggcgacc gggtgctgtg caatgccaac atttacggcg agaccttctc 1561 tacgctgcgc gacatcctca gcaagatggg ggtagagacg gacttcgtgg attacctcga 1621 catggacgct gtaaaagccg ccgtaagacc tgagacgaag ctcatctatt ccgaagtcgt 1681 aagcaatccg acggtaaaga tcgcggacat tcctgccttg gcggaactcg cccacaacaa 1741 cggcgcgctg ctgatggtgg acaacacctt tacgtcgccc tttgccatcc gtcccatgga 1801 cttcggtgcc gatatcgtca tcaacagcct tacgaaattc ctgaacggtc acgcggatgc 1861 catgggaggc tccatgacca cgacacaggc gctggtcgac cggatccgcc ccgtttccat 1921 gctggtcgga acgcccggcg acgccttcag cgcctggctc atcctgcggg gtttaaagac 1981 tgcggaactg cgcattccca gacagatcaa gacggcggaa aaactggccc gtttcttcgc 2041 ggatgacccc cacatcaccg cggtcaacca tccgagcctg gcgacgggca aacagaagga 2101 actggcggac aaactgttcg gggaaaacgg ctccacgccc atgatgagct ttgtgctgcc 2161 cgaagatatc gaaaagatcg acgccttcat gaaggctctg cggttcacgc gctacgcccc 2221 gactttaggc ggcctgcgca ccaccatgag ccatcccgtt acgtcgtctc atttctccat 2281 gccggacgag gaacgccgca agatcggcat tacgccgggc atgataagac tgtccgtcgg 2341 tctcgaggac ccggacgacc tgatcgccga ttttaaaaat gcactgaagg tattctagag 2401 cttttcccgc cagaaaccgc gggaaagggg aaggatgacc gcatagatct ccagtctgcc 2461 cgccagcatt aaaaagctga ggaacaggtg ggtgagggga tggaacatgt agtactgccc 2521 aagcatgccc atctggccgc agccggcgcc cgtgttgcag agcatggccg cggtagcggt 2581 aaacgcggtc tggaaatcgg acgtatcaaa cgtcaatacg aaagctcctg ccaggaacaa 2641 caggaagaac gtgagcgtat aggaaacgac cccgttcgcg atggaggaag gcaggggctt 2701 tttgtttgtc ttgatggtaa cgacggcgtt gggatggatg cgcgtcgtaa agctgcgcca 2761 gatcatcttg gacaggatga cgatgcggat gaccttgaga gccccgcccg tggaagagga 2821 acagccgccg aagaatccca gcagcgtgag catcatcctg gagaaggcgg gccaggtgtt 2881 gaaatccgcg ttggcatagc cggtggtcgt gaggaaggag accgcctgga atccgccgta 2941 gcgcagggct tctccggccg ttgcatacgt tctcgtaacg tacagatccg ctgcgatcag 3001 cagtatggcg cctgccgcga tccccaggta ggccttcagc tccgtattgc gtcgtatggt 3061 gtctttatcg cgcttgatga tcgcaaaa // LOCUS sequence120 3073 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence120 VERSION sequence120 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3073 /mol_type="genomic DNA" /organism="" /note="sequence120" CDS complement(488..1006) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MKTRRSWIILLTAALLLAASCFAAVFADDVVPGTAADPVVSKSYM DAQVAILQTQIKTLQEQIDKLAAGQSGSETPSTPATPAEVPKFVVVKVDAGKSLIGSAS AEIILRSGTATAIAGASGGVSDLTGGTDLSTGTDVSKNHLLIIPADDGRGIRCTTTCYV MVKGDYKLQ" /locus_tag="LOCUS_4120" /note="MGA_580" CDS complement(1210..1800) /product="DUF1836 domain-containing protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_010964199.1" /transl_table=11 /codon_start=1 /translation="MRYEQFAEKTAQEYQKKGLAEGRSIPEIELYIDQMVSCLNSELSL YAKDGDGPITKGMISNYTKHKMIPGPEGKRYTKDHCIFMLLVYYLKGCFSMDQIQRLMK PLLSNYSSEWDDSLDIQAYYGKIIEEVRKAEENFAGELLGDMNGIKKFLADRGSDDDIS EIVLLITMLIMRSNEERFLAEKLLDEYFPDKKK" /locus_tag="LOCUS_4130" /note="WP_010964199.1 DUF1836 domain-containing protein (Clostridium) [pid:30.7%, q_cov:88.3%, s_cov:87.9%, Eval:1.4e-18]" /note="MGA_581" misc_feature complement(1893..>3073) /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_011459544.1:ABC transporter ATP-binding protein" /note="WP_011459544.1 ABC transporter ATP-binding protein (Desulfitobacterium hafniense) [pid:64.9%, q_cov:98.2%, s_cov:60.0%, Eval:2.8e-142, partial hit]" /note="MGA_582" /locus_tag="LOCUS_4140" ORIGIN 1 aaatagacgc tgccgtcgtc cccgaaagcg atgacggatt cgctgtagcc tccggtgcgc 61 acgatgccgt cccggatgac aggtccgaga gagacgcccg tagccatgac gaaaaagtcc 121 gcgttcgtaa ggccggcgag cggattgtcc gcttcccctt ccgtgcggaa gatcgtcttt 181 gcagaggaga cgccgtagat tccgggaccg tagcagacca ggggctttac gtttcctccg 241 ggtgtatatt cgaaatagtg ttcgacggca ttcttgccgt taacggtgtt gtagttcgtg 301 gtggtgacca gcgtaagctg atcgttgagt tctatgcttt tcgaccgtag ctctacgagt 361 ccggaagctg cccaaatgcc tgcggccggc tgcagcataa gacaggccag gagcaggcac 421 ataatgcgaa acagtgtaag tctcttcccc ttcatgtaag ttcaataccc tttctgaaaa 481 tatcctgcta ctgcagtttg taatcccctt ttaccatgac gtagcaggtg gtggtgcagc 541 ggatgcctct gccgtcatcc gcagggatga tgagcagatg gttcttcgac acgtcggtgc 601 cggtggacag gtccgtgccg ccggtgaggt cggatacgcc gccggatgcg ccggcgatgg 661 ccgtggctgt gccgctccgc aggatgatct ccgcgctggc ggacccgatg aggctcttgc 721 ctgcatcgac ctttacgacg acgaacttgg gcacttcggc aggcgttgcc ggggtactcg 781 gcgtttcgga accgctctgg cctgcagcca gcttgtcgat ctgttcctgc agcgtcttga 841 tctgcgtctg caggatcgcg acctgagcgt ccatgtagct cttgctgacg acggggtccg 901 cggcagtgcc gggcacgacg tcgtccgcga agacggcggc gaagcagctg gctgccagaa 961 gcagcgctgc ggtgagaagt atgatccaag atcttctggt cttcatagtg atcctccggt 1021 tgttaaaaca gctgatctct tatcccctgc ccacaagatt ttgtgcgggc agaccctcaa 1081 aaatgcatat atagtaagta tatcatctgt tgcgggcata gaaaagtgca agcggtggaa 1141 attcaccgct tgcacacaat ttatcggggt ttggagctgc ctgccgggtc ttaagactgc 1201 gccgggccgc tattttttct tgtccgggaa gtattcgtcc agcagttttt ccgcaaggaa 1261 ccgctcctcg ttggaccgca tgatgagcat cgtgatgagc agcacgatct cggagatatc 1321 gtcgtcgctg ccgcggtcag ccaggaactt cttaatgccg ttcatgtcgc cgagcagttc 1381 gccggcaaag ttctcctccg ccttgcgaac ctcttcgatg atcttgccgt aatacgcctg 1441 gatatccaga ctgtcgtccc actcggagct gtagttcgag agcagcggtt tcatcaggcg 1501 ctggatctgg tccatggaga agcagccctt cagatagtag accagcagca taaagatgca 1561 gtggtccttc gtatagcgct tgccttccgg tcctgggatc atcttatgct tcgtgtagtt 1621 ggagatcatg cccttggtga tgggtccgtc tccatccttg gcgtacagcg aaagttcgct 1681 gttgaggcag ctcaccatct gatcgatgta cagttcgatc tccggaatgc tcctgccctc 1741 cgcaagtccc tttttctgat attcctgcgc tgttttctcc gcaaactgtt cgtaccgcat 1801 cgtcgctcct ccggggatgg taaaagatat cttttatctt attatagggc gggcggaacg 1861 agttggcaag ggaaaatgac gggcggagga aattacgcct ccgcgatctg gttgccggta 1921 tacagttgat aataccggcc cttcagggcc atcagctcgt cgtggtcacc gcgctcgatg 1981 atgcggccgt gctccatgac catgatggca ttggagttct ggatggtgga cagccgatgg 2041 gcgatgacga acaccgtgcg gccctccatc agctggtcca tgcccttctg gatgaggctc 2101 tcggtacggg tatcgacgct gctggtcgct tcgtccagga tcatcaccgg gggatcggct 2161 accgcgcagc gggcgatgga cagcagctgg cactgaccct gggacagctg gcttcccgta 2221 cccgaaatga cggtctggta cccttccggc agacgggaga tgaagtagtc cgcgttagcc 2281 agcttcgccg ccgcgtagac ttcctcgtcc gtggcatcgg ggcggccata gcggatgttc 2341 tccatgatgg tgcctgtaaa cagattggtc tcctgcagca ccatgcccag agatctgcgc 2401 aggtcgtcct tctttatatg gttgatgttg atgccgtcgt agcggatctt gccgtcttcg 2461 atgtcgtaga agcggttgat gaggttcgta atggtggtct tgcctgcgcc ggtggagccg 2521 acgaaagcga tcttctgtcc gggtttcgca aacagggaaa tgtcgtgcag caccgtcttc 2581 ccctccacgt agccgaaatc cacgccgctc atgcgcacgt cgcccgccag ttttacatag 2641 cggggcttgc cggccgcgtc ttccgaaggc agcttccatg cccagtgccc cgtgcgttct 2701 tccgtttcct ccatcgaacc gtcctccgcg atgcggacgt tcaccagggt caccttgccc 2761 tcgtccacct ccggcttttc gtccatcaga tcgaacaccc gctgcgcgcc tgccagcgcc 2821 atgacgacgg agttgatctg ctgcgaaatc atggagacag gccgcgcgaa gttcttggac 2881 agcgtaagga acgctgccaa atctcccagg gtcagcccgg aggttccccg gatggcgatg 2941 gcgccgccga cgatggcgat caccacgtac tgcaggttgc cgatgttgtt catgatcggg 3001 cccagaatat tggaatagct gttggcccgg gtggtctgca cccgcaggtc ctcgttcttg 3061 acgtcgaagc cgg // LOCUS sequence121 3069 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence121 VERSION sequence121 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3069 /mol_type="genomic DNA" /organism="" /note="sequence121" CDS 486..875 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MKKKICLLLICALLLATTGCKAKTPEEISAEKYEAMANACLTLVE TYNDVAQTAIDNGWEADFETLKLMDQIADQAEEITNAVNAPENVEDARRDQLAALAKQL TDQLTNEVLPKVSEPCPKTGVETGE" /locus_tag="LOCUS_4150" /note="MGA_584" CDS complement(944..1969) /product="type I glyceraldehyde-3-phosphate dehydrogenase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003025408.1" /transl_table=11 /codon_start=1 /translation="MLRIAINGFGRIGRLAFRKMFGDPRFDVVAINDLTSPEMLAYLLK YDSVQKAYEGHVIDCGEDHISVDGTKIPVFAQADAKNLPWKEYDVDIVLECTGFYTSKA KSQAHIDAGAKKVLISAPAGNDLPTIVYGTNHDTLTKEDNIVSGASCTTNCLAPMAKAL NEYRELRTGFMTTIHAYTGDQMILDGPHRKGDFRRARAGALNIVPASSGAAKAIGLVIP ELDGKLIGSAQRVPVGTGSVTILDATLKDMTDTVSVEGINEKMRASTNKSFGYNEEPIV STDIIGSTYGSVFDATQTLAQKCGTHIYEVRVVAWYDNEMGYTSQLLRTMAHMGRLMGR I" /locus_tag="LOCUS_4160" /gene="gap" /note="WP_003025408.1 type I glyceraldehyde-3-phosphate dehydrogenase (Francisella) [pid:63.8%, q_cov:98.5%, s_cov:100.0%, Eval:4.0e-118]" /note="MGA_585" misc_feature complement(2025..>3069) /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_011107748.1:MATE family efflux transporter" /note="WP_011107748.1 MATE family efflux transporter (Bacteroides thetaiotaomicron) [pid:40.7%, q_cov:95.7%, s_cov:72.9%, Eval:1.6e-69, partial hit]" /note="MGA_586" /locus_tag="LOCUS_4170" ORIGIN 1 agcacaaact tgccctgatg gaagatgata tccttgacgg gtgtcccctc ctgcatcttg 61 agcgaagtgc ccagatcgcc tttgagatag ttgaccacgt agttcttgag ctggacgatc 121 agaggtttgt ccagaccata ctttgcattg gccagagcga tctgctgggg cgtggatttt 181 tccgtgagga acgggctgcc ggggatcgcg ttcatcaaga agaacgtgat cgccatgata 241 agcagcagcg tgagcagcgc ggcccccaca cgcttcagcg tataactaac catactccac 301 ttcctgtttc ttagttctac gggaacgctt taatgcgtta aacgcaataa aactactccc 361 gcggcttagg gatttaataa ttatagcaga acgcataaat acacgcaagc aatttgcatt 421 tttcttccag ttgcaattat tcgcagattc tctataattg ttaaggtaag acaacggagg 481 tatccatgaa gaaaaaaatc tgtcttttac tgatatgcgc cctattgctc gcgacgaccg 541 gatgcaaagc caagacgccg gaggagatct cagcggaaaa atacgaagcc atggcgaacg 601 cctgcctgac tttggtagaa acgtataacg acgtggcgca gaccgccatc gacaacggct 661 gggaggcgga tttcgaaacg cttaagctga tggatcagat cgcagaccag gcggaggaga 721 tcacaaacgc cgtcaacgcg ccagaaaacg tggaagacgc cagaagagat cagctggccg 781 ccctcgccaa gcagctgacg gaccagctta cgaacgaggt gctccccaag gtgagcgaac 841 cctgcccgaa gacaggcgtc gagaccgggg aataagaaat gaccgatcga gaaaagcaaa 901 agcgctgcgg aaagccgcag cgcttttatt gtgcgttaaa agatcagatc cttcccatca 961 gccggcccat gtgcgccatg gtgcgcagca gctggctggt gtagcccatt tcgttgtcgt 1021 accaggcgac gacgcggact tcgtagatgt gggtgccgca cttctgcgcc agggtctggg 1081 tggcgtcaaa cacggagccg taggtgctgc cgatgatgtc ggtggacacg atgggctctt 1141 cgttgtagcc gaaggacttg ttggtggaag cgcgcatctt ttcgttgatg ccctccacgg 1201 aaacggtgtc cgtcatatcc ttcagcgtgg cgtccaggat cgtcacggaa ccggtgccca 1261 cgggaactct ctgggcggat ccgatcagct tgccgtccag ttcgggaatg acgagaccga 1321 tggccttcgc cgcgccgctg ctggcgggaa cgatgttgag cgcgcccgct cttgctctgc 1381 ggaagtcgcc ctttctgtgg ggaccgtcca ggatcatctg gtcgccggtg taggcgtgga 1441 tggtggtcat gaagcccgtg cgcagctctc tgtattcgtt gagggccttc gccatgggag 1501 ccaggcagtt cgtggtgcag ctggcgccgg agacgatgtt gtcctccttc gtaagggtat 1561 cgtggttggt gccgtagacg atggtgggca ggtcgttgcc cgcgggtgcg gagatgagca 1621 ccttcttggc gccggcgtcg atgtgcgcct gggatttcgc cttgctggta tagaaaccgg 1681 tgcactccag cacgatatcc acgtcgtatt ccttccaggg caggttcttg gcatccgcct 1741 gggcaaatac ggggatcttg gtgccgtcca cggaaatatg atcctcgccg cagtcgatca 1801 cgtgaccctc ataagccttc tgcacggagt cgtacttcag cagatacgcc agcatttccg 1861 ggctggtgag gtcgttgatg gcaacgacgt cgaatctggg gtctccgaac atcttgcgga 1921 aagcgagtct gccgatgcgg ccgaaaccat tgatcgcgat tctaagcatg tatatcctcc 1981 ttcattgact gaaatagttt tgtcaaaaag cgcttaataa tttattatag catattttcc 2041 tgcgcagttt ttcgcttcag caggaaaaag tacacaaaac acagcacgat ctgcacaaaa 2101 gtgctgcagg gcgtggccag ccccacatga aacagcgaca ccggcacctc tttgctcatc 2161 aggtacgaca cggggatgcg cacgccaaac gctccgatga tgctctgggt catgacgaaa 2221 cgggtgcggc ccaggccgtt gaaatagccg ttgaagcaga acaggaagct cgtcagcaga 2281 cagtcgatgg cataggcctt cagataatct gctgcggctg ccaccacgtc ggccttcccg 2341 gccgcgaacc aggacgccgg gatatcgccc cggaagaaga taaacaggaa cataaagacg 2401 ccaacgccca gcgaaaggcc gatgccgtag gcaagcgccc tctccgcccg gtccatcttc 2461 ctcgcgccgt aattctgcgc cacgaaagcg gacatggcca tggaaaatgt ggagggcacg 2521 agcatcacga acgagcagat cctctccgca acgcccacgc cggcggaggg caccagtccc 2581 aggccgttta cgatggccgc gatcacaata aaggacaggg tgaccagtac atcctgcgcg 2641 gaagtcggga ttccgatgtg aagcagttcc gtcgcgatga ttccatccag ccgcagattc 2701 tttctcccga acgtgaacgg catgccccgc ttcttcatga tgagcagcga cgccagcacg 2761 ctgacgccct gggcgaatac cgtggcaatg gcgactccct ttacgcccat gcggaagacg 2821 ccggccagca gcaggtcgcc gccgatgttg aacgcgcagg cgatggcgac ggtcaccaga 2881 ggcatggcgg aatcgcccat tccccggaac atgctgccga tcacatggta cgccgtaatg 2941 aaggccaggc cgcccgcgca gatccggatg taggtgaccg ttccggcaaa cgctgcctcc 3001 ggggctttca tcagagccgc cagctgcggc gcaaagacga tgagcgcggt catgatggcg 3061 aggcagaaa // LOCUS sequence122 3049 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence122 VERSION sequence122 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3049 /mol_type="genomic DNA" /organism="" /note="sequence122" CDS complement(605..1747) /product="DUF362 domain-containing protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_004082494.1" /transl_table=11 /codon_start=1 /translation="MEKAPVYFTNLRTNGEESLLQKLERLMKKAGFENIDFEDKFVAVK IHFGEPGNLAYLRPNWARTVCDYIKRLGGKPFLTDCNTLYVGGRKNALDHLDSAYINGY NPIATGVQTIIADGLKGLDERDLPVPNGEYCKTAKIGSALADADIIISMSHVKGHGSAG FGGVLKNIGMGGGSRSGKQIMHSEGTPAIYEDRCIGCRTCEKNCAHDAIHVVNRKAAID EEKCLGCGRCIAVCPKDALQTKWDAGNDVLSCKIAEYTYAIINGKPNFHIAFVLDVSPD CDCDGHNDLPIIPDIGIFCGFDPVAVDQACADAVNAQTYVESSVLGDIMRDSRKKASRK EAIEKNDVFKMVHPNTKWEAGLAHGEKMGMGTRTYELITL" /locus_tag="LOCUS_4180" /note="WP_004082494.1 DUF362 domain-containing protein (Thermotoga) [pid:48.5%, q_cov:98.7%, s_cov:97.5%, Eval:7.4e-100]" /note="MGA_588" CDS complement(1780..2961) /product="M20 family metallopeptidase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_066054433.1" /transl_table=11 /codon_start=1 /translation="MKQKITQIAKEIRADIEALSDAIYKNPELGNVEYESSKLHAELLK KYGFKVEKPYMGLATGYRAEYRSSKPGPHICYMAEYDALPGLGPTGGPGHGCGHNMLGA TSVAAGIILSRFVDETGGWVVVLGTPAEETDGAKVAYANKGVFRDLDAAMICHPTSVDY FESGKSLAMDTIEFEFFGRAAHAASEPEMGINALDAVIQTFNNINALRQQTRPDARIHG IITEGGVACNVIPEHCVCRFYVRAGKKAYLKHLYQQVVNCGKAAALATGCELKMRPFEL AYDDLATNETLNDLFEQSMKELGVEGIQPPGEDYGSVDAGNVSYVCPTIHPYFPITTEA IPGHTREFAAATQTVYAKDRMMETAGGMALAGYHILTEPDTLKAIRKEFKALK" /locus_tag="LOCUS_4190" /note="WP_066054433.1 M20 family metallopeptidase (Robertmurraya korlensis) [pid:46.3%, q_cov:100.0%, s_cov:99.0%, Eval:1.7e-99]" /note="MGA_589" ORIGIN 1 acaggttgga gatgggatag atgccggtga tgcgcttggc cgcccagtgg cggtccacgg 61 tctccagcag ccaaatggct tcggagtcgg cgatcataaa ggtgttgtgg tagttatcgt 121 cgggattctg ataggcgcat ccgccgccct ggccgtactt ttccaggtga tcgatgatga 181 cgtgcatcgc ctgatatgcc gtgcggcctc tctccaggcc cagacgcagc agatccatgc 241 ccagcagcgc ttcctctttc tgcgccggga tctcggacca gtccgcctcg ttgccgatgc 301 agacgccgtg ctcgttgatg cccatctcga atccccagat ccaccagggc tgggacccga 361 tcatggcgta ggtgtgctcg acctggggca cttcgatata cgtgcacttg accgtctctc 421 ccttggcgtg gtcttccgcc gggaagaatt tcaggttctg gcattcatcg gtctcccggt 481 cggaattttt ggccaggatg ttgaacccgc tcacggatgc gctcttctcc accgcgacgg 541 tatcgcagga gggggtgcat ccgcagatct gcttgtgtct gttcatttgg aactcctttg 601 gtttttacag ggtaataagt tcgtatgttc tcgtgcccat gcccatcttt tcgccgtggg 661 ccaggcccgc ttcccacttg gtgttgggat ggaccatctt gaaaacgtcg ttcttttcga 721 tggcttcctt gcggctcgcc ttcttgcggc tgtctctcat gatgtcgccg aggacggagc 781 tttccacgta ggtctgggcg ttgaccgcat ccgcgcaggc ctggtccacc gccacgggat 841 cgaagccgca gaagatgccg atgtccggga tgatgggcag gtcgttgtga ccgtcgcagt 901 cgcagtcagg agacacgtcc agcacgaaag cgatgtggaa attgggcttg ccgttgatga 961 tggcgtaggt gtactccgcg atcttgcagg acagcacgtc gttgccggcg tcccacttgg 1021 tctgaagagc atccttaggg cagactgcga tgcagcgtcc gcagccaagg cacttctctt 1081 cgtcgatggc ggctttccgg tttacgacgt ggatcgcatc gtgggcacag ttcttttcgc 1141 aggtgcggca gccgatgcag cggtcttcgt agatggccgg cgttccttcg gagtgcatga 1201 tctgcttgcc ggagcggctt ccgccgccca tgccgatgtt cttcagcacg ccgccgaaac 1261 cggcgcttcc gtgacccttt acatggctca tggagatgat gatgtcggcg tccgccagag 1321 cggaaccgat ctttgcagtc ttacaatatt cgccgttggg aacgggtagg tctctttcgt 1381 ccaggccctt aagaccgtcc gcgatgatgg tctgcacgcc ggtcgcgatg ggattgtagc 1441 cattgatgta ggcggaatcc aggtggtcca gggcgttctt tctgccgccg acgtacagcg 1501 tgttgcagtc cgtcaggaag ggcttgccgc ccagtctctt gatgtaatcg cagaccgttc 1561 tcgcccagtt gggacgaaga tacgccaggt tgcccggctc accgaagtgg atcttgacgg 1621 ccacgaattt gtcttcgaaa tcgatgttct cgaagccggc cttcttcatg aggcgctcga 1681 gtttctgcag caggctctct tcgccgttgg tgcgcaggtt ggtgaagtat acgggtgctt 1741 tttccatggg tctctcctta tttttctatg aatgttgcct tacttgagtg ccttgaattc 1801 tttgcggatc gccttcagcg tatccggttc cgtcaggata tgatagcccg ccagcgccat 1861 gccgcctgcc gtttccatca tgcggtcctt ggcgtagacg gtctgggtcg ctgccgcaaa 1921 ttcccgggtg tgacccggga tcgcttccgt cgtgatgggg aaatacggat ggatcgtcgg 1981 gcagacgtag gagacgttgc cggcatccac ggagccgtag tcctctccgg gaggctggat 2041 gccctccacg cccagttcct tcatgctctg ttcgaacaga tcgttgaggg tctcgttcgt 2101 ggccagatcg tcgtaggcca gctcgaaagg ccgcatcttg agctcgcagc cggtggcgag 2161 ggccgccgcc ttgccgcagt tgacgacctg ctggtagaga tgctttaagt acgccttctt 2221 gcctgctctt acgtagaacc ggcacacgca gtgctcggga atgacgttgc aggcgacgcc 2281 gccctccgta atgatgccgt ggatgcgggc atcgggacgg gtctgttggc gcagcgcgtt 2341 gatgttgttg aaagtctgga tgaccgcatc cagcgcgttg atgcccatct ccggttcact 2401 ggccgcatgg gctgcccggc cgaagaattc gaactcgatg gtatccatag cgagggactt 2461 gccactctcg aaatagtcca cgctggtggg atggcagatc atggccgcat ccagatcgcg 2521 gaacacgccc ttgttggcgt aggccacctt ggcgccgtcc gtctcctctg caggggtgcc 2581 cagcaccacg acccagccgc cggtctcgtc gacgaaacgg ctcaggatga tgccggctgc 2641 tacggatgtc gcgcccagca tgttgtgacc gcatccatgg ccaggtccgc cggtcgggcc 2701 gaggccgggc agcgcatcgt attccgccat gtagcagatg tgggggccgg gtttggagga 2761 gcggtattcc gcccggtagc ccgtcgccag gcccatgtag ggcttctcca ccttaaagcc 2821 gtatttcttc agcaattcgg cgtggagctt cgaggattcg tactccacgt ttcccaattc 2881 cgggttttta tagatcgcgt ccgagagcgc ttcgatgtcg gcgcggatct ctttcgcgat 2941 ctgtgtaatc ttctgtttca tggccgggcc tcctgttctg tgtctacttt aagaatccgt 3001 cgatgatggc tttttccgcc tcttcttccg tcaggccgag ggtgcgcag // LOCUS sequence123 3042 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence123 VERSION sequence123 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3042 /mol_type="genomic DNA" /organism="" /note="sequence123" misc_feature <1..698 /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_003438277.1:tRNA 2-thiouridine(34) synthase MnmA" /note="WP_003438277.1 tRNA 2-thiouridine(34) synthase MnmA (Clostridioides difficile) [pid:52.3%, q_cov:95.2%, s_cov:61.0%, Eval:2.3e-59, partial hit]" /note="MGA_591" /locus_tag="LOCUS_4200" CDS 913..1788 /product="methylenetetrahydrofolate reductase [NAD(P)H]" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011949153.1" /transl_table=11 /codon_start=1 /translation="MKISQILQQDGYRLSFEVFPPKKSTGLENVRKATEEIAKLEPSFV SVTYGAGGGTSDFTLDIAKNIKEQTGVPVLAHITCVSSSREKVASYIDALKASGIENVM ALRGDLTPEMESQDRSGWDYRNAYQLVEELKAAGDFCIGGACYPEVHPESSCRNEDILH LKEKVKAGCDFLTTQMFFDNDLFYSFLYRVRDIGIDVPVIPGIMPITNANQVEKALKLS GCHMPIRFTSLVDRFGSNAAAMQQAGIIYATEQIIDLYANGIRNVHVYTMNKPEVASGI LNNVSAILNA" /locus_tag="LOCUS_4210" /gene="metF" /EC_number="1.5.1.20" /note="WP_011949153.1 methylenetetrahydrofolate reductase [NAD(P)H] (Clostridium botulinum) [pid:39.7%, q_cov:100.0%, s_cov:97.6%, Eval:4.1e-65]" /note="MGA_592" CDS 1785..2396 /product="methionine synthase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011986274.1" /transl_table=11 /codon_start=1 /translation="MMDLISLKTYNDLQPDLSEVMRYAGAPKTAEPDAQILSCLAELGE IRGRLCWRRFPIERQGAWLDLGFCRTPSASLSINLKGCSSLVLFAGTLGIGIDRFLAKY GRLSPARALWFQAIGAAGIEALCDAFCEELPQLLAEDGQPARIRPRYSPGFGDFGLEYQ PFIFSALDCQKNLGLTLTNSLLMSPTKSVTALVGICDEER" /locus_tag="LOCUS_4220" /note="WP_011986274.1 methionine synthase (Clostridium botulinum) [pid:28.3%, q_cov:94.6%, s_cov:86.3%, Eval:3.5e-15]" /note="MGA_593" ORIGIN 1 agggtccgga cggaaaatat ctgctgaaga aggggctcga tccctccaag gatcagagct 61 acgtactgca ttgccttacc caggagcagc tggcgcatac gctgtttccc ctgggggaat 121 atacgaagga gcaggcgagg agcatcgcgg cggagcacgg cttcgtaaac gcgaataagc 181 ccgacagcca ggatatctgc ttcgtaccgg acggcgatta tgcgaaagtt gtacagcgct 241 atggaagcgg ggagggtaca agacccggcg cttttgtgga tctgcagggc gatcctatcg 301 gcacccataa gggcctgatc cactatacca ttggacagcg caagggtctg ggcaacacct 361 ggggaaaacc tgtatttgtc tgcgccatcg acgcggcggc caataccgtg accctcggag 421 acagcgaaga cctgtttgag acccgggtgg aagtgaagga cttcaactgg atcgcaggcg 481 aagcgcccaa agagtccatc cgctgcacgg cgaagctgcg ctaccggcag aaagagaagc 541 cggccactgc aacggtgcag gaggatggca gggtcatcct gacgttcgac gaaccccagc 601 gggcgcccac ccccggccaa tacgccgtgc tctacgatgg cgacatcgtg cttggcggcg 661 gcacgatcga gaccggcaaa cggcatgttg acttatagga tgaaagggaa tacaatattc 721 tggtaatcat acaaaccaag gagaaagcat gatccacatt tgcggaaaca acatgatgat 781 gcggcgcagc cgggtacggg aagatctacc ggaccttgtt ttgtgacgca aacgaggttt 841 ggagcccatt acccggataa cccacgagac cgtgcgttat ccggttttta ttttgcagga 901 gagatagaac ccatgaagat cagtcagatt ttgcagcagg acggatatag gctctcgttc 961 gaggtctttc caccgaaaaa gagcacggga ctcgaaaacg tgcgcaaagc taccgaggag 1021 atcgccaaac tggaaccttc cttcgtgagc gtcacttacg gcgcaggagg cggcaccagc 1081 gacttcactc tggacatcgc caaaaatatc aaggaacaga caggcgtgcc cgtactggcg 1141 cacatcacct gtgtgagctc ttcccgggag aaggtggcgt cctacatcga cgccctcaag 1201 gccagcggca tcgagaacgt gatggcgctg cggggagacc tgacgccgga gatggaaagc 1261 caggacagaa gcggctggga ttaccggaac gcgtatcagc tggtggagga attgaaggcg 1321 gcgggagatt tctgcatcgg cggtgcctgc tatccggaag tgcaccccga aagcagctgc 1381 cggaacgagg atatccttca cctgaaagaa aaagtgaaag ccggctgcga ttttttgacc 1441 acacagatgt tctttgacaa cgatctgttc tatagttttc tatatagggt gagggatatc 1501 ggcatcgatg tgccggtcat cccgggcatc atgcccatta cgaatgccaa ccaggtggag 1561 aaggccttaa agctgtccgg ctgccatatg ccgatccgct ttacctctct cgtcgaccgc 1621 ttcggaagca atgcggctgc gatgcagcag gcgggcatca tctatgccac ggagcagatc 1681 atcgacctgt atgccaacgg catccgcaac gtgcacgtct acaccatgaa caagccggag 1741 gtcgcatcgg gtatcctgaa taacgtctcc gccattttaa acgcatgatg gatctgatct 1801 ctttaaaaac atacaacgat ctgcagccgg acctgtctga agtaatgcgc tatgccggcg 1861 cgccgaagac ggcggaaccg gatgcccaga tcctctcctg tcttgcagag ctgggggaga 1921 tccggggcag gctgtgctgg cggcgctttc ccatcgaaag gcagggcgca tggctggacc 1981 tgggcttctg ccggacaccg tctgccagtc tttcgatcaa tttgaagggt tgttcctccc 2041 tggtgctgtt cgcagggact cttggcatcg ggatcgaccg ttttctcgcg aagtacggcc 2101 ggctgtctcc cgccagagct ctgtggtttc aggcaatcgg ggcagccggg atcgaagcgc 2161 tgtgcgacgc tttctgcgaa gaactgccgc agctgctggc ggaagacggg caaccggcaa 2221 ggataagacc ccggtacagt cccggtttcg gagattttgg actggaatat cagccattca 2281 ttttttcggc cctggattgt cagaagaatc ttgggctcac cctgacgaac agccttctga 2341 tgagccccac aaaatccgta acggccctgg tgggcatctg cgacgaggaa cggtaacatg 2401 aagatcttag actatctgaa agacaatatc ctgatcctgg acggcggcat gggcagcttt 2461 ctgcaggaga aaggcctgca gcccggggaa cggccggaac cttggaatct cagccatccc 2521 gaggtcataa caggcataca taagtcgtat tacgacgcag gcagcaacgc tgtcatcacc 2581 aatacgttcg gcgcctgcgg gctgcggttc tccaaggaag aactggagga gatcgcagcg 2641 gctgccgtag cgaacgcccg gcgggctgcg gaagaaagcg atgcgcccca gccgaagtgg 2701 gtgggtctgg atgtgggacc ctgcggcaag ctgctgaagc ccttcggcga tctggagttt 2761 gaggatgccg tagagacctt taagctcttt ttacgggcag gcgcagcgca gcatccggac 2821 tttatcttta tcgagaccat gagcgactgc tacgagacga aggcggcggt actggcagcg 2881 aaagagtgct gcgatctgcc catcttcgcc tccaacgcct acagcgacaa cggccgtctt 2941 ttgaccggcg cagatcctgc cgccatgacc gccatgctgg aagggctggg cgtcgctgcc 3001 ctgggtatga actgctcttt ggggccggat acgctgcttc cc // LOCUS sequence124 3033 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence124 VERSION sequence124 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..3033 /mol_type="genomic DNA" /organism="" /note="sequence124" CDS complement(1282..1746) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MKDIMLKITGKTVRQDEGREKHEDIMEFVTAGQLFHRGSTTFIKY PESELSGLEGCTTSLIITKDKVKMRRSGNALAADTEMEFKKGERFYGMYETPYGPIGME LLTNDVTGLEDAGDGRQKLSIDYHISLKGFMESRNKLELEITHSGEGVKQ" /locus_tag="LOCUS_4230" /note="MGA_596" CDS complement(1715..2695) /product="D-alanine--D-alanine ligase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011459778.1" /transl_table=11 /codon_start=1 /translation="MDKIRLGVIYGGKSGEHEVSIMSADSVIAAVDPEKYEVVRIFISK EGWWTIAGQPLNPWDLRSYIDFALPILHGPNGEDGTVQGLLKLANIPYGGCGVLGCSVT MDKIVAKKVFASEGLKQAPYIAFSDADDVEAVMDEACRTMTFPMFVKPSNMGSSVGITK AHDREELRAAIELAERYDSRLLIEQGIDAREIESAVMGNNVLVCGKVGEIIPGAEFYDY DDKYFNGTSQLLIPAPISPEQEAEVLDMAKRAYKACGCCSFARVDFLMDKATGEIYINE INAIPGFTKISMFPMLMQAAGMKYPEIIDRIVELGYERYHAENHR" /locus_tag="LOCUS_4240" /EC_number="6.3.2.4" /note="WP_011459778.1 D-alanine--D-alanine ligase (Desulfitobacterium hafniense) [pid:43.9%, q_cov:100.0%, s_cov:98.9%, Eval:4.2e-77]" /note="MGA_597" ORIGIN 1 ctttataacc gaggatgttc agccgctgct gggctgccag cacgttcaat ccgcgctggc 61 ccttgaaata cttcttgcct tcatccatgg gaagcacgga ttccaggtat ttcgcgatct 121 gctcctgcgt cagggcagag ccgttggaga tcgcgatgtc cggcgcgatg ccgaccttgt 181 cgatgcgctg cttgttcggg gtgaggaaat ggcagaacgt cagcttaaag ctgtcgccgt 241 tgtccatggt caccagctcc tgcgccacgc ccttgccgta ggtcgtgacc cccaccagcg 301 tgccggcgcc gttgtccttg acggctgccg ccaggcattc ggaggcactg gccgtatgat 361 cgttgatgag gacgaccaga ggcacgtctt tgtaggtgcc gccggcggaa tactcctcgt 421 cgatgatctc gccctgctgc tcgtagaaga ccagcggctt tccctggggg atgagcatgc 481 cggcgatgtt cagggcgtcg cccatcacgc cgccgccgtt gtcccggacg tcgacgatca 541 gtttttccat gccgtccgcg atcaggttga gcttggcagt gcgaaattcc agccaggtct 601 cgccggagaa ctgggaaatg gcgatgtagc cgatcttatt gtccagcatc tggtaggtga 661 cggtctgcgc tttgatgttc ttgcgctcga tctccatggt ctgcagcgcg ccattgcttt 721 ccagctgcag cacggccttc gtgcccggtt cgccgcgcac gagagaggag atctgatcca 781 gggtcatccc ggagacgctt ttaccgtcca cgctccggat gatcatcccc gccgtaacgc 841 ccgcttcgta ggccggcccc agcgtgttca cctgggtgat gacgcagttt ccgctgccgt 901 ccagggtcat cgtgaccccg atcccggcgt aattgcccgt cacctggctg atgaaggcgt 961 ccttttcctc cttggtcttg tagaacacgg accactggtc cagcgcgtcg aacacgccgt 1021 tgtaagccgc gtccgtcaga tcttccacgt tgacgtcgtc tgcgtaattc tcgtcgatgt 1081 actgcacgac gtcccgcagc tgatccaact tgctgaggtt cttgtcgatg gtctcctggc 1141 tctccgccgc atagacgtag agcgttccgg tctcgccaga gaaagccgcc agcagcgtga 1201 acccggtcat catcagcatc gagatgacga cgacgatggc caggatgcgc gccagtttct 1261 tgtttcgttc ctgtttgcgg ttcattgttt taccccttcc cccgaatggg tgatctccaa 1321 ttccagtttg tttctggatt ccataaagcc cttcaggctg atgtgatagt cgatggacag 1381 cttctgcctg ccgtcgccgg cgtcttccag ccccgtcacg tcgttcgtca gcagttccat 1441 gccgatgggg ccgtaaggcg tctcatacat gccgtagaag cgctcgccct tcttgaactc 1501 catctccgta tccgcagcca gcgcattgcc gctgcgccgc atcttcacct tgtccttcgt 1561 gatgatgagg gacgtggtgc agccttccag cccggaaagc tcgctctccg ggtatttgat 1621 gaaggtcgtc gaaccgcggt ggaacagctg tcctgcggtc acgaattcca tgatgtcttc 1681 gtgtttctcg cggccttcgt cctgtcttac cgtcttaccg gtgattttca gcatgatatc 1741 tttcataacc caactccacg atccggtcga tgatctccgg atacttcatg cctgccgcct 1801 gcatcagcat ggggaacatg ctgatcttcg taaagcccgg gatggcgttg atctcgttga 1861 tgtagatctc gcctgtggcc ttgtccatca ggaagtccac ccgcgcaaaa ctgcagcagc 1921 cgcaggcttt atacgccctt ttggccatat ccagcacctc cgcctcctgc tcgggcgaga 1981 taggcgccgg aatgagcagc tggctggtgc cgttgaaata tttatcgtcg taatcgtaaa 2041 attccgcgcc ggggatgatc tctcccacct tgccgcagac gagcacgttg ttgcccatca 2101 cggcgctttc gatctcccgg gcgtcgatgc cctgttcgat cagcaggcgg ctgtcgtagc 2161 gctccgccag ttcgatggcg gccctcagct cttcccggtc gtgggctttg gtgatgccta 2221 cggaagagcc catgttggag ggcttgacga acatggggaa cgtcatcgtg cggcaggcct 2281 catccatcac cgcctccacg tcgtccgcgt cggaaaatgc gatatagggg gcttgtttta 2341 agccctcgga tgcgaagacc ttcttcgcta cgatcttgtc catggtcacc gaacagccca 2401 gcacgccgca gccgccgtag gggatattcg ccagcttcaa caggccctgc accgtgccgt 2461 cctcgccgtt ggggccgtgc aggatgggca gggcgaaatc gatgtagctg cgcaaatccc 2521 agggattcag gggctgaccc gcgatcgtcc accagccttc cttgctgatg aagatgcgca 2581 cgacttcgta tttttccggg tcgacggccg cgatgacgga atccgccgac atgatggaaa 2641 cttcgtgctc gccggatttg cctccgtaaa ttacgcctaa tctaatcttg tccatgggat 2701 gcctcctcga gcagcgtccg cagctcccgt tcgtcgaaat aatatttttt caggcagaac 2761 tggcaagtga gctccgcgcc gtggtcttct tcgatgatct ctgtcagatc cttcttgccg 2821 atggagacga gcgctttcgc catgcgctcc cggctgcagt cgcagagcca agagacgctg 2881 cgttcctcca gcacgtgggg gcggaattcc tccggcagct tgccgaagat gatgtccaga 2941 agcttgtagg ggtcaccctc cgcgtcctgg atgagcagcg taaggtcgtc cagcaggaaa 3001 agcgtctcct ccagggcatc cagcgcctct tcc // LOCUS sequence125 2996 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence125 VERSION sequence125 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2996 /mol_type="genomic DNA" /organism="" /note="sequence125" CDS complement(236..1036) /product="MBL fold metallo-hydrolase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011389564.1" /transl_table=11 /codon_start=1 /translation="MAEFDGMRVTVLGARGSVPACGRQFTGFGGSTSCYMVQAGEQTVF LDAGSGLVSAPADFSVPPVILLSHLHLDHILGLGMYPRLSQKGKRTGIYVPAAPGEDPQ ALLNGVYEPPYWPLTLKNYAGDVHISPLQAHLEAGGIAVDTLEGYHPGGCKVFRLRFDG RTLVYATDQEPDEDGFAKLAAFAKDADLLLFDGQYAEAEYESRKGFGHSTAQKGMALME RCGAKQLLLIHHDPHSTDAELTARETALGRTDVRYAREGETIVL" /locus_tag="LOCUS_4250" /note="WP_011389564.1 MBL fold metallo-hydrolase (Rhodospirillum rubrum) [pid:33.6%, q_cov:97.0%, s_cov:95.0%, Eval:2.8e-30]" /note="MGA_600" CDS complement(1041..1508) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MNTKTFKKDEVIVRQGEYASTMYDIVSGKVKVVADLGTPDEKDVA EIAAGEVFGEMGLIECLPRSASVVALEDGTTVQEISAAEFSDYFKSSPDKVLGVMRQLS ARLRETNEKYAEACRTVYDTVETEKKGEKKSGGLLSRLNFFHKEYGKIRTK" /locus_tag="LOCUS_4260" /note="WP_012584159.1 Crp/Fnr family transcriptional regulator (Dictyoglomus turgidum) [pid:31.6%, q_cov:96.1%, s_cov:68.9%, Eval:7.5e-12, partial hit]" /note="MGA_601" CDS complement(1530..2015) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MRGASYKKGEIIFREGDPGNCMYDIFWGRVGVYTGYGTPQEKKLA ELKTEDFFGEMGLLDRAPRSATVVSLSDDTYLGVITESDFHEYFQEKPAKVFLIMQQLS QKLRKTTQDYVEVCRTVHDVVEEEKEKGEGTPHSEDLEKSLLEIYNSYLSYPFLDMY" /locus_tag="LOCUS_4270" /note="WP_175285932.1 Crp/Fnr family transcriptional regulator (Brachybacterium squillarum) [pid:32.5%, q_cov:72.7%, s_cov:47.5%, Eval:6.5e-12, partial hit]" /note="MGA_602" CDS complement(2034..2969) /product="LD-carboxypeptidase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011392232.1" /transl_table=11 /codon_start=1 /translation="MIKPRKLNPGDTIAIISPSSPTKDPTAVPRGKEYLESLGYKVVLG KHVDEWRANYIAASEEARAEDLNEMFARKDVDMILCARGGYGALQFIDKIDFDNIKANP KIFCGYSDITSLHLAIGKFAGLVTIHGEVLTAVNPGISGYTKDHWLRCLTTTEDHRAIT LADPNKYLTTIAPGKAEGEVIGGNLCLIASSCGTFYQPDFKDKILFFEEVGEEPYGIDR FLAQMRNCGMLEGLKGVVIGECANCKDASGYYPDVIDTFKYYFSDLGVPCLYGLPMGHT RDQAALPLGVKVRLDADAKTFEILESGVTE" /locus_tag="LOCUS_4280" /note="WP_011392232.1 LD-carboxypeptidase (Moorella thermoacetica) [pid:42.0%, q_cov:98.7%, s_cov:96.5%, Eval:2.7e-62]" /note="MGA_603" ORIGIN 1 gccatccgtt cggacagatc cgtggactgg cggagatccg taaacatgat cgtcaccacc 61 cgccgttctc cgccgatctt caggtcggcg ctgtgggaga ggatctcctc ggcgacttcg 121 tccgtcagat agcggccgaa ggtctgccgg atcagatcgt cccgctggcg gagctgttcc 181 ttcagccggg cgatctccgc ccgggcttcc tgcagttctc tgctttcctg tccgctcata 241 aaacgatcgt ctctccttct ctggcatagc ggacgtccgt gcgtccgagc gcagtttctc 301 tggcggtcag ttccgcatcc gtgctgtggg ggtcatgatg gatcagcagc agctgcttcg 361 ccccgcagcg ctccatcagt gccatgccct tttgcgccgt ggaatggccg aaccccttcc 421 ggctttcgta ttccgcttcc gcgtactggc cgtcgaacag cagcagatcc gcatcctttg 481 cgaatgcggc cagttttgcg aagccgtctt catccggttc ctgatccgtg gcatagacca 541 gtgtccggcc atcaaaccgc agccggaaga ctttgcagcc gccgggatgg tatccttcca 601 gcgtgtcgac cgcgataccg cctgcctcca gatgagcttg cagcggcgag atgtgcacgt 661 ctcccgcgta gttcttcagg gtcagcggcc agtagggcgg ctcgtacacg ccgttcagca 721 gcgcctgggg atcttcaccc ggggcagccg gaacatagat gcccgtgcgc ttccctttct 781 gggacagtct gggatacatg cccagtccca agatgtgatc cagatgcaga tggctaagca 841 ggatgaccgg aggcacagaa aagtccgccg gtgcggagac gagtccgctg ccggcgtcca 901 gaaatacggt ctgttctccc gcctgcacca tatagcagga cgtggacccg ccgaatcccg 961 taaattgtct gccgcatgcg gggacagagc ctcttgcgcc gaggaccgtc acccgcatgc 1021 cgtcgaattc cgccatatgc ctactttgtc cggatttttc cgtattcctt gtggaagaag 1081 tttaagcgcg acagcagtcc gccgctcttc ttctcgccct tcttctccgt ttctacggtg 1141 tcgtagacgg tgcggcaggc ttccgcgtac ttctcgttcg tctcccgcag gcgggcgctc 1201 agctggcgca tcacgcccag caccttatcc gggctgctct taaaatagtc ggagaattcc 1261 gccgcagaga tctcctgcac cgtcgtgccg tcttcgagcg caacgacgct ggcactgcgg 1321 ggcaggcatt cgatcaggcc catctcgccg aacacttcgc cggcggcgat ctccgcgacg 1381 tccttttcgt ccggcgtgcc gagatctgcg acgactttca ccttgccgct cacgatatcg 1441 tacatcgtag aagcgtattc tccctgacgg acgatgactt cgtccttttt aaatgtcttc 1501 gtattcattt cggtctccct cgcttcgctc taatacatat ccaggaacgg ataggacaga 1561 taggagttgt agatctccag cagagacttc tccagatctt cggagtgggg cgtgccttca 1621 cccttttcct tctcttcttc cacgacgtcg tgcaccgtgc ggcagacttc cacgtaatcc 1681 tgggtcgtct tgcgcagctt ctggctcagc tgctgcatga tcaggaagac cttcgcgggc 1741 ttttcctgga aatattcgtg gaaatcgctc tccgtgatga cccccagata ggtgtcgtcc 1801 gacagggaaa cgacggtggc agaacggggc gctctgtcca gcagacccat ctcgccgaag 1861 aaatcctcgg tcttgagttc ggccagtttc ttctcctgcg gcgtgccgta gcccgtatag 1921 acgcctacgc gtccccagaa gatgtcgtac atgcaattgc ccgggtcacc ttcccggaag 1981 atgatctcgc cttttttgta agatgctcct ctcatagttc ctccttctga taattattcc 2041 gttacgccgc tctccaggat ctcgaacgtt ttcgcatctg cgtccagccg gacctttacg 2101 cccagcggca gcgccgcctg gtcgcgggtg tgacccatgg gcagcccgta caggcagggg 2161 acgccgagat cggagaagta atatttgaac gtatcgatga cgtccggata gtaaccggat 2221 gcgtccttgc agttggcgca ctcgccgatg acgacgccct ttaagccttc cagcatgccg 2281 cagttgcgca tctgcgccag gaaacggtcg atgccgtagg gctcttcgcc cacctcttcg 2341 aagaacagga tcttatcctt gaaatccggc tggtagaacg tgccgcagct ggaagcgatc 2401 aggcagaggt tgccgccgat gacttcgcct tcggccttgc ccggcgcgat ggtcgtcaga 2461 tacttgttgg gatctgccag cgttatcgcg cggtggtctt ccgtcgtcgt aaggcagcgc 2521 agccagtgat ccttcgtgta cccgctgatg ccggggttga cggcggtaag cacttcgccg 2581 tggatcgtca cgaggcctgc aaacttgccg atggccaggt gcagggacgt gatgtccgaa 2641 tagccgcaga agatcttggg attggccttg atgttgtcga agtcgatctt atcgatgaac 2701 tgcagcgcgc catagccgcc tctggcgcag aggatcatgt ctacatcctt gcgcgcgaac 2761 atctcgttca ggtcttcggc tctggcttct tcggaggcag cgatgtagtt cgcccgccat 2821 tcgtccacat gcttacccag cacgaccttg tagcccaggc tctccagata ttcttttcct 2881 ctggggaccg ccgtcgggtc cttcgtggga ctggatgggg agatgatggc gatggtatcg 2941 ccggggttga gttttcttgg tttgatcatt ttttaaagtc ctcccagacc tttgcc // LOCUS sequence126 2993 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence126 VERSION sequence126 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2993 /mol_type="genomic DNA" /organism="" /note="sequence126" CDS 278..964 /product="zinc metallopeptidase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_012583790.1" /transl_table=11 /codon_start=1 /translation="MFGYYTSMILLLPAILLSVYAQGKVQSAYRTYANVRNGRNITGAE AAQRILQFNDLQIPIYETQGTLTDNYNPQKGTLNLSPAVYEQPSVASMAIAAHECGHAL QHAAGYSLLSIRNSIVPVANIGSMLSWPMLILGLMLGAQGDFLFNLGIFLFLGVVLFHL VTLPVELDASKRALIQLEALNCFVSDEEHAAAKRVLDAAALTYLAALATAVANLLRMFA IRGNRR" /locus_tag="LOCUS_4290" /note="WP_012583790.1 zinc metallopeptidase (Dictyoglomus turgidum) [pid:42.8%, q_cov:100.0%, s_cov:98.7%, Eval:2.5e-42]" /note="MGA_605" CDS 961..2172 /product="16S rRNA (cytosine(967)-C(5))-methyltransferase RsmB" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_206580826.1" /transl_table=11 /codon_start=1 /translation="MTDPSRRIAFDILKAVESEGAFSNILLNRKLQTAEGADAAFVRRL VHGVLKNRTLLDSQIDRYLRKGGIKVPARILLRMGFYQLALCEDVPDHAAVSETVALAK QAFRGGEGFINAVLRSFVRDGKRLELPEDLTVRYSMPSWIVRLWTESYGEEKTRQLLEA SLEEAPLCLRINPLKAQENYVPDVSGGIAASAGYRSGLFSVQDASSQEAIRILDPRPGE RVLDVCSAPGGKTCAMAERMENRGSIKACDLHENKLPLIENEAKRLGISIVTTCVRDGC EPPDPQEIEAFDAVLCDAPCSGLGVLRRKPEIKWRLTEEELRSLPGTQLRILKNAAACV RKGGRLLYSTCTVDPLENERVTEAFLSDGSFDKVCERQIFTGETINNSKGDGFYVCLMR KKDL" /locus_tag="LOCUS_4300" /gene="rsmB" /EC_number="2.1.1.176" /note="WP_206580826.1 16S rRNA (cytosine(967)-C(5))-methyltransferase RsmB (Clostridium aminobutyricum) [pid:41.3%, q_cov:99.3%, s_cov:99.1%, Eval:2.1e-79]" /note="MGA_606" CDS 2169..2903 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MISVGFKTDKGNLRSGNEDSLFLLPDQQLYIVADGVGGHNSGELA SRMAVGYMAQYVAMNPIAAVASKKDLRKYFLECFQGANALIYSKSKEEEGNNGMATTTV LCYLDATDCYVVNVGDSRAYLVREGVMRQLTEDHTLVQDMLRSGLLTKEEAMMHPDRNM ITRAIGGEETIEPDFYRFETCPGDVILLCTDGLYGEVSANRILQLSTEYSSMHELAKKL VDEANEAGGKDNISVVCIRIGG" /locus_tag="LOCUS_4310" /note="WP_012257018.1 protein phosphatase 2C domain-containing protein (Chloroflexus aurantiacus) [pid:40.7%, q_cov:97.5%, s_cov:70.4%, Eval:1.3e-39, partial hit]" /note="MGA_607" ORIGIN 1 gcatttactt ccctgaacgg agaagtcttt aagatccacg ccgccaaggc ggcggaacgc 61 aggacgaaag cggctccggg caccgtggtg tcttccggca aggaaggcat cggcgtcgcc 121 tgtggagatg gcggtgttct gctgctgaca aaagtgcagc tgcccggcaa aaaggctatg 181 gatgccggcg cgttcctgct gggtcacaca gttgaaaccg gaaccgttct gggataaaat 241 aaagtgttat gaaatccgca tttcaaggag gctttgcatg tttggatatt atacttcgat 301 gatccttctg ctcccggcga tcctgctgtc ggtctacgcg caggggaagg tccagagcgc 361 gtaccggacc tatgccaacg tacgcaacgg acggaacatc accggcgcgg aagccgcaca 421 acgcatcctg cagttcaacg acctgcagat ccccatctac gagacgcagg gaacgctgac 481 ggataactac aatccgcaga aggggacgct caatctttct ccggcggtct acgaacagcc 541 cagcgtcgcc agcatggcca tcgcggctca tgagtgcggt catgcgctgc agcacgcagc 601 gggctattcg ctgctgagca tccgcaacag catcgtaccg gttgccaaca tcggctccat 661 gctgtcctgg cccatgctca tcctcggcct gatgctcggc gcgcagggcg atttcctgtt 721 caatctgggc atcttcctgt tcctgggcgt cgtgctgttc catctcgtta cgctgcctgt 781 ggagctggac gccagcaagc gggcgctcat tcagctggaa gccctgaact gcttcgtaag 841 cgatgaagaa cacgcagctg ccaagcgtgt gctggatgct gccgcgctca cgtatctcgc 901 agcgctggca acggctgtgg ccaacctgct gcgtatgttt gccataagag gaaaccgcag 961 atgacggatc cctcccgccg catcgcgttc gacatcctga aagcggtcga aagcgaaggg 1021 gcgttttcca atatcctcct caaccggaaa ctgcagactg cggaaggggc ggacgccgcc 1081 ttcgtacgcc gtctggtgca cggcgtgctg aagaacagga cgctgctgga cagccagatc 1141 gaccggtatc ttcgcaaagg cggcataaaa gtgccggcga ggatactcct gcgaatgggc 1201 ttctaccagc tggcgctctg cgaagacgtg ccggaccacg ctgctgtttc cgagacggtc 1261 gccctggcga aacaggcgtt tcgcggcggt gaagggttta tcaacgccgt gttgcgcagt 1321 tttgtgcggg acggcaagag gctagaactt ccggaggatc ttaccgtccg ctattccatg 1381 ccgtcctgga tcgtccgtct ctggacggaa agctacggcg aagagaagac gcggcagctt 1441 ctggaggcaa gcctggaaga ggcaccgctt tgcctgcgga taaatccgct taaagcacag 1501 gaaaactatg ttcctgatgt ttccggcggt attgccgcat ctgccggcta ccgcagcggg 1561 ctgttttccg tacaggacgc atcgtcgcag gaggcgatcc gcatcctgga tccaagaccc 1621 ggcgaacggg tgctggacgt ctgcagcgcg ccgggcggca agacctgcgc tatggcagag 1681 cggatggaaa acagaggaag cataaaggcc tgcgatctgc acgaaaacaa gcttccgctc 1741 atcgaaaatg aggcgaagcg gcttgggatc tccatcgtaa cgacctgcgt gcgcgacggc 1801 tgcgagccgc cggatccgca ggagatcgag gcgttcgacg cggtgctgtg cgatgcgccc 1861 tgcagcgggc tcggcgtgct gcgcagaaag ccggagatca aatggcggct gacggaagaa 1921 gaactgcgat cgcttcccgg aacgcagctg cgcatcctga agaacgccgc tgcctgcgtc 1981 agaaaaggcg gcaggctgct gtacagcacc tgcacggtag atccgctgga aaatgagcgg 2041 gtcacggaag cgtttttaag cgacggatcc ttcgataagg tctgcgaacg gcagatcttt 2101 accggagaga cgataaacaa cagcaaagga gacgggtttt acgtctgcct tatgaggaaa 2161 aaagatttat gatcagcgtt ggattcaaga ccgataaggg caatttaaga tccggcaacg 2221 aagactcgct cttcctgctg ccggatcagc agctctacat cgtggcggac ggcgtcggcg 2281 ggcacaattc cggcgaattg gcttcccgca tggcggtggg atacatggcg cagtatgtgg 2341 ctatgaaccc gatcgcagcc gtcgcgagca aaaaagatct gagaaagtac ttcctggagt 2401 gcttccaggg cgcgaacgct ctcatctaca gcaaatcgaa ggaagaagaa ggcaacaacg 2461 gcatggcgac cacgacggtg ctgtgctatc tggatgctac ggactgctat gtcgtaaacg 2521 tgggcgattc cagagcctat ctcgtccggg aaggcgttat gcggcagctg acggaagacc 2581 atacgctggt gcaggacatg ctgcgctccg gccttctgac gaaggaagaa gccatgatgc 2641 acccggaccg caatatgatc acccgggcca tcggcgggga agagacgatc gaaccggact 2701 tctaccgctt cgagacctgc cccggggacg tcatcctgct gtgcaccgac ggtctgtacg 2761 gcgaagtgag cgcgaacagg atccttcagc tgtcgacgga atacagttcc atgcatgagc 2821 tggcgaagaa actcgtggac gaagccaatg aggcgggcgg caaggacaac atctccgtcg 2881 tctgcatccg gataggggga tagcgtatgg gcagcagaat tttagcagga agatacgagc 2941 tgcaggacaa gatcggcgaa ggcggcatgg ccgtcgtctt caaggcaaga gac // LOCUS sequence127 2985 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence127 VERSION sequence127 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2985 /mol_type="genomic DNA" /organism="" /note="sequence127" CDS 795..2978 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MNKKSSKVISLLLVLSLLLSACGGGGGSAKATTLSPENTSAVSNG VTVDVGDFVLDGEAELSVAKGQTEDHSDEGYKIDVYDIKLGDMHELGDYITIRIPYDTS YCKEGQDPAKCVGAKYMNGETGEWEDVLFEVDAEKQELVIYTDHLSYYGALYVEDEGRR NALVTDVLNSPLTMDKTTAMDFASRIAANDASVKKDLSDYAEKATDMFFDYADRLDNAI NIATLGDGEAIPKWLDTSIPDTNQTLFSALGYIATATNLLRVARDEMRGGADKGAVLNL IRDVGSKVTTYWADAFTSVGSGALSVGMGGVLIIDKMLTAFAEEAQATKLEDIAYVYHH YNEGFSATWAHKVMRPKDWREKVIQVLENNPDDPEIAITALEAGFRKYASEFFDLSADQ MAEVASDVPNVTVKRIPAFTEAEKEQMIDEYVAYMKDKTMPAVLTSAENYMIRKAEETQ LQAIEAIKDYYNSRISITMQENLPEGEKSSYAGYKFRFAPLSDAATENKANWTGKWPES GNIKTSSTLIGIMTAGFPHTVEFFKPDADMDNDKPEFTVPFVISVPSITITVGQLYPTL EEICGTYSDAVITILDIGPPEVVEALKKGGEEGEEGCDIDLEALIGQSQGLPFTLTQTG ANTAIFESADMEEEGEVISGKDLVYDPATGILQWSEPLVTEEASITLNFSCTYKDEAKT AVLVDGNLTETMGGSEMAGLYIKAALKGEKPLE" /locus_tag="LOCUS_4320" /note="MGA_610" ORIGIN 1 gatgatgcgg atccggccgc cgttctgcac gagctgcagc agcaatcctg cccagacttt 61 cgcgaaagct gcgtcttcgg tgagccagtc catgttctcg tcggagtgga gcagcagggt 121 gcagggtttg ccgctttgca ccagatcttc caggaggatc cgcacgcctt cccgtttgcc 181 ttcgttgccg aaaaacagca gcgcctcgga tttttccctt gcgttttccg ccttccgggc 241 gtcctttttg gcgccgcgca gcgacgcggt gaccctagcc agcggatctt ccttgatcgc 301 ttcgcccttc agccaggctt cgatctgttt tgccgccttt ttctcgtctt ccggccactc 361 cgtctgcagc tgcatggcgt tcgcggcaga ttctttctga tgttccttct tgatcgcttt 421 tgcgaaatac tggcttgcgg gttcgaggaa gggctgatgc gtgggaatgc cgcgcttgcc 481 ggagcggatg cggctgatgt aggacgggtc gtagttgagc gcccgggcca gcgtgctgct 541 gcgagtggct gtgagggtca tgagaaaatc gatcttttcc gagagggtgg acagcatggg 601 agcctccttt acgcagaaat ccatttccaa tttcagtata gtacgtgctg ggtttgttgt 661 aaacgatttc cggcacgatt cgtgcctgaa attggcattg ccaatgcccc atcttgcggg 721 aaataatccg cgaagctgtt ttacaataga atcgggagtg caattgtgta cagggaaggg 781 ggaaatgcaa tcatatgaat aaaaaatctt caaaagtgat ctcgctgctg ctggttcttt 841 ccctgctgct ttccgcctgc ggcggaggcg gcggctcggc caaggcaacg acactttcgc 901 cggagaatac cagcgcggtg tcgaacggtg ttacggtcga cgtcggcgat tttgtgctgg 961 atggagaagc agagctgtcc gtcgcaaaag ggcagacgga agaccattcg gatgagggct 1021 acaagatcga cgtgtacgac attaagctcg gcgacatgca cgagctggga gactacatca 1081 cgatccgtat cccgtacgac acgagctact gcaaagaggg gcaggacccg gccaaatgcg 1141 tcggcgcgaa atacatgaat ggagagaccg gcgagtggga agacgttctg ttcgaagtcg 1201 acgccgagaa gcaggagctc gtcatctata cggatcacct gtcttattac ggcgcattgt 1261 atgtcgagga cgagggcaga agaaatgcgc tggtgacgga tgtgctgaat tcgcctctga 1321 ccatggataa gacgaccgcc atggactttg cttccaggat cgccgctaat gacgcaagcg 1381 ttaagaagga cctgtctgat tatgcggaaa aagcgaccga catgttcttc gattatgccg 1441 accgtctgga caatgccatt aatattgcga cgctcggaga tggggaggcg atccccaagt 1501 ggctcgatac ttcgatcccg gatacgaatc agaccctgtt ctccgctctt ggatacatcg 1561 cgactgcgac gaaccttctg cgggtcgccc gggatgagat gcgcggcgga gcggataaag 1621 gcgccgtcct aaatctgatc cgcgacgtcg gcagcaaagt gacgacctac tgggcggatg 1681 cctttacgtc cgtcggcagc ggtgcgcttt ccgtcggcat gggaggcgtt ctgatcatcg 1741 acaagatgct caccgcattt gcggaagaag cgcaggccac caagctggaa gacattgcct 1801 acgtctacca ccactacaac gaaggctttt ccgcgacctg ggcgcacaag gtgatgaggc 1861 cgaaggattg gcgcgaaaaa gtgatccagg tcctggagaa caatccggat gaccccgaga 1921 tcgccattac cgctctggaa gcgggcttcc gcaagtatgc gtctgaattt tttgatctgt 1981 ctgcggacca gatggcagag gtcgcatccg atgtccccaa tgttacggta aagcgcattc 2041 ctgcctttac cgaggcggaa aaagagcaga tgatcgatga gtatgtcgcc tacatgaagg 2101 acaagaccat gccggcggtg ctgacgagcg ctgagaatta catgatccga aaagcagagg 2161 agacccagct gcaagcgatc gaggcgatca aggactacta caactcgagg atctcgatca 2221 cgatgcagga gaatctgcct gaaggcgaaa aatcctctta cgcaggctat aaattccgct 2281 ttgcgccgtt gagcgatgcc gccacggaga acaaggcaaa ctggacaggc aagtggcccg 2341 aatccggaaa catcaagact tcttccacgc tgatcgggat catgacggca gggttcccgc 2401 atacggtgga gttctttaag ccggatgccg acatggataa cgataagccg gagtttaccg 2461 ttcccttcgt gatctccgtg ccgagcatca cgattaccgt aggccagctc tatccgacac 2521 tagaagagat ctgcggaacg tacagcgatg ccgtgatcac gatcctggat atcggcccgc 2581 cggaggtcgt agaggccctg aagaagggcg gcgaagaagg ggaggaaggc tgcgacatcg 2641 acctggaagc tctgatcgga cagagccagg gcctgccctt tacgctgacg cagaccggcg 2701 caaatacggc catctttgag agtgcggata tggaagaaga gggtgaggtc atctccggca 2761 aggatcttgt ctacgatccc gcgacaggca tcctgcagtg gtccgaacct ctcgtaacgg 2821 aagaagcctc cattacgttg aacttcagct gcacgtacaa ggatgaagcg aagaccgccg 2881 ttctggtcga cggcaatctg accgaaacga tgggaggttc cgagatggcc ggactctaca 2941 taaaggctgc tttaaaaggt gagaaaccgc tcgagtaatg catcc // LOCUS sequence128 2983 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence128 VERSION sequence128 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2983 /mol_type="genomic DNA" /organism="" /note="sequence128" misc_feature <1..657 /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_130435197.1:ATP-binding protein" /note="WP_130435197.1 ATP-binding protein (Cuneatibacter caecimuris) [pid:46.2%, q_cov:93.6%, s_cov:28.5%, Eval:6.6e-42, partial hit]" /note="MGA_611" /locus_tag="LOCUS_4330" CDS 684..2429 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MNKRILTLCLALLLCLSLIPAQSFAVSAPKQAVIKEAPVAGEMAF NRGGLGLIEAKDGTRYLIDRDGGIYRSGKAWMDYMAGSGSYTVDGEGYYEYPLGKKMFT MAEMEKNVKAFLEENYPMGEVVSVQSEITYPFSGPYATCSFSAAMKSDDQLEKYEFYAL IDQSGLVHYVTPLIALTAGGGFPIEMTLGSGSEGLVRFTKEYNDREGEHYLYETGYLDL DGNEVLVFSNNDGRDPEGPAIVIDASDVAFIGDFNNGVAVICNNRQKESLIDRSGKVLL PFTHDSIYNDCGRYPVVYDEGKGYGYMDTAGLIVIPQQYEDAKGNWDDLFTVQKNGKWG VVDTDNKPVVPFEYDFMSSPELGIVYACKGNKAYIIRFEDAAPEEELTPWGTPRVSSIF KDVPAGAWYETYLQAAYENGIVGGKGSGRYDPSGNLKHGEIMVMVTQLHALAKGEKFQP APNPTDHWARAYCDYCKAEGIIDSRFDNKLDAKVTRAEMAYYFAHALRDDYYLEEEDVS LMDIATEEYGGDILKLAKAGIVTGYDVKGQTAKEFRPHNLVTRAEAAVFVTNLLGAIGP TGGVY" /locus_tag="LOCUS_4340" /note="WP_011108325.1 WG repeat-containing protein (Bacteroides thetaiotaomicron) [pid:30.9%, q_cov:19.4%, s_cov:60.9%, Eval:7.4e-07, partial hit]" /note="MGA_612" ORIGIN 1 accggcatcg gcatgagcga ggaattcgca gcccggatct tcgaaccctt cgagcgggag 61 cgcacgtcca cggtgagcgg catccagggc acgggtctgg gcatggccat cacgaaggct 121 atcgtggaca gcatggacgg ctgcatcgac gtgcagagca aacagggcga gggcagccgg 181 tttacggtgc tgctcacgtt cccggtgttg accggcgaaa cggacggctg ccattgcgaa 241 gagaagccgg aagaaccgaa aaaaagagat tataccggcc gcagactgct gctggcggaa 301 gataacgaga tcaaccggga gatcgcctgc gccatcctga ccgacgccgg ctttgccgtg 361 gacacggcgg agaacggcca ggtagcggtg gggatgctgg aggggtcaac ccccggcacc 421 tacgacgccg tcctgatgga catccagatg ccggtgatgg acggattcga ggcatccaaa 481 gccatccgca gcctgcccga tgcggcgctg gctgcggtgc ccatcatcgc catgacggcc 541 aacgcgttcg cggaggacgt ggcggcggag caggccgcag ggatggacgg ccatatttcc 601 aagcccttga accagcagga catgttccgc acgctggatg agatcttatt tggctaacgt 661 tgtatttcga aggagggagg accatgaaca aacgcatttt gaccctttgc ctggcactgc 721 ttctgtgcct gagtcttatt cctgcacaga gcttcgcggt gtccgctccg aagcaggcgg 781 tcatcaaaga ggctcctgtt gcgggagaaa tggccttcaa cagaggcggg ctgggcctga 841 tcgaggccaa ggacggcacc cgttatctga tcgaccggga cggcggcatc taccgttcgg 901 gaaaagcctg gatggactat atggcaggat ccgggagcta caccgtcgac ggtgagggtt 961 actacgaata tccgctcggc aaaaagatgt ttacgatggc cgaaatggag aaaaacgtaa 1021 aggcgttcct ggaagaaaac tatccgatgg gcgaagttgt aagcgtgcag tcggagatca 1081 cctatccgtt ctccggcccc tatgccacct gttcgttctc cgcagccatg aagagcgatg 1141 accagctgga gaaatacgag ttctatgcgc tcatcgacca aagcgggctt gtgcattacg 1201 tgaccccgct gatcgcgctc accgccggcg gcggctttcc gatcgagatg accctcggca 1261 gcggcagcga agggctggtc cggttcacga aggaatacaa cgaccgggaa ggcgagcatt 1321 atctctacga gaccggctat ctggatctcg acggaaacga ggtgctcgtg ttctccaaca 1381 acgacggacg cgatccggaa ggtccggcga tcgtgatcga tgcaagcgac gttgctttta 1441 tcggggattt caataacggc gtcgccgtga tctgcaacaa caggcagaaa gagtccctga 1501 tcgaccgcag cggcaaagtg ctgctgccct ttacgcacga cagcatctat aacgattgcg 1561 gccgctatcc cgtcgtttac gacgaaggca agggctatgg ctatatggac acggcaggtc 1621 tgatcgtgat cccgcagcag tatgaagacg ccaagggcaa ctgggatgac ctctttaccg 1681 tacagaaaaa cggcaaatgg ggtgtcgtcg atacggacaa taagcccgtc gttcccttcg 1741 aatacgactt tatgagcagc ccggagctgg gcatcgtcta tgcctgcaag ggaaacaagg 1801 catacatcat ccggttcgaa gacgcggcgc cggaagaaga gcttacgccc tggggcacgc 1861 cgagagtatc ttctatcttt aaggacgttc ccgcgggcgc ctggtacgag acctatctgc 1921 aggccgctta tgagaacggc atcgtcggcg gcaagggcag cggtcgctac gatccgtccg 1981 gcaatctgaa gcacggcgag atcatggtga tggtgacgca gctgcacgcc ctcgcgaagg 2041 gtgaaaaatt ccagcccgcg ccgaatccca cggaccactg ggcaagagcg tactgcgatt 2101 actgcaaggc ggaaggcatc atcgacagcc gtttcgacaa caagctggac gcgaaggtga 2161 cccgcgcaga gatggcgtac tacttcgccc atgcgctgcg ggacgattat tatctcgaag 2221 aggaagacgt atccctgatg gatatcgcga ccgaggagta cggcggcgac atcctgaagc 2281 tggcgaaggc cggcatcgtc accggttacg atgtgaaggg ccagacggcc aaggaattcc 2341 gtccgcacaa tctcgtgacc cgcgcagaag ctgctgtgtt cgtcacgaat ctgctcggcg 2401 ccatcggacc taccggcggc gtgtactgat ccttatcgca tagaaaaagg gagatccccc 2461 gcgggatctc cttttctatt gcttttcatt atctcagatg cttttcgatc agatccataa 2521 acagttcggc atcggccttc ttggagaaga tggcacgggc aagagtcttg ctgccgccgc 2581 ccttgccgcc gtacatgccg gcgtaatcct tcaccagctg gccggctgcg ggcgttcccg 2641 gggtggccag caccactgtc ttgtcttttt cgctgaacag cgcggagggc tttgtaaaga 2701 tgtcctccgc ttttctcgcc atggactgca gatcgtctgc gctcatcagc gggtagcgga 2761 agaccgccaa gctcccttcc gctttcggca gcgcttctct cagcttttct tcttcccgtt 2821 tagacagagc gctcttcagc tccgacagct cccggcgcac ctcgtcgttt ttggcgtcgt 2881 tggccgcttc tctgtccagt agggtaatta cctcacagga gtacttttgg gccaatgcag 2941 aggcgatttt cgacctcgta cgggcttcct cgaaggcggg tct // LOCUS sequence129 2976 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence129 VERSION sequence129 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2976 /mol_type="genomic DNA" /organism="" /note="sequence129" CDS complement(739..1497) /product="lysophospholipid acyltransferase family protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_000616577.1" /transl_table=11 /codon_start=1 /translation="MLTAALAAIVNIPSCIYWHFKHEKDQQGAYRKATAICHTWIRPLM RIAGVRLHKCGEENLIDDRPVLYVGNHQGDMDILLIMRELENLYSIIAKIETKKIPIVS QWMANANCIFMDRGNPRHTLESIKQAQTLLENGRTVVVFPEGTRSQKAEMNEFKPGAFR CAVKAGVPIVPFVIDGSYKIFEQQRRLRPADVYFHILPAIEPEEIEGMKTPDVSALVQQ KIQDELYRIRQEAGEPVPEEKKVWNAPQNS" /locus_tag="LOCUS_4350" /note="WP_000616577.1 lysophospholipid acyltransferase family protein (Bacillus cereus) [pid:38.7%, q_cov:84.5%, s_cov:90.8%, Eval:2.3e-39]" /note="MGA_615" ORIGIN 1 cgtgcagcgt gacgaccatg tccgccttgg cggtctcgtc gtagtcggcg atgtcgccca 61 cgaggaactg caggtcttca tagcctagat cctgcgccac gccgctgcag aaggcgatga 121 cgtcttcttt caggtccagt cccaccagct tcgctttgta atcgttttta acgtttagat 181 accagtacag ggcgaaggtg agataggact tgccgcagcc gaaatcgatg atgacaggct 241 ctttgggcag gtattccaga caatcctccg cgatctccag aaagcggttg atctgccgga 301 acttgttgcg gtgtttgggc acgatctgtc cgtctctcgt ctgaacgccc aggcgcacca 361 ggaaatccac tggcatgccg tcggggatgg cgtagttctt ctctctgttg tgagcgagag 421 gccccatggt cttcgtgggc ttctttttca ggatcttttc gtggtcgggc ttgttggcca 481 gcacggtgta atccgcttcg gtggagaaaa tatccgcctg cttaaagccg ctctgcagct 541 gccgctcggc gaaggcttcc acctcctccg gcaggaggtt ttcgtgggtc accttttttt 601 cgtaggtgta ttccgcctgg tagtgcaggg catccttgag cagtaccggc cgcagggata 661 ccttgcgcac gggctggctt ttctttctgg gaccgccgaa gaccgccagg atgaggcttt 721 cctccgccgc cagttttcct aggagttctg aggcgcgttc catacttttt tctcctcggg 781 gacgggttca cccgcttcct gacggatgcg gtacagttcg tcctggatct tctgctggac 841 gagagcgctc acgtccgggg tcttcattcc ttcgatctcc tccggctcga tggcgggcag 901 gatgtggaaa tacacgtccg ccggtctcag ccgtctctgc tgctcaaaga tcttatagga 961 tccgtcgatg acgaagggga cgatgggcac accggccttg acggcgcaac gaaaggcacc 1021 gggcttgaac tcgttcatct ccgctttctg gctgcgggtg ccttcgggga atacgacgac 1081 ggtgcggccg ttctccagca gcgtctgggc ctgcttgatg gattccaggg tatggcgggg 1141 attgccgcgg tccatgaaga tgcagttggc gttggccatc cattgggata cgatggggat 1201 ctttttcgtc tcgatcttcg cgatgatgga gtacaggttc tccagttccc gcatgatgag 1261 caggatatcc atgtcgccct gatggttgcc cacgtagagc accgggcggt cgtcgatcag 1321 gttttcttcg ccgcacttgt gcagtctgac ccccgcgatc cgcatgaggg gccggatcca 1381 ggtgtggcag atggcggtcg ctttgcggta ggcgccttgc tggtcttttt cgtgcttaaa 1441 gtgccagtag atgcagctgg gaatattgac gatggcggca agggctgccg tcagcaaaaa 1501 cagaatactt ctcataaaaa attttacctc gccgttgatt ttatcataaa tgtgagggat 1561 tttgtgataa tatataaaag ttaaagttac agacagagga acacacaata tgagcaagaa 1621 gaaaatcatc aatatcgcgg tcatcgccca cgtagacgcc ggaaaatcca ccctggtgga 1681 cgcattcctg gcccagagcg gcgtgttccg cgaaaacgaa gagatggtag cccagaccat 1741 ggactccaac gatctggagc gggagagagg catcaccatc tattccaaga actgttccgt 1801 catgcacgac ggttacaaga tcaatatcgt cgacaccccg ggccatgcgg acttctcctc 1861 ggaagtggag cgcatcatca agaccgtgga tacggtcatc ctgctggtgg actcctccga 1921 aggccccatg ccccagaccc gtttcgtgct ccagaagtcc ctggagcaga acctcaatcc 1981 gatcctgctg atcaacaaga tcgacaagcg cgacgcgcgg atcgacgagg tggtggacga 2041 ggtctacgag ctgttcatgg atctggaagc caacgacaga cagctggatt tccccatcct 2101 gtacggcatc gcccgccagg gcatcgtcgt gagagatccg gcggatgctg cgggggtcac 2161 cgtggaaggc gagagcggca ccaaggtgag aaagagagcg gctgggcagg acggcctcaa 2221 cattacgccg ctgtttgaga ccattatcga gcaggtgggc ggctatgagg atgcggacga 2281 ggagccgctg cagttccaga tctccacgct ggcttacgac gactatatcg gacgtctggg 2341 catcggccgc gtgacccgcg gcaagatccg tccgggtcag caggtcgccg tctgcaagcc 2401 cgacggcacg tataagatgg ggaagatcaa ccagaccttc gtgtacagag gcctgaagag 2461 aacggctgtg gacgaagtcg gaagcggcga catctgcgtc atctccggca tttccgacat 2521 tacgatcggc gacacgctct gcgaggaaga gcatatcgat ccgctgcccc acatcgagat 2581 cgaggaaccg acgctgtcca tgaatttcat ggtcaattcc tctccgttcg cgggcaagga 2641 aggcaagtac gttacgaccc gccacatcaa ggagaggctg gagaaggaac tggaggtcaa 2701 cgtcggcctg ctggtggagc ccaccgacag cacggattcc ttcaaggtgt ccggcagagg 2761 cgagctgcat ctgcccatcc tcatcgagaa catgcgccgc gaaggctacg agctggcggt 2821 gtccaagccg gaagtcatct taaagcgggg tgaccacggt cagaagcagg agcctgtgga 2881 agaggtcgtc atcgaagtgc ccgaccagta ttccggtggg gtcatctctg acctcaacct 2941 gcgcaagggc atgatggtct ccatggacgg tcgcaa // LOCUS sequence130 2973 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence130 VERSION sequence130 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2973 /mol_type="genomic DNA" /organism="" /note="sequence130" CDS complement(548..1324) /product="arginine ABC transporter substrate-binding protein ArtP" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_004398706.1" /transl_table=11 /codon_start=1 /translation="MAKKLTALLLALCMIVGLAACSGSSSDTATWEDELGTKGKLRVGM AADYPPYESYDAQGNVVGLDADIAAMIAEQLGVELEIVPMEFDTIISAVTAGTVDMGIS CFSYTEERAKSVLFTETYMTSAQCCFASTDFGITKLEDLKGGLVGAGNGTTGMEVAEAM APEYGFSTQAGEIAVMSESLKNGAMQAIITEQCVADSYIAANPGKFQMVAEDLTVEEIK AITNLNNTKLQEKVNEIIKSFVASDAYSELVVKWFD" /locus_tag="LOCUS_4360" /gene="artP" /note="WP_004398706.1 arginine ABC transporter substrate-binding protein ArtP (Bacillus) [pid:33.7%, q_cov:96.9%, s_cov:96.1%, Eval:3.2e-31]" /note="MGA_618" CDS 1738..2526 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MHSPFIEWVIHQVRVEHWTFDTCVGRARRKGLFPREQIVCAKTLY NELWAGNLPLTPFDLPEALSRKRKNNRPRQNKRILGKSIDERPEEASLRTVCGHWEIDT VVGHRSGRESVVLTLVEKKTDHYLAIKIPGKDSDSVMAAMEVLKEEYGDAFSEIFKTIT ADNGSEFERLSELEAYGVGVFFAHPYSSWERPQNERHNRLFRRYLPKGRSIDNYTAEQI LQFADEMNALPRRTLGYATPEELFDEFLDQVYSVNKVQIA" /locus_tag="LOCUS_4370" /note="WP_004270929.1 IS30 family transposase (Lactobacillaceae) [pid:41.3%, q_cov:92.4%, s_cov:69.4%, Eval:5.5e-47, partial hit]" /note="MGA_619" ORIGIN 1 cttgaaggcc tggggcagga tgatctcccg catggtctgc ttgtgggaga ggcctatggt 61 ctgcgccgct tcccactgac ctttatccac ggactggatg gcggagcgga acagttccgt 121 cgtgtaggcg ccggagttga ttcccacggc gatggtgccc accaggatgg ggttgggcgt 181 gtatacgtag tggaacaggg ctctggtgac cacagggccg cccaggtaga gcagcaggat 241 ctgcagcatc atgggtgtgc cgcggatgac ctccacatag atgttcgcga tcagcttcgg 301 cagtttgtgc ttgcccatct ttgccatggc ggaaagcagg ccgaggacgg agccgccgac 361 cagggcacat acggccacca agatggaata gccggcgccc ttgatcataa actggagatt 421 ttccggcgtg aggattcttt ggattgcgtt cataaacgga tacctctaag acgacaatca 481 tggcaggaag ggtctccctg ccatgatgct tgcggattcg gatgttccgg tgcgcggatt 541 tttcgcttta gtcgaaccac ttgacgacca gttcgctgta ggcgtcgctg gcgacgaagg 601 acttgatgat ctcgtttacc ttttcctgca gcttcgtgtt gttcaggttc gtgatcgcct 661 tgatctcttc cacggtgagg tcttccgcca ccatctggaa cttgccgggg ttggcggcga 721 tataggaatc ggctacgcac tgctcggtga tgatggcctg catcgcgccg ttcttgagag 781 attcgctcat gacggcgatc tcgccggcct gggtggagaa gccgtattcc ggcgccatcg 841 cttccgcgac ttccataccg gtggtgccgt tgccggcgcc taccaggccg cccttcaggt 901 cttccagctt ggtgatgccg aaatcggtag aagcgaagca gcattgggcg gaggtcatgt 961 aggtctcagt gaagagaacg gatttagcgc gctcttccgt gtaggagaag caggagatgc 1021 ccatgtcgac ggtgcctgcg gtgaccgcgc tgatgatcgt atcgaattcc atgggtacga 1081 tctccagttc tacgcccagc tgttcggcga tcatggctgc gatatcggca tcgaggccga 1141 cgacgttgcc ctgggcatcg taggattcgt agggcggata gtccgccgcc atgccgactc 1201 tcagcttgcc cttcgtgccg agttcgtctt cccaggttgc agtatcgctc gaagagccgg 1261 agcaggctgc gaggcctacg atcatgcaca gtgccagaag cagtgcggtc agtttctttg 1321 ccattttgtt ttccttcttt cttgttggtt aattgtaaaa tcaaattgaa caactgaata 1381 aaaaagtgat ccataggatt cctttggtag aattgagtta ccacactaac aaaacttccg 1441 aaggagaacg ctatggatca actcaatgct accacattta cacccgatcg cgaaagaggt 1501 cagcacttaa aacttgaaga tcgtttcagc attaagattt tcaggaaaca ggggcattcc 1561 cttcgcagta ttgctgcaga acttgattgt tctccgtcga ccgttatgta tgagttgcga 1621 cgtggaaccg gcgagcgcaa tggaaagcgc ggccgcttcc cggaatactc tgcaaagcgc 1681 ggtcaggcga attacgaaat caatcgctca agatgccaca aaccgcacaa ggtcaatgtg 1741 cacagtccgt tcatcgaatg ggtcatccat caggttcggg ttgagcattg gacctttgat 1801 acctgcgtcg gcagagccag acgcaagggc ttgtttccca gagaacaaat cgtttgcgcg 1861 aagaccctct acaacgagtt atgggccgga aatctcccgc ttacgccgtt tgatcttcct 1921 gaagcgctgt ctcgcaagcg caagaacaat cggccccgtc agaacaagag gatccttggg 1981 aaaagcattg atgaacgtcc tgaagaggcc tcactgcgca cagtttgcgg acactgggag 2041 atcgacactg ttgtggggca ccgcagtggc agagaatcgg tggtcttgac tctcgtagag 2101 aagaagaccg atcactacct ggcgatcaag atccccggta aagattcgga ttcggttatg 2161 gccgcaatgg aagtcctgaa agaagagtac ggagatgcat tctccgagat cttcaaaacg 2221 atcacagcgg acaacggcag tgagtttgaa cgcctctcag aacttgaggc ctatggcgta 2281 ggcgtattct tcgctcatcc gtattcttcg tgggaaagac cacagaacga gcggcataac 2341 aggctgttca gaaggtacct tcccaagggc agatcgattg acaactatac tgcagaacag 2401 atcttgcagt tcgcggacga aatgaatgcc ttgccgcggc gtaccctagg gtacgctact 2461 ccggaggaac tctttgatga gtttctggat caggtgtatt cagttaacaa ggtacagatt 2521 gcttaactgt ttgtgttcaa cttgaaattg ctttttacga tatgataaaa tcaaatgaat 2581 tctgcaaaat cgcaaaagaa aggcgctttt cggatgatcc gcatattagg aatagacccc 2641 ggttacgcca tcatgggctg gggggtcatc gaaaaaaacg gaagcagttt taagcccatc 2701 gcctacggat cgctcacgac ggataaggat atgcccatgc ctcagaggct caaaagcctg 2761 tacgcggggc tgatggagat catggcggag taccagccgg aggagatgag catcgagcag 2821 ctctacttca acgataatgc caagacagcg atattcgtcg gccaggccag gggcgtcgcc 2881 atccttgccg gggtcaacag cggccttacg atctacgaat acacgccgct ggagatcaag 2941 atgaacatca ccggttacgg cagggcggac aag // LOCUS sequence131 2960 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence131 VERSION sequence131 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2960 /mol_type="genomic DNA" /organism="" /note="sequence131" misc_feature <1..1081 /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_011393940.1:elongation factor G" /note="WP_011393940.1 elongation factor G (Moorella thermoacetica) [pid:71.1%, q_cov:99.4%, s_cov:51.6%, Eval:6.8e-148, partial hit]" /note="MGA_621" /locus_tag="LOCUS_4380" CDS 1130..2329 /product="elongation factor Tu" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_009887863.1" /transl_table=11 /codon_start=1 /translation="MAKAKFERTKPHVNIGTIGHIDHGKTTLTAAITKVLATRFPSATN QIVAFENIDKAPEERERGITINTAHVEYETAHRHYAHVDCPGHADYVKNMITGAAQMDG AILVVGATDGPMPQTREHILLSRQVGVPYIIVFLNKCDMVDDEELLDLVEMEVRELLDE YEFPGDDTPIIRGSALEALQHPDGPWGDKVMELLDAVDTYIPEPERKSDLPFLMPVEDV FSITGRGTVATGRVERGTIKVGDTVEIVGLTDEKRAVVVTGVEMFRKLLDQAIAGDNIG CLLRGVQRNEIERGQVLSAPGSIHPHTHFKGQVYVLKKEEGGRHTPFFNGYRPQFYFRT TDVTGTLTLPEGTEMCMPGDNVVMEIELITEIAIEEGLRFAIREGGRTVGSGVVTEIIE " /locus_tag="LOCUS_4390" /gene="tuf" /note="WP_009887863.1 elongation factor Tu (Clostridioides) [pid:77.7%, q_cov:100.0%, s_cov:100.0%, Eval:7.3e-178]" /note="MGA_622" CDS 2451..2936 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MNISFDKAKEILGGFTAQAQDMLKDGSKVEAALEALEAKMKEIPT IGEGLSRLPLMISMIRAYITKEYTEVSPKVVASMLCAVLYLVKGRDLIRDDIPVVGLVD DIAVAGAAFMLSEKELDAYAAWREAKDCTVTAERALPQTEDVSEALEAQMDEIPTEA" /locus_tag="LOCUS_4400" /note="MGA_623" ORIGIN 1 cgtatactcc ggaacgctcg caagcggttc ctacgtgtac aatccgcgca aggacaggaa 61 ggagcgcata ggccgcatcc ttcagatgca cgccaatcac agggaagaca tagacatggt 121 ctattccggc gacatagccg cagccgtagg acttaaggac accaccacgg gcgacacgct 181 ctgcgacgag aagcatccca tagtcctgga atccatggaa ttcccggatc cggtaataca 241 gatagccatc gagcccaaga ccaaggccgg tcttgaaaag atgggcatcg ctctgtcgaa 301 gctggcggaa gaggatccta ctttcaggac ctggaccgac ccggacaccg gccagaccat 361 aatcgcaggc atgggagagc tccatctgga gatcatcgtg gacagactgt tccgcgagtt 421 caaggtggag gccaacgtcg gaaagccgca ggtatcctac aaggagacca taacccagga 481 gtctgtaagc gagtacaagt acgcgaagca gtcgggcggc cacggtcagt acggacacgt 541 aaagataagg ctctacccca gagaggcagg cgccggctac gagttcgtca acaagatcgt 601 gggcggagcc atccccaagg agttcatacc caagatcgac gaaggtatac gcgaagccat 661 gcagaacggt ccgctcgccg gttatcaggt ggtggacatg ggagtggaac tgttcgacgg 721 ttccttccac gaggtagact cgtccgagat ggcgttcaag atcgccgcgt ccatggcatt 781 ccgcgagggt gccagaaagg caaagcccat acttcttgag ccggtcttca aggtagaggt 841 caccgctccc gaaaactaca tgggagacgt aataggcgac atcagctcca gaagaggccg 901 catagaagga acggacatct tcaacggaat agcaagcgta cacgcaatgg tgccgctgtc 961 cgagatgttc ggctacgcca cggatctaag gtccaagacc cagggaagag gagcatacgt 1021 aatgcagatg gatcattttg aaaaattacc cgattccctg attgaaaaaa tcaacaaata 1081 aagtataatt aatgagttag tactaacatt cattttttgg aggaaaaaaa tggcaaaagc 1141 aaaattcgaa agaaccaagc cgcatgttaa catcggtacc attggtcaca tcgaccatgg 1201 taagaccacc ctcaccgcag cgatcaccaa ggtgctcgct accagatttc cgtccgctac 1261 caaccagatc gtagcattcg agaacatcga taaggctccg gaagaaagag aaagaggtat 1321 tacgatcaat accgctcacg tagaatacga gaccgcgcac agacactatg cgcacgttga 1381 ctgcccgggt cacgcagact atgttaagaa catgatcacc ggtgccgctc agatggacgg 1441 cgctatcctg gtagttggtg ctaccgatgg tccgatgccc cagaccagag agcacatcct 1501 gctgtcccgt caggtaggcg ttccctacat catcgtattc ctgaacaagt gcgacatggt 1561 cgacgacgaa gagctgctcg acctggtcga aatggaagtt cgcgaactgc tggacgaata 1621 cgaattcccc ggcgacgaca cccccatcat cagaggttcc gctctggaag ctctgcagca 1681 tcccgatggc ccctggggtg acaaggttat ggaactgctc gacgctgtcg acacctacat 1741 tcccgaaccc gaaagaaagt ccgacctgcc cttcctgatg cccgtagaag acgtcttctc 1801 catcaccggc cgcggcaccg ttgctaccgg tcgtgttgaa agaggcacca tcaaggttgg 1861 cgacaccgtt gagatcgttg gtctgaccga tgaaaagaga gctgtcgtcg ttaccggcgt 1921 tgaaatgttc cgtaagctgc tcgaccaggc tatcgctggc gacaacatcg gctgcctgct 1981 ccgtggtgtt cagagaaacg agatcgaaag aggtcaggtt ctctccgctc ccggcagcat 2041 tcatccccac acccacttca agggccaggt atacgttctg aagaaggaag aaggcggccg 2101 ccacactccg ttcttcaacg gttacagacc ccagttctac ttcagaacca ccgacgttac 2161 cggtactctg actctgcccg aaggcactga aatgtgcatg cctggcgaca acgtcgtcat 2221 ggagatcgag ctgatcaccg agatcgctat cgaagaaggt ctgcgtttcg ctattcgcga 2281 aggcggcaga accgttggtt ccggcgttgt taccgagatc atcgagtaat tcgaaataag 2341 tcactttaag agagctcttc ggagctctct tttttcgttg agccgctgag ttgaaaaccc 2401 gccgcttttt ttgtacaatc gtagcaggtt ttctagatag gaggcaaacc atgaacatca 2461 gctttgataa ggcaaaagaa attctgggcg ggttcaccgc acaggcacag gacatgctga 2521 aggacggcag caaagtggaa gctgctctgg aagcgctgga agccaagatg aaggagatcc 2581 cgacgatcgg cgaaggcctc tccagactgc ccctcatgat ctccatgatc cgggcataca 2641 ttacgaagga atacaccgag gtgtccccga aggtcgtcgc gtccatgctg tgcgcggtgc 2701 tgtacctggt gaagggcaga gaccttatcc gggacgacat ccccgtcgtg ggcctggtgg 2761 acgacatcgc cgtggcaggc gccgcgttta tgctgtccga gaaggaactg gacgcctacg 2821 ccgcatggcg cgaagccaaa gactgcactg tgaccgctga gagagcgctg ccgcagacag 2881 aggatgtgtc cgaggcgctc gaagcgcaga tggacgagat ccccacggaa gcgtagccgc 2941 acgcacagct acccgaagac // LOCUS sequence132 2951 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence132 VERSION sequence132 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2951 /mol_type="genomic DNA" /organism="" /note="sequence132" misc_feature <1..805 /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_004081442.1:ABC transporter ATP-binding protein" /note="WP_004081442.1 ABC transporter ATP-binding protein (Thermotoga) [pid:57.9%, q_cov:97.4%, s_cov:78.1%, Eval:1.1e-82]" /note="MGA_624" /locus_tag="LOCUS_4410" CDS 795..1775 /product="dipeptide ABC transporter ATP-binding protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011172559.1" /transl_table=11 /codon_start=1 /translation="MESKVLVETKDLTKEFPTKSGSFGKNRATVHAVTDVNLQIFQGET LGVVGESGCGKSTLGRLIIRLLDPTRGQVFFEGKDLGKMSVEELRSQRKQMQMVFQDPY ASLNPRLRVRDLIAEPLITHKVNNTAKEDTDRVEDLMRKCGIRPEFMYRYPHQFSGGQR QRVSIARALALNPKLIICDEPVSALDVSIQSQILNLLGDLQQELGLTYVFISHDLSVVR YLSDRVCVMFLGKVCELGITRDIYANPLHPYTKFLLEAVPIPDPKYRKDQKDMLTGEIP SPVNPPSGCHFRTRCPYATERCAKEVPQLHEVEPGRTVACHLFDK" /locus_tag="LOCUS_4420" /EC_number="7.4.2.-" /note="WP_011172559.1 dipeptide ABC transporter ATP-binding protein (Thermus thermophilus) [pid:57.4%, q_cov:97.2%, s_cov:96.6%, Eval:3.7e-105]" /note="MGA_625" ORIGIN 1 cgggcgcgtc gtggacggcg agatcctgct gaagggcgaa aacctgctga agaaaacgcc 61 gcgccagatg tgcgacataa gaggcaacga gatctccatg atcttccagg agcccatgac 121 ctccctcaac ccggtgtaca ctatcggcaa gcaggtgatg gaggccgtgc gccagcacca 181 ggacgtaagc aaggaagaag cgaaaaagat cgccatcgac atctttaagc ggatcggtat 241 ccccgaaccg gaaaagcgct tctattccta tccccaccag ctgtccggcg gtctgcgcca 301 gagagtcatg atcggcatgg ccatggtatg caaccccgcg ctgatgatct gcgatgagcc 361 taccacggct ctggacgtca ccatcgaagc ccagatcctg tacctcatca aggagatgca 421 gaaagaaaag gggacggccg tcatcatgat cacccacaac ctgggcgtcg tggcggagtc 481 ctgcgactac gtctacgtga tgtatgcggg caagatcatg gaagaggcca gcgtctacga 541 gatcttcgag catccgaccc atccctatac ctacggtctt ctgaactcca ttcccaagac 601 caccgaggtg aaggaccatc tgtttacgat ccgcggcctc gtgcccaacc tgctgagcct 661 gcccaagggc tgccggttct gcacccgctg cgacaaagcc atgaagatct gcacggaata 721 cgaaccggat ctgtacgata tcggagacgg acataaagtc cgctgcttcc tggcgaacaa 781 ggaggtgatg gcgagtggaa agtaaagtat tggtcgaaac caaagatctg accaaggaat 841 tccccacgaa atccggatcc ttcggtaaga accgggcgac agtccacgcc gttacggacg 901 tcaaccttca gatcttccag ggcgagactc tgggcgtcgt aggcgaatcc ggctgcggca 961 agtccacctt ggggcggctc atcatccgcc tgctggaccc caccagaggc caggtgttct 1021 ttgaaggcaa agacctcggc aagatgagcg tcgaagaact gcgttcccag cgcaagcaga 1081 tgcagatggt cttccaggat ccgtatgcat ccctgaatcc ccgtctgcgg gtgcgcgacc 1141 tgatcgcaga acccctcatt acccataagg taaacaatac ggcaaaggaa gacaccgacc 1201 gggtcgaaga cctgatgcgc aagtgcggca tccgtccgga attcatgtac cggtatccgc 1261 accagttttc cggcggtcag cggcagcgcg tcagcatcgc cagagccctg gcgctcaacc 1321 cgaagctcat catctgcgac gagccggtct ccgcgctgga cgtctccatc cagtcccaga 1381 tcctcaacct gctgggcgac ctgcagcagg agctgggcct cacgtacgtc ttcatctctc 1441 acgacctgtc cgtggtgcgc tacctgtccg accgggtgtg cgtcatgttc ctgggcaagg 1501 tgtgcgagct gggcatcacg agagacatct acgcgaaccc gctgcacccc tacacgaaat 1561 tcctgctgga agccgtgccc atccccgatc cgaagtacag aaaggatcag aaggacatgc 1621 tcacaggcga gatcccgtct cccgtcaacc cgcccagcgg ctgccatttc cgcacccgct 1681 gcccgtatgc gacggagcgc tgcgcgaagg aagtgcccca gctgcacgaa gtggaaccgg 1741 gacgcaccgt ggcctgccat ctgttcgata agtgatactg tggaaaacga agccgctcct 1801 ttccgggagc ggcttttata tgataaaata aaaagaacat acccgttttt taggagaata 1861 cccatggatt taaaagaact tatcaaaatc gacccggtca tagcggatct tgccgaagcg 1921 aaggaagtct gctggatcaa tccgaagaag atcccctttg ccgaggcaaa ggataagctg 1981 gtcttcggcc ccgaagatat tgcggaagca tccgcccgcc tgcagcgctt tgcgcctctg 2041 ctggcgaaga tctttccgga gacggcggag cagggcggca tcatcgaatc tcctctgacg 2101 gagatccccg acatgaagga tctgttaaag gagaagtacg gcgcggacct gggatctgcg 2161 aggctgttct taaagcggga ttccgatctg gcggtggccg gttccgtcaa agcaaggggc 2221 ggcttccacg acgtgctgaa gcatacggag gacctggcgc tggaggcggg catcttctcc 2281 tcgcgggagg atgacccgat gaagctcctg cagccggaag cgatcgcctt ctttaaaaat 2341 cataaggtgc aggtggcttc caccggcaat ctgggcgtct ctatcggcat gatgagcgca 2401 cacctgggct accaggccat cgtgcacatg tcggcggacg cgaagcagtg gaaaaaggat 2461 tacctgcggg cccacggggt gaccgtcatc gaatacgcag gcgactacgg caaggccatt 2521 acggaaggcc gtgcgatctc cgatgcggat ccggacagct atttcgtgga cgacgaaaac 2581 tccaaggagc tgtttatggg ctatgccgtg gccgcggaac ggctgcagaa gcagctggcg 2641 gatgaagggg tcaccgtgga cgaagcacac cccctgttcg taacgatccc ctgcggcgtg 2701 ggcggcgccc cgggcggcgt ggccttcgga ttaaagcaga tctacggcga caatgtgcat 2761 gtgctgttcg cagagcccgt ccaggcctgc tgcatggtgc tgggcatggc gacggggctg 2821 cacaatcaga tctgcgtgca ggacatcggc ctttccggta agactcatgc agacggcctg 2881 gcggtgggca gggcttccag cctggtagga aagatcatgg aaccgctgct gaccgctgag 2941 gttacgctgg a // LOCUS sequence133 2915 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence133 VERSION sequence133 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2915 /mol_type="genomic DNA" /organism="" /note="sequence133" CDS 1845..2318 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MNKKEAKTKKDRSIQPALTGVICFALIVIIAISIPLYRHRQYVKF TSELSSLTTRAGGKGAVTCEMDGGTSNVSPDAAYEIYAKLIFSELKKHVKPDPALAESG LRLSYGLLGGELTLAPAEYQGEEALYVEFHSRDMDYTYLAPHLRYKDFEMLVR" /locus_tag="LOCUS_4430" /note="MGA_628" CDS 2370..2780 /product="ASCH domain-containing protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_002354908.1" /transl_table=11 /codon_start=1 /translation="MKLDGLEKWHFELTEKACNELLDLVLQGKKRATSSSLASFRAEGT AVPEEGELSVITDWDGHPCCVIRTTKVRVIPYKDIPFGLARLEGEDDTLASWRKNHEAF FREEGKSLGYSFSEDMEIVFEEFEVVETIKPK" /locus_tag="LOCUS_4440" /note="WP_002354908.1 ASCH domain-containing protein (Enterococcus) [pid:36.1%, q_cov:86.8%, s_cov:76.3%, Eval:4.5e-14]" /note="MGA_629" ORIGIN 1 acgaccatct tgtcgatctt ggcctgggtc tccggggagc aggccagggt ggtgtcgccg 61 cccagatact ggttggtgac ggtctccatg gccaccatgc cgaattcgcc catgccgtaa 121 cgggtgatca tagcccgggc cagcttcgta gcctgttcga tatcgttgga agcgccggtg 181 gtgatggacc cgaagatgag ttcctccgca gcccggccgc ctgtcagcgt cgcgatcttg 241 ttctgcagct cttccttgct catcaggtag tgctcgccct cgtccacctg catggtgtag 301 cccagggcgc cggacgttct cggaatgatg gtgatcttct gcaccggtgc ggaatgggtc 361 tgcatggccg ccaccagtgc gtgacccact tcgtgatagg ccacgatgct cttctccttg 421 tcggagagga tggcgttctt cttctgatag ccggcgatga cgacttcgat gctttcctcg 481 aaatctctct ggctggccat cttgcggccg tcccggacag cccgcagcgc cgcttcgttt 541 acgatgttgg ccagctctgc gccggaggca cctgacgcca tgcgggcgat cttaccgtag 601 tcgatattgg gttcggtctt caacttcttg gcgtggacct tcagaatggc ttctcttccc 661 tttaagtcgg gcagttccac gggcacgcgg cggtcgaatc tgcccggtct ggtgagggcc 721 ggatccagag attcgggccg gttggtggcc gccaggatga tgaccccggt attgccttcg 781 aaaccgtcca tctcggtcag aagctggttg agcgtctgct ctctttcgtc gttgccgccg 841 atgttgccgc cgtttctctt ctggccgatg gcatcgatct cgtcgataaa gacgatacag 901 ggggcctttt ctttggcctg cttaaacagg tcgcgcacct tggatgcgcc cataccgacg 961 aacatctcca cgaattcgga gccgctcatg gagaagaacg gcacgttggc ttcgcctgcc 1021 acggcctttg ccagcatggt cttaccggtt cccggaggac ccaccagcag cacgcccttc 1081 ggcatggaag cgccgatctc ggaatacttg gaggggttgc ccaagtaatc cacgatctcc 1141 tttaaatttt cttcggcttc atccacgccc tccacgtcgg agaaatggat gccgtcggag 1201 gattttacgt agatcttcgc gttgctcttg cccaggttga acatcatgga accggggccg 1261 ccggccttgt ccatcatctt tctggacagg tactggccga ggaagataaa gatgaagatc 1321 ggcaggatcc aggtgagcag aaaactggtg aagggcgacg cctgttccac gatctggctc 1381 gtaaactccg cgccggattc gtgcaggcgc tgcaccagcc ccggatcgtc catgatgccg 1441 gtgcggtaga tctgcggggg atccgccttg tctgtaaaga ggatcatgtt ggagcggact 1501 tccacctctc cgatctgttt tttctccgtc atggtcatga aggtgccgta gtccacctcc 1561 tggatctgct gctttgccag ggacggcagc accagagtgt tgaacaccag catcaggatc 1621 agcatgacga tatagaagat cagcatgggt cttctcggtt gtttgacttc gttcatattg 1681 tctcctttat ataaaaagtg gatcgtctta aatactaacg gtattatggc acaggtttta 1741 gcactcgtca acagagagtg ctaaagttcc gcacattgcc cttggtctgc cccgtatcta 1801 tgctataatg gaacggaggg gtgacccccg gaaaggttgg aatgatgaat aaaaaggaag 1861 cgaaaacgaa aaaagaccgc agcatacagc ctgctctgac aggggtcatc tgttttgcgc 1921 tgatcgtgat catcgccatc tccatccccc tgtaccggca ccggcagtac gtaaaattca 1981 cctcggagct ctccagtctg acgacccgcg ccggcggcaa gggcgccgtc acctgcgaga 2041 tggacggagg gacctccaac gtttcccccg acgccgccta cgagatctac gccaaactca 2101 tcttttccga gctgaagaag cacgtaaaac cggacccggc gctggcagag agcgggctgc 2161 gcctctccta cggactgctg ggcggggaac tcaccctggc gcctgcggag tatcagggcg 2221 aggaagcgct ctacgtggaa ttccatagcc gggacatgga ttatacctat cttgcgcccc 2281 acctgcggta taaggatttt gaaatgttgg tgagataggc atcatagccg tatacgaatt 2341 gtgagcgaag cactgtggag atttaggtga tgaaactgga cggtttggaa aagtggcact 2401 ttgagcttac ggaaaaagcc tgcaacgaat tgctggatct ggtcctgcaa ggcaaaaagc 2461 gggcaacctc gagcagcctg gcaagcttcc gggccgaagg cacggcagta ccggaagaag 2521 gagaactgag cgtgatcaca gactgggacg gacatccctg ctgtgtcatc cggacaacaa 2581 aggtccgggt gatcccatac aaggatatcc cctttggcct ggcacgcctc gaaggagaag 2641 acgataccct cgcctcgtgg cggaagaatc acgaagcctt ttttcgggaa gaaggaaagt 2701 ccttggggta ttcgttttct gaggacatgg agatagtctt cgaagagttt gaagtcgtag 2761 aaacgataaa acctaaataa atggatcgat ccgctgcgca ctgcgcaagg atcgatcctt 2821 ttttaatcct gcgtattgta gaccttggag atctcctccc ggttgccgcc gataaagatg 2881 agggcggccg ccaggcacac gaggttgacg gacat // LOCUS sequence134 2911 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence134 VERSION sequence134 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2911 /mol_type="genomic DNA" /organism="" /note="sequence134" CDS 3..776 /product="RluA family pseudouridine synthase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_071542473.1" /transl_table=11 /codon_start=1 /translation="MLSKKEKLKEGSEVRIELPPAVPCEAVPQDIPLDIVYEDAHLVVV NKPKGMVVHPAPGNPDGTLVNGLLYHCGALSLINGVERPGIVHRIDKDTSGLLVCAKSD EAHRGLTEQLASHSCTRQYRGVAFYAFKEAAGTVDAPIGRDPSNRLRMAVVPGGKRAVT HWQVSEEFNGFTEIRARLETGRTHQIRVHMASIHHPLLGDTVYGPQKQPYSLHGQMLHA EILGFTHPVTGQYMEFRADPPEEYLQTLEKLRNRK" /locus_tag="LOCUS_4450" /note="WP_071542473.1 RluA family pseudouridine synthase (Moorella thermoacetica) [pid:58.7%, q_cov:97.7%, s_cov:82.4%, Eval:2.4e-79]" /note="MGA_630" CDS 773..1459 /product="flavin reductase family protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011017175.1" /transl_table=11 /codon_start=1 /translation="MKRTLKPGTMLYPLPAVLVTGGDMENSTLMTAAWTGIVNSDPPMT YVSIRPERYSYDIIRERGEFVINLTTRQLVRETDYAGCVSMRKEDKFKKLGLTKEAADE VAAPLIAQCPVNLECKVVEVKDLGSHSMFLANIVAVHVDEKLFDKNDRICLENADLLAY IHGGYLPLGSKKLGTFGYSVMKPKTKKKKAAESRQASLMKAKAKGNTPAKKKSIFTGKS KLVSKE" /locus_tag="LOCUS_4460" /note="WP_011017175.1 flavin reductase family protein (Fusobacterium nucleatum) [pid:44.9%, q_cov:86.4%, s_cov:98.5%, Eval:1.2e-44]" /note="MGA_631" misc_feature complement(1619..>2911) /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_010965410.1:NFACT RNA binding domain-containing protein" /note="WP_010965410.1 NFACT RNA binding domain-containing protein (Clostridium) [pid:33.1%, q_cov:99.3%, s_cov:78.6%, Eval:2.0e-64]" /note="MGA_632" /locus_tag="LOCUS_4470" ORIGIN 1 ccatgctctc gaaaaaggaa aagctgaaag agggcagcga agtccggatc gaactgccgc 61 ctgccgttcc ctgcgaagct gtgccccagg acattccgct ggatatcgtc tatgaggatg 121 cgcatctggt ggtggtcaac aagccgaagg ggatggtggt gcatcctgcg ccgggcaacc 181 cggacggcac cctcgtcaac gggctgctgt atcactgcgg cgcgctgtcg ctcatcaacg 241 gtgtcgaacg gccgggcatc gtccaccgca tcgacaagga tacgtccggt cttctggtct 301 gcgccaaatc cgacgaagcg caccgggggc ttacggaaca gctggcgtcc cattcctgca 361 cgcggcaata ccggggcgtc gcgttctacg cctttaagga ggcggccggc acggtggacg 421 cgccgatcgg gcgtgaccct tccaaccgcc tgcgcatggc ggtcgttccg ggcggaaaaa 481 gagccgtaac gcactggcag gtctcggagg aattcaacgg atttacggaa atcagggcgc 541 gcctggagac gggccgcacc catcagatcc gcgttcatat ggcttccatc catcatccgc 601 tgctgggcga cacggtctac gggccgcaga agcagcccta cagcctgcac ggccagatgc 661 tgcacgcgga gatcctggga tttacgcatc ctgttacggg acaatacatg gaattccggg 721 cggatccccc ggaggaatat ctgcagactt tggagaaact gaggaacaga aaatgaagag 781 aacgttaaaa ccgggcacga tgctctatcc gcttcccgcg gtcctcgtga cgggcggcga 841 catggaaaac agcacgctca tgacggctgc ctggacaggc atcgtcaatt ccgatcctcc 901 gatgacctac gtatcgatcc ggccggaacg gtacagctac gatatcatcc gggaaagagg 961 ggagttcgtc atcaatctga cgacccggca gctggtccgg gagacggatt atgcaggctg 1021 cgtctccatg cgtaaagagg ataagtttaa gaaactgggc ctgacgaagg aggctgcaga 1081 cgaggtcgcg gcgcctctga tcgcgcagtg cccggtcaac ctggaatgca aagtcgtgga 1141 agtgaaggat ctgggcagcc attccatgtt cctggcgaat atcgtcgcgg tccacgtgga 1201 cgaaaaactg ttcgacaaga acgaccggat ctgcctggaa aatgcggatc tgctggcata 1261 tatccacggc ggttatctgc ctctgggctc gaagaaactg ggcaccttcg gctattccgt 1321 catgaagccg aaaacgaaga aaaagaaagc agctgaaagc aggcaggcct ctctaatgaa 1381 ggcgaaagcg aaggggaata cccccgcgaa aaagaagagc atctttaccg gtaaaagcaa 1441 actggtatcg aaggaatagc aaaaagccgc ctccggtggg gcggcttttc ccatgtttac 1501 agatctcttc tcggcgcggg agcatacctc atttctgcaa gatttaccgg aatctgttgg 1561 taataattgt aatagcagaa aatggaaacg tcaagagatt tctgtaaaat attactaatt 1621 attttttcat ggtctccgga tcttccgggt cgacccatac ggtacggttg ttcgtgaaga 1681 tcaccatgcc gggcttggct ccggaaggct tctttacata ccgcaggggc acgtagtcca 1741 caggcacgtt ctgggactct tttcccttgg aataccaggc cgcgacggct gccgcttcgt 1801 agatctcgtc ctcgcccggc gtatcgccgt tcataaacag gacaacgtgg gatccgtgga 1861 tgtccttggt gtgcagccaa tagtccgtct tgccgcccac tttgaaggtg atatagtcgt 1921 tctcggcgtt gttccttccc acggcgatct cccggccaca gggcagggta aagcgtctgg 1981 gcttcggttt cgctttcgcg gctgcccgtt ttctgtcctt tgcctgccgg ccccgcagat 2041 agccttcccg gatgagttcg tcccggatca gctccatctc ctcgtaggtg gacgaaagag 2101 agatctggtc ctgcacggtg ctcaggtatt caatgtcctt ctcgcactcc tccagctgga 2161 tgagcttttc ttttttcccg gtctttgcct tcgcatattt cttaaaatag ttctgggcgt 2221 tgcgggccgg ggagaagcgt tcgtcgagct cgatggtaac gggctggccg tcgtagtagc 2281 tcgttacggt gacccgttta tcgccggttt tcgccaggtg aaggttcgcg ttgagcaatt 2341 cccccttcag gcggtaaatg tccgcgtttt cggccttctg gatgtcttcc agcagccttt 2401 gtttcttgag gaggagctta tccaccagcg tggagacgct cttggcaaaa ccttcgctct 2461 tctgcatcac gcggttcgtc tctttgcggt gcgaataaaa gaaatccaga gcgtcgccaa 2521 tctcgtcgaa gggtttgact tcgcagacct ccgccaattt cttcatgggg aagatgtgca 2581 cgtctctcgg ctttccgttt gggtcacaat agacagccgg atacagcctg cccgccagca 2641 cgtcgtcccg gacgcggaag agagaaggta tatcgtcttc gaattccgcg gcagcagcgg 2701 cgctcagtcc ctggatctgt gcagggtccg tcacatcttc cggctttgcg gtccagagat 2761 cttgtctgtc ctggggcggg ggagagacgt agggcatgcc cggcaggatc tggcggtagc 2821 ggttgacgtc gatggagatg cgcttgatcg catcgatgat ctttccgctc gcctcatccg 2881 tcaggatcag gttgctgtgc ttgcccatga g // LOCUS sequence135 2911 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence135 VERSION sequence135 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2911 /mol_type="genomic DNA" /organism="" /note="sequence135" CDS 414..1094 /product="class II aldolase/adducin family protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_004453954.1" /transl_table=11 /codon_start=1 /translation="MFEETKRQIIKAGMSLDRYGLIALSGGNVSVRMPSGEILVTPSGM IYEDLVEDDILVMDLQGKIIEGTRKPSSDTEAILYIFREMPEVTAVIHTHQPYATAIGL VQDEFEVNLTTLANATAGPVRVSPYSSAGSIDMGIDTVKYIGDSLAIIMAHHGVMTVGK DKGLKQALYAAVYLEEAAKCYLAAKACGEMKQMTPEQIQQSIEVFKYYGQGTPTIPKDL VKRV" /locus_tag="LOCUS_4480" /note="WP_004453954.1 class II aldolase/adducin family protein (Clostridioides difficile) [pid:38.1%, q_cov:94.2%, s_cov:98.6%, Eval:1.7e-35]" /note="MGA_634" CDS 1136..1840 /product="response regulator YycF" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_000722052.1" /transl_table=11 /codon_start=1 /translation="MTENGRKILIIEDEKPISDIIKFNLTKEGYEVETAYDGQEGLDKA LSCGCDLVLLDIMLPIMSGFEVCKKIREHSEIPIIMLTAKEEEADKVLGLELGADDYIT KPFGMRELLARIKANLRRTEFLEGKAEEPADIQEFGKLQIDMNRYEVRKDGQPLDLTLR EFELLKYLATRDDKVFSREQLLEDVWGYEYYGDIRTVDVTVRRLREKLEDDPGDPKYII TKRGIGYYFSKQ" /locus_tag="LOCUS_4490" /gene="yycF" /note="WP_000722052.1 response regulator YycF (Streptococcus) [pid:61.5%, q_cov:96.2%, s_cov:97.5%, Eval:7.5e-74]" /note="MGA_635" ORIGIN 1 ctcaaggcgg tcaaggtgct gcagaaccac ggcgtatccg tgcagatgct gtccgtttcc 61 accctcaagc ccttcaccga tccccaggtc gtagatgcct taaagaaggt gaagtacggt 121 gccgttacct acgagaacca caacatcatc ggcggtctgg gcacctgcgt ggcggaagtc 181 atggcggaga acggcatcgg taagccgctc atcaaggtcg gcgtaaacga tctgtacacc 241 cacggcgcat ccaagatgtt cctgctcaag aagtacgatg tagacgccat gagctgcatc 301 aaggccgtcg aaaagctcat cggaaaagac cttggcatcg acgagtccga gatcgaggct 361 gtccgcttcg aagatttcaa cggcgtagca taagtttttc aaggagatca tcaatgttcg 421 aagaaaccaa aagacaaatc atcaaagcag gcatgagcct ggaccgttat ggcctgatcg 481 ctctctccgg cggcaacgta tccgtacgca tgccctccgg cgagatcctc gttaccccct 541 ccggcatgat ctatgaagat ctggtggaag acgacatcct cgtcatggac ctgcagggca 601 agatcatcga aggcacccgc aaacccagct ccgacaccga agccatcctc tacatcttcc 661 gggagatgcc cgaggtcacc gcggtcatcc atacccacca gccctacgcc accgccatcg 721 gcctcgtgca ggatgaattc gaagtcaacc tcacgaccct ggccaacgct acggccggcc 781 cggtccgcgt ttctccctac agctccgccg gttccatcga catgggcatc gacaccgtca 841 agtacatcgg cgattccctg gccatcatca tggcccacca cggcgtcatg actgtcggca 901 aggacaaggg actcaagcag gcgctgtacg ccgccgtcta tctggaagag gccgccaagt 961 gctacctggc tgccaaggcc tgcggcgaga tgaagcagat gaccccggag cagatccagc 1021 agtccatcga agtcttcaag tactacggcc agggcacccc gaccattccc aaggatctgg 1081 tcaagagagt ctaaggacgg taaaataata cgtatttcta caggaggcgt cagagatgac 1141 cgaaaacggc agaaagatcc tcatcatcga ggacgaaaag cccatatccg acattatcaa 1201 attcaacctt acgaaggaag gctatgaagt agaaacagcg tacgacggcc aggagggcct 1261 ggacaaggcc ctctcctgcg gctgcgatct cgtgctgctc gacatcatgc ttcccatcat 1321 gagcggtttc gaagtatgca agaagatccg cgaacacagc gagatcccca tcatcatgct 1381 caccgcaaag gaggaggaag ccgataaggt gctcggtctg gagctcggcg cggacgatta 1441 cattacgaag cccttcggca tgcgggagct gctggcgcgg atcaaggcca acctgcggcg 1501 cacggagttc ctggaaggca aggcggagga acccgccgac atccaggagt tcggcaagct 1561 gcagatcgac atgaaccgct acgaagtccg caaggacggc cagccgctgg accttaccct 1621 ccgggaattc gagctgctga aatatctggc gacgagagat gacaaagtct tttccagaga 1681 gcagctgctg gaggacgtct ggggctacga gtactacggc gacatccgga cggtggacgt 1741 tacggtgcgc cgtctgcggg agaaactgga ggacgacccc ggcgatccca agtacatcat 1801 tacgaaacgc ggcatcggct actatttcag caagcaatag ggatcggtcc tgggcagtat 1861 gaatattttc agacgcggca gcgtacgctg gaggatagcg ctcatctact ttatgctgtt 1921 cttcgcggtg ctttccctcg tatccgtgtt cctcgtgaac cgcatcgagc agtaccagct 1981 gtcttcgcta aaagagaata tcgctaagac catcagcgaa agcaatctcc cgtcctatct 2041 gggagcctac gattcgctgt cttcccatgg ggaagagatc caggctgtgc tggattccag 2101 ctggagcagc ttttcggaag aattatccgt ggtggacgag cggatgcaga tctgcgcgtc 2161 caccaattcc aatctggtag gcaggtccgc tgcggacgtg ttcgacgcgt ccatcatcgc 2221 gtcctgcctg cttacgggag attccggcga gtccgattcc gtgctctccg gcggcatccc 2281 cgtcaaaaat ctgtgctacg gcatagagaa tgcgaaagat cccggcgtca tctacgtgcg 2341 ggccgacctt tcgagcatca acgccttcgt gtcgcagagc aaactcatct ttatccgggt 2401 catcctcatc gcgttgctgg cgaccgtcgt gctgggcttc gccctggcgg gcagcattac 2461 gaaacccatc aacgacgtaa cggacacggt cttaaagatg tcggccggcg atttttcgga 2521 aggcgttcag gtaaacagcg acgacgagat cgggcagttg ggagagatgt tcaacctgat 2581 gcgggagaag ctttccgaca cgctgtccga gatcacggga gagaagaaca agctttccac 2641 tatcctggag tacatggcgg acggcctggt ggccatcgac ctgcagggcg gcatcatcca 2701 cgtcaatccg gcagcccggg ccatcctggg cctggatccg gcggatccgc tgcccaaaga 2761 ttacgacgcg ctgatgggtc acatctccga caacatcagc ctgtcgcgca tcaagggcaa 2821 ctgcgagatc cacggcgccc aggacatctt ctcctacggc agcagcatct tcgcgatcca 2881 ctacgaccgg tttaaggacg aagacggcga g // LOCUS sequence136 2902 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence136 VERSION sequence136 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2902 /mol_type="genomic DNA" /organism="" /note="sequence136" tRNA 54..140 /product="tRNA-Leu" /inference="COORDINATES:profile:Aragorn:1.2.38" /locus_tag="LOCUS_t0080" /note="Aragorn_8" CDS complement(248..445) /product="DNA-directed RNA polymerase subunit omega" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_005811864.1" /transl_table=11 /codon_start=1 /translation="MLLYPSVDLLKTKVDSKYTLVIMAAKRARDLIDGKPMLINVDSNK PISIATAEIADDLISYKREE" /locus_tag="LOCUS_4500" /gene="rpoZ" /EC_number="2.7.7.6" /note="WP_005811864.1 DNA-directed RNA polymerase subunit omega (Desulfitobacterium) [pid:54.9%, q_cov:78.5%, s_cov:75.0%, Eval:2.2e-08]" /note="MGA_637" CDS complement(446..1054) /product="guanylate kinase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003388624.1" /transl_table=11 /codon_start=1 /translation="MKHGKLFVFSGPSASGKGTICRELLKEPDTWLSVSLTTRQPREGE LHGVHYYFVTREEYDRTVEEDGFLEHAEIYGNCYGTPKKYALEHMAAGEDVILEIEMQG ALQIKKAYPEAVLIFVLPPSLKELRNRIRKRGTENEEQIAVRMKTTLEEIGLLEKYDYF LINDDLEEAIQTARAIMKAEHCRTAGQAKALIERFKEEE" /locus_tag="LOCUS_4510" /gene="gmk" /EC_number="2.7.4.8" /note="WP_003388624.1 guanylate kinase (Clostridium) [pid:50.5%, q_cov:99.0%, s_cov:95.2%, Eval:9.1e-56]" /note="MGA_638" CDS complement(1111..1998) /product="YicC family protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003416240.1" /transl_table=11 /codon_start=1 /translation="MAKSMTGFGRGVYTDELRSVTVELRSVNHRYSDITVKMPRRYQFA EDTIKNIVKGVAPRGKIDVFVNVDNIAADDTAVELNIPLAKRYFETLQTIKAELPQLSG EPTLAMVANFPDVVKSAAAEEDEELVLKALTEATKEAAANLDAMRIVEGAKLMEDILQR GQLIEQTVCGIEVYAPEVAKNYAAKMKERIQELLGDEATIPEDRIVLEAAVFADKSNIT EEMVRLKSHCSQLKSIAADTSGPIGKKLDFLVQEMNRESNTIGSKANDIRITNDVLLLK AEIEKIREQVQNIE" /locus_tag="LOCUS_4520" /note="WP_003416240.1 YicC family protein (Clostridioides difficile) [pid:46.3%, q_cov:100.0%, s_cov:100.0%, Eval:2.4e-68]" /note="MGA_639" ORIGIN 1 caattttata cccttgtttt tcggtccaaa aaatggtacc ataatcgggt aatgccggcg 61 tgatggaatt ggcagacgta cgggactcaa aatcccgcgg tggcgacacc gtgcgggttc 121 gacccccgcc gccggcacca gcaaacggaa aaggtccttc agggcctttt ttgtttgctc 181 cgttctatcg cggtgggtcg aaatccaatg aaaaacggat cctgcgggac ccgttttttc 241 ttttctttta ctcttccctc ttgtaggaga tcagatcgtc tgcgatctcg gccgttgcga 301 tggagatggg cttgttgctg tccacgttga tgagcatcgg cttgccgtcg atgagatctc 361 tggcgcgctt cgccgccatg atcaccaggg tgtatttgct gtcgaccttc gtcttgagca 421 ggtctacgga cggatataat agcatctatt cttcctcctt gaaacgttcg atcagggcct 481 ttgcctgccc tgctgtcctg cagtgttccg ctttcatgat ggctctcgcc gtctggatcg 541 cttcctccag atcgtcgttg atcaggaagt aatcgtattt ttccagcagg ccgatctcct 601 ccagcgtcgt cttcatgcgg accgcgatct gttcttcatt ttcggtgccg cgcttgcgga 661 tccggttccg cagttctttt aaactgggcg gaagcacaaa gatgagcacg gcctcgggat 721 atgccttctt gatctgaagg gcgccctgca tctcgatctc caggatgacg tcttcccctg 781 ccgccatatg ctccagcgca tattttttcg gcgtgccgta gcagttgccg tagatctcgg 841 catgttcgag aaaaccatcc tcttccaccg ttctgtcgta ttcttcccgg gtcacaaaat 901 aatagtgcac gccgtgaagt tccccttccc ggggctgccg ggtcgtgagg gagacggaca 961 gccaggtatc cggttctttc agcagttctc tgcagatcgt tcctttcccg gaagcggaag 1021 gcccggagaa aacgaataat ttaccgtgct tcataatcag tcctcattga aacaattaat 1081 aatataactt tttatccgcc ttttcaagtc ttattcgata ttctggacct gttcccggat 1141 cttttcgatc tccgctttca gcagcagcac gtcgttcgtg atccgtatat cgttggcctt 1201 cgaaccgatg gtgttggatt cgcggttcat ctcctgtacg aggaaatcca gtttcttgcc 1261 gatgggaccg gacgtatccg ccgcgatgct cttcagttgg ctgcagtggc tcttgagccg 1321 caccatctct tccgtaatgt tggatttgtc cgcaaagacc gcggcttcca gcacgatgcg 1381 gtcctccggg atcgtcgcct cgtctcccag cagttcctgg atgcgttctt tcatctttgc 1441 cgcatagttc ttggcgactt ccggcgcata gacttcgatg ccgcagaccg tctgttcgat 1501 cagctgtccc cgctgcagga tatcctccat gagcttggcg ccttccacga tgcgcatggc 1561 atccaggttg gctgccgcct ccttcgtggc ttccgtaagc gctttcagaa ccagttcctc 1621 gtcttcctcg gcagcagccg acttcacgac gtccggaaag ttcgcgacca tggccagggt 1681 cggttcgccg ctgagctgcg gcagttccgc tttaatggtc tgcagcgtct cgaaataccg 1741 cttcgccaac gggatgttga gttccaccgc cgtatcgtcc gccgcgatat tgtccacgtt 1801 gacgaatacg tcgatcttgc ctctgggcgc cacgcccttc acgatgttct tgatggtatc 1861 ttcggcaaac tgatacctgc ggggcatctt gaccgtgata tcggagtacc ggtgattgac 1921 cgaccgtagc tccacggtga cactgcgcag ctcgtccgta tagacgcctc tgccgaagcc 1981 tgtcatactt tttgccatat tctcctcttt tccaacacgc gatttgtttg ggctattcct 2041 tcgatccgtg ttattatgga tacgatttta gcataaataa cacaaaggat aaagaacaca 2101 catggcatat gatggatttc ttgcaggcgc agttgcccgg cagctggaca gcgaactgca 2161 aggtgcgaaa atagaacggg tgcagcagcc cgaaccggat gagatcgtgc tgcagatcta 2221 cagtcctgct acgggtcagc gcaaaaaact gctcctctgc acagcgcctc agggcgcccg 2281 ggtgcactac acgaagctgg cgtacgaaaa cccgcaggac gccccgaatt tctgcatgct 2341 gctgcgcaag cacctgcagg ggggccgcat cctggcggtg acccagccag ccacagaacg 2401 tatcctggaa ttccacctgg aaacgataaa cgaaatgggg tattccgtta acaaactgct 2461 gatctgcgag ctcatgggca agcacagcaa cctgatcctg acggatgagg cgagcggaaa 2521 gatcatcgat gcgatcaagc gcatctccat cgacgtcaac cgctaccgcc agatcctgcc 2581 gggcatgcct tacgtctctc ccccgcccca ggacagacag gatctctgga ccgcaaagcc 2641 ggaggacgtg acagaccctg cacagatcca gggactgagc gccgctgctg ccgcggaatt 2701 cgaagacgac atgccttctc tcttccgcgt ccgggacgac gtgctggcgg gcaggctgta 2761 tccggctgtc tattgtgacc cgaacggaaa gccgagagac gtgcacatct tccccatgaa 2821 gaaattggcg gaggtctgcg aagtcaaacc cttcgacgag atcggcgacg ctctggattt 2881 cttttattcg caccgcaaag ag // LOCUS sequence137 2889 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence137 VERSION sequence137 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2889 /mol_type="genomic DNA" /organism="" /note="sequence137" CDS 260..1534 /product="diaminopimelate decarboxylase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011020771.1" /transl_table=11 /codon_start=1 /translation="MEKRPFVTKEQIEEIVKTYPTPFHLYDEKGLRENCERIKRAFAWN PGYREFFAVKACPNPSIMAILKDYGFGCDCASRAELTFAKAMDLPGDKIMFTSNVTPAS EFQYAAKIGAIINFDDISHIDFCEKAIGKLPETVSVRYNPGGSFTINTAIMDNPGEAKY GFTTEQMFEGMRLLKEKGVKHCGIHAFLASNTVTNDYYPTLAGELFELAVKLRDETGMD IPFVNLSGGVGIAYRPDQTPNDIEIIGAKVHEVYDRIFGPAGMTNVAIYTEMGRFVTGP YDLLIGQVLHIKHTHKEFVGLDACCVDLMRPAMYGAYHHVTVLGKEDEPCDHKYDITGS LCESNDRFAIDRMLPGIEVGDYIAIHDAGAHGHSMGSNYNGKLRHAELLLKEDGSVVQI RRAETLADYFKTLDDTEFYKKLDLE" /locus_tag="LOCUS_4530" /gene="lysA" /EC_number="4.1.1.20" /note="WP_011020771.1 diaminopimelate decarboxylase (Methanosarcina acetivorans) [pid:58.9%, q_cov:96.5%, s_cov:96.7%, Eval:2.1e-138]" /note="MGA_642" CDS 1550..2431 /product="2-hydroxy-3-oxopropionate reductase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011861698.1" /transl_table=11 /codon_start=1 /translation="MTGFIGLGIMGKPMAKHLLAKLGELAVYDLQEGPVKELTDLGAVY NTPAEMAKDCEAIHCILPTEAIVQEVLFGEGGVLENAGALRYVCDHSSVTPGESRDCAE KLAAKNIGFVDCPVSGGEPKAIDGTLAFMAGGSQADFEALKPHFLAMGSSAVLVGDVGS GSIAKLVNQVIVNLNIAAVSEAFVLCEKAGADPRKVYDAIRGGLAGSTVLDAKIPKILA GDFAPGGTIKVNRKDINNVLSTAHACECPMPLSSQLFEIMQYLSAHGHLMDDHGGIVQY FEDLAGVQVREH" /locus_tag="LOCUS_4540" /gene="garR" /EC_number="1.1.1.60" /note="WP_011861698.1 2-hydroxy-3-oxopropionate reductase (Clostridioides difficile) [pid:60.1%, q_cov:99.3%, s_cov:98.3%, Eval:7.2e-94]" /note="MGA_643" ORIGIN 1 ccgaaagcgg cgtatataag gttcacgagc ccgttatgat caacggcttc gcctttacgc 61 tcaacaagga gaacgtaacg gatgaggaga tccacgcgct ggagagagcc attcgcgccg 121 aaggtacgac ttacctcaat ccgtccggcg tatgcggcgt gcctcatctg cgctgcagcc 181 tgtccaactg gtccatcgaa gaggcggacg tggagaaggt cgctgctgcg gtcatcgccg 241 tgggaaagga gttcctgtaa tggaaaagag acctttcgtt acgaaagaac agatcgaaga 301 gatcgttaag acatacccga cgccttttca tctctacgat gagaaggggc tgcgggaaaa 361 ctgcgagcga atcaaaaggg cgtttgcctg gaatccgggg taccgggaat tcttcgcggt 421 aaaagcgtgt ccgaatccgt ccatcatggc tatcctgaag gactatggct tcggctgcga 481 ctgcgcgtcg cgggcggaac ttacctttgc gaaggccatg gatctgccgg gggataagat 541 catgtttacg tcgaacgtga cccccgcatc ggagttccaa tatgccgcca agatcggtgc 601 catcatcaat ttcgacgata tttcccacat cgatttctgc gaaaaagcca tcggcaaact 661 gccggaaaca gtttccgtgc ggtataaccc cggcggcagc tttacgatca acacggcgat 721 catggacaac cccggcgaag ccaaatacgg ctttacgacg gagcagatgt tcgaagggat 781 gcgtctgctg aaggaaaaag gcgttaagca ctgcggcatc cacgcgtttt tggcgagcaa 841 taccgttacg aacgattact atccgacgct ggcgggcgag ctgttcgaac tggcggtaaa 901 actgcgggac gagaccggca tggacattcc cttcgtcaac ctgtccggcg gcgtgggcat 961 cgcataccgg cccgaccaga cgccgaacga tatcgagatc atcggtgcta aggtccacga 1021 agtctacgac aggatcttcg gtccggccgg tatgacgaac gtggcgatct acaccgagat 1081 gggccgtttc gttaccggcc cctacgacct gctgatcggc caggtgctgc acatcaagca 1141 cacccataaa gaattcgtgg gactggacgc ctgctgcgta gacctgatgc ggcctgccat 1201 gtacggcgcc tatcaccacg tgacggtcct gggcaaggaa gacgaaccct gcgaccacaa 1261 atacgacatt acgggatctc tgtgtgaatc caacgaccgc tttgctatcg acaggatgct 1321 gcccgggatc gaagtggggg actacatcgc tatccacgat gcgggcgccc acggacactc 1381 catgggaagc aattacaacg gcaagctgcg ccatgcggag ctgctgctga aggaagacgg 1441 cagtgtggtg cagatccgca gagcggagac cctggcggac tacttcaaga cgctggacga 1501 cacggagttt tataagaaat tagatctgga ataggagacg tttggagcaa tgaccggatt 1561 tatcggactt ggtatcatgg gaaaacccat ggcaaaacac ttactggcaa agttgggaga 1621 actggcggtc tacgacctgc aggaaggccc tgtaaaggaa ttaacggatc tcggtgcggt 1681 gtataatacg ccggcggaga tggcaaagga ctgcgaagcg atccactgca tcctgcccac 1741 ggaagcgatc gtacaggagg tgctgttcgg cgagggcggc gtgctggaga acgcaggcgc 1801 gctgagatat gtctgcgacc actcctcggt gaccccggga gaatccagag actgtgcgga 1861 aaagctggcg gcgaagaaca tcggttttgt ggattgccct gtttccggcg gtgaaccgaa 1921 agccatcgac ggaacgcttg ccttcatggc aggcggcagc caggcggatt tcgaggcgtt 1981 aaagccgcat tttctggcca tgggcagttc cgctgtactg gtgggagacg tgggatccgg 2041 cagcatcgcc aagctcgtaa accaggtgat cgtcaatctc aacatcgcag cggtctccga 2101 agccttcgtg ctctgcgaaa aggcgggtgc agacccccgc aaggtctacg acgccatccg 2161 cggaggcctg gcaggcagca cggtgttgga cgccaagatc cccaagatct tagccggcga 2221 tttcgcccct ggcggcacca ttaaggtgaa tcggaaagac ataaataacg ttctgtcgac 2281 cgcgcatgcc tgtgaatgtc ccatgccttt gagctcccag ctgttcgaga tcatgcagta 2341 tctgtcggct cacggccacc tgatggacga ccacggcggc atcgtgcagt atttcgagga 2401 tctggcgggc gtacaggtga gggaacactg atggacatcg acagactctt acaggaacag 2461 tacgcaaaat ttgaccgcaa gatcgtcgtg ctcgacgacg acccaacggg cagccagacc 2521 gttcacgaca tccacgtcta cacagattgg acacaggaga ccctggacga ggcgtttggc 2581 tcggacgaaa agctctttta cattcttacg aactctcgca gttttacggc ggaacagaca 2641 aagaaggtcc atcaggatat cgcagcggcc atccggaatg cttctgcaaa gaccggcaaa 2701 gactacctgg tgatctcccg cagcgattcc atgctcagag gccattttcc gttggaaaca 2761 gaggtgttaa gggcttcttt gggtaaagat atcgatgggg aagttttatg cccctttttc 2821 cccgaaggag gccgttatac gatcggcgac atccactacg taaaacaggg cgacgcgctt 2881 gtcccggca // LOCUS sequence138 2888 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence138 VERSION sequence138 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2888 /mol_type="genomic DNA" /organism="" /note="sequence138" CDS 97..741 /product="phosphoribosylglycinamide formyltransferase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_010964703.1" /transl_table=11 /codon_start=1 /translation="MSAKKERKANIAVLISGGGTNLQAILDAEKAGALHSGTVKLVISN RKGAYGLERAKNAGVKAVAVTRKDCGSQKAFEAELIRLLDEAKTDLIVLAGWLAILSEN FTRHYEKRIINIHPALIPSFCGEGFYGLKVHEAALAKGVKVSGATVHYVNEIPDGGEII AQKAVRVYPGDTPEKLQLRIMKQAEWKLLPKAAEQICSEIVAGKHPGFQED" /locus_tag="LOCUS_4550" /gene="purN" /EC_number="2.1.2.2" /note="WP_010964703.1 phosphoribosylglycinamide formyltransferase (Clostridium) [pid:50.8%, q_cov:87.4%, s_cov:89.7%, Eval:3.1e-44]" /note="MGA_646" CDS 746..1465 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MDIYKIHDIAELIRGNSYVGRGIVLGKSEDGKNAVSVYFIMGRSA NSRNRIFTVKDGEVFTEPFDASKVEDPSLIIYAALRSYQNHLIVTNGDQTDTIYEGLQK GKCIRGSLKSRCFEPDAPNFTPRISGDIEFGEDDFCYHMSILKSIDAEGSDCARYTFDY PAKAGLGHFIHTYVCDGSPIPTFQGEPERVAIPNSIDEFTAKLWDALDADNKISLYVRY TDLETKEYKEKLINKNK" /locus_tag="LOCUS_4560" /note="MGA_647" CDS 1526..2710 /product="phosphoribosylaminoimidazolecarboxamide formyltransferase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_008765038.1" /transl_table=11 /codon_start=1 /translation="MKEFELKYGCNPNQKPAKIYMADGSDLPVQILNGRPGYINFLDAF NSWQLVKELKEATGMPCAASFKHVSPTSAAVGKVLPEKLKKACFVDDIEGLDDSPIACA YARARGTDRMCSFGDWIALSDVCDATTAKIIKREVSDGVIAPGYTDEALEILKAKRKGS YNVVQMDPDYVPDPQETKQVFGITFEQGRNNFKIDRALLSNIVTANKELPDDAAIDLIV ALITLKYTQSNSVCFAVDGQAIGVGAGQQSRVHCTRLAGSKADTWLLRQSDKVLGLPFK EGLGRADRDNAIDGYINQNELDVCADGNWQRYFSRQPEPFTKEEQKAYLATIDGIALGS DAFFPFDDNIERAKLSGVKYIAEPGGSVRDDLVIGCCDKYGMVMAFTGMRLFHH" /locus_tag="LOCUS_4570" /EC_number="2.1.2.3" /note="WP_008765038.1 phosphoribosylaminoimidazolecarboxamide formyltransferase (Bacteroides thetaiotaomicron) [pid:69.1%, q_cov:99.5%, s_cov:99.2%, Eval:2.0e-156]" /note="MGA_648" ORIGIN 1 actgcgaaaa ggcgctggag atcctgcgcg cgaacggcga ggaagcctac cgcatgggac 61 gcatcgtcaa gtccccggaa gaaggagtga gcatcgttgt ccgctaagaa agaacgcaaa 121 gcgaatatcg ccgtgctcat cagcggcgga ggcaccaacc tgcaggccat cctggatgcg 181 gaaaaggcag gcgcgctgca cagcggcact gttaagctcg tcatctccaa ccgcaaaggg 241 gcctacggcc tcgagcgggc gaagaatgcc ggggtcaaag ccgttgccgt gacccgcaag 301 gactgcggca gccagaaagc cttcgaagcg gagctcatcc gcctgctgga cgaagcgaag 361 accgacctca tcgtgctggc cggctggctc gccatcctca gcgagaactt taccaggcat 421 tacgaaaagc gcatcatcaa catccacccc gccctcatcc ccagtttctg cggcgaaggc 481 ttctacggac tgaaggtcca cgaggcggca ttggccaagg gcgttaaagt gagcggtgct 541 acggtacatt acgtgaacga gatccccgac ggcggcgaga tcatcgccca aaaagctgtg 601 cgggtgtatc cgggagacac cccggaaaag ctgcagcttc gcatcatgaa gcaggcagaa 661 tggaaactgt tgcccaaagc cgcagagcag atctgcagcg agatcgtcgc cgggaagcat 721 cccggctttc aggaggatta aacccatgga catctacaag atccacgaca tcgcagaact 781 catccgcggc aattcctacg tgggccgcgg catcgtgctg ggaaagagcg aggacggcaa 841 gaacgctgta tccgtctatt tcatcatggg ccgcagcgcc aacagccgca accgcatctt 901 caccgtcaag gacggcgagg tgtttacgga gcccttcgac gcttccaagg tcgaagaccc 961 cagcctcatc atctatgcgg cgctcagaag ctatcagaac cacctgatcg tgacgaacgg 1021 cgatcagact gatacgatct atgaaggtct gcagaagggc aagtgcatcc gcggcagctt 1081 aaagagccgc tgcttcgagc cggatgcccc gaactttacg ccgcgcatct ccggcgacat 1141 cgaattcggc gaagacgatt tctgctatca catgagcatc ctcaagagca tcgacgccga 1201 aggcagcgac tgcgcccgct acacgttcga ctacccggcc aaggctggtc tgggtcactt 1261 tatccacacc tacgtctgcg acggcagccc catccccacc ttccagggtg aacccgagag 1321 agtcgccatt cccaacagca tcgacgaatt caccgctaag ctgtgggatg ccctcgacgc 1381 ggacaacaag atctccttat acgtaagata tacggatctt gaaacgaaag aatataaaga 1441 aaagctgatc aataagaaca aatagatatt gtttatccgt ccgaggggtg acaggacccc 1501 gaggacgcat cgtaaggaga tcattatgaa agaattcgaa ctcaaatacg gatgcaatcc 1561 gaaccagaaa ccggccaaga tctacatggc ggacggatcc gacctgcccg tgcagatcct 1621 gaacggccgc cccggctaca tcaatttcct ggatgccttc aactcctggc agctcgtcaa 1681 ggaactgaag gaagccaccg gcatgccctg cgcagccagc tttaagcacg tgagccccac 1741 ctccgccgcc gtcggcaagg tccttcccga aaagctgaag aaggcctgct tcgtggacga 1801 catcgaaggt ctggacgact cccctatcgc ctgcgcctac gcaagagcga gaggcaccga 1861 ccgcatgtgc tccttcggcg actggatcgc tctgtccgac gtctgcgacg ccaccaccgc 1921 gaagatcatc aagagagaag tctccgacgg cgtcatcgcg ccgggctaca ccgacgaagc 1981 cctggagatc ctgaaggcca agcgcaaggg ttcctacaac gtggtgcaga tggatccgga 2041 ctacgtgccc gatccccagg agaccaagca ggtcttcggc atcaccttcg agcagggccg 2101 caacaacttt aagatcgacc gcgcgctgct gtccaacatc gtgactgcaa acaaggaact 2161 tcccgacgac gctgccatcg atctcatcgt cgcgctcatc accctcaagt acacccagtc 2221 caactccgtc tgcttcgccg tggacggcca ggccatcggc gtcggcgccg gccagcagtc 2281 ccgcgtgcac tgcacgagac ttgccggaag caaggccgac acctggctgc tgcgccagtc 2341 cgacaaggtc ctgggcctgc cgttcaagga aggcctcggc agagctgaca gagacaacgc 2401 catcgacggc tacatcaacc agaacgagct ggacgtctgc gccgatggca actggcagag 2461 atatttcagc agacagcccg aaccctttac gaaggaggaa cagaaagcct acctcgccac 2521 gatcgacggc atcgccctcg gttccgacgc tttcttcccc ttcgacgaca acatcgaaag 2581 agcgaagctg tccggcgtca aatacatcgc ggagcccggc ggctcggtga gagatgatct 2641 cgtcatcggc tgctgcgaca aatacggcat ggtcatggcc tttaccggca tgcgtctgtt 2701 ccatcactag gaggcaaaat ctatgaacgt aatggtcatc ggcggcggcg gacgcgagca 2761 cgccatcatc aagaagatca aagagaatcc ggaagtgacc gccatctacg ccctgcccgg 2821 caacggcggc atcgccatgg acgcttactg cgtcgacatc aaggcgacgg atctggaagg 2881 catcaaag // LOCUS sequence139 2885 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence139 VERSION sequence139 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2885 /mol_type="genomic DNA" /organism="" /note="sequence139" misc_feature <1..961 /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_003897464.1:iron ABC transporter permease" /note="WP_003897464.1 iron ABC transporter permease (Mycobacteriaceae) [pid:34.2%, q_cov:96.9%, s_cov:93.6%, Eval:9.1e-45]" /note="MGA_650" /locus_tag="LOCUS_4580" CDS 958..1716 /product="ABC transporter ATP-binding protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003372869.1" /transl_table=11 /codon_start=1 /translation="MIRVHDLHASYEGEEILHGIDASFPEGKISVLMGPNGCGKSTTLR SMLRLVPHSSGTIELNGTPLSALSPQEWARNIAYLPQSRSVPDIAVKTLVMHGRFPYLS YPRRYRPEDHEKVRESLEWVGLTDLADRKMEQLSGGQRQKAYLAMALAQDTDVILMDEP TTFLDIRNQFELLDRSKQLAKQGKTVIMILHDFEAVLRYADHVVLLHNGHVLQEGGAEE VLRSGSIREAFQVTPVFHQGEDGLHCYVRQ" /locus_tag="LOCUS_4590" /note="WP_003372869.1 ABC transporter ATP-binding protein (Pseudomonas) [pid:44.0%, q_cov:92.1%, s_cov:89.0%, Eval:7.4e-54]" /note="MGA_651" ORIGIN 1 agccgctgcc tttatgctgg ctgctgcggt cctgaacatc tgtctcggcg catcccgcat 61 ctcgctcgtg cagctctggg aagccttgct cagcggaccc ggctcatctg ctgcgtcccg 121 catcctctgg tacgtccggc tgccccgtac cgctgcctgt ctgctggcag gttccgggct 181 cgcagtatcc ggaaccgtca ttcaaaaggt gctggccaac aatctggcct ctccggggat 241 catcggggtc aacgcaggag caggtctggc cgttgccgtc tgcagcggcc tcggcatgta 301 ttccgcctgg gtcatcgcag gcgcatcctt cctgggcgcc atgatcgcga catttgttgt 361 ggtgatcgtg gccagaaaga gcaatgcatc ccggacgacg gtcgtgctgg gcggcgttgc 421 cgttacggct ggtttgattg ccgttacaga aaccatcatc gtactcatcc cggatgctgc 481 gctggcaaat gtggatttcc gtgtgggcgg tttctccgcg gtcaaccacg caagactgct 541 cccggctgcg atcctcatct tggcttcaat cattctggtc tgcaccctga cgaacgaact 601 ggacgtgctg tccctgggtg acgacaccgc ccattccctg gggcttcggg tagggcgcat 661 gcggaacggt tttctgaccc tggcagcgct gctggccggc gctaccgtca gttttgccgg 721 cattttggga tttgtcgggc tcatcgtgcc ccatatcgca agacgcttta tcggaaatga 781 gagtggaaaa cttctgccgt tctgcgcact gttgggagcg ggatttgtta cgatctgcga 841 tcttgcggcc cgtctggtct ttgcgcctta cgaagtctcc acaggtatcc tgttgaactt 901 cctgggcgga cccttcttcg tatggctgct gctgaagaga aaggataagc acaccaaatg 961 atccgcgtac acgatttaca tgcttcctat gagggagaag agatcctgca cgggatcgat 1021 gccagttttc cggaaggaaa gatctctgtt ttgatgggac cgaacggctg cggtaagagc 1081 accacgctgc gttcaatgct ccggctcgta cctcattcct ctggaacgat cgaactaaat 1141 ggcacgcctc tatccgcgct ttcgccccag gaatgggcga gaaatatcgc ctatctgccc 1201 cagagcagaa gtgtgccgga tatcgccgta aaaacgctgg tgatgcacgg aagatttccc 1261 tatctgagct atccgaggcg ttaccgaccc gaagatcacg agaaggtgag agagtctctg 1321 gaatgggtcg ggcttacgga tcttgcggac cgcaagatgg aacagctgtc gggcggacag 1381 aggcagaagg cgtatctcgc catggcgctg gcgcaggata ccgacgtcat cctcatggat 1441 gagcccacca cgttcctgga catccgcaac cagttcgagc tgctggaccg ttcgaaacaa 1501 ctggcaaagc aaggcaagac cgtcatcatg atcctgcacg atttcgaagc ggtcctgcgc 1561 tatgcagacc acgtcgtcct tttgcataac ggccatgtgc tgcaggaggg cggggcggaa 1621 gaggtcctcc gctccggatc gatccgggaa gcctttcagg tcacccctgt cttccatcag 1681 ggcgaagacg ggctgcattg ctatgtaaga caatagaaac ggggttgcac ttttcctcct 1741 tctatactaa aatcattatg ttatgccgtg ggcaattccg cccaggcttt aacgtgcaca 1801 actgaataat atccggtgcc tcaaaacgta aagcgcggag aggataatag ggaaacaggt 1861 gagaatcctg tacgatctcg tcactgtcat aggcgagtgt gcggcatagc aatcatcgca 1921 gtcactgatg ctccatcggg aagactgccg cacgcgcaga accttaagtc aggaaacctg 1981 ccgggtatgg tactaagacg tccgtcttgc accacgagga attggttgta ccgccgtgtt 2041 tgttatttca tgtggcacgg cagaaacaag gaggaaaaca tgaaactcaa aagaattttt 2101 gcgctgctgc tggcgctggt cctcatcatg ggatccctgg cagcatgcac caactctcag 2161 cagcctgctg aggaagagga cgaagaaaac tacgagaccg gcgatgcgtc tctggacgat 2221 cctctgaatc aggacggcat cggccccacc gagatcttag tcgtatcttt cggaaccagc 2281 tttaacgatt ccagaagact caccatcggc gccatcgaaa aggatatcgc cgctgctttc 2341 ccgcagtttg acgtccgcag aggcttcacc gcgcagatca tcatcgatca tgtgcagaac 2401 agagacggcg aagtcatcga taacttcgaa caggccatgg accgcgcagt caacaacggc 2461 gtcaagaaca tcatcatcca gccgacccac ctgatggcag gtctggaata caacgacatc 2521 gtcgcttccg cagccaacta tgccgacgcc ttcaacagca tcacgatcgg caagaacctg 2581 ctggataccg acagcgattt cgtgaccgtt gcaagccttc tctatgaaga gaccaagtcc 2641 tacgacgacg gcgagaccgc gatcgttttc atgggtcacg gcaccgaagc cgaatccaac 2701 agcgtctatg cttccatgca ggctaccttc gaccagatgg gtctgaaaaa ctgctacgta 2761 ggcaccgtcg aagcgactcc gtccctggac gacgtcgtag cggcagctaa ggaaggcggc 2821 tataagagag tcgtcctcga acccatgatg atcgtctgcg gcgaccacgc caacaacgac 2881 atggc // LOCUS sequence140 2866 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence140 VERSION sequence140 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2866 /mol_type="genomic DNA" /organism="" /note="sequence140" misc_feature <1..1249 /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_010963689.1:M20/M25/M40 family metallo-hydrolase" /note="WP_010963689.1 M20/M25/M40 family metallo-hydrolase (Clostridium) [pid:35.6%, q_cov:98.8%, s_cov:75.8%, Eval:1.0e-81]" /note="MGA_653" /locus_tag="LOCUS_4600" ORIGIN 1 ctgccgcggt ctcttcgaca tgaagaccgg cgatgccgcc atcatggccg tcatggaaga 61 catgtccaag cacctggatg agctggaagg caacctgatc ttctccgccg tatgcgacga 121 agaaggcaac tccggcggcg tcctcaactg cgacccggac tatgtccgcc tggcagagga 181 gagaggctac gagtatctgg ccatgctgga tgccgactac atcaccgaag aatacgaggg 241 tgacccgaac aagtacatct acatcggcac cgtcggcaag accatgccca cgttctacat 301 cgtcggcaag gagacccacg taggcgagtc cttcaagggt ctggatccca accagatcgc 361 tgctgcgatc acgatgcggg tcaacctcaa ccccgaattt gcagacgtcg cagacggcga 421 agtcgcgctg cctcccatca cgctcaagca gagagactta aagaccgagt actccgtaca 481 gaccgccaag gctgctacga tctacttcaa ctatgccacc cactgcagca ctcccgagat 541 catcctggaa aagatgctca aggtcggtca ggaatgcttc gaagagacga tggatgtcct 601 gaacgaacgg tataagaatt tctgcgagat ggcaaagcgc gagtacacgc cgctgccctt 661 cgttcccaga gcgatgagct tcgatcagct gatggacgct gtccgcaagg aagttcccaa 721 cctggacgaa ctggtaaagg ccaaggcgga agagctgatg aagaccgata tggactccag 781 agaccgttcc accgcgatct gcgcttacgt gcacgatatg tggagcgacc gcgatcccgt 841 ggtcatcgtc tacttctcca gcccgtacta tccgcacgtc tttatcgaag gcaagagcca 901 gaaggataag aacctgatcg ctgccgtcga aaaggccgtt aacgaggcag agaccgatta 961 ccagatcggc tacaagaagt tcttcccgta catctccgac ctgtcctatg cggcagtgcc 1021 cgatgagacc gtcgtcgaga ccttcaagtc caacatgccc ggttacggca tcacctacga 1081 tctgcccttc gataccatta agaaactgaa tctgcccgta ctggacatcg gcgctttcgg 1141 caaggatgcc cacagatgga cggagcggat cgagaagaag ttctccttca acgttacgcc 1201 ggaactgatc taccgcacgc tgctcaacct gctggagatc tccaaataaa gacatatttt 1261 taagtcattc aagaggtgaa acatgaaaca gaaaatcgac aaactgtttg taaacggcaa 1321 gatctacacc tttatcgaag aaaacgatac cgtggaagcg gtagcggtcg acaagggcta 1381 catcatctgg accggtctta cgaagaacgc gatggaaaag ttcgagcccg cagagatcat 1441 cgatctcgaa ggcaaggcga tggaaccctc catgggcgac tcccatctgc acttctacgc 1501 ctataaccag acgctgttca cggtagatct gggcggcatc accaccagag aagaagcctg 1561 ggcaaaactg aaggccaagt gcgccgaggt tcccgctggt gcctgggtca aaggctccaa 1621 ctacgaccag tccaagtggc aggatatgga tgtggacaga atgcctaccg ctgacgacct 1681 ggatctggtc tccaccgatc accccgtcat catcaagaga tgctgcctgc acgaagtctc 1741 cgcgaaccat aaggcgctgg aagtcgcagg catcggcaac ggctatgtct tcggcgaagg 1801 cggcctcgta gaactggatg aaaacggcga tcccaacggc gttatccgcg aacaggcttc 1861 caagatcttc gacgatatcg tacccgatcc tctcaccgat aagaccgtgc gcgagcagac 1921 catggagaag acctttaagc acgtttccag cgtaggcgtt accatgatgg atacctatgc 1981 cgctaagatc tggaacttct tcgaagaccc cgacgtctac gaaaatctgg acaagaaggg 2041 taagctgccc gtccgtatga gagtctgcct cgaagagatg tacgacaagc ccatcctcac 2101 cgagcagcag aaggctgacc cctacagaaa ggtcgactac ggcaccttca agagctttac 2161 cgacggctcc ttcggtgcca gatccgcagc gctgctggaa gactacgacg acgatcccgg 2221 caacaagggt atcctcgtta tctcccagga tgctctgaac gagcgcattt atcaggcgta 2281 caagcacggt ctgcagcccg cgacccactg catcggcgac gccggtaccg aagcctgcct 2341 gcaggccatc gaatacaccg tcaagaagtg catcgaggaa gacggctata ccatggacga 2401 gatcatgaag ggcccgaagt tccgcgtcat ccacgcgcag ctggtccaca gagatcagct 2461 ggagagattc aagaaggtgc ccgtcatctt cgatatccag cccgtattcc tcaacaccga 2521 cctgcaccgg atcgacgagc gcatcggatc cagagcggac gatgcctaca cctggaagac 2581 ctatctggac gaaggcatca tctgcaccgg cggttccgac tgcccggtag agagctacaa 2641 cccgtggccc ggcatctggg gcgccgtcaa cagaacggat cctctgttcc cggacgaagc 2701 tccctggcat cccgagcaga agctgtccaa gttccaggct gcctgcctgt tctccaagta 2761 catggcttac ggcaaccaga tggaaagata tctgggcacc atcgagccgg gtaagttcgc 2821 cgacatgatc gtcaccgaca gagactggcc caacggtccg gacgac // LOCUS sequence141 2865 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence141 VERSION sequence141 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2865 /mol_type="genomic DNA" /organism="" /note="sequence141" CDS complement(61..798) /product="NAD-dependent protein deacylase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_010963607.1" /transl_table=11 /codon_start=1 /translation="MYEELKEILDKAQRIVFFGGAGVSTESGVPDFRSENGLYHAQHNY GRSPEEMLSIDFFESDPVTFFDYYKNNLIATWAKPNRAHKALAKLEEQGKLIGVVTQNI DGLHQLAGSKKVYELHGSVHRNTCLRCRKKYGLDYILDEANCEKGVPKCSCGGTIKPDV VLYGEMLDDDCIRGAVNAISKADVLIIGGTSLVVYPAAGFVHYFKGDKLVILNKSETAA DDRADLVIHDPIGEVLGECLNIE" /locus_tag="LOCUS_4610" /EC_number="2.3.1.286" /note="WP_010963607.1 NAD-dependent protein deacylase (Clostridium) [pid:61.4%, q_cov:95.9%, s_cov:95.1%, Eval:4.9e-79]" /note="MGA_656" misc_feature complement(1021..>2865) /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_003428202.1:glutamine synthetase" /note="WP_003428202.1 glutamine synthetase (Clostridioides difficile) [pid:51.0%, q_cov:99.5%, s_cov:96.7%, Eval:4.3e-178]" /note="MGA_657" /locus_tag="LOCUS_4620" ORIGIN 1 ccttctgacc cgcttttttg acgatctgag agctttttct cgcctcgtcg agcatctttc 61 ctattctatg ttcaggcatt ctcctaagac ctctccgatc ggatcgtgga tgacgagatc 121 ggcgcggtcg tccgctgccg tctcggattt gttgaggatc accagcttgt cgcccttgaa 181 atagtgaacg aagcctgccg ccggatacac gaccagggac gtgccgccga tgatgaggac 241 atctgccttg gaaatggcgt tcacggcccc gcggatgcag tcgtcgtcca gcatctcgcc 301 gtagagcacg acgtcgggct tgatggtgcc gccgcagctg cacttgggca cgcccttctc 361 gcagttcgcc tcgtccagga tatagtcgag gccgtatttt ttgcggcagc gcaggcaggt 421 gttgcggtga acgcttccat ggagctcgta gactttcttg ctgccggcca gctgatgcag 481 gccgtcgatg ttctgggtga ccacgccgat cagtttgccc tgctcctcca gtttggccag 541 ggccttatgg gcccggttgg gcttggccca agtggcgatg aggttgttct tgtaatagtc 601 gaagaacgtt accggatcgc tctcgaagaa atcgatggac agcatctctt cggggcttct 661 gccgtagttg tgctgcgcgt gatacaggcc gttttcgctg cggaaatccg gcacaccgct 721 ctcggtggat acgccggcgc cgccgaaaaa gacgatgcgc tgcgctttgt ccaatatctc 781 tttcagttct tcgtacatgg ttgctccttt ctacccaaag caaaagcggc ctcgaaaggc 841 cgcttttccc ggatgtgtgt atctttattg tatagaagga aaactatcgg gaggctcgcc 901 tcccactctt tgctgcttgc tacacctaaa gaatactggc cttttgtgtg tttcctgtga 961 agcccctgtg ggatttgtct tcactttatc tcattattgc cccatttttt cgcatattct 1021 tcagtcaagt atgtttttcc ggtaagtcgc atacagtttt tccagttttt cgatactggc 1081 ctgcgccgcc agctgcatgt cggatgcggt gtcgaaatcg cccgcatcca gcgcgtcttc 1141 cagccgggac aggaagcact tgtgatgcaa tccgtcctgg ataaggtctt tgcggagctg 1201 gcagatctcc gtccagcgct gttcgtccag ctgcttgcag ttgtcgctgt cgtgcacctt 1261 tttcagttcg tgcacccggt ccgccatctg cggcacgatg cggtcgcgca gagacagagc 1321 ccactgctcc acgacggatg cctcgaagga ttccagatcg atcggcgcaa acgcgttgcc 1381 gcgcagcagc accttgtact tctccggata ttccttgaag gagcacaggt tctcccagac 1441 ggtgcccggg cacttgccga acagctttac gcgctcttcc tgcgtgtaat cctcgaagat 1501 gttgttctcc gcccggtaca cgcggtcctt ttccagatag aagtcctcct cgccatattg 1561 cttggagatg gacgcgcaga gctcctccgg cgtcttcttt gccttcagca ccgcctccac 1621 gccgtccagc atggcgagat atccggccgc cagcaccagg taggtgttgc tcttggggtt 1681 gggggcgcgc atctcgaagc gggtcgccag cgggctgttg atgtcgcgga tgagccccag 1741 cagcaccgta cggttgcggg agggcttctc cacactgtga cccagcgccg tacagatgga 1801 gaccggcgcc tcgaaaccgg gctttaatct ctggaacgcg ttgttgcggc agttggcgat 1861 gggcgaaatg acctcgtagt tcttcagaat gcccatcagc gcgccgtagc ccagggggct 1921 gaggtagtcc ttggacgggt caagcgccgt aaacagattg acggtacggc cgtccttcag 1981 cttcgcagcc acgccgaaat gggtgtgctt gccgctgccc gcgacgcctt ccaccggctt 2041 ggacataaag gtaacgtcca gcccgttcct gcggaattcg tccttgatca tgtagcggac 2101 gaaatagtcg ttgtccgccg cctgcagcgc cgtggagtat ttaaagtcga tctccagctg 2161 ctccatgatg tgctcgtagc cgcccttgtg cagctccggc tttacgccgc ccacctcttt 2221 atggcccatc tcgatgtcca ggccgtagtg gtccagcaga agcagcgcct tttccatggc 2281 ggtgcgcacg ggaccgatgg tgcgcttcca gtactgctct ttcagctcct gggacacctg 2341 caggcggtct ctgtccgcca cgtcgtgggg cgtctttacg tagaattcga tctccgtggc 2401 cgaggtcagg gagaggtcct cgatgtcgtc gacactgtcg aacggcagat actcgaagac 2461 gtaaggattt tcgcgcagca tgcgcaggat ctccgattta aaaacatcca ccgcgtcgcg 2521 caggatgacc cgcgagccga cgtcccggga attgttgtgc ttcaggaagg cgggaatacg 2581 caggcttccc acgggaagcc cggtctcgtc gtcgatgtgc ccgaagttat agtccacgta 2641 ccagttgacg tcgcggtcgg ggatcaggtc gaccttggcg tcggagatgt ccgcgatctt 2701 cggcagcagt acggaagaac cgtcggtctg ctggccttct tccaggaact tgtccacatc 2761 cttgagcatg atgcggatgg ggatcttctc gtcggtgtcg ttgccgaaga tgtccgcggc 2821 tgccaggctc acgaaacgga tctcggggtg ttcggaaagc agcgc // LOCUS sequence142 2858 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence142 VERSION sequence142 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2858 /mol_type="genomic DNA" /organism="" /note="sequence142" misc_feature <1..853 /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_011015666.1:SPFH domain-containing protein" /note="WP_011015666.1 SPFH domain-containing protein (Fusobacterium nucleatum) [pid:57.8%, q_cov:95.4%, s_cov:91.8%, Eval:1.4e-83]" /note="MGA_658" /locus_tag="LOCUS_4630" CDS 857..1360 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MDIFDIVGAILGFIASIIPLIVILFIFSRLAKAAKQSQKRSGGSN PWQQPAAQQEKPHLVKSLKNSSSGEYKAEDKQFGFGKSAFAGSRSTSSSLKAEKVSRLS ETFMKDDRKNDWLARQLREEEKILRRGDMLDLGASHAASCDADLLKRYHLFAEHDDSVD SGEY" /locus_tag="LOCUS_4640" /note="MGA_659" CDS 1514..1837 /product="helix-turn-helix transcriptional regulator" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_000827865.1" /transl_table=11 /codon_start=1 /translation="MIENMALTESTYYILLSLVSPQHGYGIMQQAEALSNGRVRLAAGT LYGALSAMVDKGWIRQLPVEEGSRKKEYQLTEKGRSVLDNEVARLRELADNGERILGMA QEE" /locus_tag="LOCUS_4650" /note="WP_000827865.1 helix-turn-helix transcriptional regulator (Streptococcus) [pid:42.9%, q_cov:91.6%, s_cov:87.4%, Eval:6.0e-19]" /note="MGA_660" CDS 1839..2348 /product="DUF2812 domain-containing protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003721612.1" /transl_table=11 /codon_start=1 /translation="MGERKTVRKWFWVWDFDKEERWLNEMALQGWVLDGVGFCTYHFKK CEPGEYAVRLEMRPHDESYIAFMEETGAEFVGRFTMWLYFRKKVEDGAFDLYSDIDSKI AHLDRIGRVLAVIGGLNLLCAFMYSVGVGTWVGVLNTICATVLMYGLGRIHGKKESLQQ ARQLYE" /locus_tag="LOCUS_4660" /note="WP_003721612.1 DUF2812 domain-containing protein (Listeria monocytogenes) [pid:29.3%, q_cov:86.4%, s_cov:88.5%, Eval:8.0e-11]" /note="MGA_661" ORIGIN 1 ctgcatctgc atcgttccgc aggccagcgc atggatcgtg gaagcgttag gtcagtataa 61 agccacgtgg ggtgcgggcc ttcatttcaa ggtgcccatc atccaccgcg tcgtcaagaa 121 agtgtcctta aaggagcagg tcgcagactt cgaaccgcag cccgtgatca cgaaggataa 181 cgtaaccatg atggtggact ccgtcgtatt cttctacatc ttcgacgcca agctgttcgc 241 ctacggcgtg gagagaccga tcgcggccat cgaaaatctg tccgctacga ctcttcgtaa 301 tatcatcggt tccatgacct tagatgagac cctgacgagc cgcgacgaca tcaacagccg 361 catcaccgct atcctggaca acgccacgga caagtggggc atcaaggtga gccgggtaga 421 agtcaagaac atcgcgccgc ccagaagcat ccaggaagcc atggaaaagc agatgaaggc 481 agaacgcgaa aagagagaag cgatcctcac cgccgaaggt aagaagcaga gcgccattac 541 cctggcagaa ggtgaaaagg aagccgcgat cctccgcgcc gaagccgtca aacagcagcg 601 catccgcgag gcagaaggtg aagccgaagc tctgctcgcc gttcagaagg ccagagccga 661 aggtatccgc atgatcaacg aagcggctcc ttccgcaggc tacctcacca tggagagcta 721 caaggctgcc gagaagatgg cggacggcca ggccacgaag atcatcgtgc cctccgacat 781 ttccaatctg gccggtacgc tgagcgccct gagcgccgtc gtaaaagatc cgcaggagcc 841 taagggagag tagcaaatgg atatcttcga tatcgttggc gcgatcctcg gttttatcgc 901 gtcgatcatc ccgctcatcg tcatcctctt catcttcagc agattggcga aggccgcgaa 961 gcagagccag aagagatccg gcggttcgaa cccctggcag cagccggctg cgcagcagga 1021 aaagccccac ctggtaaagt ccctgaagaa cagcagttcc ggggaataca aggcggagga 1081 caagcagttc ggcttcggga agagcgcctt cgcgggcagc cgctccacga gctcttccct 1141 gaaggcggag aaagtctccc gtctgtcgga gaccttcatg aaggatgacc gcaagaacga 1201 ctggcttgcc cggcagctgc gcgaagagga gaagatcctg cgccggggcg acatgctgga 1261 tctcggcgcg tcccacgccg ccagctgcga cgcggacctg ctgaagcgat accatctgtt 1321 cgccgagcac gacgacagcg tggacagcgg ggagtattag aacaattgca tcaagagacc 1381 ggaaccggaa gcggttccgg tcttttcata ttttttttaa aaaggatgtt gacaaatata 1441 tcggcatccg atatactcta atcacgatat atcggacgac gatataacgg gtcacgatag 1501 aaagggtaga catatgatcg aaaacatggc gttgaccgaa tccacctatt acatcctgct 1561 ctcgctggtg agtccgcagc acggctacgg catcatgcag caggcagagg cgctgtcgaa 1621 cggcagagtg cggctggcag ccggcacgct gtacggcgcg ctgagcgcga tggtggacaa 1681 gggctggatc cggcagctgc cggtggaaga gggcagccgc aagaaggaat atcaactgac 1741 ggagaaaggg cgcagcgtgc ttgacaacga agtggcaagg ctgcgggaac tggcggacaa 1801 cggagagcgc attttgggca tggcgcagga ggaataaaat gggcgagaga aaaacggtca 1861 gaaaatggtt ctgggtctgg gatttcgata aggaagaacg ctggctcaac gagatggcgc 1921 tgcagggctg ggtgctggat ggcgtcggct tttgcacgta tcactttaaa aagtgcgagc 1981 ccggcgagta cgcagtgcgg ctggagatgc gtccccacga cgaatcatac atcgcgttta 2041 tggaggagac cggcgccgaa ttcgtaggac gctttacgat gtggctctat ttccgcaaga 2101 aggtcgagga cggcgcgttc gatctgtact ccgacatcga ttccaagatc gcgcatctcg 2161 atcgcatcgg acgggtgctg gcggtcatcg gcggtctcaa cctgctctgc gcctttatgt 2221 acagcgtcgg cgtgggcacc tgggtgggcg tgctcaacac gatctgcgcg actgtgctga 2281 tgtacggtct gggccgcatc cacggcaaga aagaatcgct gcagcaggcg agacagctgt 2341 acgaataacg gcaaggaaga catacaaaaa tctccggtga gtcccggaga ttttttcgtt 2401 tacagttcga tccagtaccg gcgggtgagc gcgtatactc ccggttcgat ctcgttctcg 2461 atcttatcct gcagcacgcc gccgttcgct tcgatcgtct tcgccgagcg gatgttcgtg 2521 tcgtcgcagg tgacgagcac tttctcgaac ccgaaatgtt cccggcagta atccagcgcc 2581 atggccagct gcagtttgcc atagcccttg ccctgttcgg acgggcgtat ggtgtagccg 2641 atgtggccgc cgaagcgcaa aaggctgggg gtgagccggt ggcggatgtt gaccctgccg 2701 ataaagcggt ctccatccac gagccacagc gtcgtagccg gcacgtagcc tgcgggaagt 2761 ccttctccct tgcgctccga ctccgagcgg gcgatggcga tgtccggatg gatcagcatc 2821 tgcagttcac ctttgtttac cgcaatgtct tccgcgta // LOCUS sequence143 2852 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence143 VERSION sequence143 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2852 /mol_type="genomic DNA" /organism="" /note="sequence143" CDS 299..874 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MKIVNMYTDGACSGNQNEENVGGWGCILEFAGREKELWDGEVNTT NNRMELSAPIAGLSALKEKSLLVRIYSDSSYLVNCFQQGWHKNWVKNGWKTSQKKPVEN RELWEKLLSLMEGQTCEFYLVKGHLKLTDKDGSPLDETNAALNKAYKAYCSHNGGISFE EFYRIAGYNNRADDLANEFIRRHAAQAM" /locus_tag="LOCUS_4670" /note="WP_010933276.1 ribonuclease HI (Chlorobaculum tepidum) [pid:53.5%, q_cov:66.5%, s_cov:84.2%, Eval:2.2e-32, partial hit]" /note="MGA_664" CDS 993..1568 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MLRIRRITAIILAIAVLATGYVFADAAAIVSPAANSIVYTDSLLV SVKVTELKTIRVSVYAEKVTSGDKLVNADVSKFTEADLKAAAGDPKYTDVLLADPAEYT NTLEIGFYTKQIAVSPGLYKVKAETLETVMEWPEGAVEPVEKTIVTETKSSLVAVKKKP TEEKTQVFQNNSTGAITFIRKILKGLLR" /locus_tag="LOCUS_4680" /note="MGA_665" ORIGIN 1 acgatctggt ggtgtcccgg gccgtggcca acatggcgac gctgtcggaa tactgcctgc 61 ccttcgtgaa gatcggcggc ttcttcatcg cctataaaac ggaggatgcg gcggaggaga 121 tcgaggccgc aaaaggggcc atcgccaggc tgggcggcca gatccggcgc attgaaaaag 181 catcgtctaa taacgatgcg cttttgaatg gtcacgtttt cgtcgtggtg gaaaagatcg 241 cgaaaacgcc gaaggaatat ccgagaaaag cgggtacgcc gggaaaggat cccctgaaat 301 gaagatcgtc aacatgtaca cggacggcgc ctgctccggc aatcagaacg aggagaacgt 361 gggcggctgg ggctgcatcc tggaatttgc cggccgggaa aaggagctct gggacggtga 421 ggtgaacacc accaacaacc gcatggagct gtccgcgccg atcgccggtc tgtccgctct 481 gaaggaaaag agcctgctgg tgcggatcta ttcggattcc tcttacctgg tgaattgttt 541 tcagcagggc tggcacaaaa actgggtcaa aaatggctgg aagacgtccc agaaaaagcc 601 ggtggagaac cgggagctct gggaaaagct gctgtctctg atggagggtc agacctgcga 661 attctatctg gtaaagggtc acctgaagct gacggacaaa gacggcagcc ccctggacga 721 gacgaacgcg gccctaaaca aggcctacaa agcctactgc agccacaacg gaggcatttc 781 tttcgaggaa ttctaccgca tcgcgggcta caacaaccgg gcggacgatc tggcgaacga 841 atttatccgc cggcacgccg cacaagcgat gtaaaggcat attaaattgt ttgtaataat 901 tctgtaacat tcctgctgta tactagtagt tgtagcagag gatatcctct gcaggttttg 961 ccttgttaca acagcggaaa ggagttgcgg aaatgttgcg gatccggcgg atcacagcga 1021 tcatattggc catcgccgta ttggcgacag gctatgtttt tgccgacgcc gccgctatcg 1081 taagtcctgc cgccaacagc atcgtctata cggacagcct tctggtctcc gtcaaggtaa 1141 cggagctgaa gaccatccgg gtgtccgtct acgcggaaaa ggtgacctcc ggcgataagc 1201 tggtgaacgc cgacgtgagc aaattcacgg aagccgacct gaaagccgcc gcgggcgacc 1261 cgaaatatac ggacgtgctg ctggcagatc ccgcggaata cacgaatacg ctggagatcg 1321 gcttctatac gaagcagatc gccgtttcgc ccggcctgta caaggtaaag gcggagacgc 1381 tggagaccgt catggaatgg cccgaaggcg ctgtggagcc ggtggagaag accatcgtca 1441 ccgagacgaa gagcagcctg gtggcggtca agaaaaagcc cacggaagag aagacccagg 1501 tcttccagaa caactccacg ggcgccatca cgtttatccg caagatcctg aagggcctgc 1561 tcaggtaagg aatggacgag cgcgcaaaga gacaggaaaa actgaagaat gcggtcatag 1621 tagtattgtt cctgacgaca atactacttt taaatttgac ctggcgcagc gaaggccagg 1681 ggagcttccg cctgtcgtcg gtgctggatt ttatcagccc ggacgtgtgg gtgcccgatg 1741 cggacgaatt cgtgaccgca gacagcgccg tgtacggttt cggcgatgcc acgttctccc 1801 tggacagggt aaatgcggaa cagcagctgc agtctgtttt ggaactgctg cgccgggaga 1861 gcgcgaacgc ctcgttcctg atcaacgaag tgacggacca gcagtaccgg gacatgctgc 1921 gcagctaccg cagtttaaag gtgcggctgt cgtgtccggt gcctttcggt gaattttgcg 1981 accgcaccgg catcaaccgc aattccacct acgaccaggt gaccaccgtg gatgcgttcc 2041 tgatctcgga agcggcgccg gagagcatct tcgtcgaagg cggcggccag tgctggcgct 2101 ttatctccga cagcgaggag gatctggcag gaccgttcct caccggtctc acccggggcg 2161 aacccatcta ctacacggca gccagcatgc tgggcggcga aaatctgtcg ctgctgccgc 2221 tggcgcagac gtcggaactt tcccaggcgg aatgggagag cgaatcgtcg gacgatccgg 2281 agcgggccgg ccgggaaatg gcggagtccg tattcggcga gaacttcgat ttcgtgcgcc 2341 gcatcacgga cagtttcggc aacgtcacgt acatgtacgg gtacggcgag aagacgctca 2401 cctgccttac ggacggttcg ttcgaataca agacggagac ggcggacggg ccggatcctg 2461 gcttttacgg cagcctgcag accgccatcg ccttcacggc gactcacggc ggctggggca 2521 gcgacaggag agatctggac tacgtgctct gcagcgccgt agaatccggc agcggcagaa 2581 gcaaggtcta taccttcgga tttgcgcagg tgctgggcgg cgtcaagctc ctcagcgaag 2641 acggaccggc catcatcgta acggtgtccg gcggcgaagt cagctattac agacgcgctg 2701 tggcaaaagc cacaacggca acggcggaaa cgcagccggc ggcggaagcg gccaacgtga 2761 tcgcaggcaa cagccatctg atctacagcg tgctgacggg caacgtgctt tctgcaaact 2821 ccgacgagga attcgcctat gtggcggatc ac // LOCUS sequence144 2849 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence144 VERSION sequence144 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2849 /mol_type="genomic DNA" /organism="" /note="sequence144" CDS complement(1663..1884) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MKKSFKVKGIDCANCAAKLEDNLNKMPGVEKATVSFMTEKLTLTA ADDKFEEVLEAAKALTKKLEPDWEIVTK" /locus_tag="LOCUS_4690" /note="WP_002327795.1 heavy metal translocating P-type ATPase (Enterococcus faecium) [pid:42.6%, q_cov:93.2%, s_cov:9.8%, Eval:9.5e-12, partial hit]" /note="MGA_668" CDS complement(1898..2206) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MPKKKDKSIITEEDLYDLADLFKAFSDTTRIKLLYALMEGELCVA DLTEKTGATQSAVSHQLRTLKQMDLIRCRKEGKQVIYFLADDHVHTILQMGMDHVKE" /locus_tag="LOCUS_4700" /note="WP_011459353.1 metalloregulator ArsR/SmtB family transcription factor (Desulfitobacterium hafniense) [pid:57.1%, q_cov:89.2%, s_cov:73.4%, Eval:1.4e-23, partial hit]" /note="MGA_669" ORIGIN 1 cttgatgccg atggagaaac tgatgttctc gtagatgatg cgcatcgttt tgcgggcgat 61 ccgtacggca agcgccacat cggaaggctt gtcgttcatc aatacgatgt ccgccgcctc 121 caccgcagcc gcactgccca tggaccccat ggcaatgcct acgtcggcaa gcgccagcac 181 cggcgcgtcg ttgatgccgt cgccggcaaa ggcgaccgtc cggtctttct gcttcgaagc 241 gatcagatcc tttacgcgcg acactttatc ctgaggcatc agctcggcgt gccattccga 301 aaggccgagc gcttttgcga cgtcttgggc gatctccttc ttgtcgccgg tcagcattac 361 tgtgcgggtc acgcccaatg cctgcagcga gctgatcgcc tgtttcgcgt catcttttac 421 gacgtctgcg ataacgatgt gaccctcata gacgccgtcc actgccacat gcaccatcgt 481 gccctggact tcgcagtcct tgtgctgcgc acctgcccgg gtcatcagcc gcgcgttgcc 541 gcaggcgacc tgcttgccat cgaccgtagc gatgatgcct tctccggcga agttctcgaa 601 ctggcccaca cgcgccttat ccgctgtttt tccggtgcgc gcttggtact cctcttccag 661 ggaacgggaa atggggtggt cggagaagct ctctgcagct gctgccagat ccagcagttc 721 ctcttccgtc atgcgttccg gatggactgc aacgacggaa aacacgcctt tcgtaagggt 781 gccggtctta tcgaacacca cggtatccgc cttcgccagc gcttccagat agttgccgcc 841 cttcatcagg atgcccttgg aagaagcgcc gccgatgcct gcgaaaaagc tgagcggtac 901 ggagatgacc agcgcacagg ggcaggacac cacgaggaag atgagcgccc ggtgcaccca 961 ggtcgcccac tgcccggtcg caaggcccgg gaccactgcg agcagcaccg ccagtccgca 1021 aacgatgggc gtatagtagc gggcaaagcg ggtaatgaac tgctccgcct ttcccttgtt 1081 ctctgtcgac tcttccacca gttccaggat gcgggtggcg gtggattcgt cgcaaggctt 1141 ggtgacccgg atcttcagca gtccgttcag gttgatggtg ccggagtaga tctcgtctcc 1201 ctctgccaca tgccgcggca gcgattcgcc ggtgagggcg gccgtatcca ggcgggaatc 1261 cccttctatg acgacgccgt ccacgggcac ccgctcgccg ggtttgaccg tgatgatggt 1321 gccgacttcc agatcgtccg gatccacctg ctgcagctcg ccgttttcgt cttcgatatt 1381 ggcgtagtcc ggccggatat ccatcaacgc cgcgatggac tggcgggact tgtccacagc 1441 cttgtcctga aagtactcac cgatgcggta cagcaccagc acggagatgg cctccaggta 1501 ctcgcccatg gcgagggcgc cgaaggtggc caccaccatc aggaagttct cgtcgaacac 1561 ctggccgttt tttatgttgc gaaaagcctt gcgcaggatc ttatggccga cggccacgta 1621 gatgaccagc gcaatagcca gcttcagata tggattcata gcctacttcg taacgatctc 1681 ccaatccggt tccagcttct ttgtcagggc tttggccgct tccagtactt cctcgaactt 1741 gtcgtcggct gcggtcaggg tcaatttttc cgtcataaaa ctgacagtcg ccttctcgac 1801 gccgggcatc ttgttgaggt tgtcttccag cttggcggcg cagtttgcac agtcgattcc 1861 cttgacttta aaggattttt tcatgatcgg gtcctcccta ctcttttacg tgatccatgc 1921 ccatctgcag gatcgtatgc acgtggtcat cggcgagaaa atagatcacc tgtttgcctt 1981 ccttgcggca gcggatcaga tccatctgtt tgagggtgcg cagctgatgg ctgacggcgg 2041 actgggtggc gccggtcttt tccgtcagat cggcaacgca gagctcgcct tccatgagcg 2101 cgtacagcag cttgatgcgg gtcgtgtccg aaaaggcctt gaacaggtcg gccagatcgt 2161 acagatcctc ttcggtgatg atgcttttgt cttttttctt cggcatgttt cccctccgat 2221 gaacatatga atatctgttc atatttgcat tatatcgggc gggggatgaa atgtcaaccg 2281 aagtagtgaa aaaagatgca cggtatcgta taatgtcgat atcagaatga cccgggagga 2341 gaatcatgac cacggaagaa cgcgcgaaac agatcgtaga agcgatcaaa acagaagaag 2401 gaacggatcc ggcggagatc ttccgccata tggcacggaa ggatttcgtc cgcatgcacg 2461 ggccggaaca tcacattctg gacggcgcag ccatcctgac cgcgtactgc aatgcaggcg 2521 gcgcgatcga cctggaagca gccctgcaga gcatcctgca ggaaggcctc cgcatgcccg 2581 gcgccatgtg cggactgtgg ggcgtctgcg gcgccattgc atccatcggc gctgcgctgg 2641 ccatcatcga cggcaccggt cccctttccg aggacgggtc ctggggcgag cacatggcct 2701 acacatcgga agcgatccgg gagatgggac gggtcaacgg accccgctgc tgcaagcgcg 2761 acgcgatgct ggcgttccgc aacgccgtcg cttacattaa cagccattac gacgtgaccc 2821 ttacatacga ggaaaagcct tgcgagttc // LOCUS sequence145 2844 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence145 VERSION sequence145 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2844 /mol_type="genomic DNA" /organism="" /note="sequence145" CDS complement(208..984) /product="enoyl-CoA hydratase-related protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_005901833.1" /transl_table=11 /codon_start=1 /translation="MAFVELEIKGSVGVLTINRPEALNALNDQVISQLGETLDNLDLNT LRCLIVTGSGAKAFVAGADIGQMSGLTKAEGEAFGKLGNDTFRKLETLPIPTIAAVNGF ALGGGCELAMSCDIRLASETAVFGQPEAGLGITPGFGGTQRMARLIGPGKAKELIYSAR NIKAPEALSIGLVQAVYPAEELMPAAEKLANRIAGNAPIAVRACKKAINDGLQVGMDEA VVIEEKLFGSCFETKDQRNAMSAFLEKRPHDPFENC" /locus_tag="LOCUS_4710" /note="WP_005901833.1 enoyl-CoA hydratase-related protein (Fusobacterium nucleatum) [pid:63.5%, q_cov:96.5%, s_cov:96.5%, Eval:2.8e-88]" /note="MGA_672" CDS complement(1065..1949) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MERITKEQIQAWLPKREPDAHKGDFGRILVIAGSRGMMGACILAC RAAFRSGSGLVAACCPPEFFSVVHTGVPEATCVSRDAFDPAKYDAVAIGSGLGVSRENY EMICRILREYAGPVVLDADGLNCLSEYGVPSASETRAHLVLTPHAAEAARLVNASAEAG RPPVTPQDVALDRAFYGKFLAKRLHAACVMKGRGSLICLPDGTVYENTTGNPGMATGGS GDVLTGVTVSLAGQYVAQGVTAESACVLAAVCGVYLHGLAGDIAAEKWGEAGVMAGDIA DGVAIAWKHIDKK" /locus_tag="LOCUS_4720" /note="WP_011109230.1 bifunctional ADP-dependent NAD(P)H-hydrate dehydratase/NAD(P)H-hydrate epimerase (Bacteroides thetaiotaomicron) [pid:40.6%, q_cov:99.3%, s_cov:55.5%, Eval:2.1e-45, partial hit]" /note="MGA_673" misc_feature complement(1950..>2844) /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_011393448.1:ABC transporter permease" /note="WP_011393448.1 ABC transporter permease (Moorella thermoacetica) [pid:40.5%, q_cov:100.0%, s_cov:89.7%, Eval:5.7e-46]" /note="MGA_674" /locus_tag="LOCUS_4730" ORIGIN 1 ccgcttatcg aaggaagcgg cgagcttgtc cttatgtctc tgcgcagacg ccacgctgct 61 ggcatacatc agagcggtgt gaccattctg agcgaatacc tgtgcgatac cggaacccat 121 ggtgcctgcg ccgaaaattg ctactttcat tttaagttac ctcctaaaat atcgtaaaaa 181 ggtttaaaaa catgtatgtg agactgctta gcagttctca aacggatcgt ggggtctctt 241 ttccaggaac gcgctcatgg cgtttctctg gtctttcgtc tcgaagcagc tgccgaacag 301 cttttcttcg atgacgaccg cttcgtccat gccgacctgc agaccgtcgt tgatggcctt 361 cttgcaggcg cgtacggcga tgggtgcgtt gccggcgatg cggttcgcca gtttttctgc 421 cgcaggcatc agttcctcag cgggatagac tgcctgtaca aggccgatgg acagtgcttc 481 gggagccttg atatttctcg cgctgtagat gagttccttg gccttgccgg gtccgatgag 541 gcgggccatt ctctgggtgc cgccgaagcc cggggtaatg ccgaggccgg cttccggctg 601 accgaataca gccgtttcgg aagcgagccg gatatcgcag ctcattgcca gttcgcagcc 661 gccgcccagc gcgaagccgt tgaccgcagc gatggtggga atgggcaggg tttccagttt 721 tctgaaggtg tcgttgccca gtttgccgaa cgcttcgcct tctgccttgg tcaggccgct 781 catctggccg atgtcggcgc cggcgacgaa ggcttttgca ccgctgccgg taacgatgag 841 gcagcgcagc gtattcagat ccaggttatc cagcgtttcg cccagctggg agatcacctg 901 atcgttcagg gcattgaggg cttcgggtct gttgatcgtc agaacgccga cagatccctt 961 gatttccagt tctacaaatg ccatttaata taatcctcct tacaggtcct tctctgtctt 1021 ccatgatgca tgagaattcc tgcatctccc attatatact ttgtttattt tttgtcaata 1081 tgtttccagg cgattgctac gccgtccgcg atatcccctg ccattacgcc tgcttcgccc 1141 catttttcag cagcaatatc ccctgccaga ccgtgcagat acacgccgca gacggctgcc 1201 agaacgcagg cgctctccgc ggtcacgcct tgggccacat actgcccggc cagggaaacg 1261 gtgacccctg taagcacgtc gccggagccg cccgtcgcca tgccgggatt tccggtggta 1321 ttttcgtaga cggtgccatc cggcagacag atcaggctgc cccgcccctt catgacgcag 1381 gccgcgtgca gcctttttgc gaggaatttt ccgtagaacg cgcggtccaa agctacgtcc 1441 tgcggggtca caggcggtct tcccgcctcc gcggaggcgt ttacgagacg tgcggcttcc 1501 gctgcgtggg gcgtaaggac cagatgcgcg cgagtctccg acgcggaagg cacgccgtat 1561 tctgacagac agttgagccc gtctgcatcg agaacgacag gacctgcgta ctcccgcagg 1621 atgcggcaga tcatttcgta gttctcccgg gagacgccaa gtccggagcc gatggcgaca 1681 gcatcgtatt tcgcggggtc aaacgcatcc cgcgatacac aggtcgcctc cggcacgccc 1741 gtatggacca cggagaaaaa ctctggcggg caacaggcag cgaccagacc gcttccgctg 1801 cggaaagccg cccggcaggc caggatgcag gcgcccatca tgccgcggct gcccgcgatg 1861 acgagaatgc gcccgaaatc acctttatgc gcgtctggct ccctcttggg gagccaggct 1921 tggatctgtt cttttgtaat gcgttccatc tatctttctt ctctgaaata cggaagtccc 1981 aggcttgcgg ggggctgatc ctcccgtttc tggcgcaggg atacgataat gagcacgatc 2041 gccgttacga tgtacggcag cactttatag atctgggacg ggataaagga gaccggcacg 2101 cgcaggtaca tgatcatcag accgccgaac aggatggagc cccagatggc gttgaggggc 2161 ttccacaggc agaagatgac cagggcaacg gctacccagc cttcgccgga cagcgccgtg 2221 tggttccaga ccgtgccggc gatggtcatg gtgtagacca tgccgccgat ggcggagatg 2281 ccgccgccga tgacggtcgc cagatacttg tatttcgtta cgttgatgcc cgctgcgtcc 2341 gccgtggagg ggctttcgcc gacagccttc agatacagtc ctctgcgggt acggttgagg 2401 aacagcgaca tgacgatggc catggcgatg cccagataca cgaacccgtt ataggagaac 2461 agcacctgcc cgaaaaacgg aatgtcctgc agcgccttgg gcaggatggg gttcgcaaac 2521 gaccccttga gcgcgttgga gatggagatg ttgccgccca ccttcaaacg cagctgctcg 2581 cccacgaact ggcccagacc ggtgccgaag atcgtcagcg caagacccgt aacgttctga 2641 ttggccctaa gggagatcgt aaggaagctg aagatgaggg cgccgaacac gccggccagg 2701 aaggagcaga gaagcgcgat gagcaccgcc agaaatccgc tggcggaagc gccggccagc 2761 tggtcgtacc agaacgcgcc ggccagaccg aaggcgccgc ccatgaacat caggccttcc 2821 acgcccaggt tcatgttgcc gctc // LOCUS sequence146 2832 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence146 VERSION sequence146 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2832 /mol_type="genomic DNA" /organism="" /note="sequence146" CDS 3..935 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MLLGVLGSEKPWCRYDKIKFLCPVPGYDRHFTICETLGIEMIPVP LTEWGPDMDQIRELVKDETVKGIWCVPKYTNPLGGCYSDEAVKALASMETAAKDFRIFW DNAYCVHYVYEDVPVLNMLEECKKAGHPDRVYMFGSTSKITFPGAGVGFFGASEANVEF IKKQINAEAISWDKMNMLRHVRFFGSAQGILDLMDKHAALLRPKFDAVLNALEEEIGPR GCGSWVRPSGGYFVTFMAPKGCAARVNALCKEAGVTMTGPGATHPYHKDPDDSVLRIAP SFPPAEELQKAMEVFCVAVRLAAVEKLLA" /locus_tag="LOCUS_4740" /note="WP_013224310.1 aminotransferase class I/II-fold pyridoxal phosphate-dependent enzyme (Amycolatopsis mediterranei) [pid:51.5%, q_cov:97.1%, s_cov:72.9%, Eval:9.6e-84, partial hit]" /note="MGA_675" CDS 1025..2038 /product="aspartate--ammonia ligase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011949062.1" /transl_table=11 /codon_start=1 /translation="MSKVIVPENYKAALNPYDTQRAIMLIHSIFEKELCSELDLSRVSA PLMVPTASGLNDNLNGVERPVGFDIKETGEDCQVVQSLAKWKRKALKDYDFHVGKGLYT DMNAIRRDEEMDNLHSVYVDQWDWEKVIRESDRTLNYLKKVVQKIVNAIVDTEDIIREV YPELNVYAPKKRQIKYLTTQELEDMYPDKTAKEREDAVTEQYKTVCLMKIGGALKSGKP HDGRAPDYDDWELNCDILFWNEILHHTIEISSMGIRVSPESLDRQLTIAGCDDRRELPF HKALLAGELPYTIGGGIGQSRLCMLLLGKAHIGEVQSSVWDDDTRKICKEAGITIL" /locus_tag="LOCUS_4750" /gene="asnA" /EC_number="6.3.1.1" /note="WP_011949062.1 aspartate--ammonia ligase (Clostridium botulinum) [pid:57.4%, q_cov:99.4%, s_cov:98.2%, Eval:1.1e-109]" /note="MGA_676" CDS 2069..2827 /product="TraX family protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_002895510.1" /transl_table=11 /codon_start=1 /translation="MSLVNEKKKGYNQLVLRSIAMVCTILAIASHTVAPTFRFFGYLEW IAFPIFAYLLAEGVENSMARGLYAVRLFLFAVLSEVPYDLMMSGKVMDTRQQNVLFTLF FGYLILLGVDLIRTHADNLILTIVAEVGGIIFGRYLISEMHCAYSRFGMFFIMLFYVAR RVHYEKLMELAVTLYIAFNLSNQTFATPKINGLQYDLSVQLFAVLALILIWLYNGERGP NTLTVRYISYGFFPVSILLFWYLASQGVIY" /locus_tag="LOCUS_4760" /note="WP_002895510.1 TraX family protein (Streptococcus sanguinis) [pid:25.6%, q_cov:93.7%, s_cov:91.7%, Eval:3.4e-14]" /note="MGA_677" ORIGIN 1 ccatgctgct gggcgttctc ggatccgaaa agccctggtg caggtacgat aagatcaaat 61 tcctctgccc cgttcccggc tacgacagac attttacgat ctgcgagacc ctgggcatcg 121 agatgatccc tgtgcctctc acggaatggg gaccggacat ggatcagatc cgcgaactcg 181 taaaggatga gaccgtgaaa ggcatctggt gcgtgcccaa gtacacgaat cccctgggcg 241 gctgctattc ggacgaagcc gttaaagccc tggcatccat ggagaccgcg gccaaggatt 301 tccgcatctt ctgggacaac gcctactgcg tccactacgt ctacgaggac gtgcccgtgc 361 tcaacatgct ggaggaatgc aagaaggcag gccatccgga cagagtctac atgttcggtt 421 ccacctcgaa gatcacgttc cccggcgccg gcgtcggttt cttcggcgca tccgaggcga 481 acgtggaatt catcaagaag cagatcaacg ccgaagccat cagctgggac aagatgaaca 541 tgctgcgcca cgtgcgcttc ttcggttccg cccagggcat cctggatctg atggacaaac 601 acgccgccct gctgcggccc aaattcgacg ccgtgctcaa cgccctggaa gaagagatcg 661 gtcccagagg ctgcggcagc tgggtgcgtc cctccggcgg ctatttcgtc accttcatgg 721 cgcccaaggg ctgtgctgcc agggtcaacg ccctgtgcaa ggaagccggc gtgaccatga 781 caggccccgg cgccacccac ccctatcaca aagacccgga cgacagcgtc ctgcgcatcg 841 cgccctcctt cccgcccgcc gaggaactgc agaaggccat ggaagtgttc tgcgtggcgg 901 taaggctggc agccgtagaa aaacttctcg cttagaagaa aatggaattg cacaatccgg 961 ccggaaagcg taaaattaga tattattttt tatttcacaa gaactgatat agagaggcaa 1021 aaccatgagt aaagtcatcg ttcccgaaaa ctacaaagca gcgctcaacc cttacgacac 1081 gcagagagcg atcatgctca tccacagcat cttcgaaaag gagctgtgca gcgaactgga 1141 cctgagcaga gtttcggcgc ctttaatggt gcccaccgcc tcgggtctga atgacaatct 1201 gaacggcgtg gaacgtcccg tcggcttcga catcaaggag accggtgaag actgccaggt 1261 cgtacagtct ctggcgaaat ggaagcgcaa ggctttaaaa gactacgatt tccacgtggg 1321 caagggtctt tacaccgaca tgaacgcgat ccgcagagac gaagagatgg ataacctcca 1381 ctccgtctac gtggaccagt gggactggga aaaggtcatc cgcgaatccg accgcacgct 1441 caactatctg aagaaagtcg tgcagaagat cgtcaacgcc atcgtcgaca cggaagacat 1501 catccgggaa gtctatcccg agctcaacgt ctatgccccc aagaagcgtc agatcaaata 1561 tctgacgacg caggagctgg aagacatgta tccggacaag actgccaagg aaagagaaga 1621 cgccgttacg gaacagtata aaacggtgtg cctgatgaag atcggcggcg cgttaaagag 1681 cggcaagccc cacgacggca gagccccgga ctacgacgac tgggaactca actgcgacat 1741 cctgttctgg aacgagatcc tgcaccacac catcgagatc tccagcatgg gcatccgcgt 1801 atcccccgaa agtctggaca gacagctcac catcgcgggc tgcgacgacc gcagagaact 1861 gcccttccac aaggcgctgc tggcgggcga gctgccctac accatcggcg gcggcatcgg 1921 tcagagccgt ctgtgcatgc tgctgctggg aaaagcccac atcggcgaag tccagtcctc 1981 cgtctgggac gacgatacga gaaaaatctg caaggaagcc ggcattacga tcctgtaagg 2041 cttctcctct caggaagtta acgtaagaat gagtttagta aacgaaaaga aaaaaggata 2101 taatcaatta gtactgcgga gcatcgccat ggtatgcacg atccttgcga tcgcctccca 2161 taccgtggcg cccacgttcc gctttttcgg ctatctggaa tggatcgcct tccccatttt 2221 cgcctatctg ctggcggaag gcgtcgaaaa cagcatggcc agaggactgt acgccgtccg 2281 tctgttcctg tttgccgtcc tgtccgaagt gccctacgac ctgatgatga gcggcaaggt 2341 gatggacacc agacagcaga acgtactgtt tacgctgttt ttcggctatc ttatcctgct 2401 cggagtcgat ctcatccgca cgcatgcgga caatctcatc ctgacgatcg tagcggaagt 2461 cggcggcatt atcttcggac ggtacctgat ctcggagatg cactgcgcct attccaggtt 2521 cggcatgttc ttcatcatgc tgttctacgt cgcccggcgg gtgcactacg agaagctgat 2581 ggaactggcc gtgaccctgt acatcgcgtt caacctgtcg aaccagacgt tcgcgacgcc 2641 gaagatcaac ggtctgcagt acgatctgtc cgtacagctg tttgcggtcc tcgccctcat 2701 cctcatctgg ctgtataacg gcgaacgggg tccaaacacc ctgactgtcc gctacatcag 2761 ctatggcttt ttccccgtca gcatcctgct tttctggtat ctggcatctc agggcgtaat 2821 ctattaaaat tc // LOCUS sequence147 2819 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence147 VERSION sequence147 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2819 /mol_type="genomic DNA" /organism="" /note="sequence147" CDS complement(224..865) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MRFPDAYFITGTAYAGKSTMVKLLAEKYGGILCGENYHNERLEGL DPAEFPGLTYTRDLEDWHDFVRRTPDEYEAWIDRTSKECEILELQMLEDLSKQGRKIFV DTNISVETLRQISDNRHVLIMLADPDVSVRRFFDRPDREKQFLYRLMLEEPDPEASLEN FRQCLMRINSPERCDAFLHCGFPVLLRDEGRTVEQTLALVERSFGLEGNT" /locus_tag="LOCUS_4770" /note="MGA_679" CDS complement(870..2045) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MPRPTRCRRIEQMPVYRSFSPDDAPDAETVRMTVDEYEALRLLDD EGLTQEACAAKMNVARTTVTAIYDSARKKIADTIVHGKRLVIAGGRCEYASVDIDQPIR EKGNDMMRIAVSYENGTIFQHFGHTEQFKLYDVEDGKIAAEQIVNTNGSGHGALAGFLK AAKADVLICGGIGGGAQAALQEQGIELCAGASGDADAAVQAYLRGELINTGANCDHHDH HGEGHDCGEHDCGGHDGGCGGCHSPRMEGPNVGKKVRTHYRGTFNDGTQFDSSYDRGEP LEFVCGAGMMIPGFDKAVADMKVGEIRKVHLMPEEAYGIRDLNNVFTLEIQQLPGSQDL NVGERAYLQTMDGRPFEVEVIAKDDKNITLDANHEMAGKELNFEIELVEVL" /locus_tag="LOCUS_4780" /note="WP_010933554.1 peptidylprolyl isomerase (Chlorobaculum tepidum) [pid:45.3%, q_cov:35.0%, s_cov:95.8%, Eval:1.4e-27, partial hit]" /note="MGA_680" CDS complement(2144..2491) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MSWMRSVCGRLKSDYRYSKDIVYNNFPWPDPTPEQKVKIEQTAQA ILDARALYPEASLADLYDELTMPPELRKAHQANDRAVMQAYGMPIKETDEAACVAWLMR LYQEKVGELEK" /locus_tag="LOCUS_4790" /note="WP_015613294.1 N-6 DNA methylase (Lactobacillus acidophilus) [pid:66.1%, q_cov:97.4%, s_cov:12.0%, Eval:1.5e-38, partial hit]" /note="MGA_681" ORIGIN 1 tcgtcgcccc gccagcggtt cgacagataa aaatccacgc tgaactctgt gatgtccttc 61 gattcgatca ccttcggcgc gtttgcgtcc gtatgggtcg tcgtgccgcc gtcgatgggt 121 tccggctccg gcgcggcatc ctctttgcat ccgccgagtc cgaaaagcgt cagcaggccg 181 agcaggaccg ccataacgat cactcctttt ctgttcttct tcctcatgtg ttgccctcca 241 ggccgaagct ccgttcgacc agcgccagcg tctgttccac ggtccttccc tcatcccgca 301 gcagcacggg gaagccgcag tgaagaaacg cgtcgcagcg ctccggcgaa ttgatccgca 361 tcaggcactg ccggaaattc tccagtgacg cttccgggtc cggttcttcc agcatcagcc 421 ggtacagaaa ctgtttctcc cggtccggcc ggtcgaagaa gcggcggacg gaaacgtccg 481 gatccgccag catgatcagc acgtggcggt tgtccgagat ctgccgcagc gtctccacgg 541 agatgttcgt atccacgaag atcttcctgc cctgcttcga caggtcttcc agcatctgca 601 gctccagaat ctcgcattcc ttcgacgtgc ggtcgatcca ggcttcgtac tcgtccggcg 661 tcctgcgcac gaaatcgtgc cagtcttcca ggtcgcgggt gtacgtcagg cccggaaact 721 ccgcgggatc cagcccttcc agcctttcgt tatgataatt ctctccgcag aggatgccgc 781 cgtatttttc cgccagcagc ttcaccatcg tcgacttgcc cgcgtaggcg gtgccggtga 841 tgaaatacgc atctgggaac cgcatcgctt tacaggactt ccaccagttc gatctcgaag 901 ttcagctcct tgcctgccat ctcgtggttg gcgtccagcg taatgttctt gtcgtccttc 961 gcgatgacct ccacttcgaa gggacggccg tccatcgtct gcaggtaggc ccgttcgccc 1021 acgttcaggt cctgggaacc gggcagctgc tggatctcca gcgtaaagac gttattcaaa 1081 tcgcggatgc cgtaggcttc ctccggcatc agatgcacct tgcggatctc gcccactttc 1141 atgtctgcga cggctttatc gaagccgggg atcatcatcc ctgcgccgca gacgaattcc 1201 aggggttcgc cccggtcgta ggacgaatcg aactgcgtgc cgtcgttaaa agtgccgcgg 1261 taatgggtgc ggaccttttt gccaacgttc gggccttcca tccggggact gtggcatccg 1321 ccgcagccgc cgtcgtgacc cccgcagtcg tgctcgccgc agtcgtggcc ttcgccatgg 1381 tgatcatggt ggtcacagtt tgcgccggta ttgatcagct cgccgcgcag gtaggcctgt 1441 accgctgcat ccgcatcgcc gctggcacca gcgcacagtt cgatgccctg ctcctgcagc 1501 gcagcctgcg caccgccgcc gatgccgccg cagatcagga cgtctgcctt tgcggccttc 1561 aggaagcctg ccagcgcgcc gtggccgctc ccgttggtgt ttacgatctg ctcggctgcg 1621 atcttgccgt cttccacatc gtacagctta aactgctcgg tgtgtccgaa atgctgaaaa 1681 attgttccgt tttcataact gactgcgatt ctcatcatat cgtttccttt ctctctgatg 1741 ggttggtcga tgtctaccga cgcatattcg cagcggccgc ctgcgatcac caggcgtttt 1801 ccgtgaacga tcgtatccgc aatcttcttt ctggcgctgt cgtatatcgc cgtaacggtg 1861 gtccgtgcga cgttcatctt agccgcgcag gcctcctgcg ttaaaccttc gtcgtccaga 1921 aggcgcaatg cctcgtactc gtccaccgtc atgcgcacgg tctcggcgtc gggtgcgtcg 1981 tccggggaaa agctccggta gacaggcatc tgttcgattc tgcggcagcg ggttggtctc 2041 ggcataggcc ctcctttctg acatatgtca gttatgatgt tatacccggt tttgacttat 2101 gtcaattatt tatatcaccc tgcgcagagg cgggtggagc gcattacttc tccagttccc 2161 ccaccttctc ctgatacagg cgcatgagcc aggcaacgca ggcagcctcg tcggtctctt 2221 tgatgggcat gccataggcc tgcataacag cccggtcgtt ggcctgatgc gccttgcgca 2281 gctcgggcgg catggtgagc tcgtcgtaga gatctgccaa cgaagcctcc gggtagagcg 2341 ctctggcgtc caggatggcc tgcgcagttt gctcgatctt caccttctgt tccggggtgg 2401 gatccggcca ggggaagttg ttgtagacga tgtctttact gtagcgataa tcgcttttta 2461 atcttccaca aactgaacgc atccatgaca tatggcatcc cttattctgc gatatatgtg 2521 ggtagagaag agcgcttttc ttgtgaacgc tgccgtgagc aaggcatgat cgactattgg 2581 aataaagaga agtaattcgc cccccgtttg tgtttttata cttggtatta tgaccatttt 2641 ccctcctaaa taattgtgta ttttattgct ctgataatac ttgctatttc tgccgagtag 2701 agtgatatat gtacacgaca aagggccagg gagcccagat ttaggaggaa agaacatgaa 2761 atacgcagaa tgcaacgccc ggcagaagaa ggccttcaag aatatttttc acgccagca // LOCUS sequence148 2808 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence148 VERSION sequence148 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2808 /mol_type="genomic DNA" /organism="" /note="sequence148" CDS complement(912..1535) /product="epoxyqueuosine reductase QueH" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_010964885.1" /transl_table=11 /codon_start=1 /translation="MEQKTKKTLLLHACCGPCSSACLERLYPDYDITVFYYNPNITDEG EYRMREEELKHFLQRWQPEGKPTGIAAISGRYDPREYYTCVKGLEQEPEGGARCRACFL LRLEETAKQAAALGFDAFDTTLSVSPYKNSKVLAEIGQSLAETYGVAYLAGNYKKQDGY RRSIELSNEYGLYRQDYCGCEFSKAEAEARRAAKAAQKAVEAAK" /locus_tag="LOCUS_4800" /note="WP_010964885.1 epoxyqueuosine reductase QueH (Clostridium) [pid:50.5%, q_cov:89.9%, s_cov:88.0%, Eval:1.5e-48]" /note="MGA_684" CDS 1569..2486 /product="TIGR01212 family radical SAM protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011461526.1" /transl_table=11 /codon_start=1 /translation="MENTFGSLHYNAIGPYLKRQFGCRVAKLSLDGGFTCPNRDGTKGT GGCTFCSEDGSGRFTGPVSGQMRQLAPKWPEDTKYIAYFQNFTGTYAPAGRLRSLWEEA LSQPGCIGLAVATRPDCLPDDVLDLLSEFNERTFLWVELGLQTANEETADRFNRCWKNA DFEDAMRNLSTRGIKTVIHLILGLPGEDKRQVLSSADYAARFQPFGIKLHMLHLMEGTV MGEAYQNAPFPVLSREEYVSLVCDVLERLPADITVHRVTGDAPRADLIAPLWTGDKRAV LRAIQQEFKRRGTWQGCLCYNQKD" /locus_tag="LOCUS_4810" /note="WP_011461526.1 TIGR01212 family radical SAM protein (Desulfitobacterium hafniense) [pid:45.4%, q_cov:97.7%, s_cov:91.3%, Eval:1.3e-77]" /note="MGA_685" ORIGIN 1 gccctgctcg ctgcggtaga aatcctgtgc agaaggcgtc gcgcttccca gcaccaggac 61 agcgccgtga gccttggcgc gcttcatggc cacttccatg gcatcgtatt tcgcgccgct 121 ctcggattta taggagcttt catgctcttc gtcgatcacg atgaggccaa gtttgtcgaa 181 aggcgcgaac accgcggagc gggcaccgat cacaagatcg acctcgcctc tgcggatctt 241 gccgtattcc acacttttct gcgccggcgt aagcttactg tgcagcaccg cgatgcggtc 301 cttgccgaag cgggccataa accggcttac ggtctggggc gtaagggaga tctccggcac 361 cagcacgatg cccgttcttc cctgctgcag cacggattcc atggcctgca ggtacacctc 421 tgtcttaccc gaaccggtga ccccgaacag cagaaaattc cggttctgcc ggctttcgat 481 ggcttccgcg atctccgcca gcgcgctctg ctgatccgcg ttcagctgct tcggttcttc 541 cggcgcagcc tcgatgccgg cgaagggatc tttcgtcttg cgcttcgcct gggtgttgcc 601 aggcagaaag cactttaccg cctcgatata gcggcagacg tagcggttct tcatccagag 661 ggcggtctcc atcgcttcgg gggtaaggcc ttctccgggg aatgcttcga gcacgtcttt 721 aaaccgcttg acccctgcag ggggctcatc caggatcctg gcgacatacc cttccgtttt 781 gcgatcgtgg atcgagaacg gcactgatac cttgcagcct gctaaaggtt ctgtgtccgt 841 caaatcccac cggtaggtgt acagctcgtc cgttgcgttc gtgttgttgt cgacgacgac 901 ggagacgtag gtcatttcgc cgcctccact gccttctgcg cggctttcgc ggcacgtctt 961 gcttccgctt cggccttgga aaactcgcag ccgcagtaat cctggcggta gagaccgtat 1021 tcattcgaaa gctcgatgga acggcggtag ccgtcctgtt ttttataatt gcctgcgaga 1081 tacgcaacac cgtacgtttc cgcaaggctc tggccgatct ccgccagcac tttggaattc 1141 ttgtaggggc ttacggacag cgtggtgtcg aaggcatcga aacccagcgc agctgcctgt 1201 ttcgccgtct cttcgaggcg cagcagaaaa caggcgcggc agcgggcgcc gccttcgggt 1261 tcttgctcca ggccttttac gcaggtataa tactcccggg gatcgtagcg gccggatatg 1321 gcagcaatgc ccgtaggttt gccttccggc tgccagcgct gcaggaagtg tttcagttct 1381 tcctcgcgca tgcggtattc cccttcgtcc gtgatgttcg gattgtagta aaagaccgta 1441 atatcgtagt ccggataaag acgctctaaa caggcgctgc tgcagggtcc gcaacaggcg 1501 tggagcagca aagttttctt cgttttctgt tccatagagc ctcctttacc aatattttat 1561 tataccatat ggaaaatact ttcggaagtc tgcactacaa cgccataggt ccctatctga 1621 agcggcagtt cggatgccgc gtcgcaaagc tgtccttgga cggcgggttt acgtgcccaa 1681 accgggacgg caccaaaggc accggcggat gcacgttctg cagcgaagac ggcagcggcc 1741 gctttacggg acccgtttcc gggcagatgc ggcaactggc gcccaaatgg ccggaagaca 1801 cgaagtatat cgcctatttt cagaacttta cggggacgta tgcgcctgcc ggcagactgc 1861 gcagcctctg ggaagaagct ctgtcacagc ccggctgcat cgggctcgcc gtagctacgc 1921 gcccggactg cctgccggac gatgtgctgg acctgctgtc cgagtttaac gaaaggacgt 1981 tcctctgggt ggaactgggg ctgcagaccg caaacgaaga aacggctgac cggttcaacc 2041 gctgctggaa aaacgccgat tttgaagatg cgatgaggaa tttatcgacc cgcgggataa 2101 aaaccgtgat tcacctgatt ttaggccttc ccggcgaaga taaacggcag gtcctctcgt 2161 ccgcggacta cgccgcacgc ttccaaccct tcggcataaa gctgcacatg ctgcacctga 2221 tggaaggcac tgtcatggga gaagcgtatc agaatgcccc cttccccgtc ctgagcagag 2281 aggaatacgt atctctggtc tgcgatgtac tggaaaggct tccggcggac atcaccgtgc 2341 accgggtcac cggggacgca ccccgcgcgg acctgatcgc cccgctttgg accggagaca 2401 aacgggcggt gctccgcgct atccagcagg agtttaagcg ccgcggcaca tggcagggat 2461 gtttgtgcta taatcaaaag gattaaaaac aaggagatat tgtcatggct cagctatact 2521 atcgctacag cacgatgaac gcgggaaaat ccatagaatt actgaaggtc gcatataact 2581 acgaagagag aggcaagcac gtgctggtgc tcacgccgtc cttcgatgac cgctacggcg 2641 tgggaaagat caccagccgc atcggcatct cccgggatgc gatcgccatc tccggcgacg 2701 aagacctgct ggagctttat aagaaatacg aagcgcagca gcacatcgac tgcatgctga 2761 tcgatgaatg ccagttcctc aagaagcacc aggtgctgga gttggccc // LOCUS sequence149 2788 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence149 VERSION sequence149 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2788 /mol_type="genomic DNA" /organism="" /note="sequence149" CDS complement(1226..2173) /product="lysine exporter LysO family protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_005817344.1" /transl_table=11 /codon_start=1 /translation="MYLGSCVLGYFAGLPLRKLRARMGWLDPAQNILVLLLIFAMGLRV GSNEEAVRNIGSYGIYAFAFTAVVLLFSMLSVSIIRRLLGYDRYGEKHGKGAAPKRSED SYAVSGTGSNTLKMVGLVSVGIALSYWLVRSGRVEAETLGSGAGTFITVGLCALLVMIG LSLGLEGKIASDIRSAGQVAFILPLAVAAGTFAGSALCSLFLPLSLRECFAIGSGFGWY SLSSGIILDAGYVVAGTISFMHNVMRELFSVILIPIVAAKCGWLEALGLPGSTAMDVCL PVAARATNARIGICSFVTGFLLSLAVPFVVPLFL" /locus_tag="LOCUS_4820" /note="WP_005817344.1 lysine exporter LysO family protein (Desulfitobacterium hafniense) [pid:30.7%, q_cov:99.4%, s_cov:97.1%, Eval:2.7e-33]" /note="MGA_688" ORIGIN 1 atgccacttt gtactgcacc tgcgttttgc ccgagaccag gtcctgttcc gccagggcca 61 gactgctctc ggcggggccg tcctcccggg tgaccgtcac cagcagcgcg gctgtcccgg 121 cgtttttcag atccgcaaga tcgaagacga actgtgcgcc gccggcttcc ttcagatccg 181 ccctgtaggt cggcatcttt tccatgcctt tgcggcagat ccacacgtaa ccgtcgagcc 241 cggtgccgtt ccggtcgcag acctgcacgt cgatctttcc accgcagcct tcgggcagcg 301 ccggccaggc gagctttacg acatacttgc cgtcttcctt tacgaagcgg gcggacgtta 361 cgacggactg cagataactg cgggccgcat cgtccataaa cgataggact tccgcatccc 421 ccgtcttaac gaggacgcgc tcctcctcgc gctgcagcag ttcttcccgg gtcttcggtt 481 ccgcaggctt tgcgggcacc gggggctccg gttctttcgc aggttccggg tctgccggcg 541 cctccgcgcc ggtgatctgc gccagcgccg tcatcgcagc ggctgcctct gcccgggtca 601 gaaaacccag cggcccgaac gtgccgtcgg gataaccggt gagggcgccg taataggcgc 661 agagcgcgat cggatattcc cgctcatctg ttgcctccac gtccgaaaac aggagatccg 721 cctgctttac gttgcggccg ctcaagccgg ctttgccgag caagcctgcc atgatgagcg 781 ccatatcccg tctggggatg ggttcgtcca ggacgcgcga aggcacctgg gcttcgctga 841 agatctcctg tgccgccgca gcatcgtaga agggtctggc ccagtgggcc ttgtaagggg 901 tcacatcggt gttcgacgtc ccctgcccgc gcatggccat ggcgagaaat tcgccgtagg 961 agacccggcg ggaaggctta aaactgccgt cgggatagcc ggaaacgatg cccagatccc 1021 gggccgtttc cacgtaagac gcaaaccaat ccgtctgccg cacatcggaa aacagagagg 1081 ctgcggagat gggcacggtc agaagaaaga ccagtgccgc tgtgagtagt acggttcttt 1141 tcatcctttc ttcgctccca cgcaaagaaa ctgccattat tatacaggca gtttctggaa 1201 atcgcaagat gaaattggat gatttttaca aaaacagggg gacgacgaag ggcactgcca 1261 gcgagagcaa aaagcccgtc acgaaggagc agatgccgat gcgggcgttg gtagcccggg 1321 cggcgacggg aaggcacacg tccatggccg ttgaccccgg cagccccaaa gcctcgagcc 1381 agccgcattt ggcggcaacg atggggatga ggatgaccga aaacagctcc cgcatcacgt 1441 tatgcataaa ggagatggtc cccgccacca cgtagcccgc atccaggatg atgccggagc 1501 taagggaata ccacccgaag ccggagccga tggcgaaaca ttcccgcagg gaaaggggca 1561 ggaacaggga gcaaagcgcg gagcctgcaa aggtgccggc ggccacagcc agcggcagga 1621 taaaggcgac ctgacccgca gaacggatgt cggaagcgat cttgccttcc aaacccaaag 1681 acaggccgat catgacgagc agcgcgcaga gacccacggt gatgaatgtg ccggcgccgc 1741 tgcccagcgt ttccgcttcc acgcggccgc tgcggacgag ccagtagctg agggcgatgc 1801 cgacggagac cagacccacc atcttcaggg tattggagcc ggttccggag acggcgtaac 1861 tatcctccga acgcttggga gcggcacctt tgccgtgctt ttccccatag cggtcgtagc 1921 cgaggagacg ccggatgatc gagacggaga gcatggaaaa aagcagcacg actgcggtaa 1981 aggcaaaggc gtagattccg taagagccga tgttgcggac ggcctcttcg ttggatccca 2041 cgcggagacc catggcgaag atcagcaaga gcaccagtat attctgggca gggtcgagcc 2101 agcccatccg cgcgcgcagt ttgcgcagcg gcaggcccgc aaagtatccc aacacacagc 2161 tacccaaata catcacagca tcttgcataa aaaaagtccc tttctgctca ttttggggca 2221 tccggggact attgtaccat aatgatcagc ttatttcacg cgttcgtcgt acaggaacag 2281 catccagccg tgggcttcgt ccgccgcaaa gttctgcagc tgttcgtagg tggcgtgcag 2341 ggtgggatag acgtggtctg cgccgttcgc atcggtgtag gtctcgatgg ccgtcgtgat 2401 gttgtgctcc cggccgaagg ctaccagcaa ctctgcgact tccggatcgt ccggatccag 2461 ctgcacctcg tctttaaaga tatccaccca cacgcggtag accgcatcgt ctccgtattc 2521 cttcatggct gcccgcaggg gctcggaata accggcctcg ccgttcttcg gcgccgcata 2581 gcagccgtcc ggcgcgtccg gataggcgga caccagcgtc ttgccgttat acgcatccgc 2641 gtccataccg gcgtatgcat aactatcgct ggtcggcatc tccacccctt ccgtgggcag 2701 aggttcggtt tccgcaggag ctgcttcgtc gagttccgcc acctctgccg gttcttcggc 2761 catttccggc gcatcctctt cctcggca // LOCUS sequence150 2784 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence150 VERSION sequence150 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2784 /mol_type="genomic DNA" /organism="" /note="sequence150" misc_feature <1..585 /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_011393325.1:selenium metabolism-associated LysR family transcriptional regulator" /note="WP_011393325.1 selenium metabolism-associated LysR family transcriptional regulator (Moorella thermoacetica) [pid:34.0%, q_cov:98.5%, s_cov:63.2%, Eval:3.4e-20, partial hit]" /note="MGA_690" /locus_tag="LOCUS_4830" CDS complement(735..1898) /product="pyridoxal phosphate-dependent aminotransferase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011016536.1" /transl_table=11 /codon_start=1 /translation="MLKYVDRRGTNCSKWDGLEGVYGEKDLLAMWVADMDFEIAEPIRK AVGNYVDNVPWGYYDPSPSYKQAFIDWEKKYHGYEVKPEWICFSNGIVSAFYWVTCMAA KPGEAVILLAPIYYPMMDGVKFNDRKLVLCDMIHDGNTYRVDYEKFEKQIVENDVKLFI MSSPHNPVGKIWTKEELKTLMDICRKHNVLVVSDEIHQDFEWNGHVHTPTATVGDYDDM LITMCAVSKTFNLASCQNSFIIIPDEKLREQYLTFARNVHGTGGNGFGYVAVEAACREG RPWFEEVKKQIWENYCYVRDTFAKELPDVTVADLQGTYLLWLDFGKYFKTQEEIKAFMQ GKCKLAFDYGNWFGRGGDDYCGFVRMNLATSLENVKEACDRMIKNLK" /locus_tag="LOCUS_4840" /note="WP_011016536.1 pyridoxal phosphate-dependent aminotransferase (Fusobacterium nucleatum) [pid:43.1%, q_cov:99.0%, s_cov:95.7%, Eval:1.6e-94]" /note="MGA_691" CDS 2094..2381 /product="30S ribosomal protein S6" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_010966984.1" /transl_table=11 /codon_start=1 /translation="MNKYELMFIVEPSLDDAKKDEVVEAVKAIIAEGGEVLDTDVWGMR KLAYPIQKKTEGYYVVMHFNAKPELPKELDRRLRISDNFMRHIIINLDEE" /locus_tag="LOCUS_4850" /gene="rpsF" /note="WP_010966984.1 30S ribosomal protein S6 (Clostridium) [pid:52.6%, q_cov:98.9%, s_cov:100.0%, Eval:1.0e-21]" /note="MGA_692" ORIGIN 1 ccgtccggct acatcctgcc gcggcttctg gaagggttcc gcagcgaatc tccggacgtg 61 gtcatctcca tccgccagtc cgacagcgag gagatcgagt ctgctgtgga acagggcgcc 121 tgcgatatcg gactcgtcgg cgaagaagcc ggcggcggtc tggtgagcaa acccatcgcg 181 gaggacaaga ccgtgctgat cacgccaaac acgcctgcgt tcaaaaagat gatcaaggcg 241 aaggatctga acgctctgct ttcccagccg atgctgttcc gggaaaaagg cagcgccagc 301 cgcaaaagcg cggagaagct gctggaactg ttaggcaagg atctgcagga cgtggacgtg 361 gcagccagtc tgaacgatca ggaagccatc aagaacctgg tggaacacgg cttcgggatc 421 tcgttcatct cggcgctggc cgcggaagac agggtgcggg aaggaaggct gctcctcttc 481 gacacggggc ttgccgaggc aaagcgcacg ttctacctca tccgccgcaa aaacgtgcag 541 ctctccgaaa cggcggagga gttcgtgaag tatatttgta aatagggcgt cttcggaccg 601 tttcgaaccg ctcggcaagg gaagattgcc tcgcttgtcc gaaacggctc ctcaaccgcc 661 tcataattgc taaaaaggcc ctgtccgctt tggacaaggc cttttataaa gcaattcagt 721 agcggccgag gacgctattt cagatttttg atcatcctgt cgcaggcttc cttcacgttc 781 tccagggacg ttgccaggtt catgcggacg aacccgcagt aatcgtcgcc gccgcggcca 841 aaccagttgc cgtagtcgaa ggccagcttg cacttgccct gcatgaatgc cttgatctcc 901 tcctgcgtct tgaagtactt gccgaagtcg agccacagca ggtaggtgcc ctgcaggtct 961 gcgacggtca cgtcgggcag ctccttcgcg aacgtgtcgc gcacgtagca gtagttctcc 1021 cagatctgct tctttacttc ctcgaaccag gggcggcctt ctctgcaggc ggcttccacc 1081 gccacgtagc cgaacccgtt gccgccggtg ccgtgcacgt tgcgggcgaa ggtcagatac 1141 tgctctctga gcttctcgtc cgggatgatg atgaaggagt tctggcagct ggccaggttg 1201 aaggtcttgg agacggcgca catggtgatc agcatgtcgt cgtaatcgcc gacggtcgcg 1261 gtcggggtat ggacgtggcc gttccactcg aagtcctgat ggatctcgtc ggagaccacg 1321 agcacgttgt gcttgcggca gatgtccatg agggtcttca gctcttcctt cgtccagatc 1381 ttgccgacgg ggttatgcgg ggaggacatg atgaacagct tgacgtcgtt ctccacgatc 1441 tgcttttcga acttctcgta gtcgactctg taggtgttgc cgtcgtggat catgtcgcac 1501 agcaccagtt tgcggtcgtt gaatttgacg ccgtccatca tcgggtaata gatgggcgcc 1561 agcaggatga cggcttcgcc gggcttcgcg gccatgcagg tgacccagta gaacgcggag 1621 acgatgccgt tggagaagca gatccactcc ggtttgactt cgtatccgtg atacttcttc 1681 tcccagtcga taaacgcctg tttatagctg gggctgggat cgtaatatcc ccagggaacg 1741 ttgtccacgt agtttccaac ggctttgcgg atcggttccg cgatctcgaa gtccatatcc 1801 gcgacccaca tggccagcag gtccttctcg ccgtatacgc cttccaggcc gtcccacttg 1861 gaacagttcg tccctcttct gtctacgtat ttcagcatat ttcctaacct ccaatgatat 1921 atagaaagag ctgtttttat cctcttaaaa tatagcattt ttgtgttgca attcaaagca 1981 cccctatgta taatgtatag gcattcgtct gctcgggaga tcccgccgcg gacgaagctc 2041 tctgccgcag gggagcactg cggccgcaaa acagaccata gggaggtgaa agaatgaata 2101 agtacgaact gatgttcatc gtagaaccca gcttagacga cgccaagaaa gacgaagtgg 2161 tggaagccgt taaggcgatc atcgcagagg gcggcgaagt gctcgacaca gatgtctggg 2221 gtatgcgcaa gcttgcttat ccgatccaga agaagaccga aggttattac gttgtgatgc 2281 acttcaacgc aaagcccgag cttccgaagg aactggacag aagactccgc atttccgaca 2341 acttcatgag acacatcatc atcaatctgg acgaagaata gagagggaca ttatgaattc 2401 tgtttgctta gtaggaagac ttacgagaga cccggaagtc cggtatggct ctcagtccca 2461 gatggcgatc gccagattct ccatagccgt ggaccgtacg atccccgacc gcaacggaga 2521 aagacagaca gattacccca atatcgtgtg ctttggaaag agcgccgaat tcgtcgagaa 2581 gtattttaag aagggaatgc gcgtcggcgt caccggaagc ctgcgcaccg gttcttatac 2641 caataaggac ggcgccaagg tcttcacgac ggaagtcgcc gcggaccgcg tcgagttcat 2701 ggaaagccgt gccgaaagag agggccgcga ggccaccggt aatttcggcg gaaacttcgg 2761 aggaggctac agccagccgg cacc // LOCUS sequence151 2771 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence151 VERSION sequence151 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2771 /mol_type="genomic DNA" /organism="" /note="sequence151" misc_feature <1..570 /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_011948262.1:fructose-1,6-bisphosphatase" /note="WP_011948262.1 fructose-1,6-bisphosphatase (Clostridium botulinum) [pid:52.4%, q_cov:100.0%, s_cov:28.1%, Eval:4.7e-48, partial hit]" /note="internal stop codon at [568:570](+)" /note="MGA_694" /locus_tag="LOCUS_4860" CDS 678..1460 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MKHARKLRLTSLCLCLCLLLAGAAPVYGLSEDDALTLTFDHIAAH VQPPQAVNGFTDAQVIQYFVEVAMYSEYEGYRGYLMRYEQPRKYCFLGSPDEEDKAQVR ALVAELNQIVGCPDLTETANVNEADIKIMFSDQASYESYFSLRVPAGSWGYASVWYYDQ GYYLGELTATNIWISNDAWPRRDRNSVIAEEFIQGLGLLNDPEYGYYSIFDQNRNDCDW PSELDWAVVNLLYHPWMDRTASESQVRETAQMILDSWK" /locus_tag="LOCUS_4870" /note="MGA_695" tRNA complement(1595..1671) /product="tRNA-Arg" /inference="COORDINATES:profile:Aragorn:1.2.38" /locus_tag="LOCUS_t0090" /note="Aragorn_9" tRNA 1785..1859 /product="tRNA-Gly" /inference="COORDINATES:profile:Aragorn:1.2.38" /locus_tag="LOCUS_t0100" /note="Aragorn_10" tRNA 1895..1971 /product="tRNA-Pro" /inference="COORDINATES:profile:Aragorn:1.2.38" /locus_tag="LOCUS_t0110" /note="Aragorn_11" CDS 2102..2539 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MENNTKRALSVIFAFLLLMSIFPAAAFANGSTESGETLVAVSIEA VAEFEQSEASRNGGAETWALMNVILCVVTFLAAIAALRIRDGRIRTIAILAAAAALVTT AVTQNFGTHIILADKWTVLMAVYAAGCSALNEMRSSKKPRE" /locus_tag="LOCUS_4880" /note="MGA_696" ORIGIN 1 ggcaaggaat ggttcgacta cgccgaccgg ctggtgcgca ctggttactt cggcaaagct 61 tcggacaaga acaagcagag gggcatcgac tttttctggt atctgtggtg cggctataaa 121 tcgccgctgt tcggcaagaa gaagatcacg acgttcgagc gtctgttcgt ggaggacgag 181 agcacctggg tggaggccaa gaacccgtat tacaaactga tcgaaaagcc cggttccgaa 241 gccatcgtag agcatatcct ggcggatttc ggatgcgaca ccgtcaacgg catcatcatc 301 aacggccaca tgccggtcaa gaagggcgcc aacccgatca aggcgaacgg cagggcgatc 361 tgcatcgacg gcggattcgc gaagccttac cagaagacga cgggcatcgc gggctactcc 421 ctcatccaga actcctacgg ctttatcctt accgcccacg aggccttcga atccaaggcg 481 aaagccgtac agcaggagct ggacatccac tccacgcagg tcgcgcggga ggacatctcc 541 atccgcatgc tcaacaagga tacggactag ggtgcggaga tccaggaaaa gatcgacgga 601 ctcaagatgc tgctggaggc gtatcacacc ggccttatcc cgcagacggt aaagcagtga 661 ccctatagga ggatcccatg aaacacgcga gaaaactgcg gctgacaagc ctgtgcttgt 721 gcctctgtct gcttttggcg ggggcagcgc cggtctatgg tctgtcggaa gacgacgcgt 781 tgacccttac attcgaccat atcgccgccc acgtccagcc gccccaggcg gtgaacgggt 841 ttaccgatgc gcaggtcatc cagtactttg tggaagtcgc catgtacagc gaatacgaag 901 gctaccgggg ctacctgatg cgctacgaac agccgcggaa atactgcttc ctgggctctc 961 cggatgagga ggacaaggcc caggtgcggg ctttggtcgc ggaactgaac cagattgtcg 1021 gctgtccgga cctgacggag acggcaaatg taaacgaagc tgatataaag atcatgtttt 1081 cggatcaggc gtcgtatgag agctatttct cgctgcgggt gcccgccggc agctggggct 1141 acgccagcgt ctggtattac gaccagggct attacctggg cgagctgacc gcgacgaaca 1201 tctggatctc caacgatgcg tggccgcgcc gcgaccgcaa ctccgtgatc gcagaggaat 1261 tcatccaggg actgggtctg ctgaacgatc cggaatacgg ctattacagc atcttcgacc 1321 agaaccgcaa cgactgcgac tggccctccg aactggattg ggctgtcgtc aatctgctgt 1381 atcacccctg gatggaccgg accgcttcgg aaagccaggt ccgcgagacc gcgcagatga 1441 tcctggatag ttggaaataa aaaaatccga caggatcgct cagccgtcgc ctgcggctcg 1501 gcttcgcgtg aacctgctcc ggttcgaatc ctttcgatca taactcgaga aaaaacgatc 1561 ccggtcgctg acgcttccgg gattgttttt tctctggtgt atccgacagg attcgaacct 1621 gcggcctttg gagtcggagt ccaacgctct atccagctgg gctacggata catggtactt 1681 tgatagtata acacaagttg atgagaaaat ctaaaaaaat gtacttgaaa taagaaatat 1741 cttttgctat actaatatgc gtcgccggca aagacggcag acatgcggaa gtggctcagg 1801 ggtagagcat cgccttgcca aggcgagggt cgcgagttcg aatctcgtct tccgctccaa 1861 tttttttata aaagtgcagt tcttctgcac atatccgggt gtagcgcagt ttggtagcgt 1921 gcttgactgg gggtcaagag gccgtgggtt caagtcccgc cactcggacc atcacaacac 1981 agaactttcg ggttctgtgt ttttttttag aaaatgcggg aacattcctt tatgcggaac 2041 gtctaacgag tgtaagacaa aaccaaacgc aggacgtttc gaaccataaa ggagaacaga 2101 aatggaaaac aatacgaaga gagcgctatc cgttatcttt gcctttcttc tgctgatgag 2161 catcttcccg gcagcagcat ttgcgaacgg cagtaccgaa agcggcgaaa cgctggtagc 2221 tgtcagcatc gaggctgtag cggaattcga gcaaagcgaa gcatcccgga atggcggcgc 2281 agagacctgg gctcttatga acgtcatcct gtgtgtggtc acctttctgg cggccatagc 2341 agccctccgg atccgggacg gaaggatccg caccatcgcc atcctggctg ccgctgcagc 2401 gctcgttacg accgccgtga cccagaactt cggaacccac atcatcctgg cagataagtg 2461 gaccgtcctg atggcagttt acgcagccgg atgctccgcc cttaacgaga tgagatcctc 2521 caaaaagcct agagaataag caaataggaa tataattaca aagaatccca cacctgaaag 2581 cggccctcct cctggccgct tttcccttgc agggctttat ggtatactgg tagggcagct 2641 tgccttggca ggctgcgatc ccaacgtatc aaaggagttt tatctatgac cgttttcgaa 2701 gcaaaagaga aactgacagc gcttcagcgc aagatggctg cttacgagca tgcgcagagc 2761 ctgctgtatt a // LOCUS sequence152 2759 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence152 VERSION sequence152 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2759 /mol_type="genomic DNA" /organism="" /note="sequence152" CDS complement(545..1255) /product="CoA transferase subunit A" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_002983642.1" /transl_table=11 /codon_start=1 /translation="MKNKMVTAAEAVSAIKDGDMIAVGGFLGTGSPEILMDALVAQGTK HLTVIANDGGLNEENAPTNGKLKGIGKLLANHQIDHLIASHIGVNPEINRQIAAGTLTY ELFPQGSLAEKLRAAGAGLGGVLTPVGLGTPMEKDWQGNAKEIIEIDGVRYLLEKPLRP KFALVRADYCDKYGNFTMLRATKNFNHVMAMAAEHTLLASEKVYEIGEKDPDEYQFSGV YVEKIVEGEKPWEI" /locus_tag="LOCUS_4890" /note="WP_002983642.1 CoA transferase subunit A (Streptococcus pyogenes) [pid:42.3%, q_cov:96.2%, s_cov:98.6%, Eval:1.3e-44]" /note="MGA_699" CDS complement(1351..2130) /product="B12-binding domain-containing protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_005902977.1" /transl_table=11 /codon_start=1 /translation="MSNFTTATSTVDLTKIKPYGDTYNDGKVQMSFTLPVPDGEEAQEA ARQYAKLMGMDEPSVTHHSDLGIGYTFFVVYGPVHHTVDYTKIRVTKVESHVFDRVECG EWIAKNIGRTITMVGASTGSDAHTVGIDAIMNMKGFHGHFGLERFKNVNAINMGSQVPN EELIAKAIEVNADAILVSQTVTQKDVHIKNLTNMVELCEAEGIRDHMLLLCGGPRISHE LAQELGFDAGFGPETYAEHVCSYVMQEIVARGWVNKK" /locus_tag="LOCUS_4900" /note="WP_005902977.1 B12-binding domain-containing protein (Fusobacterium nucleatum) [pid:61.0%, q_cov:95.0%, s_cov:93.5%, Eval:4.7e-83]" /note="MGA_700" misc_feature complement(2130..>2759) /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_011015881.1:D-lysine 5,6-aminomutase subunit alpha" /note="WP_011015881.1 D-lysine 5,6-aminomutase subunit alpha (Fusobacterium nucleatum) [pid:71.0%, q_cov:99.0%, s_cov:39.8%, Eval:2.2e-79, partial hit]" /note="MGA_701" /locus_tag="LOCUS_4910" ORIGIN 1 agggtgagct tgccgtcgat gtacttcata acgcccattt cggtgatgat ctcatcgact 61 accttttctg cggtgagggg cagcgtgcac ttcttcatga tcttgtagtt gcccttctgg 121 gtgtgggtca tcgcgatgat aaccttctta gcgccgcaga ccaggtccat agcgccgccc 181 atacctgcaa cagccttgcc cgggatgatc cagttggcca ggttgccttc ttcgtctacc 241 tgcatagcgc ccagaacggt tgcgtctacg tggccgccgc ggatgatgga gaaggattct 301 tcggaaccga agaagttagc gtacggagtg taggttaccc agttcccgcc gctgtcgatg 361 actctgtagt cttccttgcc cggttcagcc ttgccggaca ggccggtgaa gccgttctcg 421 gactgcaggc aaatgtctac gccttcggga aggtagctgg tgcacatggt cggaagacca 481 atgccgaggt tgacgacgtc gccgtcatgg aattcctgcg ccgctctctt ggcgattcta 541 gcttttaaat ctcccatggt ttttctcctt ctacgatctt ttctacgtat acgccggaga 601 actgatattc gtcaggatcc ttttcgccga tctcgtatac cttttcggat gccagcaggg 661 tgtgctcagc agccatagcc attacgtggt tgaagttctt ggtagccctc agcatggtga 721 agttaccata cttgtcgcag tagtctgctc ttacgagagc gaacttcgga cggaggggct 781 tctccagcag atagcgaacg ccgtcgatct cgatgatctc cttagcgttg ccctgccagt 841 ccttttccat aggagtacca aggcctaccg gggtcagaac gccgcccagg cctgcgccgg 901 cagctctcag cttttcagcc agagatccct gcgggaacag ttcgtaagtc agagtgcctg 961 ctgcgatctg tctgttgatc tcggggttaa cgccgatgtg ggaagcgatc aggtggtcga 1021 tctggtggtt agccaggagc ttgccgatgc ccttgagctt gccgttggtc ggagcgtttt 1081 cttcgttcag gccaccgtcg ttggcgataa cggtcaggtg cttggttccc tgtgctacga 1141 gagcgtccat caggatctcg ggggaaccgg tgccaaggaa tccgccgact gcgatcatgt 1201 cgccgtcttt gatggcagat acagcctcag cagctgttac cattttgttt ttcataaaaa 1261 tctcccttta actatataag atgcttctga agtcgacggt ccctgagccg tgtcgaaggg 1321 accgccgctg cagaaaattt ataccgaaag ttacttcttg ttgacccatc cacgggcgac 1381 gatctcctgc atgacgtagg agcaaacgtg ttctgcatag gtctcgggac cgaaaccggc 1441 gtcgaagccc agctcctgcg ccagctcgtg ggaaatacgg ggaccgccgc acagcagcag 1501 catgtggtcg cggatacctt ccgcttcgca cagctctacc atgttggtga ggttcttgat 1561 gtgaacgtcc ttctgggtta cggtctggga aacgaggatg gcgtcggcgt tgacctcgat 1621 ggccttcgcg atcagctctt cgttggggac ctgggaaccc atgttgatgg cgttgacgtt 1681 cttaaagcgc tccagaccga agtggccgtg gaagcccttc atgttcatga tcgcgtcgat 1741 gcctacggtg tgggcgtcgg aaccggtgga tgcaccgacc atggtgatgg tgcggccgat 1801 gttcttcgcg atccattcac cgcattctac gcggtcgaat acgtgggatt ctaccttcgt 1861 aacgcggatc ttggtgtagt ccaccgtgtg gtgaacgggg ccgtagacta cgaagaaggt 1921 gtagccgatg cccaggtcgc tgtggtgggt cacggagggt tcgtccatac ccatcagctt 1981 cgcgtactgg cgggcagctt cctgcgcttc ttcgccgtcg ggtacgggca gggtaaagct 2041 catctgaact ttcccgtcgt tgtaggtatc gccgtaaggc ttgatcttgg taagatcgac 2101 ggtgcttgta gcagtcgtga agttactcat tacttggcac ctcccagcat cttttcgata 2161 aacggattga agtagaaatc gttgtccttc gtggctacgc cttccagacc cttgccgccg 2221 tcgaacggtc tcttgactgc ggcgaattta cctgcctcga tggtcgggaa caggccgtcc 2281 ttttcgatct gagccagcag ctcgtctgcg tcgtgcagaa ccttctgggc tctcttctgg 2341 atgatgccgt ctttcttata ttcgatctcg tcgcccaggt ggcgtgcgtt attgaatacg 2401 tacttggcgt tctcgatgga cagcatacgg tcctggagga acggggtgtg aatggcttcg 2461 gtgagcatgc ccagcagctg cagggactga cccgtccaga cggagaccag gttgaacaga 2521 gcatcctgga tatggccgcg gaagatgttg ccggtcatga acttcgtggg aggcatgtac 2581 ttcagggaag cgttggggaa gatctctctt gccatctgcg cctgggacag ctccagcagg 2641 aagccgtctt cggtcatggg atccatttcg aacgcgtggc ccagacccat ctgccattcc 2701 tggatgttgg ccagaacagc gaactgttcg ttgatcatct gggaagccag aacggtgtg // LOCUS sequence153 2738 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence153 VERSION sequence153 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2738 /mol_type="genomic DNA" /organism="" /note="sequence153" CDS 2..1138 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MLGVATVILVLPSLLLLADKWVAKWHHKPLIPDLEGLNEHTIRRR WVFVLIAAILFVPAVYAKNNAAVYYKLDESLPQDLPSIVANHRLKDEFGMSVSHFAVVS DDLTAAQLAEMEGRIEAVDGVTDLISYHKLLGSGIPEFFVPEELRSMVKAGGHQLMMIN SEYDTASDEVSQQVAQLRTILKDYDPDAMLTGEAVLTDDLIVTTAVDFRTTNYISMAAI FLIIAIVFKSVTVPLVLVAVIELAIFINLGIPYFTGSEVAFITPTVISCVQLGATVDYA ILMTSRFQDELRAGKDRFEAIRIAAKASDPAIITSSLVMLCATLGVSFVSSIDLIGSIC TMLARGSVISAVMSIVFLPAILCAAEPLFRRTSYHWLG" /locus_tag="LOCUS_4920" /note="WP_164930970.1 MMPL family transporter (Dictyoglomus turgidum) [pid:29.1%, q_cov:80.7%, s_cov:44.1%, Eval:1.7e-32, partial hit]" /note="MGA_702" CDS 1251..2558 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MKKYLSILLCLALCASMAACSSGEPTPEPEEPAVSGEPEDQVKLI AENKDLWLVTDVNEADQYQYAVTDLDENGRLELIATITEGSGQFSTTHFYEVSEDFSKL EPLEYAYGETHSEPDIGWYNALRCYKGEYGNFVIAMDEMRNGYAENYYTQDLIVLKDGV VDAHSISYCMVLAEDSNGDGEPEMHAYYYTSGGDQEEELTSEQFATSVDDFFGYDYDRY VMDVEWQRFSAEERDSEVDIPAALLDSWKAFGFRKDMDEFNGLFVAPSSYYEELYENGE KADITYGMESLADYWQLVEAATELEVRTAEDFGELDCHLIIGQDGMADFYWNDPADARG EISLEGMPISMAEDGMGQAAEEPAEAADPEVTEAPADENAAGWMVVFNTEDGLNRFEAT IGPDDGRLYVNWYWWSEEDPGADPQIMKLTFTNGVA" /locus_tag="LOCUS_4930" /note="MGA_703" ORIGIN 1 cgtgctgggc gtcgccaccg tcatcctggt gctgccttcg ctgcttctgc tggcggacaa 61 atgggtggcg aagtggcatc acaagcccct cattccggac ctggaaggcc tgaacgagca 121 cacgatacgc cgcagatggg tcttcgtgct catcgcggcc atcctgttcg ttcctgcggt 181 ctatgcgaag aacaacgcgg cggtctatta caagctggat gaatctctgc cccaggacct 241 gccctccatc gtggccaacc accgtctgaa ggacgaattc ggcatgtccg tgagccattt 301 tgccgtggtc tccgacgacc tgacggcagc gcagctggcc gagatggaag gccggatcga 361 ggcggtggac ggggtcacgg acctcatctc ctaccacaag ctgctgggca gcggcattcc 421 ggaattcttc gttcccgaag agctccgcag catggtgaaa gccggcggcc atcagctgat 481 gatgatcaac tcggaatacg acaccgcatc cgacgaggtt tcgcagcagg tcgcacagct 541 gcggaccatc ctgaaggact acgacccgga cgccatgctg acgggcgaag ccgtgctgac 601 ggacgacctg atcgtgacca cggccgtgga tttccgtacg acgaactaca tctccatggc 661 ggccatcttc ctgatcatcg ccatcgtgtt caagtccgtt acagtgcctc tggtgctggt 721 ggcggtcatc gagctggcca tcttcatcaa cctgggcatc ccgtacttta cgggaagcga 781 agtggcgttc attacgccga cggtcatcag ctgcgtgcag ctgggtgcca cggtggacta 841 cgccatcctg atgacgagcc ggttccagga cgagctgcgg gcgggcaagg accggttcga 901 ggccatccgc atcgcggcaa aggcgtctga cccggccatc atcaccagtt ccctcgtcat 961 gctgtgcgcc acgcttggcg tgtcctttgt gtcgtccatc gacctgatcg gttccatctg 1021 caccatgctg gccagaggat ccgtcatctc tgcggtcatg agcatcgttt tcctgccggc 1081 catcctgtgc gcggcggagc ccctgttccg caggaccagc tatcattggc tcggataacg 1141 gccacgcaat tttctcattt ccctgaggcg gagcattcgt gctccgtctc ttttttatgg 1201 tatacttata ctgagaaaga attgtcccgc agcaaaaggg ggaggaacgc atgaaaaagt 1261 atctcagcat tttgctttgc cttgcgctct gcgcgtcgat ggcggcctgt tcgtccggcg 1321 aacccacgcc cgaaccggaa gagcccgctg tcagcgggga gccggaggat caggtaaagc 1381 tcatcgcaga aaataaagac ctgtggctgg tcaccgacgt gaacgaggca gaccagtacc 1441 agtacgccgt aacggatctg gacgaaaacg gccggctgga actgatcgcc actattaccg 1501 aggggagcgg ccagttctcc acgacccatt tctacgaagt aagcgaggac ttcagcaagc 1561 tggagcccct ggaatacgcc tacggcgaga cccacagcga accggacatc ggctggtata 1621 acgcgctgcg ctgctacaag ggcgagtatg gcaacttcgt gatcgccatg gacgagatgc 1681 gcaacggcta cgcggaaaat tactataccc aggacctgat cgtcctgaag gacggcgtcg 1741 tggatgccca ctccatctcc tactgcatgg tgctggcgga ggattccaac ggcgacgggg 1801 aaccggagat gcatgcctat tactacacct ccggcggtga ccaggaagag gagctcacct 1861 ccgaacagtt cgcgacttcc gtcgacgact tcttcggcta cgattacgac cgctatgtga 1921 tggacgtgga gtggcagcgc ttcagcgcag aggaaagaga cagcgaagtg gatatccctg 1981 cagcgctgct ggattcctgg aaggctttcg gcttccgcaa ggatatggac gagttcaacg 2041 gcctgttcgt ggcgccttcg tcctattacg aggaactgta cgaaaacggc gaaaaggccg 2101 acatcaccta cggcatggag agcctggctg attactggca gctggtcgag gccgccacgg 2161 aactggaagt ccgcacggcg gaagacttcg gcgagctgga ctgccatctg atcatcggtc 2221 aggacggcat ggcggatttc tactggaacg atcccgcgga cgcccggggc gagatcagcc 2281 tcgaaggcat gcccatctcc atggcggagg acggcatggg gcaggctgcg gaggaaccgg 2341 cggaagcggc cgatccggaa gtgacggaag cgcccgcgga cgaaaacgcg gcaggctgga 2401 tggtcgtgtt caacacggaa gacgggctca accgcttcga ggccaccatc ggccccgatg 2461 acggcagatt atatgttaac tggtattggt ggagcgaaga ggatcccggc gcggatccgc 2521 agatcatgaa gttaacgttt acgaacggtg tcgcgtaaca ccggggaggt gctccatgaa 2581 gaaatggttt gcaattttcc ttgcagctgc gatggtcttc ggacttgccg cctgcacgtc 2641 ttccgaaaac accccggaag tggaacagga accggaagtc gtccgcagcg acgtgcccgc 2701 agaggaccag atcgatgtga tcgtcgccag taaggatc // LOCUS sequence154 2717 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence154 VERSION sequence154 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2717 /mol_type="genomic DNA" /organism="" /note="sequence154" CDS 47..853 /product="pyrroline-5-carboxylate reductase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_009898446.1" /transl_table=11 /codon_start=1 /translation="MDKKILFLGGGNMAEGIIGGLLKHKVFEPGNITVYDVIPARLEYL KNTYGLQTTDKGIAAAADQDVVFLAVRPQDVDNACRGLDAYLRPDTIVMSIISSTDIAK LESCAGKGAKIARIMPNTLIKTGNGFSAAAVNGNVDEGDKKTITAVLDALGQTMYIREE MFDRFTAYSCAGPMFLYMMAHALIEAGIHCGFSKKESYDIVIKNMIGTGENLDLTGSHP LQLIDTMTSPAGVTIESLKVLEEEAFTGIVMKAMEAGVKRAEDMGK" /locus_tag="LOCUS_4940" /gene="proC" /EC_number="1.5.1.2" /note="WP_009898446.1 pyrroline-5-carboxylate reductase (Clostridioides difficile) [pid:32.7%, q_cov:99.3%, s_cov:99.6%, Eval:1.8e-40]" /note="MGA_705" CDS 855..1340 /product="Cys-tRNA(Pro) deacylase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_000710860.1" /transl_table=11 /codon_start=1 /translation="MKKDSTEKTNVMRLLDQKKAAYKVHSYASTGAISGVDVAAALGQD PARVFKTLVTVGKTGQHYVFVIPVAKELDLKKAAKAAGEKSIEMIKSKELLPLTGYIHG GCSPLGMKKFFPTCIDQTAEHCETICFSAGKIGYQVEMSPETLAKMIRYSFADLTEE" /locus_tag="LOCUS_4950" /gene="ybaK" /note="WP_000710860.1 Cys-tRNA(Pro) deacylase (Bacillus cereus group) [pid:47.2%, q_cov:99.4%, s_cov:100.0%, Eval:1.1e-35]" /note="MGA_706" ORIGIN 1 gcggaaaaat acaaggtgga ataaacgaac ccgtaaggag ggcataatgg ataagaagat 61 cctgttttta ggcggcggca atatggcgga aggcatcatc ggaggcctcc tgaagcacaa 121 ggtttttgaa ccgggaaaca tcaccgtata cgatgtgatc ccggcaaggc tggaatatct 181 gaaaaatacc tatggcctgc agacgacgga taagggcatc gcggcagcag cagatcagga 241 tgtggtgttc ctggcggtac gcccccagga cgtggacaac gcctgccggg gactggatgc 301 ctatctgaga ccggacacca tcgtcatgtc catcatctcc agcacggata tcgcaaaact 361 ggagagctgt gccgggaagg gcgcaaagat cgcccgcatc atgcccaata ccctcataaa 421 gaccgggaac ggcttctccg ctgctgcggt caacggaaat gtcgacgagg gggataaaaa 481 gacgatcacg gctgttttag acgccttagg acagacgatg tacatcaggg aggagatgtt 541 cgaccgcttt acggcttaca gctgcgccgg ccccatgttc ctgtacatga tggcccacgc 601 cctgatcgag gccggcatcc actgcggctt ctccaagaaa gagagctacg atatcgtcat 661 caaaaacatg atcggcaccg gggagaacct ggatcttacc ggaagtcatc cgctgcagct 721 gatcgatacc atgacgtctc ctgccggggt cacgatcgaa tccctgaaag tcctggaaga 781 ggaagccttt accggcatcg tcatgaaggc gatggaggcc ggcgtaaaac gcgcggagga 841 tatgggaaaa taagatgaag aaagattcca cagaaaaaac aaacgtcatg cgcctgctcg 901 atcagaagaa ggcggcgtat aaagtgcata gctatgccag caccggggcg atctccgggg 961 tggatgtggc agccgcgctg gggcaggacc ctgccagagt cttcaaaacg ctggtgaccg 1021 tcggcaagac aggacagcac tacgtgttcg tcattccagt ggcgaaggaa ctggacctga 1081 agaaggcagc gaaagcggcg ggggagaaga gcatcgagat gatcaagtcc aaggaactgc 1141 tgcctctgac aggctatatc catggcggct gctcacccct aggcatgaag aagttcttcc 1201 ccacctgcat cgatcagacg gcggaacact gcgaaaccat ctgcttttcc gccgggaaga 1261 tcggctatca ggtggagatg agcccggaaa cgcttgcgaa aatgatacgg tattcttttg 1321 cggatctgac agaagagtaa cgatccgata gaagacggcc ccaaacagag agagggattc 1381 tctctgtttt tatttaccaa aaagtggttg ctaaattctg gaacgtaaga tagaataatg 1441 taaattattg ctagtacaag aagaaagagg tttatatgta cgcgagagta cttacatcct 1501 gcctttatgg cctgtcggga gagcctacct gggtggaagc agatgtggac aacggactgc 1561 cgggcttttt tatggtggga cttgcggacc aggccatccg ggaagcgaag gaacggatcc 1621 ggtccgctat ccgaagcgga gggcacaagt tcccggacaa acggatcacg gtaaacctta 1681 ctcctgcgaa caagaaaaag gagggaagcc atttcgatct tccgatcgcc ataggcgttc 1741 tgctcgcatc cgaatccgtc ctatgccggg gcgatctgtc caaaacggcg tttttgggcg 1801 agcttacgct ggatggacgc gtgcagccct gcgagggtgt gctgcccatg gtcatcggtt 1861 tgcagcgccg cggcatcggg cgggtcgtcc ttccgcaggc caacgcagcg gaagcggggc 1921 tcgtcaaggg catggagatc atgccggtag agacgctggg agaggcggca gagttcatcg 1981 aaggcggact cgcgttaaaa gccttcatcg cggaagggta tcagccggac gatcttccgg 2041 tccaggcgcc ggatttcgcg gatatccgcg gtcagcagac cgtaaagagg gcagcgcagg 2101 tagctgctgc cgggggtcac gggctgctga tgatcggccc gcccggcgta ggcaaaagca 2161 tggccggcaa gcgcattccc ggcattttgc cgcctcttac ctacgaagaa cagctggagg 2221 tgacccagat ctacagcgtc gcgggtgaat tggatgctca gaggcctttt cttacggagc 2281 ggccgtaccg ggcgccgcat cataacatgt cgccggcggc gctggcaggg ggcggcaccc 2341 atccaaaacc cggggagatc tccttgagtc actgcggcgt gctgttcctg gacgaactgc 2401 cggaatttgc gccgtccgcg ctggagtgtc tgcggcagcc cctggaggat ggacagatca 2461 cgatttccag ggcaggcggc cgctgcacct atccggcccg gtttatgctg gtcgcggcca 2521 tgaatccctg ccgctgcggc tacttcggag accctgtcaa ggtctgcacc tgtaacgaaa 2581 gcgaccgcaa acgctatctg aacaaggtct ccgggcctct tttagaccgc atcgacatgc 2641 atgtggcggt agagcggacg acataccggg agatgagcgg tccgggacct gcgatcgctg 2701 cgccgccgga cgaagca // LOCUS sequence155 2711 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence155 VERSION sequence155 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2711 /mol_type="genomic DNA" /organism="" /note="sequence155" CDS complement(893..1213) /product="V-type ATP synthase subunit F" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011986934.1" /transl_table=11 /codon_start=1 /translation="MYRIAVIGGSDTVIGFKALGLDTFPVNSAEEASAAFKQVFQGDVP YAIVYIEETWAQSLQSAIHKFRSDPQLAIILIPGREGSLGLGRQALKDAVEKAVGSDIT GE" /locus_tag="LOCUS_4960" /EC_number="7.1.2.2" /note="WP_011986934.1 V-type ATP synthase subunit F (Clostridium botulinum) [pid:37.9%, q_cov:97.2%, s_cov:99.0%, Eval:3.1e-15]" /note="MGA_709" CDS complement(1206..2189) /product="V-type ATP synthase subunit C" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011986935.1" /transl_table=11 /codon_start=1 /translation="MSKIRDNDYLCISAMLRGKEAHMIGADAFARMAEAENAQAAAKIA EEYGYTDLDLSTPQTVDASLGRIRAAVYEDLAGILPQRALLDLFRLKYDYHNAKILVKN ASRDQDVSGMLSSEGRLSVDEIRELFASETASGVLKDAMTEAADTLAKTQNPQLSDFGL DLAYFKEMRACAQQLGGTSEDYIRLLIDCANLNSYVRSVRMGKSADFLKFALTEGGSID PDVLLNRWPDTDVTDLYAGTALESASKFAGEAMGGWKITPFELACDNALTACLADTRYV PFGADAVVSYLASLDTEIMDLRMVLSGKICGISTEAIKERLRDVNV" /locus_tag="LOCUS_4970" /EC_number="7.1.2.2" /note="WP_011986935.1 V-type ATP synthase subunit C (Clostridium botulinum) [pid:26.1%, q_cov:95.4%, s_cov:96.4%, Eval:5.0e-30]" /note="MGA_710" ORIGIN 1 atgtcggagg tgttggcgat gagcacggta cgcttcatca gaggctcgcc gttatgcggg 61 tcgatgagtt cggggaattc gttgagtacg tccgtcatct cgttgccgcg ctcgccgcag 121 ccgatgtaga tgacgatatc cacgtcggac cacttagcca gctggtgctg gaccaccgtc 181 ttaccggagc cgaagggccc ggggacggcc gctgtgccgc ccttcgccag ggggaacagg 241 gtgtcgatga tgcgctgacc cgtggaaagc gggatctccg gcacgaactt tttaacatag 301 ggacgggcca cgcgcaccgg ccacttctgg gccatggtga gttcgcggat ggtgccgtct 361 tccgtttcga tctttgcaat gacctcgtcc acgttgaaca tgccgccccg gatctccttc 421 agggtgccgt ctgcaccaag gggaaccatg atgcggtgtt cgatggcgct ggtctcctgg 481 accgtgccca ggaaatcgcc ggcctttaag acgtcccctt ccttggcggt gggaacgaac 541 tcccaggtct tttcccggga gagggccggt acggagatgc ctctggcaat ggtatcgccg 601 gagagcttac ggatctccgt cagaggacgc tggatgccgt cgtagatgcc ttccagcatg 661 cccggcccca gttccacgga cagagggtat cccgtcgttt ccacgacggc gcccggtccc 721 agacccgagg tctcttcgta gacctggatg gaggcgctgt ctccggtcat gttcaggatc 781 tcgccgacca gatgctgttc gccgacccgt actacgtccg ccacgttggc atcggacagg 841 ccgtctgcca ccaccagcgg accggatact ttgattactt ttccgctcat acttactctc 901 ctgtgatatc ggaacccacg gctttttcca cggcgtcctt cagggcctgt ctgcccaggc 961 ccagacttcc ttcccgtccg ggaatgagga tgatcgccag ctggggatcg cttctgaatt 1021 tatggatggc agactgcagg ctttgcgccc aggtctcctc gatatatacg atggcgtaag 1081 ggacgtcgcc ctgaaacacc tgtttgaacg cggcggatgc ctcttctgcc gagttcaccg 1141 ggaacgtatc caggcccagg gccttgaacc cgatgacggt gtcgctgccg ccgatgactg 1201 ctattctata catttacgtc acgcagcctt tccttgatcg cctctgtgga gatgccgcag 1261 atcttgcccg acagcaccat gcgcagatcc atgatctccg tatccagcga cgccagatag 1321 gagactaccg catccgcccc gaagggcacg tagcgggtat ccgccaggca cgcggtaagc 1381 gcgttgtcgc aggcaagttc gaagggcgtg atcttccatc cgcccatggc ttctcccgca 1441 aatttcgagg cgctttccag cgctgtcccc gcatacagat ccgttacgtc cgtatccggc 1501 cagcggttta gaagcacgtc cggatcgatg ctgccgccct ccgtgagcgc aaacttcaga 1561 aaatccgcgc tctttcccat gcggacggac cgcacgtagg aattcaggtt ggcgcagtcg 1621 atcagcagac ggatatagtc ttccgaggtg ccgcccagct gctgtgcgca ggcccgcatc 1681 tccttgaaat acgccaggtc gagaccgaaa tccgaaagct ggggattctg ggtcttcgcc 1741 agcgtgtccg ccgcttccgt catggcgtcc ttcagaacgc cggaagcggt ctcggacgcg 1801 aacagttccc ggatctcatc gaccgagagc cgcccttccg aagaaagcat gccggacaca 1861 tcctgatccc gggatgcgtt cttcaccagg atcttggcgt tgtgataatc gtatttcagc 1921 cggaacagat ccagcagcgc gcgctggggc aggatgcccg ccagatcctc ataaacagcc 1981 gcacggatgc gtccgaggga tgcgtccacc gtctggggcg tgctcagatc cagatccgta 2041 tagccgtatt cttccgcgat ctttgccgct gcctgggcgt tttccgcctc tgccatgcgg 2101 gcgaaggcgt ccgcgccgat catgtgcgct tcttttcccc gcagcatggc ggagatgcag 2161 aggtaatcgt tatccctgat cttggacaaa ccgtacctcc tctcttaccc gaacagcatc 2221 gccgcgacct ggggcacgag ggcgtctttg ccggcatcga tcagcgtacc gatgctgcag 2281 ttcgtctcga cgctgccgga gcggagcttg catccgcctt cgatgtctgc aggttcgctg 2341 cacagcgtaa gctgcgccgt cttccctgct ttggccagcg cctcgttgat ctcatcgcac 2401 agtccctggc cgtagcgggc cagatccttc gcgttcagca ccagttcttc ttttccggaa 2461 acgctggcct tgcttgccag ttttacgaga aatgcccggt aagcctgttc atccatgttc 2521 agcagttcct gctgcgcagc ctcgaaagcc ttctgcatta aagactgctt ttcctccagc 2581 agcgcgctgc gggcccgcat gtccgcttcg cccttcatgc gcttgatcag ctcgccggct 2641 tccttttccg ctgcttccag gatggatgcg gccgcgtctt tggcctgttt ctcgtattgg 2701 gcatcgatga c // LOCUS sequence156 2687 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence156 VERSION sequence156 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2687 /mol_type="genomic DNA" /organism="" /note="sequence156" misc_feature <1..721 /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_003428218.1:recombinase RecA" /note="WP_003428218.1 recombinase RecA (Clostridioides difficile) [pid:65.0%, q_cov:89.1%, s_cov:64.1%, Eval:5.5e-80, partial hit]" /note="MGA_712" /locus_tag="LOCUS_4980" CDS 864..1358 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MYAVVVTGGKQYRVCPGDKIRVEKLNVEAGESVCLDKVLVLGGEG ETMVGAPYVEGAAVDAEVVANGKADKVIIFKYKAKKDYRKKQGHRQPYTELKINGISVN GEVKAKAEEAPKAEAAEAPVDLKSMKKAELAEFAAAKGIEVDSKLKKEEMIAAIEAALN K" /locus_tag="LOCUS_4990" /note="WP_011392094.1 50S ribosomal protein L21 (Moorella thermoacetica) [pid:55.3%, q_cov:62.8%, s_cov:99.0%, Eval:3.1e-25, partial hit]" /note="MGA_713" CDS 1383..1643 /product="50S ribosomal protein L27" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_000916187.1" /transl_table=11 /codon_start=1 /translation="MASKKGVGSSKNGRDSEAKRLGVKRADGQFVSAGTILVRQRGTKI HPGNNVGIGGDDTLFAKQDGVVKFERKDKTRKQVSVYSQEA" /locus_tag="LOCUS_5000" /gene="rpmA" /note="WP_000916187.1 50S ribosomal protein L27 (Bacteria) [pid:79.3%, q_cov:95.3%, s_cov:87.2%, Eval:3.1e-31]" /note="MGA_714" ORIGIN 1 gaaggggatc ggcgtcgaca tcgacgacct gctcgtatcc cagcccgata ctggcgaaga 61 tgccctggag atctgcgaaa tgctggtgcg ttccggcgcg atctccgtgg tggtcatcga 121 ctctgtcgct gcactggtgc cgaaggccga gatccagggc gacatgggcg attcccacgt 181 aggtctgcag gcaagactca tgtctcaggc cctcagaaag ctcaccggcg tcatcaacaa 241 gctgcgcgaa aagttcggcg tcatgttcgg caatcccgag acgacgaccg gcggcagagc 301 gctcaagttc tacagctccg tgcgtctgga cgtgcgccgc atcgaatcca tcaaggtggg 361 cgacgccatc gtaggtaacc gcacccgcgt taaagtcgtt aagaacaagg tggcgcctcc 421 gttcaagatg acggaattcg acatcatgta cggcaagggc atctcccgcg cgggcgacgt 481 gctggactgc tccgtggaag caggtctgct ggaaaagagc ggtgcctggt acagctatgc 541 cggcgaacgc atcggacagg gcagggagaa cgtcaagaac tatctggacg aacatcccga 601 actcatggcc aagctggaag agcagatccg cgccaaatac gtggcaaaga aggacgatac 661 gctggtggac gattccgatt ccatcaaggt cgatgcagac ggtgtcgtca tcgaagaata 721 atttcaaaaa gggcgaaaat ctttcttgac actgcatccg caaaccttta tactatttgc 781 gttgccgctc tgaacgggta ctttttaagt gtctgaaaaa gaccaccccc gatggcgaga 841 ccggatagag gaggtaaaat atcatgtatg cagtagtagt taccggagga aagcaatacc 901 gcgtttgccc cggagacaag atccgtgttg agaaactcaa cgtagaagcc ggcgaatccg 961 tatgcctgga caaggtcctg gtcctcggag gagaaggcga gaccatggtc ggcgcaccct 1021 atgtggaagg cgctgccgta gatgctgaag tcgttgcaaa cggcaaggca gacaaggtca 1081 tcattttcaa gtataaggcc aagaaggact atcgcaagaa gcagggtcac agacagccct 1141 acaccgagct gaagatcaat ggcatctctg taaacggcga agtcaaggca aaggctgagg 1201 aagctcccaa ggcagaagca gcggaagctc ccgtagacct gaagtccatg aagaaggccg 1261 agctggctga attcgcagcc gctaagggca tcgaagtgga ttccaagctc aagaaggaag 1321 aaatgatcgc agcgatcgaa gccgcgctca acaagtagtc aagggatcgg aggtaaaaac 1381 ttatggcaag taaaaaaggt gtaggcagct ctaagaacgg ccgcgattcc gaggcgaaac 1441 gtcttggagt caagagagca gacggtcagt tcgtcagcgc aggaacgatc ctcgttcgcc 1501 agagaggaac caagatccac ccgggcaaca acgtaggcat cggcggagac gataccctgt 1561 tcgcaaagca ggacggcgtc gtcaagttcg agagaaaaga caagacccgc aagcaggtca 1621 gcgtttattc tcaggaagca tagttctcac aggcctctgg caattccaga ggccttgctt 1681 tttctcagag gaaactcatg tttgtagata aggcaacgat cttcatcaag tcgggcaagg 1741 gcggaaacgg ttccgtgtcc ttccgcaggg aaccctatat tccccagggc ggtccggacg 1801 gcggaaacgg cggcaagggc ggcgacatcg tcatccaggc cgaccgcaac ctgcgcacct 1861 tgatggattt ccgttataaa agaaaatacg aggcggagag cggagaagac ggcagaggcc 1921 gccagcagtt cggcaaggac ggcgcggatc tggtcatcaa ggttcccgtc ggcaccgtgg 1981 tgcgcgacac tgaaagcaac gcggtcatgg cagacctgac ggaggacggc cagtccttcg 2041 tggcagccaa aggcggcaga ggcggcaaag gcaacgtcat gttcaagaat tccgtccgcc 2101 aggcgccgaa tttcgccgaa gccggcggat ttgccaggga acggcagatc gagctggagc 2161 tcaagctgat cgcggacgtg ggcctcgtgg gctatcccaa cgtgggcaaa tccacgctgc 2221 tgtccgtatc caccagcgcc aaccccaaga tcgcgaatta ccacttcacg accatcacgc 2281 cgaacctggg cgtcgtatcc atgtacgact ccagcttcgt catggcggat attccggggc 2341 tcatcgaagg cgcttcggaa ggcgcaggcc tcggcctgga ctttctgaag cacatcgaac 2401 gcacgcgcat cctcatccac gtggtggacg tatccggaag cgagggcaga gatccgaagg 2461 aagatctgga caagatcaac gcagaactgg ctggctacag cgaaaaactg gcgaagaagc 2521 cccagatcgt ctgcgccaac aagatcgaca tggcggatga cgagatctat gaggaattca 2581 aggcctacgc ggaaagcaag ggctacgacg tctatccctg cagcgcaccc atccacgagg 2641 gcgtggacga gctgctgcgg gccgcttata agctgctgct ggagacc // LOCUS sequence157 2660 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence157 VERSION sequence157 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2660 /mol_type="genomic DNA" /organism="" /note="sequence157" CDS complement(244..1704) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MKEDQKRMPLYEAILEYNEKSPAFFHIPGHRYERGINETWRAKVG DEIFKFDLSETPLTDDLHHASGPIKEAEQLAAELWGADYTHFLVNGSTCGNQAMVVTAS HGGAKIAIPRNAHKSVLMGLIIGGGKPVYIMPQIEPEWGLHGGITPGQVEEMFRQNPDC KGVLVVSPTYYGITSDLEGIAKVCHAHDAILMVDEAHGAHCYFSEKLPRGAIEQGADMA VQSIHKVTGSLTQSSMIHIKSDRVTKNLLEANLTLVQSTSPSYILMTSLDCARQHMALH GAEMIDRAVELSDDARKRINRIPGMSCAGKELIGRAGIHDLDTTRLIISADDIGITGFE LKKMLFDEYDVEVELPDYRNVVAIVTYANEQDEIDKLVEALEDISRRFAPEGEPLPPGE KLPPQPDYVLSPRAAYFLERERVPWVETRGRIVAEMIAPYPPGIPVIYQGERMSAEVWD YIEAFRQRNGHIHGPSDPTLSTLLVIKE" /locus_tag="LOCUS_5010" /note="WP_005903647.1 aminotransferase class I/II-fold pyridoxal phosphate-dependent enzyme (Fusobacterium nucleatum) [pid:42.3%, q_cov:99.8%, s_cov:62.2%, Eval:4.0e-120, partial hit]" /note="MGA_717" CDS complement(1794..2204) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MPDFIKKLYDKYFHQLLRFGIVGCTVTALDFIMLHLFVERVKIWY LAAAALAFTISTIINYILSMTFVFKGREGRDKKEEFIVFAILNLIGLGLTTLLMWLLVD KAGLYYMFAKVFTSATVMFWSFFSRKIFLEQR" /locus_tag="LOCUS_5020" /note="MGA_718" ORIGIN 1 cgtcgcctcc gccagatcga taccgtcttc gcacagcagg ctgccccggc ttcccgtggt 61 gatgcctatc acttttacgt cgattccttt gtccgagagg atctgttcgt gcgtcttctg 121 caggatgcgg gcaaaggctt tgcctgccac gccgtatccc agcatcagaa ctttgcattg 181 cttcattcca tcgcctcctc ttcccgtaaa aaaaccgcat tccaaaagaa tgcggtataa 241 gatctattct ttgatgacga gcagcgtaga caacgtcggg tccgaaggtc cgtggatgtg 301 gccgttcctc tggcggaacg cctcgatgta atcccagact tcggcgctca tgcgctcgcc 361 ctggtagatg acggggatgc ccggcggata gggagcgatc atctcggcga cgatacggcc 421 tctggtctcc acccagggaa ctctttcccg ttcgaggaaa taggcggctc tcgggctcag 481 cacatagtcc ggctgaggcg gcagcttttc gccagggggc agcggttccc cttccggtgc 541 gaaccggcgg gagatatcct cgagcgcctc taccagcttg tcgatctcgt cctgctcgtt 601 ggcataggtg acgatggcga ccacgttgcg gtagtccggc agctccactt ccacgtcgta 661 ttcgtcgaac agcatcttct tcagttcgaa accggtaatg ccgatatcat ctgcagaaat 721 gatgagtctc gtggtatcca gatcgtggat gccggctctt ccgatgagtt ccttgcctgc 781 gcaggacatg ccgggaatgc ggttgatccg tttgcgggcg tcatcggaaa gttccaccgc 841 ccggtcgatc atctccgcgc cgtggagcgc catgtgctgg cgggcacagt cgagagacgt 901 catgaggata taggacggcg acgtgctctg caccagcgta aggttcgcct ccagcagatt 961 ctttgtgacc cggtcggatt tgatgtggat catggaactc tgcgtcaatg acccggtcac 1021 tttgtggatg ctctgcaccg ccatgtccgc gccctgttcg atggcgcctc tgggcagttt 1081 ctcagagaaa taacagtgcg cgccgtgggc ttcgtccacc atcaggatgg cgtcgtgcgc 1141 atggcagacc ttcgcgatcc cttccagatc gctggtgatg ccgtaatatg tcggcgaaac 1201 gaccagtacg cccttacagt ccggattctg ccggaacatc tcctccacct ggcccggcgt 1261 gatgccgccg tggagacccc attccggctc gatctgaggc atgatataga ccggcttgcc 1321 gccgccgatg atgagtccca tcagcacgga tttgtgggcg ttgcggggaa tggcgatctt 1381 agcgcctccg tgggacgcgg tgaccaccat agcctggttg ccgcaggtgc ttccgtttac 1441 taaaaaatgc gtataatccg caccccaaag ctcggcagcg agctgctcgg cttctttgat 1501 gggaccgctg gcatggtgca ggtcgtcggt gagcggcgtt tcggagagat cgaacttaaa 1561 gatctcatcc cctactttcg cccgccacgt ctcgttgatg ccccgctcgt aacggtgccc 1621 gggaatgtgg aaaaacgcag gacttttctc gttatattcc aggatagcct cgtataaagg 1681 catgcgcttc tggtcttctt tcatcgccgg tatcagctcc tttattttat aaaaatcgcc 1741 ccggcccgaa cagaccgagg cacaatttca ttatggactt ttctgggtaa aagtcaacgc 1801 tgctccagga atattttgcg ggagaaaaag ctccagaaca tgacggtggc agacgtaaag 1861 accttggcga acatgtaata aagtccggcc ttgtccacca gcagccacat gagcagcgtc 1921 gtcagcccca gaccgatcag attgaggatg gcaaatacga taaactcctc cttcttgtcc 1981 cgtccttccc tgcccttgaa tacgaacgtc atggacagga tgtagttgat gatcgtggag 2041 atcgtgaacg ccagcgccgc cgctgccaga taccagatct tcacacgctc cacaaagaga 2101 tgcagcatga taaaatccag cgccgttacc gtgcatccga cgatgccgaa gcggaggagc 2161 tggtgaaaat atttatcgta aagcttcttg atgaaatcag gcattgggca gttcgatctc 2221 gattcctttc tcggtatacg ttattacgtc tttgtccatg tacagcgtat cgataaagtc 2281 cagatattcg cggatggagg caaacggcgg ctcgtactgc gccaggatct ccttcgcctt 2341 ggctgcgcca tccgatagca gcgcgtcggc gataaagagt tccgcttttg ccgggttcac 2401 gcaggctctt tccgggtccg ccacgcagaa atcgatgccg tggcccagcc ccgtgtggcc 2461 gttcgcgtag aactgcacgc cgggcatcac catcgtaagg tcgccgaagt ccgaagaccc 2521 cttgctccag gcgttgtggt cgaactttac tttttccttg ccggagagat cctcgcagca 2581 cttctggcac agatccatga acatgtggtc gtggtactcc gtcgcgtagc cgggcatgtc 2641 gcagatatgc agctgcgcac // LOCUS sequence158 2644 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence158 VERSION sequence158 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2644 /mol_type="genomic DNA" /organism="" /note="sequence158" misc_feature <1..558 /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_000503960.1:amidohydrolase" /note="WP_000503960.1 amidohydrolase (Bacillus cereus group) [pid:40.2%, q_cov:91.4%, s_cov:32.0%, Eval:1.3e-31, partial hit]" /note="MGA_720" /locus_tag="LOCUS_5030" CDS 600..1313 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MALTALLAVSVCGCKASVDPAQAEAAQAAKEAQQAAENGTTAEEA EAETIEDLYNEAGLTPAAEDDPLWADAEFELPAIAQLLAYKATFADTFNENDPSADDFW TVTAMGVVAIPPENATDPFKIVHAKEALVLDYSAALLPSYEPGDAAPKLEDVYGISGNP RSDIIDIDSLSINVESSIVLLGTDEKNGNTVMRVHIEDKEGLITQTDWDVLVERWGDGA EHALPLKVVQFYNVN" /locus_tag="LOCUS_5040" /note="MGA_721" CDS 1324..1767 /product="DUF523 domain-containing protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_009932058.1" /transl_table=11 /codon_start=1 /translation="MRKKKLLISNCLLGIPCRYDGSCKKIDCLDALDEKYNLIGVCPEE LGGLETPREPSEIFLGRVLTKSGRDVTYEYDYGADVVLSIVKGHAITKALMQDRSPSCG CGVIHNGKFDGGLVEGDGVTVKLLKANGVEVIPASRAEELLEE" /locus_tag="LOCUS_5050" /note="WP_009932058.1 DUF523 domain-containing protein (Listeria monocytogenes) [pid:41.1%, q_cov:89.1%, s_cov:95.9%, Eval:5.1e-25]" /note="MGA_722" ORIGIN 1 agaaagaaca atccgggctg cggcaagggc agagacggca tcatccactg ccagatcatg 61 aatccggacc agtacgaaaa gatgaaggac atgggcctca tcgggtacat ccagcccatc 121 ttcctgaatt acgactataa gatcctggtg gacagagtcg gagaagagaa agccgcgacg 181 agctacggct ggaagaccat gttcgacatg ggcatccccg cttgcggcgg ttccgactgc 241 ccggtggagg acatgaacat cctgcagaac atccactgcg cggtcacccg caagggcaac 301 gacctgaatc ctcccggagg atggcagccc gagcaggatc tgacggtgga gcaggcggtc 361 tccctgttta cgactcaggc agcctatgcg gcctggagag aagattgggc aggcagcatc 421 aaagccggca agtccgcgga cttcgtcgtc atcgacaagg atatcttcgc catcgaaccg 481 gacgatattc tgaagaccaa cgtagagcgc acgtacgtca agggaacctg cgagtactgc 541 gcggaaaagg aaagataaca ggacacatgc attcagagaa actgaaaaaa ctttgctgca 601 tggcgctgac cgcattgctt gcggtcagcg tttgcggctg taaagcatcg gttgaccccg 661 cccaggcgga ggcggcgcag gctgccaagg aagcgcagca ggccgcagaa aacggaacga 721 ccgcggaaga ggcagaggcg gaaacgatcg aagatctgta taacgaagcc gggctgaccc 781 ctgcagcaga agacgacccg ctgtgggcgg acgccgaatt cgagctgcct gccatcgcac 841 agctgctggc gtataaggcg acgtttgcgg atacgttcaa cgaaaacgat ccgtctgccg 901 acgacttctg gaccgtaacg gccatgggcg tcgtggcgat cccgccggaa aacgcaacgg 961 atccgtttaa gatcgtccat gcgaaggaag cgctggtgct ggattattcc gcagcgctgc 1021 tgccttccta cgagcctggc gatgctgcgc cgaaactgga agacgtgtac ggcatctccg 1081 gcaatccccg ctcggatatc atcgatatcg attccctcag cattaacgtg gaatcctcca 1141 tcgtgctgct gggaacggac gaaaagaacg gcaacaccgt catgcgggtg cacatcgagg 1201 acaaggaagg gctcatcacc cagaccgact gggacgtgct cgtcgagcgc tggggcgacg 1261 gcgcggaaca cgcgctgcct ttaaaagtgg tgcaattcta caacgtgaat taagagagat 1321 atcatgagaa agaaaaaact gctcatctcc aactgcctgc tgggcattcc ctgccgctac 1381 gacggcagct gcaagaagat cgactgcctg gatgcgctgg acgaaaagta caacctgatc 1441 ggcgtctgcc cggaggaact gggcggcctg gagaccccga gagaaccctc cgagatcttc 1501 ctggggcggg tgctcacgaa gagcgggcgc gacgttacgt acgaatacga ttacggcgcg 1561 gacgtcgtgc tgagcatcgt aaagggtcac gccattacga aggctctgat gcaggacaga 1621 agcccttcct gcggctgcgg ggtcatccat aacggcaaat tcgacggcgg cctcgtagaa 1681 ggcgacggcg ttaccgttaa gctgctgaag gctaacggcg tggaggtgat cccggccagc 1741 cgggcggaag agctgctcga agagtagaac gtgacaaggg acagccatgc ttcgctgccc 1801 ctttattgtg ttgaaaatgc ataaatattc atcattgcat aaatatgtct tctgcgatat 1861 aatggaccca taggaatcta acacctgttt gtatagaaaa ggagaacccc atgaagaaca 1921 agagaatcga ccttatcggc gccaagatcg accagggcgc ctccaagcgc ggcgtctgca 1981 tcggacccga agccatccgc ttcgccggca tctgccaggg catccgcgat ctcggttacg 2041 aactgaacga caagggcaac ctcgtgcagc tcgacagcgg ccgcaccagc gaaaaactgc 2101 gcaattacga tcaggtgatc gatatgaata agcgcctgta cgaaagcacg aaacagagcc 2161 tggaagaggg cgcgttccct atcatgctgg gcggcgacca ctccgcagca gctggcaccg 2221 caagcgctgt tgccaaggct catggcggca atatcggcat catctgggtg gacgcccacg 2281 gcgactggaa taacgacgag tcttctgaga ccggcaacat gcacggcatg cccttctccg 2341 ccctgtgcgg ctggggtccg gactgcatgg tggactatgg ccagggtccc gctttcgttg 2401 acccgaagca ttgcgtccag atcgcaggcc gcgacatcga tatggaagag cgcaagcgca 2461 tgaaggaagc cggcgttacc gtcttctcca tcgacgtgat cgaccgcctc ggcatgcggg 2521 aagtcgtcaa gcgcgccatc gagatcgcaa gcaacggcac cgacgggttc cacatttcct 2581 tcgatatcga ctgcgtatcc cccgagtatg cgccgggcac cggtacgacg gtccacgacg 2641 gcct // LOCUS sequence159 2640 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence159 VERSION sequence159 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2640 /mol_type="genomic DNA" /organism="" /note="sequence159" misc_feature <1..1027 /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_002384134.1:YcjF family protein" /note="WP_002384134.1 YcjF family protein (Enterococcus) [pid:29.5%, q_cov:37.5%, s_cov:50.4%, Eval:3.7e-07, partial hit]" /note="MGA_724" /locus_tag="LOCUS_5060" CDS 1146..2504 /product="sodium-dependent transporter" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011020940.1" /transl_table=11 /codon_start=1 /translation="MDNRESFKSRLGFLLVSAGCAIGIGNVWKFPYVTGANGGGIFVVW YLIFLIIMGIPVMTMELAIGRSSRKSMIRGYEALEKPGAKWHIHGWLCMIGNYLLMMYY TTVSGWMFCYFWKFLTGGFTAGMTADEVSSVFGSMLGDPKLMMIWMTVNVVLGFAICGG GIQNGVEKVTKFMMLALLGLMVILGIHSLTLPGAAEGMKFYLLPSMERASEVGMGKVMT AAMNQAFFTLSLGIGSMEIFGTYMSKDNTLPSEAVRICGLDTFVAIMAGIIIFPACFSF GVEPGAGPGLIFVTLPNIFVNMAGGRIWGTLFFLFMMFASFSTVIAVFENIAAFSIDTF GMSRKKSVIMNCILVWILSIPCVLGYNVWSNIHLIRGGDILDSEDFIVSNLLLPIGSLL FLLFCVTKWGWGFDNYMKEVNDGKGLKFARGLKVYFQFILPILILILVWQGLR" /locus_tag="LOCUS_5070" /note="WP_011020940.1 sodium-dependent transporter (Methanosarcina acetivorans) [pid:49.8%, q_cov:98.9%, s_cov:96.5%, Eval:9.2e-132]" /note="MGA_725" ORIGIN 1 atcgggcaag agcacgctca tcgaggccat cctgccctat gcggacgcgg acagcgccct 61 ggagctgatc gatgcgccgg agtcttccgc caaactgagg gccctgcgca aagagcctgt 121 gagcatcgtc tggtactgcc tggacggcat gcagaccgcc atcctggaag aggatctgga 181 cgggctgcgg acggccgcga agctgtggcc ggatctgccg ctgatcgcgg tgttcacccg 241 gtcgctgggc accgacgagc gcgatgtttc caacatcctg atgctgcagg acgccttcgc 301 ggaatacaag ccggcgaagg atctggcgct gcgcacgaag gacatcatct gcgtgctggc 361 tcacgagttc gaaacgccgc tgggcatcgt gcccgtgcgt ggtctggacc gcctgatgga 421 gcgcacccgg gaatgcgcgg cggaggccgg taaggccgcg tcggagcggc aggtgcggag 481 cgtggtctgg gatctgaagc gcaaggaagc caacgcgacg gtagcggcat cggcggcgct 541 ggctgcgacc atcggcgccg tgccggtgag ttttccggac gccacgcttt tagtgccggt 601 gcagaccgcc atgctggcga agatcacgcg gctgtacgac ttaaaagata aaaacgccgc 661 atcgcaaatt accgatgcag ccttaaaagc gggggctacg accatcgtag gccggtcgct 721 gctggtggcg ctcaagggca tccccgtggt cggcaccatc gggggcagcg tgctgaatgc 781 ggcggtagca gccgcagtga ccgcagcagt aggcgagacc accgtggcgg tctacgataa 841 gatccaccgc ggggagctcg tgatcgacga gagcacggac tttggccgca tcgtgggtga 901 gatcttctcc ggccgcctgc cggacatcgt gtccgtggtg gcgaagacct ttgccggcaa 961 gaaagcctcc gatattccca agaatctcgc gaaactcgta tacgagatgg ttgtaaaggg 1021 aaaataggtc gttttttaac cgcttaaccc tttaacgcgt taaatatctg tggtacaata 1081 aaccacgtaa atcggccggt ccggtttcgg gccggtcttt tgttttcgtt ttaacggtaa 1141 taggtatgga caacagagag agttttaaat cgagacttgg tttcctgctg gtgagcgcag 1201 gctgcgccat cggcatcgga aacgtttgga aattccccta cgtaacgggg gccaatggcg 1261 gcggcatctt cgtcgtctgg tatctcatct tcctgatcat catgggcatc cccgtcatga 1321 ccatggagct ggcgatcggc cggagcagcc gtaagagcat gatccgcggc tacgaagcgc 1381 tggaaaagcc gggcgccaaa tggcacatcc acggctggct ttgcatgata ggcaactacc 1441 tgctgatgat gtactacacc accgtatccg gctggatgtt ctgctacttt tggaaattcc 1501 tcaccggcgg ctttacagcc ggcatgactg cagatgaagt gagcagcgtg ttcggcagca 1561 tgctgggcga tcccaaactc atgatgatct ggatgacggt caacgtcgtg ctgggctttg 1621 cgatctgcgg cggcggcatt cagaacggcg tggaaaaagt cacgaagttc atgatgctgg 1681 ccctgctggg tctgatggtc atcctcggca tccacagcct tacgctcccc ggcgcggcag 1741 agggcatgaa gttctacctg ctgcccagca tggaaagagc atccgaggtg ggcatgggca 1801 aggtaatgac cgcagccatg aaccaggcgt tcttcaccct gtctctgggc atcggctcca 1861 tggagatctt cggcacttat atgtccaagg ataacacgct gcccagcgaa gcggtgcgca 1921 tctgcggcct ggacaccttc gtcgccatca tggcgggcat tatcatcttc cccgcctgct 1981 tctccttcgg cgtggagccg ggtgctggtc cggggctcat cttcgtgacc ctgcccaaca 2041 tctttgtgaa catggccggc ggccgtatct ggggcacgct gttcttcctg ttcatgatgt 2101 tcgccagctt ctccacagtc atcgcggtgt tcgagaacat cgcggcgttc tccatcgaca 2161 ccttcggcat gagccgcaag aagtccgtca tcatgaactg catcctggtc tggatcctct 2221 ccattccctg cgtgctgggc tacaacgtct ggagcaacat ccacctcatc cgcggtggag 2281 acatcctgga cagcgaagac tttatcgtct ccaacctgct gctgcccatc ggttcgcttc 2341 tcttcctgct gttctgcgta acgaagtggg gctggggctt cgacaactac atgaaggaag 2401 tcaacgacgg caagggcctc aagttcgcca gaggcttaaa ggtctacttc cagtttatcc 2461 tgccgatcct cattctcatc ctggtctggc agggactgag ataatttaaa aaatataaaa 2521 tacgacacaa aactgccgcg ctgcaaagcg gcagtttttt ctttgcgggc tttaatggta 2581 taatggattc acgacagcga ggctgccgca ggtattttta tggaaaaaaa tcggactata // LOCUS sequence160 2638 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence160 VERSION sequence160 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2638 /mol_type="genomic DNA" /organism="" /note="sequence160" CDS 419..1012 /product="Holliday junction branch migration protein RuvA" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_012048089.1" /transl_table=11 /codon_start=1 /translation="MLHYIKGVITDTMPGMVCIENNGIGYEVYVPETSRAYLTQDGEII TLYTAMVVREDDVSLYGFTEKEALNMFRLLQTVPGVGAKAAMAILSALSLRDLKRAIAF EDVGSITRAQGVGKKTAQMVVVKLKDKMGDVSDLDLPQGAPMPSVVPGSNKEQAVSALM ALGFTKAEAMASMAGITDEGLTTQEYIKLALRNR" /locus_tag="LOCUS_5080" /gene="ruvA" /note="WP_012048089.1 Holliday junction branch migration protein RuvA (Clostridium botulinum) [pid:41.0%, q_cov:99.0%, s_cov:98.0%, Eval:8.0e-33]" /note="MGA_727" CDS 1012..2055 /product="Holliday junction branch migration DNA helicase RuvB" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003426579.1" /transl_table=11 /codon_start=1 /translation="MDTENRVVGANLQGDEELMERSIRPKRFEDYVGQTNVTDNLKVYI QASKMRGEPLDHVLFYGPPGLGKTTLAGIIAEEMGVDLRITSGPAIGRAGDLAAILTNL NEGDVLFIDEIHRLNRAVEEVLYSAMEDFALDIVTGKGPGASSIRFELPRFTLIGATTR AGSLSAPLRDRFGILAKFELYNENELAAIMRRTARILNVEIDEESTRMLATRSRGTPRV ANRLLKRVRDFAQVLGSGKIDPPIVESTLRSLGIDELGLEELDRRILKLIIEQFQGGPV GIDTIAASLGEERVTIEDAYEPYLMQAGLLHRTLKGRMASINAYRHLGLDVPKSMMPEE EQLTLGK" /locus_tag="LOCUS_5090" /gene="ruvB" /EC_number="3.6.4.12" /note="WP_003426579.1 Holliday junction branch migration DNA helicase RuvB (Clostridioides difficile) [pid:60.2%, q_cov:95.7%, s_cov:97.9%, Eval:4.9e-111]" /note="MGA_728" ORIGIN 1 tcacgacgga taaggatatg cccatgcctc agaggctcaa aagcctgtac gcggggctga 61 tggagatcat ggcggagtac cagccagagg agatgagcat cgagcagctc tacttcaacg 121 acaatgccaa gacggcgatc ttcgtcggcc aggccagggg cgtcgccatc cttgccgggg 181 tcaacagcgg ccttacgatc tacgaataca cgccgctgga gatcaagatg aacatcaccg 241 gctacggcag ggcggacaag aaacagatcc agtttatggt gaagaccatg ctgggtctga 301 aggaagtccc caaaccggac gacacggcgg acgccatcgc ggcagccatc tgccacgggc 361 gcaacggcga tgcgaagaag aaactgttcg agatgagata gacagaagaa aggacgacat 421 gctgcactat atcaaagggg tcatcaccga taccatgccc ggcatggtgt gcatcgaaaa 481 caacgggatc ggctacgagg tctacgtgcc ggagacgagc agggcgtatc tgacgcagga 541 cggcgagatc attacgctct acacggcgat ggtcgtgcgg gaggacgacg tgagcctgta 601 cgggtttacg gagaaggaag ctctcaacat gttccgtctg ctgcagacag tgcccggcgt 661 gggtgcgaag gccgctatgg ctatcctgtc ggcgctgtcg ctgagggatc tgaagcgggc 721 catcgcgttt gaagacgtag gttccatcac gagagcccag ggcgtcggca agaagaccgc 781 gcagatggtt gtggtcaagc tgaaggataa gatgggagat gtttcggatc tcgatctgcc 841 gcaaggcgcg ccgatgcctt ccgtcgttcc cggcagcaac aaggaacagg cggtgtctgc 901 cctcatggcc ctgggcttta cgaaggcgga agccatggcc tcgatggccg gcatcaccga 961 cgaaggcctt acgacgcagg aatacattaa actggcatta aggaaccgat aatggatacg 1021 gaaaacagag tggtcggcgc gaatctgcag ggcgacgagg aactgatgga gcggtccatc 1081 cgccccaaac gcttcgagga ttacgtagga cagaccaatg taacggataa tttaaaagtg 1141 tacatccagg cgagcaagat gcggggagaa cccctggacc acgtgctctt ctacggtcct 1201 ccgggactgg gcaagacgac gctggccggc atcatcgccg aagagatggg tgtggatctt 1261 aggatcacct ccggccctgc catcggaaga gcgggagacc tggcagccat cctgacgaac 1321 ctcaacgaag gggacgtgct gtttatcgac gagatccacc gccttaacag ggccgtggaa 1381 gaagtgctgt actccgccat ggaggacttc gcgctggaca tcgtaacggg caagggaccc 1441 ggtgccagct ccatccgctt cgaactgccg cgttttaccc tcatcggcgc tacaacgagg 1501 gcaggcagcc tgtctgcgcc gctgcgcgac cggttcggca tcctggcgaa gttcgaactg 1561 tacaacgaga acgaactggc ggcgatcatg cgccgcacgg cccgcatcct caacgtggag 1621 atcgacgagg aatccacgcg tatgctggcg acaaggtcac gcggcacgcc ccgtgtggcg 1681 aaccgcctcc tgaagcgagt gcgcgatttc gcccaggtgc tgggttcggg aaagatcgat 1741 ccgcccatcg tggagagcac gctgcggtct ttaggcatcg acgaactggg tctggaggaa 1801 ctggaccgcc gcatcttaaa actcatcatc gaacagttcc agggcggccc cgtgggcatc 1861 gataccatcg ctgcatctct gggcgaggaa agagtgacga tcgaggacgc ttacgagccc 1921 tatctgatgc aggcaggact gctgcaccgc acgctgaagg gccgcatggc atccatcaac 1981 gcataccggc atctgggcct ggacgtgccc aagagcatga tgccggaaga agaacaactg 2041 acgctgggaa agtaaaggat tgggggatcc ggacatgaag agactgacaa agaccatatg 2101 catcgttctg gcgctctgcc tgatggctgc gggactcgtc ttcgcggagg gcgaagaagg 2161 ggaaacggaa gaccctgcct cgcaggcggt ccgttcggac gacagcactt acctgtggat 2221 cggccttcaa tacggcagca gcgctgtgga taagatcacg gtaaggagcg cagacggatt 2281 cctgatcgtc aagggcaaca acaaggggtg gacggagacc gatatcaaga cgtccagcac 2341 gaccctgacg atcgtgcctt ccgggggtca ggccacggtc gtggatgaaa acggcgaaac 2401 gatcctcggc ggcatgggca acggcggcta catcttgctg agcgccgcgg aagatccgga 2461 ggaccggctc atcaccatca acggcagccg ttaccgggac ggcgcgacgg cgacggtcac 2521 cggcggcagg ctgaacgtca tcaacgtcat cgaactcgaa cactacgtgc ggggcgtcgt 2581 cgccaacgag atgggctata cctatccgct ggaggcgctc aaagcccagg cgatcgca // LOCUS sequence161 2626 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence161 VERSION sequence161 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2626 /mol_type="genomic DNA" /organism="" /note="sequence161" misc_feature <1..1791 /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_012048038.1:DNA polymerase I" /note="WP_012048038.1 DNA polymerase I (Clostridium botulinum) [pid:47.1%, q_cov:84.4%, s_cov:54.9%, Eval:2.3e-128, partial hit]" /note="MGA_730" /locus_tag="LOCUS_5100" CDS 1817..2407 /product="dephospho-CoA kinase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011393338.1" /transl_table=11 /codon_start=1 /translation="MIFGLTGGIGSGKSTVANILRDKGYIVLDADAIGREVTAKDEPLL RMLVKEFGIEIINEDGTLDRRTLARLVFGDKWKTHRLNELVQTAILVRAMAKFHNLELG GEKKVMFFDVPLLFEAGWDKYVQEVWLVTAPEDIRIQRIEVRDGLTEEEIRSRIKLQMS EEEKMERSDVIIENDEGMAKLMGQVEKAIAERL" /locus_tag="LOCUS_5110" /gene="coaE" /EC_number="2.7.1.24" /note="WP_011393338.1 dephospho-CoA kinase (Moorella thermoacetica) [pid:37.8%, q_cov:98.5%, s_cov:91.0%, Eval:8.7e-32]" /note="MGA_731" ORIGIN 1 gaagaggctg caccgggatc tgtcccggat gacccggaac agatcgcgat cgaagagccg 61 gacagccgcg agctgacgga cgacgtgctg cgtggactga aggacgggca ggagatctat 121 atcgacctcg agacagatgg aaaccacaag gagatgccca gtctggatct gctgcagatc 181 tgtgacgcaa aaacggtcta tacgggtctg gcggatcttg cgctgctgtc gggcaaagcc 241 cttaaactgt gcggctgcgg cctggaaaag gtctggtacg tactgaagag tcgtggcgtg 301 gatacgtccg caatggaaac aggcagcgac ctgcagctgg catactacgt gctggatccc 361 gcagccaaga cgcctacgct ccgcgacctg gcattctccg aacttaagac ggacattgct 421 tccggaacgc agcaggagaa ggagacgcag atcgatctct tttccgctgt tgcagatccc 481 ttcgacgaag ccagaaagag cgcaggcttg aaatttggca ccatgatggc tctgcgaaag 541 ctactggaaa gccggatcga agagaatagt ttacagaaag tatattatga tatcgaatta 601 cccctgtgca aagtgctgtc cgaaatggag aagaacggca tagacgtgga cagcgaagcg 661 ctggcggact tcggaaaaga gctgaaagtc cgcatcgacg tgctcgtccg ggagatctac 721 gatctggcgg gagaagaatt caacatcaat tccccgatgc agctgggcaa catcctgttc 781 gaaaaactgg gtctacctgc cggtaaaaag acgaaaaagg gctattccac gaacgccgag 841 atcctggaaa agctggcgcc ggactatccc atcgtcgaaa aagtgctgga attccgcacg 901 ctgtccaagc tcaacagcac ctatgtggaa ggtatgctgc ccctgatcgg ttctgacggc 961 cgcatccatg cgcatttcca gcagactgtt acggcaacgg gacgcatcag ctgcacggag 1021 cccaacctgc agaacatccc agtccgtcag gaactcggaa gacagctgcg caaggtcttt 1081 acctccggca gcagcgatat ggtgctgatg ggtgccgact actcccagat cgaattgcgg 1141 gtgcttgccc acatgtccaa ggatcccacg ctcatcgaag cgttcaacga aggactggac 1201 attcaccgtg agacggcggc caaggtgttc ggcgtgcccc aggatgaagt gaccccgctg 1261 atgagatcga acgcaaaggc agtcaatttc ggggtcatct acggcatgag cggcttcggt 1321 ctatccgaag aactctccat tactaggaag caggcggagc agtacatcaa agactatttc 1381 caccgttttc ccggggtcaa acagtttatg gacggctgca tcgcggactg caaggcaacc 1441 ggcgagatcc gcaccctgta cggcagacgg cgcagtgtgc cggagatcca cgcgtcgcag 1501 tatatggtgc gccagctggg cgaacgcctc gcaatgaaca cgcccatcca gggaaccgct 1561 gcggacatca ttaaactcgc gatgatccgc acggaaaaag cgctgcggga acaatgtccg 1621 gaagctcagt tgatcctgca gatccacgac gagctcatcc tgcgggtgcc gaaagcaaaa 1681 gaagaagagg caaagcgcat cctgcgggaa agcatggaaa acgccgcttg cctggacgta 1741 aaactggatg tagacttaaa cgtaggccaa aactggtacg aattgaaata aaaatagata 1801 agaaagaggt aatgaaatga tatttggatt aacagggggc atcggctccg gcaagagcac 1861 ggtggcaaac attctgagag ataaaggata tatcgttctg gacgccgacg cgatcggcag 1921 agaagtgacg gcgaaggacg aaccgctcct ccgtatgctg gtcaaggaat tcggcatcga 1981 gatcatcaac gaagacggca cgctggaccg cagaacgctg gccaggctcg tcttcggcga 2041 taagtggaag acccatcgcc tcaacgaact ggtgcagacc gccatcctgg tccgcgccat 2101 ggcgaagttc cacaaccttg agctgggcgg agagaagaag gtcatgttct tcgacgtacc 2161 gctcctgttc gaagccggct gggacaagta cgtccaggaa gtctggctcg ttacggcgcc 2221 ggaagacatc cgcatccagc gcatcgaagt ccgggacggc ttaacggaag aagagatccg 2281 ctcccgcatc aaactgcaga tgagcgaaga agagaagatg gaacgttccg acgtcatcat 2341 cgaaaacgac gaaggtatgg cgaagctgat gggccaggtg gaaaaagcca tcgcagaaag 2401 gctgtaatat gccccagaaa aagtttgaaa ataaagtaga agttatcaaa tacaaggttt 2461 taagagagct ggcccgggcg atctgggagg atcacgatcc gttcaccgtg ttcaacgaca 2521 tcgcaggatc cgtcatcaag aagggtgaac cgcccatgag ctgctgcatc tacaaggaca 2581 gagccatcgt ggcggaccgc atgcgcatgg gtatcggcga atacca // LOCUS sequence162 2622 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence162 VERSION sequence162 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2622 /mol_type="genomic DNA" /organism="" /note="sequence162" misc_feature <1..1092 /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_011016536.1:pyridoxal phosphate-dependent aminotransferase" /note="WP_011016536.1 pyridoxal phosphate-dependent aminotransferase (Fusobacterium nucleatum) [pid:41.8%, q_cov:99.7%, s_cov:90.5%, Eval:6.3e-85]" /note="MGA_733" /locus_tag="LOCUS_5120" CDS complement(1179..2054) /product="selenium metabolism-associated LysR family transcriptional regulator" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_010938626.1" /transl_table=11 /codon_start=1 /translation="MESKMLRSFIAVVDSGSFTKAAEKTYTSQPTVSAHIKALEEELGV QLIARDTKNLRVTQKGKELYDCACQMLALQQNMLDKWAGEEQNGIRIGVSTIPSAYILP ALLEGFCKEHPDVPVSIHQSDSEAIEAAVEKGTFDLGFVGEKPGVSLDSTPVAEDKTVI IAPNTESNRRLLKKGDLKALLAQPILFRERGSASRKSAELLLESLGLDLRDLDVAASLN DQEAIKNLVEHGFGISFVSALAVEDRVREGRLLAFDTGLPEAKRTFYLIRRKNTKLSES AESFVRFVLS" /locus_tag="LOCUS_5130" /note="WP_010938626.1 selenium metabolism-associated LysR family transcriptional regulator (Desulfovibrio vulgaris) [pid:33.0%, q_cov:98.3%, s_cov:93.5%, Eval:3.8e-31]" /note="MGA_734" misc_feature complement(2058..>2622) /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_000503960.1:amidohydrolase" /note="WP_000503960.1 amidohydrolase (Bacillus cereus group) [pid:39.5%, q_cov:91.4%, s_cov:33.0%, Eval:1.5e-30, partial hit]" /note="MGA_735" /locus_tag="LOCUS_5140" ORIGIN 1 aaagatctgc tggccatgtg ggtcgcggat atggacttcg agatcgcaga accgatccgc 61 aaagcggtcg gcaactacgc agccaacatt ccctggggct attataatcc cggcccgggc 121 tacaaacagg ccttcatcga ctgggaggag aagtatcacg gatataaact ggatccggac 181 tggatctgct tctccccggg catcgtcgca gcatttttct gggtcacccg catgaagacc 241 cagcccggcg acgccgttat cctgctggcc ccgatctact atcccatgat gaacgcggtc 301 aaattcaacg accgcaagct ggtcctgtgc gacatggtac acgacggcaa cacctaccgg 361 gtggattatg agaagttcga gaaggacatc gtagacaaca acgccaaagt ctttatcctg 421 tcctcccctc acaatcccgt gggcaagatc tggacgccgg aagagctgaa gaagctcatg 481 gagatctgcc gcaagcacaa cgtgttcgtc atctccgacg agatccacca ggacttcgaa 541 tggaacggtc acgtccacgt gcccaccgcg acgctgggcg actacgacga catgctcatc 601 accatgtgcg ccgtctccaa gacctttaac ctggcagcat gccagaactc cttcatcatt 661 atccccaacg cggagctgag agaatccttc aagaagttcg cagccagcat cagctgctcc 721 ggcggcaacg gctttggcta tgtggcggtg gaagctgcct gccgggaagg ccgtccctgg 781 ttcgaggaag tcaagaagca gatctgggaa aactattgct atgtgcgcga cacctttgcc 841 aaggagctgc ccgacgtggt cgtcgccgac ctgcagggca cctatctgct gtggctggac 901 ttcggcaagt actttaagac gcagaaggag atcgaagaat tcatgcaggg caagtgcaag 961 ctggccttcg actacggcaa ctggttcggc gccggtgggg acgactactg ccagttcgtg 1021 cgcatgaacc tggcaacatc cctggagaac gtcaaggaag cctgcgaccg catgatcaag 1081 aatctgaaat aattcggaac cgaaataatt tcaaaaccct ccggaaatac tccggagggt 1141 ttttcttttc aacacagtgt acctgtcccc gcgtgctctt acgaaaggac gaaccgcacg 1201 aagctttccg cgctctcgga gagcttggta ttcttacggc ggatcaggta aaacgtacgc 1261 ttcgcttcgg gcagacccgt gtcgaaggcg agcagtctgc cttcccggac gcggtcttcc 1321 acggccagcg cggatacgaa ggagatgccg aagccgtgtt ctaccaggtt tttaatggct 1381 tcctggtcgt tgaggctcgc ggcgacatcc agatcccgca ggtcgagacc gaggctctcc 1441 agcagcagtt ccgcgctttt gcggctggcg cttccccgct cccggaacag gatgggctgt 1501 gccagcagcg ccttcagatc gccctttttc agcagacggc ggttgctttc cgtgttcggc 1561 gcgatgatca ccgtcttatc ctcggctacg ggagtgctgt ccaggctcac gccgggcttt 1621 tcgcccacga aacccagatc gaacgtgcct ttttccaccg ccgcctcgat cgcttcgctg 1681 tcggattgat ggatggacac cggcacgtcc ggatgctcct tgcaaaaacc ctccagcagc 1741 gccggcagga tgtaggcgga cgggatcgtg gatacgccga tgcgtatgcc gttctgttcc 1801 tcgccggccc atttatccag catgttctgc tgcagtgcga gcatctggca ggcgcagtcg 1861 tagagctcct tgcccttctg cgtcacgcgc aggttcttcg tgtctcttgc gatcagctgc 1921 acgccgagtt cttcctccag cgccttgatg tgggcgctga cggtgggttg agacgtatag 1981 gtcttttccg ccgccttcgt aaagctgccg ctgtccacga ccgcgataaa ggagcgaagc 2041 atcttgcttt ccatatctta tccttcgtaa actgtcttgc cgttgacgac ggtcatcagg 2101 accttcgtgt tcagcagttc ttcgggggga ttctccatga tgttcttgtc gagcacggta 2161 aagtccgcgt acttgccgat ggtgatggaa cctctctcag cctcttcgaa agcggaatag 2221 gcgccctcga tcgtaaacat gcgcagcgcc tcttccatgg tcaccgcgtt ctccggatac 2281 cagggcttgc cgtccatgcc catacgggta acggcgtagt acatgttggc cagcggatcg 2341 cagtcttcca cggggcagtc ggaaccgccg ctcatgtgaa cgccgagatc gatgtagcgt 2401 ctccagttat aggaggtctt agccagttcg gaaccgacgc aatcgtccac gatctgggag 2461 tcgtagcgga cgaagacggg ctgtgcatag gcgagcaggt tgagctttac gaagcggtcc 2521 tgctgggcct cgtccatgat ctggcaatga atgatgccat ggcgcatgtt gggcttgggg 2581 ttctcgttca tcacgagctc gtagccgttg acgacctgat cc // LOCUS sequence163 2620 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence163 VERSION sequence163 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2620 /mol_type="genomic DNA" /organism="" /note="sequence163" CDS complement(880..1359) /product="peptide deformylase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003431159.1" /transl_table=11 /codon_start=1 /translation="MALRNIVTDEDPSLKKKSRPVTEVTDRIRVLVEDMIETMRAADGV GIAAPQVGVLRRIAVVEVEDLYVLINPVITEREGDQFNEEACLSVPGRAGKVHRPTRVV CEAMDLDGNMQRYEVEGLTAVCFCHEIDHLDGILYTDKAEEIRSTEGDYEEEDEE" /locus_tag="LOCUS_5150" /gene="def" /EC_number="3.5.1.88" /note="WP_003431159.1 peptide deformylase (Clostridioides difficile) [pid:52.7%, q_cov:91.2%, s_cov:100.0%, Eval:1.1e-35]" /note="MGA_737" misc_feature complement(1382..>2620) /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_003232079.1:primosomal protein N'" /note="WP_003232079.1 primosomal protein N' (Bacillus) [pid:47.0%, q_cov:99.3%, s_cov:50.7%, Eval:2.2e-108, partial hit]" /note="MGA_738" /locus_tag="LOCUS_5160" ORIGIN 1 catccatagc ctttttgccg ggcagctgca cttttgtcag cagcagaaca ccgccatctc 61 cacaggcgac gccgatgcct tccttgccgg aagacaccac ggtgcccgga gccgcttttg 121 tcctgcggtc cgccgctttt gcggcgtgga tcttaaagac ttctccgttc agggatgtaa 181 atgcgatggg ccagctgtac atgcccagca cgtgggattc caacgctttt gcgctgcggt 241 cccagtcgat ctgtccttct tccttggcga tcatggccgc gtgcgtcgcc agagacgcat 301 cctgcggaac gcccttaagt tcaccggaaa cgatttttgg taaacactcg accaaaaggt 361 ctgcgccgag cacggacagc tcgtcaaata cctgttccga ggtctttccc gcgatgggga 421 tagccctttg cgccagcatg tcgccggcgt cgcactcctc cgccatgtac atgatcgtaa 481 cgccgctctc ggggtcaccg gcaaggacgg aacgctgaat aggcgccgcc cctctgtatt 541 tgggcagcag cgaaccgtgg atgttgatgc agccgtacgc cgggatgtcc aggatctctt 601 tgggcaggat cttgccgtaa gccgccacca cgataaaatc gggcgcgatc tcgcgcagtc 661 tggccgcaaa ttccgggttg ttcttcacct tttccggcga ttccaccgca agtcccagct 721 ccagcgcctt cttttttacg tcgcattgct ggatcttatg accgcggctg gcgggccggt 781 cgggtttcgt gaccacgaga ggcacgtccc agccgcagga tacgatcttt tccagggcag 841 gcaccgcgaa atccggcgtg cccatgtaga cgatcctcat tattcttcgt cctcttcttc 901 gtagtcgccc tcggtggaac ggatctcctc ggccttatcg gtgtagagga tgccgtccag 961 gtggtcgatc tcgtggcaga agcagacggc ggtaaggcct tccacttcgt agcgctgcat 1021 attgccgtcc agatccatcg cctcgcatac gacgcgggtg ggacggtgca ctttaccggc 1081 tctgccgggg acggacaggc aggcttcctc gttgaactgg tcgccttctc tctccgtgat 1141 gaccgggttg atgagcacgt acagatcttc tacttccacg acggcgatgc ggcgcagcac 1201 gccgacctgg ggcgccgcga tgccgacgcc gtccgccgcg cgcatggtct cgatcatgtc 1261 ttcgaccaga acgcggatgc ggtccgttac ttccgtaacg ggtctcgatt tcttcttcag 1321 ggaaggatct tcatcggtaa cgatatttct taatgccatt gtttcctcca aatggtagtg 1381 attatatgaa tgaaaacgga ttgatatccg tcgtcaacag ttttgccgcg gtcttttcct 1441 cttcgaatac cctgcgcagc ttcgcagctg ccgccgtgca ttctctgcgc tttccggcag 1501 gcgccttgac gatcacctgg tagcgcgaca tgccggactg tctggcgatg ggagccgcgg 1561 acgggcccat cacgatatag tccttcgaca ggactttttt gagccatgca gccgtacggg 1621 acgcgctgtc catggctttt gcctcgtctt cgtcccagag gacgaaccgg aacagatccg 1681 aaaacggcgg gtacagcgcc gcttcgcgga tgccgatctc ccgctcgtag aacgcgcggt 1741 aatcctgggc ggcggccgcc tgaacgacgg cgttttccgg gctgtaggtc tggatgatga 1801 cttcgccctg ttcgtcgccc cggccggccc ggcctgctgc ctgggtcacc agctggaacg 1861 tccgttcccc gctgcggtag tcggggatgt tgagcgtaac gtccgcggag atgatcccca 1921 cgagtgccac gttggcgatg tccagtccct tggccaccag ctgcgtaccg atgaggatat 1981 cggtcttgcc ggctgcaaac cgttttagaa tgccctccag actgcctttt ttgcggacgg 2041 tatccaaatc caggcgttcg atcttcgcct ccggaaacag ctccttcgcc ttttcctcca 2101 cctgctcggt gccggcgccg aaccgcccga tgatcttgct ccggcaggtc ggacagaccc 2161 tgggtaccgc ttcttttcta ccgcagtaat ggcagacgag agcgccctct tctttatgat 2221 acgtgagcga gatgccgcac tccgggcacc gcggcacgta gccgcattcc cggcaggaca 2281 cgaaggaaga gtagcctctg cggttcaaaa acaggatggc ctgcttcttt tctcccagcg 2341 tcttttccaa tgcatccgta agcgcctgcg aaaaaagact gcggttgccg gcttttacct 2401 cttcccgcat gtctacggtg cgcacccggg gcaacggcac ccggttgtag cgctgcggca 2461 gttccagcct gcggaagatg ccctgctcgc tgcggtagaa atcctgtgca gaaggcgtcg 2521 cgcttcccag caccaggaca gcgccgtgag ccttggcgcg cttcatggcc acttccatgg 2581 catcgtattt cgcgccgctc tcggatttat aggagctttc // LOCUS sequence164 2606 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence164 VERSION sequence164 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2606 /mol_type="genomic DNA" /organism="" /note="sequence164" misc_feature complement(2103..>2606) /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_010965059.1:signal recognition particle-docking protein FtsY" /note="WP_010965059.1 signal recognition particle-docking protein FtsY (Clostridium acetobutylicum) [pid:64.2%, q_cov:98.8%, s_cov:54.5%, Eval:2.2e-58, partial hit]" /note="MGA_740" /locus_tag="LOCUS_5170" ORIGIN 1 ccccaatagc cggcgtacca gttcttgggc cagggtttgc cgcccatgac gacgggtctg 61 tcgtccagag gcatggcagc ggtaaacgga atgccgtcct tgcctgcctt gccgtcctgt 121 ccagcctgca gcgcggtgct gtagatggag atcggcttaa tggaagaacc cggctgccgc 181 ggcgccgttg ctctgttgta gagcagcttg ccttccacgt ttctgccgcc gatcatgccc 241 agcacgtagc cggtgcgatg gtccatgatg accatggcgg actggggctg gatcgtgggc 301 ttgcggagcg taaagtagtc ggacgtaagg taaaggcgtc cgtcttccag tctgtggatg 361 acgtcgggat gatcctcgaa gaacttggcg ctgatgatca tatcgccgtt gtcatcgcgg 421 gtcttatatt cggaggccac agcccagttg ccgccctcga tgctgtacag aaggccttcg 481 ctcttctcgt acatgttctt gaattcgatg gtgtagtccg tgccgttgcc gctggtcgtc 541 ttatagaaat tgaggcgttt gtccttcagc agcttgaggt cgccgttgcc ctgccactcg 601 aactcctcga gcggcatcac aaagtcgccg tcctcgtcga acatcacgct cttgctgtag 661 agcatgatct tgccgttgtc gccgatgatg ttgccgcttc cgtccgtgcg gtagccgctg 721 atggtgggcc agccggaatt gtccgcccat accgcttcca tgatctcctg gatctcgcgg 781 ttcatggtcg tgttgatgtg caggccgccg ttgtacagca tgcggtccgc ttcttcctcg 841 gagaggccca gctcccgcat catgtcctcg cggacctgct ttacggcgca gtccgtgaaa 901 taggaggtga cccccgcatc cgccagggcg ttgctgcccg ggttgatatg ctctctgagg 961 gtcgccggat ccgcagcggc atactgctca tccgtaatgt agccctggtc gtgcatgttg 1021 cgcagcacca gcttcatgcg gtcgacgcag gcgtcgttgt aatatgtgat gtattcgtcg 1081 ttgcgctcga tgatatccag tgcgtcgata tcctccactg cggaagtctc gatgcgcttg 1141 atgggcgcat aggtgctggg cagctgaggc agcgtcgcca ggcacgcgca ttcgatcaga 1201 tccagatccg cagcgtcttt ggagaaatat gcctgggaag ccgcctgcac gccgctggag 1261 ttgaacccca gaccgatggt gttcaggtag gcctcgatga tctgttcctt cgtcagattg 1321 cgctcgatga tcatcgtgta gtacgcctcg atgatcttac ggttcatgga gcggacgctc 1381 tttacgtccg gcagatacag gtttctggcc agctgctgcg taatggtgga cgtaccggag 1441 atcttcgtgt cgtacttcag ggcgtcgcgg atggcgccga tgatacggat gacgttgaat 1501 ccgtggtgtt cccagaacgt cttgtcttcg atggagacga aggcgttgat catgtccttc 1561 gggatatcct tgtactccag gttggagcgc agcgaatcgc cggaatacag attgtccagc 1621 acgtttccgt ccgcgtcgaa caccgtggaa ttctcggaga gcaggtcgta caggttgtcc 1681 ggattgatct ccggcgcttc cttgatgatg cccatcacgt aatatcccgc tacgcctgcc 1741 gcgatgatgc caaggccaag cagcgtaagc aggatgccga gaatgatctt ccctgccttc 1801 ttctttttct tcttcttttc cggctttttc ttctcaggag ccttcttttc cggctttttc 1861 gtttccttct tttccggctc cttcgctgct ctgccgcttt ttttatttct ggcagaacgt 1921 cctactaaag gctccgaagc cgcctgcatc tcgtaggcag ccgctgcgcc tccttcgtcc 1981 tggacagaaa acgccggctc ttcggcttcc tccgccgcgg cgagaaattc gcctcccagg 2041 cggtcgaagg cctgcagcac ttcatcttcg tgctgtctgc ctaaattttc atccatgctt 2101 ttttacccct cgaaaatgtc ttctgcaaaa ctctgcgggt cgaacggctt taagtcgtcc 2161 ataccctctc ccaaccctat atacttcacg ggcaagtcca gctcgtccgc gatcgtcact 2221 acgatgccgc ccttcgccgt gccatccagt ttcgtgagga tgatgccggt gagttcggct 2281 acttcgttga attctctcgc ctgggacacc gcgtttttcc ccgtggtggc atccaccacc 2341 agcagcgttt ccctggcagc cccttcgaat tcccggtcga tgaccttgtt catcttcgca 2401 agctccgcca tgaggttctt cttgttctgc agtctgcctg cggtgtcgca gatgaccaca 2461 tccacccctc tggccttcgc cgcgttgcag ccgtcgaaga tgacggcgga aggatctgcg 2521 ccttccttat gcttgatgat gggcacgccg acccgttcgc tccagatcgt cagctgttcc 2581 gacgccgcgg cgcggaacgt atccgc // LOCUS sequence165 2604 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence165 VERSION sequence165 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2604 /mol_type="genomic DNA" /organism="" /note="sequence165" CDS 233..1762 /product="DNA methylase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_013363706.1" /transl_table=11 /codon_start=1 /translation="MCMDKKNWSKTYIAIDLKSFYASVECRERGRDPLTTNLVVADRSR TNKTICLAVSPALKTFGIPGRPRLFEVDQKVAQINAERLRLAPGRRFAGSSDNINLLAA DPSLKLDFITAVPRMAKYIEYSTKIYQIYLKYAAPEDIHVYSIDEIFLDATLYLRASGK TAHEYAMTIIQDVLKNTGITATAGIGPNLYLCKIAMDIEAKHIPADEDGVRIAELDERS YREKLWGHRPITDFWRVGPGIARRLAQHGMYTMGDVARCSIGNPRDPHNEDLLYKLFGV NAELLIDHAWGWEPCEIRHIKAYKPEENSLSSGQVLSHGYKIAEARTVVREMADALSLD LAAKGLVTDQIVLSLGYDAESLSKGYEGQVQADWYGKTVPKMAHGSENLERHTASTRLI TEAAMRLYDRIADPTCLVRRMYVVAAHTLREESVKEEKEQGEQLDLFTDYEAAAKEKKA EDAALEKEGQLQQALLAIKKRYGKNAVMPGTSYKEEATGRERNEQIGGHRA" /locus_tag="LOCUS_5180" /note="WP_013363706.1 DNA methylase (Bifidobacterium bifidum) [pid:54.3%, q_cov:97.8%, s_cov:98.7%, Eval:6.9e-155]" /note="MGA_741" CDS 1759..1986 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MTDKFMPGRGSYDDMLDLPHPVSKKHPQMSLDKRAAQFSPFAALT GFEGAIEKAGLLFEEEADRGNAEYLEFEDI" /locus_tag="LOCUS_5190" /note="WP_003813910.1 hypothetical protein (Bifidobacterium) [pid:57.1%, q_cov:74.7%, s_cov:77.8%, Eval:1.2e-11, partial hit]" /note="MGA_742" ORIGIN 1 atatccatgc tgtgtcctcc tatgttaagt gcttagcact tccattataa tcctaaatcc 61 aaccgattcg cagattattt cgtaatgcta cgattatagt ttgtcttgca caaataatca 121 agtgaaatat ttgtgtgctg caacaaagat aaaacgcaaa aatcaatgca aagtgctcat 181 cacacggtac ccgatatcgt gtataataga accgagagaa cgaacatttg ttttgtgcat 241 ggataaaaag aattggtcga aaacctatat cgccatcgac ttaaagtcgt tctacgcctc 301 ggtggaatgc cgggagcggg ggcgtgaccc actcaccacg aatctggtgg tggcagaccg 361 cagccggaca aacaagacca tttgtctggc ggtttcgcct gccttgaaaa ccttcggcat 421 cccgggaagg ccccggctgt tcgaggtgga tcagaaggtt gcgcagatca acgcggagcg 481 gctgcggctg gcgccgggca ggcgctttgc gggcagttcg gacaatatca acctgctggc 541 ggcggatccg tccctcaaac tggatttcat caccgccgtg ccccgcatgg ccaaatatat 601 cgaatacagc acgaagatct atcagatcta tttaaaatac gcggcgcccg aggatatcca 661 tgtctattcc atcgacgaga tcttccttga tgctacgctg tatctgcggg ccagcggcaa 721 gaccgcccac gagtacgcca tgaccatcat ccaggacgtg ctgaagaaca cgggcatcac 781 tgcaacggcg ggcatcgggc cgaatctcta tctgtgcaag atcgccatgg acatcgaagc 841 caagcacatc cccgcggatg aggacggcgt acgcatcgcg gagttggacg agcgcagcta 901 ccgggagaag ctctggggtc accggcccat taccgacttc tggcgcgttg gccccggtat 961 cgcaaggcgc ctggcgcagc acggcatgta caccatgggc gacgtggccc ggtgcagcat 1021 cggaaatccc agagaccccc acaacgaaga tctgctctac aagctgttcg gcgtaaacgc 1081 ggagctgttg atcgaccacg cctggggctg ggagccctgc gagatccggc acatcaaggc 1141 gtataaaccg gaggagaaca gcctgtccag tgggcaggtg ctgtcccatg ggtataagat 1201 cgcggaggcc cgcaccgtcg tgcgtgagat ggcggacgcg ctgtctctgg acctggcggc 1261 taagggattg gtgacggacc agatcgtcct cagcctggga tatgatgccg aaagcctgtc 1321 gaagggctac gaagggcagg tgcaggcgga ctggtacggc aagaccgtgc cgaagatggc 1381 gcatggttcg gagaatctgg agcggcatac ggcatctacg cggctcatca cggaggcggc 1441 catgcggctg tacgaccgta tcgcggaccc gacctgcctc gtgcggcgca tgtacgtggt 1501 ggcggcccac acgctgcggg aggagagcgt aaaagaggaa aaagaacagg gcgaacagct 1561 ggatctgttc accgattacg aggctgcagc taaggagaag aaagcggagg atgcggcgct 1621 cgagaaggaa ggccagctgc agcaggcgct gctggccatc aagaagcgct acggcaagaa 1681 tgcggtgatg cccggcacca gttataaaga agaggcaacc ggacgggaac gcaacgaaca 1741 gatcggaggg cacagagcat gacggacaaa tttatgcccg gaaggggctc gtacgatgac 1801 atgctggacc tgccccatcc ggtctcgaaa aagcatccgc agatgagcct ggacaagcgc 1861 gcagcgcagt tttcgccttt tgccgccctt accggcttcg aaggcgccat agaaaaagcc 1921 ggtctgctct tcgaggaaga ggcagaccgg ggcaatgccg agtatctgga atttgaagat 1981 atctaaactt actcgttcgg gtggacgagc tcgtccacgt tgtgccaggg caggtcgatg 2041 ggcgcattgt cgccgaagac gccggagcgc cattcctgat agatcgcatc gtctgcgtag 2101 aaaggcgcat cgtcgccatt gatgatctcg tagacgatgc cgttgccgtc ttcatccacg 2161 tcggcgggga attcgtccgc tttttccctc agcgttaaga cttccagcgt gtactgggag 2221 acggagccgt agaagtaata gttgtcgttc tcctcgtcgt agacaaaggc gttgaagggc 2281 cagaaatcgt ccgtctccat gcccgttccg tgggaccatc cgctctcgat ggcgtgggtg 2341 tcgtaataat tgcagaccgg gaaggcgacc aacacgtcgg tgacttctcc cgtctcttcg 2401 ttatagacgt acacgttttc ctgcatgctg gccatgatcg agtccgctgc gcggatcacc 2461 agttccagct ttccgtcttc atccaggtcg cagatcgcat acaggttgtc ccattcgtcg 2521 tagccgtaac cttcgaccgg gataacttca tcgctgccgg gcagcgtgcc catgtccacg 2581 aaggtctgca cggcggccag atag // LOCUS sequence166 2601 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence166 VERSION sequence166 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2601 /mol_type="genomic DNA" /organism="" /note="sequence166" misc_feature complement(630..>2601) /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_002989648.1:DNA helicase PcrA" /note="WP_002989648.1 DNA helicase PcrA (Streptococcus pyogenes) [pid:42.1%, q_cov:96.8%, s_cov:85.2%, Eval:1.5e-144]" /note="MGA_745" /locus_tag="LOCUS_5200" ORIGIN 1 gccggatcca attgacgcag cgtgcccgct gcgctgtttc tgcggttctg ataggtcttg 61 ccgccccgtt ccgcctctct ggcgttcatc gcttcgaaac tctccgtgga catgtagacc 121 tcgccccgga cttccagata gggcagtttc tccggcacct ccttggggat ggtgcggatc 181 gccagagcgt tctcgtacac gctttcgccg atagcgccgt cgccgcgggt gatcgcatcc 241 accagttttc cgtcccggta gcgcagcacc agcgtaaggc cgtcgatctt cttttcgacg 301 atgaaccggg cgttcggcat ctccttcttc acccgctcca cgaaagcgta cacgtcctct 361 ttggagaaca cgtcctgcag ggagatgacc ggcacgtcgt gctgcacctt cttgaggtcg 421 cgccgggcgg tgccgcccac atgctgcgtt aagctgtcct tgtgcatcca ttcgggatgc 481 tccgcttcca ggcggcgcag ttccaggctc agctggtcgt attcgtagtc ggagatctcc 541 ggttcatcct ggttataata gcgttcgttg tgatacgcga ggagcttgta cagttcctcc 601 atccgttgtc ttgaatccat cggtttctcc tagagcttct taagcggggc caggtctttg 661 gccagtttct tcgttcccac cgtattgaaa attacggtga gcacgttgcc cttgcattcg 721 atgacggtgc ccttgccgaa tttggggtgt tccaccgtgt cgccgggcag cacgttgacc 781 ccggccagcg tctccttctt cgcacccatg gcggtctgcc ggacggcgtt ggcctgggcg 841 atcggagaga cgtagggacc ggcggcgtag ggagcctttg tatcgtagcg gtcgaacgcg 901 acgccctgcc cccgtttttc gtacagcgca tcgcccttca tgtattttct gtcgatctcc 961 ttcaggaacg gagattcggc ggtaaagtcg gtcttgccgt agagcatgcg catctcggca 1021 ctgctcataa agaggcgttt ttttgcccgg gtcatgccaa cgtagcacag cctgcgctcc 1081 tcctccagcc cttcgccgcg gtccagcgtg cggtagctgg ggaagatgcc cagttccatg 1141 ccgggcataa agaccacagg gaattccagg cctttggcgg agtgcagcgt catgagggtg 1201 acggcatccg catcggcgtt gtggttatcc acatcggaca gcagcgccag gccttccatg 1261 aatttttcca gcgtaagggc ttcctgagcc tcatccgcct ccttctgttt ttcggagatg 1321 acggtcttga attccagcag gttttcgatg cgggcatccg cctccaccgt ctccatatcc 1381 tgcagcgcct gcaggtagcc ggagcgggcc agcaccgtat cgtagatgtc ttccacgctc 1441 atgcgctctt gttcgagcgc cagcgacgag agcatctccg taaaggcctt aacagccgtc 1501 tcgctcttgg cggacaggct gccctgcacc tccggatcgg acagggtctg cagcaggctg 1561 cggccggtgg cggtcgccat ggcccgcagc ttttcctcgg tcttggcgcc gatgccgcgt 1621 ttgggctcgt tgagcacgcg cagcagcgcc acgtcgtcca aaggattgag gatgagccgc 1681 atatacgcca gcatgtcctt gatctccttg cggtcgtagt agcgcaggcc ggacagcacc 1741 tggtagggaa tgcccttacc ggacaggctg tcttcgaaac gccgcgactg cacattcgtg 1801 cggtacagga tggcaaaatc cgagtatttc aggtccgggt cgttgcgcat gaccgtgcgg 1861 atcttctcgc aggtccagcg ggcttcttcg cggtcgtcgg aagcgcggta gtattcgatc 1921 ttctcacctg ccggtgcctg ggtccacagt tttttcgcct tgcggccccg gttgcgggag 1981 atgacgctgt gggcggcctc gatgatgttg gaggtggagc ggtagttctg ctccagtttg 2041 atgaccttcg ccccggggaa atctttttca aattccagga tgttgcggat gtccgcgccg 2101 cgccactggt agatgcactg gtcgtcatcg cccaccacgc acaggttgcg gtgcttctgc 2161 gacagcaggt agaccaggcg atactgcagc atgttggtgt cctggtattc gtccaccatg 2221 acgtatttaa acttctgctg atactttagc agcgtctctt cgtcgcgctc aaacagcctc 2281 accgtattga ggatgaggtc gtcgaagtcc atggcgttgt tcttttttaa ggccttctcg 2341 tagcggtcgt acagcgtaca gatgggctgg tatttatcga tattgccgta tttgcgggtg 2401 tattccgcgc tggagatatt cttctccttg gcatcggaga tctcggacag cacgtaagcc 2461 ggcgcatact gcttttcgtc gtactgcagc tccttaacga tgctcttcat cagagccttc 2521 tggtccgcgg ggtcgtagac gacgaaattg cgttcgtagc cgatcttgtc cgcgtccatg 2581 cgcaggatgc gaaggcaggc c // LOCUS sequence167 2596 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence167 VERSION sequence167 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2596 /mol_type="genomic DNA" /organism="" /note="sequence167" CDS complement(600..1166) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MLAGIAVSALFGAITNLMIYHTKTGSDKVKTASYWMMGSLSGSSW EKLKYATIAFLVCFALIMLLTRQLDVLMLGDDVASTVGVNTDKLKLMIILLATLLTGVI VSVSGPIGFVGLTFPHITRSIVGTKHRRLVPAAVLVGGTFLVVADIISRVIVAPEELPI GVVSAFFGAPFFLYLIRKGNKKAGG" /locus_tag="LOCUS_5210" /note="WP_011986194.1 iron ABC transporter permease (Clostridium botulinum) [pid:43.1%, q_cov:100.0%, s_cov:52.7%, Eval:1.1e-44, partial hit]" /note="internal stop codon at [1170:1172](-)" /note="MGA_747" CDS complement(1170..1676) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MEKRKTALFPLHKESHFLIFCILMVCLMGIAMFTAMRMGSVEIDP DTIQGILVNKLTSREYYPVTWEYSLESIVWDIRTPRVFTAFIVGAGLTMCGILMQVLTK NSLADPYVLGISHGASAGAVSVIMYGYLWFLGGYGTMAGAFLGALISITLAMKIASVRK KITAT" /locus_tag="LOCUS_5220" /note="WP_011986194.1 iron ABC transporter permease (Clostridium botulinum) [pid:42.1%, q_cov:88.1%, s_cov:42.8%, Eval:2.3e-26, partial hit]" /note="internal stop codon at [1170:1172](-)" /note="MGA_748" misc_feature complement(1697..>2596) /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_011948657.1:ABC transporter substrate-binding protein" /note="WP_011948657.1 ABC transporter substrate-binding protein (Clostridium botulinum) [pid:30.4%, q_cov:92.6%, s_cov:81.2%, Eval:5.2e-31]" /note="MGA_749" /locus_tag="LOCUS_5230" ORIGIN 1 cgacgcgatg ttgaggtcgt gaatggagga aaacacggta aggtcctgat tcttgaggat 61 gttcatgatc tggtactgat atccgatgtc cagatggttg gttggttcgt ctaagatcac 121 aagctccgcc ttctgcacca gggctcgggc gacgagcgtc cgctgctttt cgccgccgga 181 cagcgacaaa aagctgcgct cctcgtagcc ggaaagccct acttccgcca gggcgtcctt 241 tacgatgcgt ccttccgcca ccatgtcggt gccgaacatc ttctggtgag agtagcggcc 301 cagcattacc atatcgaaga ccagcatgtc gaactctaca ttgttctcct gctgcatcac 361 ggacatctcc ttcgccgtct ccttgttgga gagctgcgcc aggtccttgc cgtcgataaa 421 cactttgccg ctgtcgggct tgtagacttt atagatattc tttaaaagcg tggattttcc 481 gcagccgttg gggccgacga ggcccacgaa ggacccctct tccactccca ggctcacgcc 541 gtccacgatc agcttggcgc cgatggaata gcttacgttt tctacgttga gtttcatcct 601 cagccacctg ccttcttgtt gcccttgcgg atcaaataca ggaagaacgg cgcaccgaag 661 aacgcggaca cgacgccgat gggcagttcc tccggggcaa cgatgaccct tgagatgatg 721 tctgcaacga ccaggaacgt gccgcccacc agcaccgccg ccggaaccag ccgccggtgt 781 ttcgttccca cgatacttcg cgtaatgtgg gggaaggtga gcccgacaaa gccgatgggg 841 ccggagacgg acacgatgac gcccgtcagc agcgtagcca gcaggatgat catcagctta 901 agcttatccg tattgacgcc caccgtggat gccacgtcgt ctccgagcat caacacgtcc 961 agctgccgcg taagcagcat gatgagcgca aagcacacca gaaatgcgat cgtcgcatac 1021 ttcagcttct cccaggaaga gccggacagc gagcccatca tccagtaaga tgcggtcttc 1081 actttgtccg agccggtctt cgtgtggtag atcatcaggt tcgttatggc gccgaacagc 1141 gcggagaccg cgatgcctgc cagcaccagc taagtggctg taatcttttt gcgcacgctg 1201 gcgatcttca tggccagcgt aatggagatg agagcgccta aaaatgcgcc cgccatggtg 1261 ccgtagccgc ctaaaaacca cagataaccg tacatgatga cggataccgc accggcggat 1321 gcgccgtggg agatacccag cacgtacgga tccgccaggg aatttttcgt gagcacctgc 1381 atcaggatgc cgcacatggt aagacccgcg cctacgataa aggccgtaaa gacgcggggc 1441 gtgcggatgt cccagacgat ggactccagg ctgtattccc aagtgaccgg gtaatactct 1501 ctgctggtga gtttgtttac cagtatgccc tgaatggtgt ccgggtcgat ctccacgctg 1561 cccatgcgca tcgccgtaaa catggcgatg cccatgagac agaccatcag gatgcagaag 1621 atcagaaaat gcgattcttt gtgcagcgga aacagcgctg tttttcgttt ttccatcttc 1681 gctaattgtt taaatcttag aacttatcgg gatagaactg ctttgccatg atctcgacgg 1741 taccggcgga accggcagag ccctgcatgt cggcgcagca ggcggaatag atccggcctt 1801 ccttgaccgc tctcagattc ttggtgaagt cgttgttctg caggaattcg atcttggcgt 1861 cggtgtcgta gtcgtagtcc aggatgagga tgacatccgg gtcacgcgca acgacctctt 1921 cccaggaggg cgtcgcccag cccttttcga tgtcgtcgaa gatggagatg ccgccggctc 1981 tcttgatcat gtcgccgggc atgccctggc aggcggtgaa aggagcgtcc tcgccagagt 2041 cgtagacgaa cacgcggatg gggttctcgt aaacttctgc gcccagcgtc tcttcgacgt 2101 aagccaactt gtccttcata gcctggacct tttctgcggc cagttcctgc acgccgaaga 2161 cgttgcccag cacttcgtag tccttataga tatcctcgaa ggtggcggag tcggagcagc 2221 agtacgggaa gtacgggatg atgccgtgct ccaggcagaa gctgacggag aagttattgt 2281 cggagaacag ggagtcccag cccatcataa agtcgcagcc ggtggcgatg atgtcttcct 2341 tggagacctt ggcaagaccg gttccgtccg gagccatctt gtgaacggtg tctctagcgg 2401 gatactggct aacggtggac cagcaggatc ctctggtgaa gcctgccatg ttgttttcca 2461 ggcccagatc gaagaagaag tccgccatct ggtcgccgga ggcgatggcg tgggtgggag 2521 cggaggtaaa ggtctcctcc atgttctggc cgatgccgga acgctccagg ttcagggtga 2581 tggtgtacgg ttcgta // LOCUS sequence168 2582 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence168 VERSION sequence168 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2582 /mol_type="genomic DNA" /organism="" /note="sequence168" CDS 249..1799 /product="glutamine-hydrolyzing GMP synthase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_012048241.1" /transl_table=11 /codon_start=1 /translation="MTQEKILVLDFGGQYDQLIARRVRDLRVYAELQPYNKITVEEIKA EGYKGIIFTGGPNSVYDPASPHYDPALLDAGIPILGICYGHQLLAWMADGKIGSAGNFS EYGKVTVTHRGGVLFEGVPEECVCWMSHTDSVMELPQGFESVASTGMCAVAAMEDVSRK LFGVQFHPEVQHTQYGKTILGNFLFKVCGCSGDWHMENYCKQAVEAIRAKVGDGKVLLA LSGGVDSSVCAALLAEAIGPQLTCVFVDHGMMRKNEPEEVRKAFEGWDIHFVGIDASER FLEALRGVTDPEVKRKTIGEQFIRVFEEEGKKIGSVDFLAQGTIYADVIESGAGDAATI KSHHNVGGLPDFVDFKEIVEPLRDLFKDEVRQLGRELGLPEYLVSRQPFPGPGLGIRCI GEVTREKLDILRDADAIFREEVDRAAAVDPDAPWTANQYFAVLTDTRSVGVMGDMRTYG YTVALRCVTTDDFMSADWTRLPYEVLEAAGTRIPNEVKQVSRVVYDITSKPPATVEWE" /locus_tag="LOCUS_5240" /gene="guaA" /EC_number="6.3.5.2" /note="WP_012048241.1 glutamine-hydrolyzing GMP synthase (Clostridium botulinum) [pid:57.3%, q_cov:100.0%, s_cov:100.0%, Eval:1.6e-170]" /note="MGA_751" CDS 2399..2536 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MYREQISEGLAKIIEDLEKALQERKKSFTDNVKRSDSNTKVRERV " /locus_tag="LOCUS_5250" /note="MGA_752" ORIGIN 1 aagcccgggg agccgttgtg acggctctgg tcccggaagg ggcggaaggc accgaagcgg 61 cgtacactta cgcggaccgc tgcgttgccg tacctgccct gcgggacatc ttcgcctcca 121 tcgcggccgt cgtccctctg cagctgcttg cctatcatac ggcaaaggcg aggggctgca 181 gcatcgacaa gcctaagaac ctggcgaagt ccgttaccgt ggaataggaa tagaagagga 241 aagagactat gacacaggaa aagatcctgg tgctggactt cggcggccag tacgatcagc 301 tgatcgcccg cagagtgcgc gatctgcgcg tctacgcgga actgcagccc tataacaaaa 361 ttacagtcga agagatcaag gcggaagggt ataaggggat catctttacc ggcggtccca 421 actccgtgta cgatcccgct tcgccccatt acgacccggc gctgctggac gccggcatcc 481 ccatcctggg gatctgttac ggtcaccagc tgttggcgtg gatggcggac ggaaagatcg 541 gttccgccgg caacttctcc gaatacggca aagtgaccgt gacccaccgc ggcggcgtcc 601 tgttcgaagg cgtgcccgaa gaatgcgtct gctggatgag ccacacggat tccgtcatgg 661 agcttccgca gggattcgag agcgtggcga gcacgggcat gtgcgcggtc gcggccatgg 721 aagacgtctc ccgtaaactc ttcggcgtgc agttccaccc ggaagtgcag catacgcagt 781 acggcaagac catcctcggc aatttcctgt tcaaggtctg cggctgcagc ggcgactggc 841 acatggagaa ctactgcaaa caggccgtgg aagcgatccg cgcgaaggtc ggagacggca 901 aggtgctgct ggcgctgtcc ggcggcgtgg attcgtccgt gtgcgcggcg ctgctggcgg 961 aggccatcgg accgcagctc acctgcgtgt tcgtggacca cggcatgatg cgcaaaaacg 1021 agcccgaaga ggtgcgcaaa gccttcgagg gatgggatat ccatttcgtg gggatcgacg 1081 cgtctgagcg gtttttagag gctctcaggg gggtcacaga tccggaggtc aagagaaaga 1141 ccataggcga gcaatttatc cgcgtgttcg aggaagaagg gaagaagatc ggctccgtgg 1201 acttccttgc ccagggcacg atctacgccg acgtcatcga atccggggcg ggtgacgccg 1261 ccacgatcaa gagccatcac aacgtgggcg gcctgcccga cttcgtggat ttcaaggaga 1321 tcgtcgaacc cctgcgcgac ctgttcaagg acgaggtgcg ccagctgggc cgagaactgg 1381 gcctgccgga atatctggtc agccgccagc cgttcccggg accgggcttg ggcatccgct 1441 gcatcggcga agtgacccgc gaaaagctcg acatcctgcg cgacgccgac gccatcttcc 1501 gggaggaagt ggacagggct gccgccgtgg atccggacgc gccctggacc gcgaaccagt 1561 acttcgccgt gctgaccgac acgaggagcg tgggcgtgat gggcgacatg cgcacctacg 1621 gatacaccgt ggcgctgcgc tgcgtcacca ccgacgactt catgagcgcc gactggacga 1681 gactgcccta cgaagtgctc gaggccgccg gcacccgcat ccccaacgag gtgaagcagg 1741 tgtcccgcgt ggtatatgat attacgagca agccccccgc gacagtggag tgggagtaga 1801 acgtaaaggc ttgctggttg cacaaaaaac gccgaaaagc cctgtaatta caggcaattc 1861 cgggttttga cgagttagcg ggaatggtgc cgtgcaaccg ccgtgcaacc gcgagagccg 1921 ggaaaagacc gtttggttgc acagaggcga ttttaatggt agccagtggc taaccgcgaa 1981 aagccggaaa acgtatataa attgctatta agccagttcg ttttgacaac ggactggctc 2041 tttttttatg ccaaaaaata tttttggagg gaccctaaaa aatggtcgag ttattcccat 2101 tacctaatga aggggttctc ctcccgacaa ggagtgccac ttcgcgctac ttgaaaactg 2161 aatatacaga tcatcaggta cgttacttgc tcttcagacg ctttttagaa cgaactacct 2221 tgaaggcaaa gaagtctcca tgcttcctgc tgaaacagag acactggttc gcttgtttat 2281 ggttggagaa agtgatgaga aacgatttga cgagatgatt aaagtcgctt ccgagagcag 2341 gcgcaagccg gatctgcaga cttgctttaa catgcgagag cgtcttccaa aagaaacaat 2401 gtatagggaa cagatttctg aaggattggc aaaaataata gaagatctgg aaaaggcgtt 2461 gcaggaaagg aagaaatcct ttacggataa tgtcaagaga agcgattcga acacgaaagt 2521 gcgcgagcgt gtgtgacaga cagtgcagga aaaaatggta ctcaagaggg aaaacatgct 2581 at // LOCUS sequence169 2566 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence169 VERSION sequence169 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2566 /mol_type="genomic DNA" /organism="" /note="sequence169" CDS complement(657..1658) /product="3-deoxy-7-phosphoheptulonate synthase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003439427.1" /transl_table=11 /codon_start=1 /translation="MIVVLKHNVQDEKRDQLVEWLKQQGLTVHISQGDYQTVLGLVGDT TRVDMDLIESLGIVDSVKRITDPFKKSNRKFHPDDTIVEVGDVKIGKGNFVVIAGPCSV ETEDQIVTVAKAVKASGADMLRGGAFKPRTSPYDFQGLRGEGLRLLEIAKQETGLPLVT ECMGVDDLPLFENVDVIQIGARNMQNYELLKAVGKLDKPILLKRGLANTLKELLMSAEY IMAGGNEKVILCERGIRTFDDYTRNTLDLAAVSMLRELTHLPIIVDPSHATGIARLVPP MAMAATASGCDGLIIEVHNDPMHALCDGAQSLKPEEFDALMGKVRQIREIVQ" /locus_tag="LOCUS_5260" /gene="aroF" /EC_number="2.5.1.54" /note="WP_003439427.1 3-deoxy-7-phosphoheptulonate synthase (Clostridioides difficile) [pid:58.0%, q_cov:99.7%, s_cov:98.8%, Eval:6.8e-107]" /note="MGA_754" ORIGIN 1 ggggttcagc caggcgacgc gggtcatgtc ctggtagctg ccggcagaga aacccttgtg 61 cgacgccgcc gtatcgctct tgatataggc gttggacacc acgtgggcca tctgggacgt 121 aaaagcgatc atctcgtcgt gtttgtccgc cgtcgtaaag gaaaagcgcc cgaatcccgc 181 gggcttcagc agttcctccg ccctgcccag caggtttacg tcgtccgcat ccatcggcac 241 cagcaccatg ggcgcgttgt gatacagatt cgcccgggcg tatttaaagc cggaatactg 301 ggtgccggcc atggggtgac cgcccacaaa gtgaaatccg tactcttccg ccaccgggaa 361 cagcgcttcg cacaccgccc gcttcgtgcc gcagcagtcg atgacgatgg gctttttgcc 421 gaaatacggc gacatgcgtt tgacccattc aatggcagcc tccggataaa tggtgaccag 481 caccagatcg cagctgccca cgttctcctg ggtcagttcc ccgtccacgg ctccgctgat 541 cctggcaaag tccaggacgg acgctgtgcg gttgcaggcc agcacttccc agcccgcctc 601 tttgtatgcc ttggcaaagg agcctccgat gaggcccagg cccacgatgc cgcagatcat 661 tgtacgatct cccggatctg gcgcaccttg cccatcaaag catcgaattc ttccggcttt 721 aaggactggg cgccgtcgca cagcgcgtgc atcgggtcgt tgtggacttc tatgatgagt 781 ccgtcgcagc cgctggccgt ggccgccatg gccatgggag gtacgagtct tgcgatgccg 841 gtcgcgtggc tgggatccac gatgatggga agatgggtga gttcccgcag catggagacc 901 gccgccaggt ccagcgtgtt tcttgtgtag tcgtcgaaag tgcggatgcc gcgctcgcag 961 aggatcacct tctcgttgcc gcccgccatg atgtattcgg cgctcatcag cagttctttc 1021 agggtattgg cgagacctct cttcagcagg atgggcttat ccagcttgcc aacggccttc 1081 agcagctcgt aattctgcat gttgcgggcg ccgatctgga tgacgtccac gttctcgaac 1141 agcggcaggt cgtccacgcc catgcattcc gttaccagag gcagtcccgt ctcctgcttt 1201 gcgatctcca gcagacgcag gccttcgccc cgcagtccct ggaagtcgta gggcgaagtt 1261 ctgggcttga aagcgccgcc ccgcagcatg tccgcgccgg aggccttgac ggcctttgct 1321 acggtcacga tctgatcctc tgtctccacg gagcagggtc ctgcgatgac cacgaaattg 1381 cccttgccga tcttcacatc ccccacttcc acgatggtgt cgtcgggatg gaatttacgg 1441 ttgctcttct tgaacggatc cgtgatccgc ttgacggaat ccacgatgcc cagggattcg 1501 atcagatcca tgtccacccg ggtggtgtcg cccaccaggc ccagcacggt ctgataatcg 1561 ccctgagaga tatgtacggt aagaccctgc tgtttgagcc attccaccag ctggtctctc 1621 ttttcgtcct gtacgttatg cttcaatact acgatcattg gtaaatactc ctttaacctt 1681 ataagtatac ctgaaatctt ccggatatga tactgcaggg atacaaagaa aagcggtcct 1741 gcacgatgca ggaccgcttt tggacttgta tctcttccgg cagtctatgc tcgcgcagcg 1801 tctatgggaa aggcaccgta aaagtagcct ccgaaataga agccaaagaa agcatcataa 1861 aagaagccgg aaactgcgct gtaaagtgtc ttgctatttt tgttcatcgt ctctgactcc 1921 tttctgccga aattatggat atacgataac acttccgttt tgtttagtca acaaatattc 1981 cggaaattta ttgttcttct gcaacacttt cttccgggtc aggctctgcc tgcaccgcct 2041 ctggcgagac gctctgggtg ttgggcttca tctcctgata gtagctggag atgcccgtcg 2101 tgtcttcggt gtagcccggg ttcggcggcg tctggttcgt gatctcctcg cccttgtgat 2161 tcttccacag gatcaggatg accaccacca cgagcagcgt cgctacgaca gcgatgatca 2221 gcaggccttt gagcacggag gtcgccaccc ctttggcctt atccgtcttg tccttgaacg 2281 cggagagcgg attgtcggcc tgccagaacg gatcttctcc gagagcatgt tccccacctt 2341 ccgcatattc cgcgtagttt tcgtcgaaat agtcgtagat gtcgtccgac agatctccta 2401 ttgcggaaga gttgcggaaa tccatcagac cgcaggcctc gaccgcctcc agatatccca 2461 tgtcgctagg cagtgcggtc acctgcatgt agcggtccac cgctccgtcc cagtcctcca 2521 gagactggcg ccagatatcc agcgcagaca gcgcggaagt ggcata // LOCUS sequence170 2563 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence170 VERSION sequence170 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2563 /mol_type="genomic DNA" /organism="" /note="sequence170" CDS complement(539..931) /product="cation:proton antiporter subunit C" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_010902377.1" /transl_table=11 /codon_start=1 /translation="MSVFFANLPEYAAMILFGIGLSNLMLAKNLVKKIIGLNIMDTSVY LFLAAKGYVENSVAPIVSASDLGHIEHTLYTNPVPAGLVLTGIVVSVSVTAVLLSLIVR LNEEFHTLDIDEIIHILRQRDREDLK" /locus_tag="LOCUS_5270" /note="WP_010902377.1 cation:proton antiporter subunit C (Halobacterium) [pid:40.2%, q_cov:78.5%, s_cov:80.5%, Eval:4.1e-15]" /note="MGA_757" CDS complement(928..1692) /product="Na(+)/H(+) antiporter subunit B" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_004080100.1" /transl_table=11 /codon_start=1 /translation="MNKEKRDRLYAVLCTVLTIVFISVMLFTVEKMPDLGRADNPDINE VMEFYVEEGPEETGALNAVTGMILHYRAFDTLGESCVLFVSAVCVFILLRIDGEASNDT LVAIDRRYEPTDDPILTQTFKLLVPAVFMFGIYITMNGHLSPGGGFSGGAIIGAALLLF LNAYGLEKTERFMSSQLYRRVTTMALCFYAVAKSYTFYTGANGLDSFEGAGTPGNILSA GLILPLNICVAVVVSMTIYSMYIMIRKGGFNK" /locus_tag="LOCUS_5280" /note="WP_004080100.1 Na(+)/H(+) antiporter subunit B (Thermotoga) [pid:23.8%, q_cov:96.1%, s_cov:98.8%, Eval:3.0e-10]" /note="MGA_758" CDS complement(1685..2002) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MQGLMAVLLLLLVICAVAVSATRKLLPAVIIFMSYSMIMSIVWLL LRAPDLAITEAAVGAGITSVLFFITMRRLGLLKKNLQEDEAEVQAHFAAHSGKLEEESD E" /locus_tag="LOCUS_5290" /note="WP_010902379.1 DUF4040 domain-containing protein (Halobacterium) [pid:43.5%, q_cov:59.0%, s_cov:35.2%, Eval:1.4e-10, partial hit]" /note="MGA_759" CDS complement(1990..2334) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="METIRFVLGTLLILSGLVIFIIEVFGNYRFGYVLNRMQAAAIGDS FGIVLCLLGTMLYFGWSVACLKLLFVEIFLWFSSPVSSHLVAKLEAETNEDLAKEVKMR TQKEDDPCKD" /locus_tag="LOCUS_5300" /note="MGA_760" ORIGIN 1 gagatgagga acaggccgga gccgatgagg ctcatgataa agtagcgcat ggaggcagcc 61 agcgtgtagc cgtcctcctt gctcatgacg atgccgcagg ccgtgatggt gttgatctcc 121 acgaacacgt atgccgtaaa gatgtcgttc gtgtacacga gcgccaacat ggaacacagc 181 agaaacaacg tcgagatata gtacaggttt acctttaagc ggccgatgtc gctgcgcagg 241 tgtgccctgc cgcccatgag agacagcagc gtaacgatgg agaacagcgt cgcgacggca 301 gcctcgagca tgccggcccg cagttcgttg ccgaaaggcg cgccgatctc gcccatgctg 361 taggtgtacg cggctccgcc ctgcagaaaa tagaccagca gcgcgacgga ggcagcggcc 421 accagcgcga tggcgcagtc cgccagatgt cttgccgccc tgcggggaag cacgaggcac 481 acgatgccgc acagcatcag cagcagtatg gaaaaggcag ggacgttctg gaccaggctc 541 atttcagatc ctccctgtcg cgttgtctca agatgtggat gatctcgtcg atatccagag 601 tgtggaactc ctcgttcagc cgcacgatga gagacagcaa taccgccgta acggatacgg 661 agaccacgat gcccgtaagc acaaggcctg ccggcaccgg gttcgtgtac agcgtatgct 721 cgatgtggcc gaggtcggac gcgctcacga tgggcgcgac ggagttctcg acgtagcctt 781 tggccgccag gaacagatac accgaggtat ccatgatgtt gaggccgatg atcttcttga 841 cgagattctt cgccagcatc aggttggaga gtccgatgcc gaacaggatc atggccgcat 901 attcgggaag gtttgcaaag aagacgctca tttgttgaac cctcctttgc ggatcatgat 961 gtacatggaa tagatcgtca tggagacgac gaccgccacg cagatgttga gcggcaggat 1021 gagccctgca gacaggatgt tgccgggcgt gcccgctccc tcgaagctgt cgaggccgtt 1081 ggcgcccgtg tagaacgtat agctcttggc gacggcgtag aagcacagcg ccatggtcgt 1141 aacgcggcgg tacagctggc tgctcataaa gcgctccgtc ttctccaggc cgtaggcgtt 1201 gaggaacagc agcagcgcgg cgcctatgat cgccccgccg gaaaatccgc cgccggggga 1261 caggtggccg ttcatcgtga tgtagatgcc gaacatgaag accgccggca ccagcagttt 1321 aaaggtctgc gtaaggatgg ggtcgtccgt gggctcgtag cgccggtcga tggcgaccag 1381 cgtgtcgttg ctggcctcgc cgtcgatgcg cagcaggatg aacacgcaca cggcggacac 1441 gaacagcacg caggattccc ccagcgtgtc gaaggcgcgg taatggagga tcatgccggt 1501 gaccgcgttc agcgccccgg tctcctccgg accctcttcc acgtagaatt ccatgacctc 1561 gttgatgtcc gggttgtctg cgcggcccaa gtcgggcatc ttctcgacgg taaacagcat 1621 gacgctgata aaaacgatgg tgagcaccgt gcagagcacg gcgtagaggc ggtcgcgttt 1681 ttccttattc atcgctctcc tcctccagtt ttccgctatg ggcggcgaag tgcgcctgca 1741 cttccgcttc gtcttcctgc agattcttct tcagaagacc cagccggcgc atcgtgataa 1801 agaacagcac ggacgtgatg ccggcgccga cagctgcctc cgtgatggcg aggtccggcg 1861 cccgcagcag cagccatacg atggacatga tcatgctgta ggacatgaag atgatgaccg 1921 caggcaggag cttccgggtc gcggagaccg ccacggcgca gatgacgagc agcaaaagaa 1981 gaacagccat caatccttgc atgggtcatc ctccttctgc gtgcgcattt ttacctcctt 2041 cgccagatct tcgttcgtct ccgcctccag cttcgccacc aggtgggagc tgacgggcga 2101 ggagaaccac aggaagatct ccacgaacag cagtttaaga caggcgacgg accagccgaa 2161 atacagcatc gtgccgagaa ggcataaaac gatgccgaag ctgtcgccga tggcggcagc 2221 ctgcatgcgg ttgagcacgt agccgaaacg gtagttgccg aacacttcaa tgatgaaaat 2281 gacgagcccc gacaggataa gcagggtgcc cagcacaaat ctaatcgtct ccatcgctgt 2341 gcagcccctc ctccgtagcc tgggccgtct gggcctcgat ctcctgccgt tcatcgtctt 2401 ttaacgataa gtattcgccc cggtagatgc gggaaaagac cacgaccgca agaaagctga 2461 tcatggcgta gagcagcccg atgtcgatca ggctgggatc tttaaggatg gcggacataa 2521 agacgatggc ggagatgacc atcgtgccgg ccatgttgat gga // LOCUS sequence171 2556 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence171 VERSION sequence171 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2556 /mol_type="genomic DNA" /organism="" /note="sequence171" misc_feature <1..1063 /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_011987043.1:pyruvate:ferredoxin (flavodoxin) oxidoreductase" /note="WP_011987043.1 pyruvate:ferredoxin (flavodoxin) oxidoreductase (Clostridium botulinum) [pid:51.9%, q_cov:97.7%, s_cov:31.5%, Eval:3.1e-105, partial hit]" /note="MGA_762" /locus_tag="LOCUS_5310" CDS 1124..1888 /product="amidohydrolase family protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_010867222.1" /transl_table=11 /codon_start=1 /translation="MGKIIDSHAHIGGSWMGKVKNPYSPERMKEIMQSFGIDYACISTW DVLNDIERGNADVCALAKRDPFYIPYVVVCPVHEKDSVEAIKRYVGGEGFKGIKMHPTA NYYRVDSLKMMEPVMNLAAEYDVPLLFHGEEDGYGSPCQFAALAEAFPECKIIVAHMCH GLWLDAIEVCRSHENIWLDTAECSPHNFKMERAIRLCGPDKIIFGTDTPVTDIGAHLAI FDNMNTYFPGTLTDEGLEKILHGNIEKLLKMA" /locus_tag="LOCUS_5320" /note="WP_010867222.1 amidohydrolase family protein (Pyrococcus abyssi) [pid:29.1%, q_cov:98.4%, s_cov:92.7%, Eval:5.6e-17]" /note="MGA_763" ORIGIN 1 cgagacgccc tacgccaagc tgatgaccca gctcttcggc gagcgcgtct actgggccaa 61 cggcacgggc tgctcccagg cctggggcgc ctccatgcct ggcatcccct acaccaccaa 121 ccgcagagga ttcggccccg cctggaccaa ctccctgttc gaaaacaacg cggagctctg 181 cctcggcatg ctcctgtccg tcaagcagca gagaaacgcc gtcaaggcgc aggtggaaag 241 cctttgcgcg ggcgcttccg gcgaactgaa ggcggcctgc gaagcatggc ttgcggcctt 301 cgacgatttc gacgggtcac gcgagacggc ggacgccctc tgcgccctcc tggagcagga 361 agacacgccc gaagcgaagg cgatcctcgc ccataaagac cagctggcga gaaagacttt 421 ctggatgtac ggcggcgacg gctgggccta cgatatcggc ttcggcggcc tcgcccacgt 481 catcgccagc ggcgagaacg tcaacgtctt tatcatcgac acggaagtct attccaacac 541 cggcggccag agcagcaagg cgacccaggt cggcgcggtg gcgcagttcg cgtccagcgg 601 caagcgcacc cggaagatgg acatcggcgg catcatgatg agctacggca acgtctacgt 661 ggcgcaggtc gccatgggtg cagacccgaa ccagctcatc aaggccatca aggaagcgga 721 ggcgttcgac ggccccagcg tcatcgttgc ctacacgccc tgcacgtccc acggcatccg 781 agccggcatg agcaaggtgc aggaggagat gaagcgggcg gtcgaatccg gctattggct 841 gctctaccgc ttcgatccgc gccagagcca gccgctgcac ctggattcca aggaaccgaa 901 gatgggctac gaggagttcc tggacggcga gacccgctac agcgccctca agctcacctt 961 ccccgaaaac gcgaaggcgc tcttcgccat cggcagcgac gaagccgcca agcgctacgc 1021 gcagtacaag cacatggagg cgtcgcagaa gaccggggat tgatgtgccc gccctgtccg 1081 attcgtggta aaatgagggt gcttcggcaa gaaaggagac catatgggca agatcatcga 1141 ttcccatgcg cacatcggcg gctcatggat gggtaaagtc aagaatccgt attctcccga 1201 gcgaatgaag gagatcatgc agagcttcgg catcgactat gcctgcatca gcacctggga 1261 tgtcttaaac gacatcgaaa gaggcaacgc ggacgtctgc gccctggcga agcgcgaccc 1321 gttctacatc ccctacgtcg tcgtctgccc ggtccacgaa aaggattcgg tggaggccat 1381 caagcggtat gtgggcggtg aagggttcaa gggcatcaag atgcatccga cggccaacta 1441 ctaccgggtg gacagcctta agatgatgga gccggtcatg aacctggcag cggaatacga 1501 cgtgccgctc ctgttccacg gcgaagagga cggctacggc agcccctgcc agttcgcagc 1561 gctggcggaa gccttcccgg aatgcaagat catcgtcgcc cacatgtgcc acggcctgtg 1621 gctcgatgca atcgaggtct gccggtccca cgaaaacatc tggctcgaca ctgcggaatg 1681 ctctccccac aacttcaaga tggagcgggc gatccgcctc tgcggtccgg acaagatcat 1741 cttcggaacg gatacgccgg tcaccgacat cggcgcccac ctggcgatct tcgacaacat 1801 gaacacctat ttccccggca cgctcaccga tgagggcctg gagaagatcc tgcacggcaa 1861 catcgaaaag ctgctgaaaa tggcgtaagc gttcgacaga aaggataaca ctatggcaac 1921 gatctattac gataaggact gcgatctcga tctggtgaag gacaagacca tcgcgatcat 1981 cggctacggc aaccagggcc gggcgcaggc gctcaacatg aaggattccg gctgcaccaa 2041 gatcatcgtc ggaagccgca aggacagctc ctacgaccag gccgtcgagg atggtttcgc 2101 ggtcaagccc atcgaagagg cgtccaagga ggcagatatc ctctttatgc tgctgccgga 2161 tgaatatgcg ccggccatct tcaacgaaca gattgcgccg gggcttgaac cgggcaacat 2221 cgtcaatttc gcctccgcct acaacatcac cttcaagaag atcgttccgc ccgcctttgt 2281 cgacgtcgtg atggcggtgc cccgcatgat cggcgacggc gtacggcaga tgttcctgcg 2341 gggcgagggc ttcccctcct tcgtaggcgt tgcccaggac gcttccggca aggcgctgga 2401 atacggcaaa gcgctgtgca aggcgatcgg gtctaccaag aagggcgcca tcgaggtcag 2461 cttcgacgac gagaccatgc tggatctgat ggcggagcag ggcacctggc ccatcatcta 2521 ccatgtgttc gacgagtcct tcaagctgct ggcgga // LOCUS sequence172 2536 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence172 VERSION sequence172 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2536 /mol_type="genomic DNA" /organism="" /note="sequence172" misc_feature <1..523 /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_009891775.1:ribosome biogenesis GTP-binding protein YihA/YsxC" /note="WP_009891775.1 ribosome biogenesis GTP-binding protein YihA/YsxC (Clostridioides) [pid:52.4%, q_cov:97.1%, s_cov:81.3%, Eval:2.8e-46]" /note="MGA_765" /locus_tag="LOCUS_5330" CDS 526..1062 /product="hypoxanthine phosphoribosyltransferase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003359412.1" /transl_table=11 /codon_start=1 /translation="MAARKKYSFEEVLISKEQLAAKVAELGAQISKDYEGEELFLIGIL KGSVPFMADLMRAITLDVEMDFMSVSSYGSGTKSSGVVRILKDLDSDIAGKNVLIVEDI IDSGLTLAYLKEYLAKRNPKSIKIVTMLSKPARRKADLEADYTGFVIDDMFIVGYGLDI DQKYRNLPYISWIKE" /locus_tag="LOCUS_5340" /gene="hpt" /EC_number="2.4.2.8" /note="WP_003359412.1 hypoxanthine phosphoribosyltransferase (Clostridium) [pid:61.5%, q_cov:94.9%, s_cov:93.4%, Eval:1.3e-54]" /note="MGA_766" CDS 1069..2295 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MKHLEKYIDHTLLKPAAGIADIEQLCKEAKEHGFYAVCVNSRFVP VAKKALQGTDVKIASVIGFPLGAMSTAAKVFETENSCENGAEEIDMVMEYGLLKEGHKQ AVFDDIKAVVDAAAKYGAIVKVILETGALTDGEIVDACKLSEEAGAAFVKTSTGFGEGG ATVHAVELMRKSVGPNVKVKASGGIRDRETALAMIEAGADRIGASAGIAICTVPEGEEE EGPFEKEGPKNILVLNGSPKMSGNTAALVDAFCRGAQEAGHTVHVFNVANLNVHPCTDC RYCFDHAGECVLQDDMKRIMPHLYADDVIVFATPVYFYGFSAQIKTVLDRMICMQPSKM TVKGSILLSPYGDTDTTVPKPMIAMYKAFTGYIGWKNLGIVTAENCMDPGDIQGHRALA EAEALGKNL" /locus_tag="LOCUS_5350" /note="WP_012028213.1 deoxyribose-phosphate aldolase (Streptococcus suis) [pid:56.7%, q_cov:51.5%, s_cov:94.5%, Eval:6.5e-57, partial hit]" /note="MGA_767" ORIGIN 1 gggcaagtcg tctctcatca acctgctcac caaccggaag aagctggcca aggtctccca 61 gaatccgggc aagacccgca ccatcaactt ttttacggtg aacgggacgt tccgcatcgt 121 ggaccttccg ggctacggct atgcgaaggt ctccaaggcg gaagcggaga agtggggccc 181 catgatggag gactatctgt cttcccggcc agacctgctc aaggtggtgc agctggtgga 241 catccgccac gctccctccg ctcaggaccg gcagatgtac gagtatctgc agtattacgg 301 tctggacggc ctcgtcgtcg ccacgaaggc ggataaggtg agccggggag aagcggcgaa 361 gaatatcgcg gtcatccgcc gcgatctgaa actgaagaag ggcgaccggg tgatcccggt 421 atcggctttg aataaaacag gcacggaaga gatcctcgcc gccatggaag agatccttct 481 ggccggaaaa caagagaaca cggaaaacgg ggaggatgca tagtcatggc tgccaggaag 541 aagtacagtt ttgaggaagt tctgatctcg aaggaacagc ttgcggcaaa ggtcgcggag 601 ctgggcgcgc agatcagcaa ggattatgaa ggcgaagagc tgtttctcat cggtattctg 661 aagggatccg ttccctttat ggcagacctg atgcgcgcca tcaccctgga cgtggagatg 721 gacttcatgt ccgtttcctc ctacggcagc ggcacgaaat ccagcggcgt cgtccgcatc 781 ctcaaggatc tggacagcga catcgcgggc aagaacgtgc tcatcgtcga ggatatcatc 841 gacagcggcc ttacgctggc gtatctgaag gagtatctcg ccaagagaaa ccccaagagc 901 atcaagatcg ttacgatgct gtccaagccc gccagaagaa aggcggatct cgaagcggat 961 tataccggtt tcgtcatcga cgacatgttt atcgtgggtt acggactgga tatcgaccag 1021 aaatacagaa atctccctta tatctcttgg atcaaggagt gatgtcttat gaaacatctg 1081 gaaaagtaca tcgatcatac gctgctgaag cccgctgcgg gcatcgcgga tatcgaacag 1141 ctctgtaagg aggcgaagga gcacggcttt tacgcggtct gcgtcaacag ccgcttcgtt 1201 cccgtggcga aaaaggcgct gcaaggtacg gacgtaaaga tcgcatccgt catcggtttc 1261 cccctgggtg ccatgtccac cgctgcaaag gtgtttgaga ccgaaaattc ctgcgaaaac 1321 ggcgcggaag agatcgatat ggtcatggaa tacggtcttc tgaaagaagg ccacaaacag 1381 gccgtttttg acgatatcaa ggccgtcgtg gatgcggcgg caaagtacgg agccatcgtt 1441 aaggtcatcc tggagacggg agctcttacg gacggcgaga tcgtggacgc ctgcaaactg 1501 tcggaagagg caggagcggc gttcgtcaag acctccacgg gattcggcga aggcggagcg 1561 acggtgcatg ccgtggaact gatgcgcaag tccgtgggtc cgaacgttaa ggtaaaggcc 1621 tccggcggca tccgtgaccg cgaaacagcc ctcgccatga tcgaggccgg cgcagaccgg 1681 atcggcgcct ccgcaggcat tgccatctgt acggtaccgg aaggggagga ggaagaaggc 1741 ccttttgaga aagaggggcc gaagaatatc ctcgttctga acggaagccc caagatgagc 1801 ggcaatacgg cggctctggt ggacgcattc tgccgcggtg cgcaggaagc gggtcatacg 1861 gtgcacgtgt ttaacgtggc gaatctcaac gtacatccct gcacggactg ccggtactgc 1921 ttcgaccatg ccggcgaatg cgtgctgcag gacgacatga agcgcatcat gccgcatctg 1981 tatgcggacg acgtcatcgt atttgcgacg cccgtatatt tctacggctt ctctgcgcag 2041 atcaagaccg ttctggaccg catgatctgc atgcagccct cgaagatgac ggtaaagggg 2101 agcatcctgc tgtcgcccta cggcgatacc gatacgactg tgcccaagcc catgatcgcc 2161 atgtacaagg cgttcaccgg ctacatcggc tggaagaacc tcggcatcgt gaccgcagag 2221 aactgcatgg accccggcga tatccaggga catagggctc tggcggaagc ggaagcgctg 2281 ggaaagaacc tctagtaaaa atacgtgcaa aaaagatcaa aaaaccgcaa aaatagttgt 2341 tgacattcga tctgaagtgc gtataataga ttttgcgcgt cagccaaggt gctgcgaggc 2401 acctaaaaaa cttctcaaaa aactttaaaa agttgttgac aagtaagggc cagatgcgta 2461 taatcttaaa tgttccgcgt caaacggagc acgaaccttg aaaacaacat agtgtagaaa 2521 ttgagtctta aagacc // LOCUS sequence173 2533 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence173 VERSION sequence173 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2533 /mol_type="genomic DNA" /organism="" /note="sequence173" CDS complement(533..1411) /product="LysR family transcriptional regulator" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_132283172.1" /transl_table=11 /codon_start=1 /translation="MEIRTLRYFMAVAREENMTRAAEQLHVSQPTLSKALRSLEEELGK KLFTRHSFSIKLTEEGVLLRNRAEDLVSMADKIEQEFLSLDDISGGDIYFGLAETYQIR YLAREIRRFKELYPDLRYHITSGDTEQVTEKLDKGLLDFAVICETPDDRKYHHILFPES DYFGVVLPKDSPLAEKESITAEDLAGLPLFCSEQSWENDIRPWAKELFDQFHMEGSFRL SYNGSLFAREGLGLLLTLNDLVDTSPESGMVFRPLSPHLEMKMYLIWKKYQNFTPIAER FLKQLQQSFAG" /locus_tag="LOCUS_5360" /note="WP_132283172.1 LysR family transcriptional regulator (Natranaerovirga hydrolytica) [pid:44.4%, q_cov:98.3%, s_cov:99.0%, Eval:7.5e-67]" /note="MGA_769" CDS 1548..1784 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MEQDYKQILTGLEDAGCTPKEIRDAERLCDRKDPDALVRHLRRCR CSRMEELHESQRKVDCLDYLIRQTEKTKKANIG" /locus_tag="LOCUS_5370" /note="MGA_770" ORIGIN 1 gaaggcatta cgggcggcaa gacgaaaacg ctgtttgccc ccgcagacac ctgtacccgt 61 gcgcagatgg taacgttcct gtgggcagcc agcggcaagc cggagcccaa gacggcagaa 121 aacccgttca aggacgtacc cgagggctac tacaccaagg ctgtgctgtg ggctgtggag 181 aacggcatta cggcaggcgt ttctgcagat gaattcggtc ccagccgcac cgtgacccgg 241 ggccaggcca tgacgttcct gtacggagca aagggccgtc ccgaggcggg tacggcacct 301 ttcgaagatg taaaggagag cgattatttc gcaaaacctg tcgcctgggc ctttgaaaac 361 ggcatcacca gcggcaagac gaagaccgcc ttcggtccga atgacccctg caccagagcg 421 cagatcgtaa ccttcctgta tctgctcttc gcagaataga aaagcatatt aaacacaagg 481 ggacaggtat actgtgtgca cgacacagcg tacctgtccc tttgtgcttt ttttatcccg 541 caaacgactg ctgcagctgc ttcagaaagc gctctgcgat gggggtgaag ttctgatact 601 ttttccagat caggtacatc ttcatctcca gatggggcga cagaggccgg aagaccatgc 661 cgctctccgg agaggtgtcg accaggtcgt tcagcgtaag gagcagtccc agcccttctc 721 tggcaaacaa ggagccgttg taggaaagcc ggaaggatcc ttccatatgg aattggtcga 781 aaagctcctt tgcccagggg cggatatcgt tctcccagct ctgctcggaa cagaagagag 841 gaaggcccgc aaggtcctct gccgtaatgg actctttttc cgccaatggg gagtccttgg 901 gcagaacgac gccgaaatag tccgattccg ggaaaaggat atggtgatac ttgcggtcat 961 ccggtgtttc gcagatcacg gcgaagtcca ggagcccctt gtccagcttt tccgtcacct 1021 gctcggtgtc gccgctggtg atgtggtagc gcagatccgg atacagttcc ttaaaccggc 1081 ggatctctct ggcgagatag cggatctgat acgtctccgc cagtccgaaa tagatgtccc 1141 cgccggagat atcatccaga gacagaaatt cctgctcgat cttatccgcc atgctcacca 1201 ggtcttcggc ccggttgcgg agcagcaccc cttcttccgt gagctttatg ctgaaactgt 1261 gccgggtaaa cagcttcttc cccagctctt cctccaggga tcttaacgcc ttggacagag 1321 tcggctgcga aacgtgcagc tgctctgccg cccttgtcat gttctcttcc ctggcaactg 1381 ccataaaata tcgcaatgta cggatctcca cgggtcatgg ccctcccttt ctcgtctctt 1441 ttgatattct aaaaatgaat accatgatat tcattataac cattagcgcg gatttctcca 1501 agcccttata ctgaccgtgt aagaaaaacg tgcacaggag aagaaatatg gaacaggatt 1561 ataaacagat cctcaccggg ttggaagatg ccggatgcac gccgaaagag atccgggatg 1621 cggaaaggct ctgcgaccgg aaggatcccg acgcattggt ccgccatctt cgcaggtgcc 1681 ggtgcagccg gatggaggag cttcacgaaa gccagcgcaa agtagactgc ctggattatc 1741 tgatccggca gacagaaaag acaaagaaag caaatatcgg atagagaaca aaggagagca 1801 agactatgat gtacaaagaa gaactcaaac tgacacagga atgggacaag accttcccga 1861 agagcgaaaa ggtcgatcac tgcaaggtga ccttcacaaa ccgctatggc attacgctgg 1921 ctgcagatat gtacgtgccc aaagaggcgg aaggcaaact tcctgcgatc gcggtctgcg 1981 gacccttcgg cgcggtcaag gaacagtgct ccggcctgta cgcgcagacc atggcggaac 2041 gcggcttcct gacgctcgcc ttcgatccct ccttcaccgg agagagcggc ggcaacgtgc 2101 gctatatggc atctcctgat atcaataccg aagatttcat ggcagcggta gacttcctgt 2161 ccctctgcga aaaagttgac cccgaccgca tcggcattat cggcatctgc ggctggggcg 2221 ggatggcgct caatacagcc gcgctggaca cccgcatcaa ggcgaccgtc gcctccacca 2281 tgtacgacat gacccgggtc aacgccaagg gatacttcga ttcggaagac agcgaagagg 2341 cccgctacca gaagaaggcc gccatgtgcg cccagcgcct ggccgatctg aaagccggcg 2401 aatacaccct cggcggcggc gtggtcgatc ccctgccgga agatgcgccc tacttcgtaa 2461 aggattacta tgactattac aagaccggcc gcggctacca cgcgagatcc ctgaattcca 2521 acggcggctg gaa // LOCUS sequence174 2532 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence174 VERSION sequence174 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2532 /mol_type="genomic DNA" /organism="" /note="sequence174" misc_feature <1..1771 /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_011391795.1:excinuclease ABC subunit UvrB" /note="WP_011391795.1 excinuclease ABC subunit UvrB (Moorella thermoacetica) [pid:68.4%, q_cov:99.5%, s_cov:89.0%, Eval:1.5e-228]" /note="MGA_772" /locus_tag="LOCUS_5380" ORIGIN 1 ggcgcagctc tgcggggagt tcaaggagtt cttcccccat aacgccgtgg agtatttcat 61 ttcctactac gattactacc agccggaggc ctacgtgccc tcgactgaca catacataga 121 aaaggactcg gacatcaacc aggagataga ccgcctgcgc tattccgcga cggcggctct 181 ggcggagcgc cgggacgtca tcatcgtggc gtcggtctcc tgcatctacg gtctgggcag 241 ccccttcgac tataaaaacc agatgctgtc gctgcggccc ggacagacca agagccgcct 301 ggacatcctg cgcaagctga cggacatcca gtacacccgc aacgacctgg gtttcgagcg 361 cggcacgttc cgggtgcggg gcgatatcat cgacattatt cccatcgggt cggagtcggc 421 ggtgcgcatc gagctgttcg gcgacgaggt ggaatccatc aaggagatga acccggtcac 481 cggcgagatc accggcaccc gcaaccacat cgcgatcttc ccggcgtcgc attacgccac 541 gtccaaagag aacatggacc gcgctctcgt tacgatcgag gaggaactgg aggagcggct 601 ggtgtggctg cgtgaccgcg gcaaactctt ggaagcccag cggctggagc agcgtacccg 661 ctacgatctg gagatgatgc gggagatcgg ttcctgcaag ggcatcgaga actattcccg 721 ccacatcgtc ggaaatccgc caggagcgaa gccctatacg ctgatcgact atttccccaa 781 ggactttctc gtggtcatcg acgagagtca cgtgatgctg ccccagctgc gggccatggc 841 tcacggcgac aagtccagaa agaccgccct ggtggactac ggcttccgtc tgccgtcggc 901 gctggacaac cggccgctgc ggttcgagga attcgacgcc atgatcaacc aggcgatctt 961 tatctccgcg acgccggcag cctatgagag agaagtgtcc ggcggcatct ccgcggagca 1021 ggtcatccgg cccacgggac tgctcgatcc tcccatcgag atcgtgccga cggaagggca 1081 gatcgaccac ctcatcggcg agatccacaa agaggtggac aagggtcacc gggtgctggt 1141 aacgaccttg acgaagaaga tggcggaaaa cctgacggaa tacctgaaga acgcggggct 1201 gaaggtccgc tatatgcact ccgaagtgga tacgctggaa agaaacgaga tcctgcgcga 1261 tctgcgactc ggcgtcttcg atacgctggt gggtatcaac ctgctgcggg aaggcctgga 1321 tctgccggag gtggcgctgg tcgccatcct ggatgcggac aaagaaggtt tcctgcgtac 1381 ggagacatcg ctcatccaga cgatcggccg cgctgcgaga aacgcggaag ggcgggtcat 1441 catgtatgcg gatacgatct cgcccgccat gcgcacggcg ctggacgaga cggaacgccg 1501 ccgcagcatc cagatgaagt acaacgagga gcacggcatt acgccggaga ccatcaagaa 1561 ggcagtccgc gatgtgatcg aggtgaccca gaaggtcgag gaagacctgg acagctacga 1621 aggcaagagc gtgctggagc tcacgaagag agagcttacg gattacgcca agaagctgga 1681 gaaggagatg aaggcagctg ccaaggatct gcagttcgaa cgggctgcga tactgcgcga 1741 caagctgctg gaagtacggg cgaagctgta aagcaatgaa taaacaaaag accggagcat 1801 ggcgctccgg tctttttatg cgcttttaag cgtttagggc tgataggtgt gggcttcgct 1861 gtacagttct tcccaggcat cgtcgtccat cgccttgagg gtgaaggcga cgtcttcgac 1921 ggtctcgatc tcgttgtctt ccagttcgtt gacgccgaac atcatctcgg aaacggtccg 1981 ctggccagcc gggatcgtta cgccgaagta cggatcgagg tccttgccgt tgacggtaac 2041 gtcttcccag gctacgtaca aaggcttgtc ggtcttgttc tccacatagg cgtggatctc 2101 gaaactgccc caggtctcgt ctttttcacc ttccaggatc acgaaggtaa agacgtcgtt 2161 gtctgcaacg gtgacctcgt tcgcaccggt gcgtctctcg ggaacgacga tctggtcttc 2221 cgtcaggcct gtgggataga tggtgtaggt ctcgttcatc agatagacgt cgtcccacca 2281 gccttcctca tcgtagaggc ggaagctcat cacgacctga tcgggattct ccaggccgac 2341 gttttccatg tcggaggccc agatgtccag ggtgccgacg gtgctttcgc ccggctcgac 2401 ttcggttccc agatagccgc ctacggacca gccgttgacc acgagactgt ccgcggagaa 2461 ggtgagcttc ttgtcggtct tgttctcgca gagcacgtcg aaggagatgt tgccccattc 2521 gtcgcagccg cc // LOCUS sequence175 2523 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence175 VERSION sequence175 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2523 /mol_type="genomic DNA" /organism="" /note="sequence175" CDS complement(268..681) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MNGNMGQLLGDALLVVFTFFGVVPVLLNTVSQFGVLKRFADEMVR EGVISEEKVKALLPKKQIAGVVISALMLFVLFTACIKTAPFGWVCAGVPFLLGLFKYRN IVEFNSFTVQRFQNNFKGEYDKRKMQKYIETHF" /locus_tag="LOCUS_5390" /note="MGA_775" CDS complement(695..1597) /product="PHP domain-containing protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_012870266.1" /transl_table=11 /codon_start=1 /translation="MINPDLHLHTYYSDGKESPAVVVARAKAMGIDVMAITDHDGMGGV EEAVEEGRRLGVRVVRGVEFSAEYAEDVPGFEGCTHYMHILGYGMDPSNPELDKALAYI QERREWRNEALRQVFCELGYPMTMEELKAQSINGFVGKVSFARLLVAKGYCETVVDAFD DDKMLMHPKVKAIHRYKIPAAEAIRVIREAGGKAFFAHPFQLSFKPPKREESEVYRQRQ EAVIRALKDLGMAGIECWYPTHTPEQTAYLLDLAKRLGMLVSKGSDDHGANARPVKKMG NFSTEVDLSMLQWVEEYLD" /locus_tag="LOCUS_5400" /note="WP_012870266.1 PHP domain-containing protein (Thermanaerovibrio acidaminovorans) [pid:32.4%, q_cov:93.7%, s_cov:93.8%, Eval:3.3e-33]" /note="MGA_776" misc_feature complement(1590..>2523) /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_003233100.1:helicase-exonuclease AddAB subunit AddA" /note="WP_003233100.1 helicase-exonuclease AddAB subunit AddA (Bacillus) [pid:32.4%, q_cov:75.2%, s_cov:18.9%, Eval:1.2e-20, partial hit]" /note="MGA_777" /locus_tag="LOCUS_5410" ORIGIN 1 ccccaacggt tccgcctacg ccatcgaagg catcacttcc ccggacggcc gtgtcttcgg 61 caagatgggc cacatcgagc gctacagcaa gggcatcttc cgcaacatcc cgggcaacta 121 cgacccgaag ctgatggaag cagctgtgga atactttacg aagtaagtgt aagaccataa 181 cacaaaggga caggtacgtt gtgcctgtcc cttttatgat cgctgagtat tgtcgctgag 241 aaccgtcccc ggcggcaact gacgacatta aaaatgcgtc tcgatatact tctgcatctt 301 ccgcttgtcg tactcgccct tgaaattgtt ctggaagcgc tgcaccgtaa agctgttgaa 361 ctccacgatg ttgcggtact taaacagccc cagcaggaag ggcacgcctg cgcacaccca 421 gccgaaaggc gcggtcttga tgcaggccgt aaacagcacg aacagcatga gcgcggagat 481 gaccacgccg gcgatctgct tcttcggcag aagcgcctta actttctcct ccgagatgac 541 gccctcgcgc accatctcgt ccgcaaagcg ttttaagacg ccgaactgcg ataccgtatt 601 cagcagcacc ggcacgacac cgaagaaggt gaacaccacc aacagcgcgt cgcccaggag 661 ctgtcccata tttccgttca taaacacaca ctcctcaatc gagatattct tctacccatt 721 gtaacatgga taggtcgact tctgtcgaaa agttgcccat cttcttgacc gggcgggcat 781 ttgccccgtg gtcatcggag cccttcgaca ccagcatgcc cagccgcttt gccagatcca 841 gcagatacgc ggtctgctcc ggcgtatggg tgggatacca gcactcgatg ccggccatgc 901 ccagatcctt cagcgcccgg attacggcct cctgccgctg ccggtacact tccgattcct 961 cccgcttcgg cggcttaaac gacagctgga acgggtgggc gaagaaggct ttgccgcccg 1021 cctcgcggat gacccggatc gcctccgccg ccgggatctt atagcggtgg atggccttta 1081 ccttggggtg catcagcatc ttgtcgtcgt cgaacgcatc gaccaccgtc tcgcagtacc 1141 ctttcgctac cagaagccgg gcaaaagaca cctttcccac gaacccgttg atggactggg 1201 ccttcagttc ctccatcgtc atggggtaac ccagctcgca gaacacctgc cgcagcgcct 1261 cgttgcgcca ctcgcggcgt tcctggatgt aggccagcgc cttatccagc tcgggattgg 1321 acggatccat gccatagccg agaatatgca tgtagtgggt gcagccctca aagccgggta 1381 catcctccgc atattccgcg gaaaactcga cgccccgcac cacgcggacg cccaggcgcc 1441 tgccctcttc tacggcttct tccacgccgc ccataccgtc gtggtccgta atggccatca 1501 cgtcgatgcc catggccttg gcgcgcgcca cgacaacagc cggcgactcc ttgccatcgc 1561 tgtaatacgt atgcaaatgc agatcgggat taatcatcta tggaaatttc cttgtctatg 1621 ccgaacagat agagtacggc cttcttgacc ggcaccccgg tgaccccctc cagagcctcc 1681 cggtacagcg ccagctgggg caggtaatcc gcccgcagcc gctccatctc ggcctctaag 1741 ttttctttat cgatatagtt ggacttatag tccacgagca cccagccgtc cccctgcata 1801 aagcagcagt cgatggtgcc ctggaccagc acctgccggc cctccagctc gtggcggatc 1861 gtaaagggct gctccttgta cagttccttt gcggccagcg cttcgcgccc cgtctgtgac 1921 ccgaagaacg cgctcacgcg atgcggatcc accgccgcga attccgcgtc cgtcagcagg 1981 cctttttcca cgagatcttc cataaaggcg cggatgctct ccgcatcctt gccttcgggc 2041 gtaaagggca gatgctccat caccgtgtga tacgccgtgc cgcgggcggc ggcattcagt 2101 cctttctgtg cagagaggaa cgcgggcagc ttatcccggg cggatgccgg aaagatctgc 2161 tcctgcaggg tctcttcctc tccttccgcc gtgagcacct tcggcagcgc ctgccttctt 2221 tcgcgctcca tggccgcgat ctgcgacacg ctgtacttgc gtttttcctt ctgctcttcg 2281 ggcggttcgt aatcgaagtt cagccggtag gcgatctcct ctttcgtgac aggcagttcg 2341 tcttccgcga catggaagcc ttccgccagt ttcttcgcca gctttctgcg gtcgagggtc 2401 tgcgcggcat gctgcgctgt gaccttctcc cgcggcacga tctccacgct ctctttcggc 2461 agcagcggca gcaaagcgtt cacgtagccc gagcagctct ctacgtcacc gggcagcgtg 2521 caa // LOCUS sequence176 2511 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence176 VERSION sequence176 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2511 /mol_type="genomic DNA" /organism="" /note="sequence176" ORIGIN 1 tcatgggtga accacagatt cagcagctcc gtgtaagtgt gatcgccgat catgatgtcg 61 gtcttcatct gctcgttggc cggggtcacg tggccgttct ggtgcagcag cgccttaaca 121 tcgcagccgc agcgcaggaa cgcatcccgc atcaggtcga aatccttcgg gcgcacgttg 181 acgtcgttta agccctgaac gatgagggcg gagcatttca gcccgtccgt cttcgagaag 241 tcccgctgcg cccagaaatc gccgtagtcc ccttccagcg cgatctgttc gtcccgtagc 301 gttgccaggt atttttcata ggtcttcacc agttccgggt ccacgtccga gaacatccgg 361 ctggcgcagg tcgccgcgag atccgtaatg aagtcgtatt tgtcgaacag ccccgaggga 421 atgccctggg tgttgttgta ttcgtaccag caggaaggcc ccgccacggg aacgatggtc 481 tccacgcctt tgacgccgga ggcagccact tcaaaggcca tggcgccagc gtaggatctt 541 ccggtcatgc cgatgcgccc gctgctccag tccgccgcga tctcgatgtt gttttcctta 601 tcggtgtacg ccttgcggtc gcccgtgagc cattcggcga tgcagcggaa cgcgtctgct 661 tccgcctggc tgcagcacac ttccagccct tcggagcccc aggtaccaag acctgcggac 721 tgcacaacgg catagcctct tacgagatag tagtcgtagg tcgttagatt tcccatgaac 781 tgctgctgga aggggtcgtt ctcgaaggta tagacccagt cggagggatc gaccgccgct 841 gcatgctgca gcgtgctgac gctgccggca ggcgtgcgct tctcaggctg cgcgtacatg 901 tccgcgatgt cgaattcgta ctcccctgcg gccggaagct gcggctggta ggcatacatg 961 ccgccgatgt agggccgggc ttcgtagatc accggtgctt tatacacgcc ggaggccgcc 1021 tgcagcggca cctgtaccat ggtctttacg agatccggtt ttccgtccat atccgtatcg 1081 ttatccgttt ccacatagac ggcgaaccgc aggagctcgc tcccctcgtt cgtgtaatcc 1141 tctttcatcg gatcggtgta ggatgcgatc tgctgtgcca taccgttttc gatgacgaga 1201 ccgtccccgg aaatgggttc tatggcagga gtttccacta caggttcttc ctgtgagccc 1261 tgctgacccc cggaacaggc cgtaaacaat agcataaatg cgagaaaaag tgcgaatccc 1321 cgtagttttt tcatggaaag tctccttttg ttatgaaacc ttttttatta tagcaaattc 1381 gtcgcataat ttggaaaata agcacaaaat gcgagaatga attgtgaagg ttgtgtgaag 1441 atgtagtata atagtatatg tattgatact gcatattgca gtatagatgc gtattttcat 1501 aaggaggaaa attatgaaga agtatcttgc actgctgctt tcagtggtca tggtcatcgg 1561 aatgtttgcc ggctgcaccg gcggcggttc cgaccagcct gcaggcggcg aaggcggaga 1621 agctgccggc gcagatccct acaccggtat tccttactcc agcgacacgg aatatgacta 1681 tctgtattcc gaagagatca ccagcatgaa ctatctggcg acctccgtat cggcgaacca 1741 gaagcccctg gcaaacttcg tcgataccct gatcgagtac gacaacttag gcaacatcgt 1801 tcccgacctg gctaccagct gggaagagag cgaagacggt ctcacctgga ccttccatct 1861 gagagatgac gccaagtggt atacctgcga aggcgaagag tatgcacccg ttaccgccaa 1921 cgacttcgtt atggcggcta gactggtcgc agacgttaag ttcgactccg atatgcccga 1981 catgctcacc tcttacatcg tcaacggctc cgaactgtac aacggcgtca tcgacgactt 2041 tacgcagctg ggcgtagaag cggtggacga ctacacgctg gtctatcact taaagcagcc 2101 ctgcgcttac ttcctcaccc tgctcaccta cggctgctat ctgccggtca acgaggaatt 2161 ctataattcc tgcgaagtcg agaatccgac tccgaccatc aacgacagcg gcgaagaaga 2221 gctcgtcacc aacgaattcg gtaccgacta cgacaagatc ctgtactgcg gcgcttacat 2281 ctgccagagc tggctgcccc aggaagagat gatctgggtc aagaacgaga attacttcga 2341 cgcagacaag gtctacatca ccaaggtaaa cggcaagtat aacgctcagg cagactccat 2401 cgctccggaa atgttcctgc gcggcgagat cgactcctgc tccgtcacca ccaacatcct 2461 ggatgaatgg ctcaacggcg acaacgccca gtacgtccac cagtccaaga a // LOCUS sequence177 2506 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence177 VERSION sequence177 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2506 /mol_type="genomic DNA" /organism="" /note="sequence177" CDS 28..1248 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MPDCLLVNAHREDSRYPFPGLSGCGVAFKLAQAIQRRLTAAGDDR FTRQDITDLLDLVAISTVADVVPLLDENRSLVKYGLRVINSRKRRGLRILLDMVGLERK EVDADDIGFILAPHINSCGRMATADRAVQLLAGLEDDGTLEDKAAFMVECNRNRRFAQD RTRDICMEAIAAGDCGELFSVIEAPGAHEGVAGIVAGSLKEQFHRPVCIVTPSENGLLK GTGRCIPGLDLHGMLSTCGELFERYGGHAGACGFSLPKENLEALRSRMDDLMRSILAER PDALDEKLSIEKVLEPSEKTLEFANALKLLEPFGEANPKPLFAIGGAGVYNVQYMGSEG QHVRFTAAGSDGVEVSCVLFRRAADFADLLRSAAKLDVAGELGINEFNGHRKLQLTVKD IKRSGSL" /locus_tag="LOCUS_5420" /note="WP_012257020.1 single-stranded-DNA-specific exonuclease RecJ (Chloroflexus aurantiacus) [pid:36.6%, q_cov:99.0%, s_cov:68.6%, Eval:5.5e-56, partial hit]" /note="MGA_780" CDS 1245..2456 /product="S41 family peptidase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_010963821.1" /transl_table=11 /codon_start=1 /translation="MIKIKKSTLIILLILAVVCGGAGLLTLQMSGVLGQLGIASSHMLN EEQYQEYRHMTQTYGKLDELRDYVMKRFYIDVDEDALETGMLKGLFEGLGDVYSYYMTP SEYEQTMISLTGVYSGVGVTISAGDSGYVEVVTPTKGSPAEEAGIRKGDLVLAVDGTEY VGADLDTCAAAIRGDEGTNVTLTIRRGEDIFDVTLTRRTIVAQTVDHKMLEDGIGYIAV SGFEEKTVEAFEEAMADIQAQGAKSFILDLRDNGGGLVDSAVGIADILLDQGVVAYTED HDGNRDYYRTKAGKTDLPYVVLVNEASASSSEILSAGIKDNGGGPLVGVTTYGKGIIQT VEQLTDGSGIKLTILQYYSPNGSVIHKQGIEPDYVVELTEDCYDEEGNLVNDLQLQKAL ELLK" /locus_tag="LOCUS_5430" /note="WP_010963821.1 S41 family peptidase (Clostridium) [pid:38.2%, q_cov:86.1%, s_cov:86.8%, Eval:6.2e-60]" /note="MGA_781" ORIGIN 1 gatcaccacg aactggaggc gggtgcgatg ccggactgcc tgctggtgaa cgcccacagg 61 gaggacagcc gctatccgtt cccggggctg tcgggctgcg gcgtcgcctt taagctggcc 121 caagctatcc agaggaggct gaccgcagca ggagacgaca ggtttacccg gcaggacatc 181 acagatctgc tggatctggt ggcgatctcc accgtggcgg acgtggtgcc tctgctggac 241 gaaaaccgca gcctcgttaa gtacggtctg cgggtcatca attcgagaaa gcgcagaggc 301 ctccgcattc ttctcgacat ggtagggctc gaacgcaaag aggtggatgc ggacgacatc 361 gggtttatcc tggcgcccca catcaattcc tgcggccgca tggctacggc ggacagagcc 421 gtccagctgc tggcaggttt ggaagacgat gggaccctgg aagacaaagc cgccttcatg 481 gtggaatgca accgcaaccg ccggtttgcc caggaccgca cgagagacat ctgcatggaa 541 gcgatcgctg ccggagactg cggcgagctg ttctccgtca tcgaagcacc gggcgcccac 601 gagggcgttg ccggcatcgt ggcgggatcg ctcaaggagc agttccaccg gccggtctgc 661 atcgtaacgc ccagcgaaaa cggactttta aaaggcacgg gacgctgcat cccgggactg 721 gacctgcacg gtatgctctc cacctgcggc gagctgttcg agcgctatgg gggtcacgcg 781 ggggcctgcg gtttctccct gccgaaggag aatctggagg cgctgcgcag ccgcatggac 841 gatctgatgc gcagcatcct ggcggaacgg cccgacgcgc tggacgaaaa gctttccatc 901 gaaaaggtgc tggagccttc cgaaaagaca ctggaattcg cgaacgcact aaagctgctg 961 gagcccttcg gcgaggcaaa cccgaaaccg ctgtttgcca tcggcggcgc aggcgtgtac 1021 aatgtccagt atatgggcag tgaaggccag cacgtgcgct ttaccgcggc cggcagcgat 1081 ggcgtggagg tctcctgcgt cctgttccgc agggcggcgg acttcgcgga tctgctgcgc 1141 tccgccgcaa agctggacgt ggcgggcgag ctgggcatca acgaattcaa cggtcaccgc 1201 aaactgcagc tgaccgtaaa agatatcaag aggagcggat ccttatgatc aagatcaaga 1261 aatcaacact tatcatctta ctgatcctgg ccgtcgtgtg cggcggcgca gggctgctga 1321 ccctgcagat gagcggcgtg ctcggccagc tgggcatcgc gtcgtctcac atgctcaacg 1381 aagagcaata ccaggaatac cggcacatga cgcagaccta cggcaagctg gacgagctgc 1441 gggactacgt catgaagcgt ttctacatcg atgtggatga agacgccctg gagaccggca 1501 tgctgaaggg cctgttcgaa ggcctgggcg atgtctattc ctactacatg acgccctccg 1561 aatacgagca gaccatgatc tcccttaccg gcgtgtattc cggtgtaggg gtcacgatct 1621 ccgcaggcga ctccggctac gtcgaagtgg tgacgcccac caagggcagc cccgccgaag 1681 aagcgggcat acgcaaaggc gatcttgtcc tggctgtgga cggcaccgag tacgtgggcg 1741 cggacctgga tacctgcgcg gcggcgatcc gcggtgacga gggcacgaac gtgaccctta 1801 cgatccgcag aggagaggat atcttcgacg ttacgctcac ccggcgcacg atcgtggcgc 1861 agacggtgga ccataaaatg ctggaggacg gcatcggcta cattgcggta agcggattcg 1921 aagaaaagac cgtggaggcc tttgaggaag ctatggccga tatccaggca cagggagcca 1981 agtcctttat cctggacctg cgcgataacg gcggcggtct ggtggattct gcggtcggca 2041 tcgcggacat cctgctggat cagggcgtcg tggcctatac ggaagatcac gacggcaacc 2101 gggattacta ccgcaccaaa gccggcaaga cggatctgcc ctacgtagtt ctcgtgaacg 2161 aagcttccgc ttcttcctcc gagatcctgt ccgcaggcat caaggataac ggcggcggac 2221 cgctggtggg ggtcaccacc tacggcaaag gcattatcca gaccgtcgag cagcttacgg 2281 acggctccgg catcaagctt acgatcctgc agtactactc tccgaacggc agcgtcatcc 2341 acaagcaggg catcgagccc gactatgtgg tggagctcac ggaggactgc tacgatgaag 2401 agggcaatct cgtgaacgac ctgcagctgc agaaggcgct ggagctgctg aaatagaaga 2461 cagatataga tagtgcggat gagcatatga gcaaaaagat cgtagc // LOCUS sequence178 2502 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence178 VERSION sequence178 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2502 /mol_type="genomic DNA" /organism="" /note="sequence178" CDS 306..1808 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MKNRKKHLSILLALALALAMLPLTVFAEDALPVPVEEASIVWDSE AGTLTMPGASGQEYAAIEYNDGVLDWTQAIEPDAEGNVQFTGIMKNNTYDIFTRIKGAE GAAMTLFYTHESDGSQEPDPAEGEGLEEPKWFSQIPEYPEEGDAETVTVSFAGNAEQEY VICEKGETPDWAADGDAIVRPDEDGAVGFDGLTPATVYTIYTRAAGTESPVVSADVVTM LCGSEAVCDAYEVGRVLTVTPVPANAKVTYQWCRQIATPIIAGEYEGMTRNDYFPIEGA TAASYTMTEDDLGKMLAVKFLAGGEEVHMAEDLGPVEAFGTDEEAFPFLDVPLNAYYRA AVEWATENGITGGTSKTTFGPAAPATRGQMVTFLWAAAGSPEPESTENPFADVKESDYF YKPVLWAVEKGITAGVTADKFGPAQTVTRAQAVTFLYGAAGRPEAGSEPFEDVADTDWF AAPVAWAFNNGITSGTTKTTFGPEQLCVRSQIVTFLYGSVQH" /locus_tag="LOCUS_5440" /note="MGA_783" ORIGIN 1 gggagagcac gcgaaattca tcaccggcac cgaccttctg atcgacggcg gcgtgatcgc 61 atccatccgc accggcgttt acaaactgca cggatgtgca aaatattgtg caatttccgc 121 gtttttgctc aggttcggca tggttccctc cgtaaatggt ttaattgatt caggatatat 181 ttttatgtcc cgttctgtcc aacagatgtc cagcaggcag aaaaaagaac ggaatttttg 241 tgaaaaacag atataataaa agatacaata tttattcaca tgatcttatt aaaggagtaa 301 aagggatgaa aaacagaaag aaacatctga gtatcctgct ggcgctggct ttggcgctcg 361 ccatgctgcc gctgaccgtc ttcgcggaag acgcgctgcc ggtccccgtg gaggaagctt 421 ccatcgtctg ggacagcgaa gcgggcacgc tgacgatgcc cggcgcttcc ggtcaggaat 481 acgccgccat cgaatacaac gacggcgtgc tggactggac gcaggcgatc gagccggatg 541 cagagggaaa cgtgcagttt accggcatta tgaagaacaa cacgtatgat atctttaccc 601 gcatcaaagg cgcagaaggc gcggccatga ccctcttcta cacccacgaa agcgacggtt 661 cccaggagcc cgatcccgcg gagggcgaag gcctcgaaga gccgaagtgg ttctcccaga 721 taccggaata tccggaagaa ggggatgcgg agaccgttac ggtgtccttt gccggaaacg 781 cagagcagga atatgtgatc tgcgaaaagg gtgagacccc ggattgggca gcggatggcg 841 atgccatcgt ccgtcctgac gaagatggag cggtcggctt cgacggttta acacctgcaa 901 ccgtctacac gatctacacc cgcgccgcag gcacggaaag cccggtggtt tccgcagacg 961 tagtgacgat gctgtgcggc tccgaagcgg tatgcgatgc ctacgaggtg ggcagagttc 1021 ttacggtcac cccggtgccg gctaacgcga aagtcaccta tcagtggtgc cgccagatcg 1081 cgacacctat tatcgcaggc gaatacgagg gcatgacccg caacgattac ttccccatcg 1141 aaggcgcgac ggcagcttct tataccatga ccgaagacga tctcggcaag atgctcgcgg 1201 tgaaattcct cgcgggcggg gaagaggtcc acatggcgga agacctgggc ccggtggaag 1261 ccttcggaac cgacgaagag gcgttcccgt tcctggacgt tcctctcaat gcctactacc 1321 gcgcagcggt ggaatgggct acggagaacg gcattaccgg cggcacgtcg aagacgacct 1381 tcggcccggc cgctcctgcg acccgcggac agatggtcac cttcctgtgg gcggcagccg 1441 gctcccccga accggagagc acggaaaatc cgtttgcaga tgtaaaggag agcgactact 1501 tctataagcc cgtgctgtgg gccgtggaga agggcatcac tgcgggggtc accgcggata 1561 agttcggtcc ggcgcagacc gtgacccgcg cacaggctgt tacgttcctg tacggcgcag 1621 ccggccgtcc cgaagcgggc agcgagccct tcgaggacgt tgcggatacc gactggtttg 1681 cagctcccgt agcctgggcc ttcaacaatg gcattacctc cggcacgacg aagacgacct 1741 ttggtccgga gcagctgtgc gtcagaagtc agatcgttac gttcctgtac ggcagcgtgc 1801 agcactgaga gcggatattg aacagccgtt cagcatcttt tttctgaggc ggaatcataa 1861 aaaaattcaa tcaaaaaccc cttgcaaaag gcgaaatacg gcaaaagact tgaaaatcgg 1921 gcattctgcg gaatgcccga tatttagtgt gcggagtgta accacaccac tatatattga 1981 cattcacagg cgcgaggagt acattatata gcggcgggag tgctcccgtt ttttcggtgt 2041 aacaaccact gtgtatcttt tatataaatg aggtgaaagt tatgtatcat gtcgtaaaaa 2101 gggacggaaa ggtcgctgaa ttcaacatcc gcaagatcag cgacgccatc acgaaggcat 2161 tcgaagcgca gggaagacag tatcatccca gcaccatcga tatgctggct ctgcgggtca 2221 catccgaatt cgaacccctc atccaggacg atcagatcca ggtcgaacag atccaggact 2281 gcgtcgaaaa ggtgctgtcc gaagccggct atgcggacgt cgccaaggcc tacatcctgt 2341 acagaaagca gagagagaag atccgcaacg tcaattccgc gctgctctcc tacaaggaca 2401 tcgtcgataa ctatctgaag atcaacgact ggcgcgtaaa ggaaaattcc accgttacgt 2461 attccgtcgg cggtctcatc ctgtccaatt ccggcgccat ta // LOCUS sequence179 2502 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence179 VERSION sequence179 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2502 /mol_type="genomic DNA" /organism="" /note="sequence179" CDS 410..1348 /product="bifunctional riboflavin kinase/FAD synthetase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003438310.1" /transl_table=11 /codon_start=1 /translation="MNIYRNLNEIANMSPTAVALGNFDGVHKGHQMLIRECVAVAKEKG LQPSVFTFTNHPVNEIAGKTVIKNIMTFEEKAEQLEKLGVENLFSPVFDDTIRTKSAFD FVKDILVDRFRTKHAVCGFNYRFGYKAEGDADRLAQLGREFGYGVSVIPEIRINGNTVS STLIRTIIDEGKIDEYKDYTGRLYCIDGKVVQGKHLGRRIGFPTVNLSLDTTEAFPKNG VYITQTTVNKRKYQSITNVGNKPTVGEFAKNAETHIFDFDGDLYGQKVRIEFIKMLRPE RKFDTLEDLQAEIHRNCLQAQEYFRTERSQS" /locus_tag="LOCUS_5450" /EC_number="2.7.1.26; 2.7.7.2" /note="WP_003438310.1 bifunctional riboflavin kinase/FAD synthetase (Clostridioides difficile) [pid:40.7%, q_cov:95.2%, s_cov:95.8%, Eval:9.4e-63]" /note="MGA_786" CDS 1345..1581 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MKYANGFTINATGHECFLTFLQTRPNGETKQTEEVETIVMTEQMA RQMIVALAKVYNKVDSDRAAKKKVDVKENAQLS" /locus_tag="LOCUS_5460" /note="MGA_787" CDS 1711..1977 /product="30S ribosomal protein S15" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_012869466.1" /transl_table=11 /codon_start=1 /translation="MIAKDVKTNIIKEYATHEGDTGSPEVQVAVLTHRINELNEHLKKN PKDFHSRRGLLKMVGQRRNLLAYLRDKDIERYRSLISRLGLRK" /locus_tag="LOCUS_5470" /gene="rpsO" /note="WP_012869466.1 30S ribosomal protein S15 (Thermanaerovibrio acidaminovorans) [pid:66.7%, q_cov:98.9%, s_cov:98.9%, Eval:2.2e-29]" /note="MGA_788" ORIGIN 1 tcctggcatg gaacggaccg tccgaacctt ttaagatgga gatcgtctgc agccgcggca 61 cgtatatccg ttcgatctgc cacgatctgg gcgaagccct gggctgcggc gcctgcatga 121 gcagcctcgt tcgcacggag acctgcggtt ataagatcga agaggcggcg gatctggagg 181 cactgcgcgg gatgaccccg gagcagatcg aagcgctgct ggatcctctg gaatccgccg 241 taagccatct gccgcgcctg gatcttaccg aggaacaggc caagcctttc ctcaacggca 301 atccggtgtg gagcgaagat ctgccgctgg aagaacgcaa ttacgctgtc ttcggtgacg 361 gcggattgct tggcatctgc aaaggccatc tcatttcgaa agtactgaaa tgaacatata 421 cagaaactta aatgaaatcg cgaatatgtc tccgactgcc gttgcgttag gcaatttcga 481 cggcgttcat aagggtcacc agatgctcat ccgggaatgc gtggctgtgg caaaggaaaa 541 agggctgcag ccctccgttt ttacgtttac gaatcatcct gtaaacgaga tcgcgggaaa 601 gaccgtcatc aagaacatca tgaccttcga agaaaaggcg gagcagctgg agaaactggg 661 ggtcgaaaac ctgttttccc cggtgttcga cgataccatc cgcacgaaga gcgcgtttga 721 tttcgtcaag gatatcctgg tggaccgctt ccgcacgaag cacgccgtgt gtggtttcaa 781 ttaccgcttc ggctataagg cggaagggga tgcggaccgg ctggcgcagc tgggaaggga 841 gttcggctac ggcgtgtccg tcatcccaga gatccgcatc aacggcaata ccgtatccag 901 cacccttatc cggactatta tcgatgaagg caagatcgac gaatataagg attataccgg 961 caggctgtac tgcatcgacg gcaaagtggt gcagggcaag catctgggcc gccgcatcgg 1021 atttccgacc gtcaatctga gcctcgacac gacggaagcg tttccgaaga acggtgttta 1081 cataactcaa acgaccgtaa acaaacggaa atatcagtcc atcacaaacg tgggaaacaa 1141 gccgacggta ggagaattcg ccaaaaacgc ggaaacgcac atcttcgact tcgacggcga 1201 tctctacgga cagaaagtgc gcatcgagtt tatcaagatg ctgcgtcccg agcgcaagtt 1261 cgatacgctg gaagacctgc aggcggagat ccatcggaat tgtttgcagg cacaggaata 1321 ctttagaaca gaaaggagcc aatcatgaaa tacgcgaacg gattcaccat caatgcaacg 1381 ggtcacgaat gctttttaac gttcctgcag acccgcccca acggagagac caaacagacg 1441 gaggaagtgg agaccatcgt catgaccgag cagatggcgc gccagatgat cgtggccctt 1501 gccaaagtct ataacaaggt cgattccgac agggctgcca agaagaaagt cgacgtgaag 1561 gaaaacgccc agctgtctta aatttcccgc tttacaaacc attgcgggct gtgctaatat 1621 atatcgtctg tttataagta cccagtgctt aggctgccga cgctccgacg ctgcctcggc 1681 cttgggcgga tctagaaaag gagattacaa atgatcgcaa aagacgtaaa gaccaacatc 1741 atcaaggaat atgccaccca cgaaggagac accggttctc ccgaagtcca ggtcgcagtc 1801 ctcactcacc gcatcaacga actgaacgaa cacctgaaga agaaccccaa ggacttccac 1861 tccagaagag gtcttctgaa gatggtcggt cagagaagaa atctgctggc ttatctgaga 1921 gataaggaca tcgagcgcta cagaagcctc atctcccgtc tcggcttaag aaagtaaaca 1981 gagaaaacgg cggggcacaa aagccccgcc ttgttgttat tatttttcat caggggccgg 2041 gcttgagaat taaattcata tgcgcagatc ctgtgcaatg agtttacttg tcaagccggg 2101 cctgatacga aaggcaaggt taacatttat gagatttaca gattaccgga cattccgcac 2161 tgccgtaggc ggcagactgc tggaagtcga gatcggcaag gtctgcgaac aggccaacgg 2221 ccagtgctgg gtccgctacg gcgataccgt ggtcaactgc actgccacca tgtccaagac 2281 cccgagagaa ggcgtggact tcttcccgct ttcctgcgac ttcgaagaaa aaatgtacgc 2341 tgccggcaag atccccggcg gattcatcaa gagagagggc agaccctccg aaaaagccat 2401 cctcacgtcc cgtctgatgg acagaccgct ccgtccgctg ttccccaagg gattctataa 2461 cgacgtccag gtcgtagcga cctgcatgtc catggatcac ga // LOCUS sequence180 2498 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence180 VERSION sequence180 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2498 /mol_type="genomic DNA" /organism="" /note="sequence180" CDS complement(4..735) /product="ABC transporter permease" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_211328137.1" /transl_table=11 /codon_start=1 /translation="MGILTVLWEKWVEFRRDFYKITVAAMISPLMYLIIFGMGIQTTSH GEPYLHFLIPGVVAMSTMTGSFSAIAQNMSVQRLYEKALDQVMVSPTPLWQFILGQVIG GSLRGMYAGGIILLLTMPIRTDLTFNALSLFIMFLNGLVFSTIALTLSFLAKSYTDAPR FTSYIITPMSFLCNTFFSTEQMPAGFQQAVSVLPLSQSAGMIRAIANGEDPGWIGFAIL AAYLLVFGLLSMNFIYKKKNL" /locus_tag="LOCUS_5480" /note="WP_211328137.1 ABC transporter permease (Thermodesulfitimonas autotrophica) [pid:34.3%, q_cov:93.8%, s_cov:94.7%, Eval:7.6e-40]" /note="MGA_790" CDS complement(740..1585) /product="daunorubicin resistance protein DrrA family ABC transporter ATP-binding protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011022097.1" /transl_table=11 /codon_start=1 /translation="MIELKGLTKKFGDFTAVDGLDLRVETGEFFGLLGPNGAGKTTTIS MVSTVLLPTSGEILVDGKKLDRKASEQKRKLSVITQEYSMRQDMTMDEVMEYQARLYML PKREWKPKADELLEFTGLTEYRRRTVRHLSGGMKRKLMICRALLIEPQILLLDEPTAGM DAISRRQMWNLLRRLNERDITIILTTHYMEEAQALCDRVALINRGKLQKLDTPQALIEE LGAFAVDETSEDSLKSRYFSTRQEAIAYLQTADHSAMLRQTTLEDVFVECAGRKLDSGR " /locus_tag="LOCUS_5490" /note="WP_011022097.1 daunorubicin resistance protein DrrA family ABC transporter ATP-binding protein (Methanosarcina acetivorans) [pid:44.8%, q_cov:82.2%, s_cov:86.9%, Eval:4.4e-53]" /note="MGA_791" CDS complement(1582..2268) /product="precorrin-2 C(20)-methyltransferase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011461549.1" /transl_table=11 /codon_start=1 /translation="MKGIAYGVGVGPGDPKLMTLRAIELIRENDVIAVPGKEPKESVAY KIAAAVVPEIADKELVPVYMPMIKDRALIDEEHKKGAALLKKYLDQGKNVVYITLGDPT IYCTFSYLQHYLEADGYPVKLVPGISSITAAAARLNLPLTEWDEPLHVLPAVHKTDAAM DLPGTYVLMKSASHMKDVKETLRKSGKDVQAVIDCGMPTEQVYRSLEEIPDDAGYFALV IAKEPK" /locus_tag="LOCUS_5500" /gene="cobI" /EC_number="2.1.1.130" /note="WP_011461549.1 precorrin-2 C(20)-methyltransferase (Desulfitobacterium hafniense) [pid:36.2%, q_cov:97.8%, s_cov:90.7%, Eval:9.5e-34]" /note="MGA_792" ORIGIN 1 ctcctacaga ttctttttct tatagataaa gttcatcgac agcaatccga acacgagcag 61 ataagctgcc agtatggcaa acccgatcca acccggatct tccccgttgg cgatagcgcg 121 gatcatgccg gcgctctggg acagcggcag cacggatacc gcctgctgga atcctgccgg 181 catctgctcc gtagagaaga acgtattgca cagaaagctc atgggcgtaa tgatgtacga 241 tgtaaaccgc ggcgcatccg tgtagctctt tgcgaggaac gaaagcgtta gcgcgatcgt 301 ggaaaacacc agtccgttga ggaacatgat gaacagcgat agcgcattaa acgtaagatc 361 cgtgcggatc ggcatcgtaa gaagcaggat gatgcctccg gcgtacatgc cgcgcaggct 421 gccgccgatc acctgaccaa gaatgaactg ccacagcggc gtcggcgaga ccatcacctg 481 gtccagcgcc ttttcgtaaa gcctctgcac gctcatgttc tgggcgatcg cggaaaaact 541 gcccgtcatg gtggacatgg ccacgacgcc ggggatcagg aagtgcagat acggctcccc 601 gtgggacgtg gtctgaatgc ccatgccgaa gatgatcaga tacatcagcg gcgagatcat 661 ggctgcgacc gtgatcttat aaaaatcccg gcggaactcc acccattttt cccaaagtac 721 agtaagaatg cccatgccgt tacctcccgc tgtccagctt gcggccggca cattccacga 781 acacgtcttc caacgtcgtc tggcgcagca tagcgctgtg atcggccgtc tgcagatagg 841 cgatcgcttc ctgccgcgtg ctgaaatacc ggctctttaa gctgtcttcg ctggtctcgt 901 ctacggcgaa ggcgcccagt tcttcgatca gcgcctgcgg cgtatccagc ttctgcagtt 961 tgccccggtt gatgagggct acccggtcgc agagggcctg ggcttcctcc atgtagtggg 1021 tcgtcaggat gatggtaatg tcccgttcgt tgagccggcg cagcagattc cacatctgcc 1081 ggcgggaaat ggcgtccatg ccggccgtcg gttcatccag caggaggatc tgcggctcga 1141 tcaacagcgc ccggcagatc atgagttttc tcttcatgcc gccggacaga tggcgcaccg 1201 tccgtctgcg gtattccgta aggccggtaa attccagcag ttcatccgcc ttcggcttcc 1261 actcccgttt tggcagcata tagagacgcg cctggtattc catcacctcg tccatggtca 1321 tgtcctggcg catggaatat tcctgggtga tgacgctcag ttttctcttc tgctcggagg 1381 ccttgcggtc cagtttcttt ccgtccacca ggatctctcc ggatgtaggc agaagcaccg 1441 tggataccat gctgatcgtc gtggtcttcc ctgcgccgtt cggtccgagc agcccaaaaa 1501 actctccggt ctccacgcga agatccagcc cgtctacggc ggtaaaatcg ccgaatttct 1561 ttgtgaggcc tttcagttcg atcatttcgg ttcttttgcg atcacgaggg cgaaatatcc 1621 ggcatcgtcc gggatctctt ccagactgcg atagacctgc tctgttggca tgccgcagtc 1681 gattacggcc tgcacgtctt ttccgctctt tctcagcgtt tcctttacgt ccttcatgtg 1741 gctggcggat ttcatcagca cgtaggtgcc gggaagatcc atcgcggcgt ccgtcttatg 1801 gacggcgggc agcacgtgga gcggttcatc ccactccgta aggggcaggt tgagcctggc 1861 agcggcagcc gtaatggaag agatgccggg caccagtttc accggatatc cgtccgcctc 1921 cagataatgc tgaagataac tgaacgtgca gtagatggtg gggtcaccca gggtaatgta 1981 aacgacgttc ttcccctggt ccaggtattt cttcagcagc gccgcaccct tcttatgttc 2041 ttcgtcgatg agggcgcggt ccttgatcat gggcatgtag accggcacca gttccttgtc 2101 cgcgatctcg gggacgacgg ctgctgcgat cttataagcg acggattctt tgggttcctt 2161 tcccggcacg gcgatcacgt cgttctcccg gatgagttcg atggctctca gggtcatcag 2221 tttggggtct ccggggccta cgcccactcc atatgcaatt cctttcatag atctatgctc 2281 cttttattgt tctttttctg cggtttcaaa ccaggaaaat gtatcggcca gttcgcagac 2341 tctgccgacg atgaggatgg ccggcgtctg cacgcaggct tctttgcacg ccatttcgag 2401 ggtcccgacg gtagcggcga tccgccgctg ttctttcgtc gtcccttttt ccagaacggc 2461 agccggcata tccggatcca ttcccgcgcg cagaagtc // LOCUS sequence181 2495 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence181 VERSION sequence181 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2495 /mol_type="genomic DNA" /organism="" /note="sequence181" CDS 1376..2017 /product="flavodoxin family protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011459715.1" /transl_table=11 /codon_start=1 /translation="MKVILVNGSPHEKGTTWAGLDEIARTLQAEGIEAEIFWIGNKAVG GCIGCGGCETTGRCVFGGIVNEFLDKAESADGFVFGAPVHYAGPNGNMKSFMDRVFYAD AHSFRLKPGACIAAARRAGVVTTMDDLNKYLTISEMPVVSSTYWNMVFGFNAEEAKQDA EGMRTMRNIGHNMAYLLKCMEAAKAAGIEKPEGEPGVWTHFIGNGTVSKR" /locus_tag="LOCUS_5510" /note="WP_011459715.1 flavodoxin family protein (Desulfitobacterium hafniense) [pid:52.2%, q_cov:96.2%, s_cov:99.5%, Eval:1.1e-57]" /note="MGA_795" ORIGIN 1 cgtctgcgtc ttggagatct ggggcgggat gacgccttcc acgcccgtta aggaaaggat 61 gcacaccaga ttcttctgca cgcccttgta ggcatccgtc gggtcgtacc attcgctgat 121 atcgtgcgtg ccgccgctgt cgcccccgga ggtgatggtc gctgccggga tccccaggga 181 aaggggaatg ttggcgtcgg tactggccag ttcccgcatc ttcggttcga tgccgcagat 241 ccggaaggca tctttcagaa gtgcaatgat ctcgcagttt tcatcctgca cgccgccggt 301 ggagccgccc agttcctccg tgctcatctg aatgcgggct tcgggatcga agcggagctc 361 cttgctgttc tttacggcga actctctttc cactgtccag cgttcgtact cttcctccgc 421 gcattcctcc gcgatcttca ggcatttcgc atggaaatcc tccatgatct tcgtgtcttt 481 gctgcgcacg tccatggtaa aagagcattc gctggcgatg gacgtgaccc cggtaccgcc 541 ctgcaccgtg gaaacgttga agatcgtaaa tggctcaagg ggaacgcgtt cctgggagat 601 ccgggcgatg gcccgtccca tgcattctac cgggttcacc aggccgtagg cgccgacgga 661 atggccgccc ggcccccgga acgcaatgcg gaactgcacg tcggacaaag ctccgtaggt 721 cagatgatcg ccgtgtccat cgatggaaat gaaggcgtcc accttcgtct gttttgtgtt 781 gaagatatgc cgcacgcccc ggaaattgcc gacgccttct tcgcccacat cgccgccgat 841 caggagggtg caggcggggc ggatctccgc ttccttcatg gcccgcagga tcgagagcac 901 ctccgcacag cctcttgtat cgtcgcagat gccgggcatg cagatgcggc tgccttcccg 961 gcgcatcgtc aggtccgtgt ccatgggaaa gacggtgtcc agatgggcgg tgaccatcac 1021 aacaggcgcg tctttgggcc cctcgatcac ggcgaagacg ttgcccactt catcctgtac 1081 cgtccggtaa cccatcccat cgatgatctc ccggaaccgg gctgcctttt tctcttcgtg 1141 attcgaatag gcgggaatgc cggccagttc gatctgctgt gccaccgtat tttctgcatc 1201 ttccttcaga aaggacagag ccttttggat cttttcggaa tcatataaga tttggatcgc 1261 ttcgttcata ctatcgcttg cctcctgttt tgcgtaaaat cactgccttc attatagcag 1321 aaagcacccc cgcctatgct ataatactaa ctggttttaa agttaaggag gaactatgaa 1381 agtaatactc gtaaacggca gccctcacga aaaaggcacg acctgggcgg gactggatga 1441 gatcgcaaga acgctgcagg cagaaggcat cgaggcggag atcttctgga tcggaaataa 1501 ggcggtcggc ggctgcatcg gctgcggcgg atgcgagacg accggacgct gcgtcttcgg 1561 cggcatcgtc aacgaatttc tggacaaagc ggaaagtgcc gacgggttcg tattcggtgc 1621 tcccgttcat tacgcaggac ccaacggcaa catgaaatcc ttcatggacc gggtgttcta 1681 cgcagatgcc cacagtttcc ggttaaagcc gggtgcatgc attgcggcgg cccgcagggc 1741 cggcgtggta accacgatgg atgacctcaa caagtatctc accatcagtg aaatgcccgt 1801 ggtctcttcc acgtactgga acatggtctt cggttttaat gcggaggaag caaaacagga 1861 tgcggaaggc atgcgcacca tgcggaatat cggtcataac atggcttacc tgctgaaatg 1921 catggaggcg gccaaggctg ccggcatcga aaaaccggaa ggtgaaccgg gcgtatggac 1981 tcactttatc ggaaacggga cggtctccaa acgttgatcc gcaccttcat caaaaaagaa 2041 cccgtgctcg tcatcgcggc gctggctgct gcggtcagct gctttttcgt ctcgccggac 2101 gggacttact tttcgtacct cgatctccgc acgctggcgc tcctgtactg cctcatgacc 2161 gtggtggcgg ggctgcgtca ggctggattg tttgaacacc tggcccagga agtctgcgaa 2221 cgctccggca gtctccggat gctgagcata ttgctggtcc tgctctgctt ctttacgtcc 2281 atgctcatca cgaacgacgt ggcgctgctc acgttcgtgc cgtttgcggt catcgtgctg 2341 ggcatgtcgg gaagactgca gcacctgatc cgcgtcgtcg tgctgcagac tgtcgccgcc 2401 aacctgggca gcatgctgac gccggtcggc aatccgcaaa atctgtacct gtattcctat 2461 tacggcctgg ggatgggcga gtttctgggg atcac // LOCUS sequence182 2494 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence182 VERSION sequence182 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2494 /mol_type="genomic DNA" /organism="" /note="sequence182" CDS complement(132..524) /product="30S ribosomal protein S9" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_010966378.1" /transl_table=11 /codon_start=1 /translation="MAKMQFCGTGRRKSSVARVRLVPGNGNITVNKKPLDDYFGMELLK REVRRPLQLVAADSKFDVIATVYGGGTTGQSGALRHGISRALCQADPENRPALKAAGFL TRDPRMKERKKYGLKKARRASQFSKR" /locus_tag="LOCUS_5520" /gene="rpsI" /note="WP_010966378.1 30S ribosomal protein S9 (Clostridium) [pid:66.2%, q_cov:100.0%, s_cov:100.0%, Eval:2.5e-44]" /note="MGA_797" CDS complement(543..971) /product="50S ribosomal protein L13" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_005396465.1" /transl_table=11 /codon_start=1 /translation="MSSYIAKPSEIERKWYILDAEGKTLGHLASEAASILRGKKKPTYT PYIDCGDYVIVINAEKIEVTGKKAKEKIYKHHTGYPGGLKEITFEKLQAKDPEEIIRHA VKGMMPKGPMGRQMYKKLKVYAGPEHKHAAQKPEVWEF" /locus_tag="LOCUS_5530" /gene="rplM" /note="WP_005396465.1 50S ribosomal protein L13 (Vibrio) [pid:63.3%, q_cov:97.9%, s_cov:97.9%, Eval:2.5e-50]" /note="MGA_798" CDS complement(1165..2490) /product="ABC transporter permease" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011459130.1" /transl_table=11 /codon_start=1 /translation="MSNKDILQLCFGNLLRRRTRTILSVIGVIIGTTAIIVMISIGMGL SYGYQEQLESFGNLHMVEVYNYGGGGGGAGGQPSKLDDRTIAKMEKIDGVTVISPQISQ YAIIAGDHKRTECQIIGIRTEMLQALNLELEKGRMPVASDKSPLLFGRNAAASFYDPRK SQGMDWGNTEPTVDPLQKFIITNDWDYGTNQEGQNMGETVPIQIDAQGVGMMASTDNEY AYNIYTTLEFAQKLKEEWDKAQNGGRPVGNSSQGTEYQNVMVYVADLEKVASVSETIRT EYGFSTFSLNDMLKEMQKTANMIEAVLGGIGGISLLVAAIGIANTMIMSVYERTREISV MKVIGASLKDIRKMFLLEAGMIGFGGGVIGVALSYGISYVMNHFLAGAIGGAFGMGSKV SIIPIWLVLAALAFSTMVGVVSGYSPAQRAMNMSVLEGLKNE" /locus_tag="LOCUS_5540" /note="WP_011459130.1 ABC transporter permease (Desulfitobacterium hafniense) [pid:32.4%, q_cov:100.0%, s_cov:100.0%, Eval:9.2e-52]" /note="MGA_799" ORIGIN 1 acatgctgca tgcatgcttc atatacacaa tcagtgagta taatgaagag catctcacag 61 ctacatattg tacaaaacct tgtgttttgg acgccatata gagcatatga acgtcctggg 121 acccatacag actaacgctt ggagaactgg gaagctcttc tggccttctt cagaccgtac 181 ttctttcttt ccttcattct cgggtctctg gtcaggaaac cggcggcctt cagggcaggt 241 ctgttctcag gatcagcctg gcacagagct ctggagatgc cgtggcgcag agcgccgctc 301 tgaccggtgg tgccgccgcc gtaaacggta gcgatcacgt cgaacttgct gtcggctgca 361 accagctgca ggggtcttct gacctctctc ttcagcagtt ccattccgaa atagtcgtcc 421 aggggcttct tgttaacggt gatgttgccg ttaccgggga cgagtcttac tctggcgacg 481 gaagactttc ttctgccggt tccgcaaaat tgcattttag ccattttcta ctcctccctt 541 ccttagaatt cccaaacttc aggcttctga gctgcgtgct tgtgctcggg gcctgcatag 601 accttcagct tcttgtacat ctggcgaccc atgggtccct tgggcatcat gcccttgact 661 gcgtggcgga tgatctcttc cggatcctta gcctgcagct tttcgaaggt gatctccttg 721 agtccgccgg gataaccggt gtgatgcttg tagatctttt cctttgcctt cttgccggta 781 acttcgatct tctcggcgtt gatcacgatg acataatcgc cgcagtcgat gtacggggtg 841 taagtcggct tcttcttgcc tctgaggatg gaagcggctt cggacgccag gtgaccgagg 901 gtcttgcctt cagcatccag gatgtaccac tttctttcga tctcagaggg ctttgcgatg 961 taactggaca tggttcaaat acctccttgt ctactcatat gtgcggggcg tgacccgccc 1021 atagatttcg acgcctactc tgatgggtcc aaccatcggt ttcggcacta ctacgaatag 1081 ctcggcctag ggcctctggg gcctgtgcct ttgttgtcac gctcgattat tttatctgtt 1141 tcgtcaaggc atgtcaagcc ttaattactc atttttcaag ccttccagca cggacatgtt 1201 catggcgcgc tgggccgggc tgtagccgga cacgacgccc accatggtgg agaacgccag 1261 cgctgccaag accagccaga tcggaatgat ggagaccttg cttcccatgc cgaaagcgcc 1321 gccgatggcg ccggccagga agtggttcat cacgtaagag atgccgtagc ttaaggccac 1381 accgatgacc cctccaccga agccgatcat gccggcttcc agcaggaaca tcttgcggat 1441 gtccttgagg ctcgcgccga tgaccttcat gacggagatc tcccgggtgc gttcgtacac 1501 ggacatgatc atggtgttgg cgatgccgat ggccgcgacc agcagcgaga tgccgccgat 1561 gccgccgagc acggcctcga tcatgttggc ggtcttctgc atctccttga gcatatcgtt 1621 cagggagaag gtagagaagc cgtactccgt gcggatggtc tcgctcacgg aagcgacttt 1681 ttccaggtcc gccacgtaga ccataacgtt ctggtattcc gtcccctggc tcgaattgcc 1741 tacggggcgc ccgccgttct gggccttgtc ccattcttcc ttgagcttct gagcgaattc 1801 cagcgtggtg tagatgttat aggcgtactc gttatcggtg ctggccatca tgccgacgcc 1861 ctgtgcgtcg atctgaatgg gcaccgtctc gcccatgttc tggccttcct ggttcgtgcc 1921 gtagtcccag tcgttcgtga tgatgaactt ttgcagcgga tcgacagtcg gttcggtgtt 1981 gccccagtcc ataccctggg atttgcgggg gtcatagaac gacgctgccg cgttgcggcc 2041 gaacagaagc gggcttttat cggatgcaac cggcatgcgg cccttctcca attccagatt 2101 cagagcctgc agcatctccg tccgtatgcc gatgatctga cattccgtgc gcttgtggtc 2161 tcccgcaatg atcgcatact gggagatctg tggagatatg acggtaacgc cgtcgatttt 2221 ttccatcttg gcgatggtgc ggtcgtccag cttgctgggc tgacctccgg cgccgccccc 2281 tccgcctcca tagttgtaca cctccaccat gtgcaggttg ccgaaggact ccagctgttc 2341 ctggtagccg taggacaagc ccatgccgat ggagatcatg acaatgatgg cggtggtgcc 2401 gatgatgacg ccgatgacgg acaggatcgt ccgcgtgcgg cggcgaagga gattcccgaa 2461 gcagagctgc agaatatcct tgttactcat cgag // LOCUS sequence183 2492 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence183 VERSION sequence183 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2492 /mol_type="genomic DNA" /organism="" /note="sequence183" CDS 1..378 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MKAGFDTLVEAGYAPEMAYFECIHEMKLIVDLINSGGFAMMRYSI SNTAEYGDYRSGKRIITEETRKEMKKMLGEIQDGTFASEFIQEFKAGGKAKFLASRNKE ANHPLNKVGDELREMMSWLKK" /locus_tag="LOCUS_5550" /note="WP_010938673.1 ketol-acid reductoisomerase (Desulfovibrio) [pid:69.6%, q_cov:100.0%, s_cov:37.5%, Eval:4.6e-43, partial hit]" /note="MGA_800" CDS 392..2053 /product="dihydroxy-acid dehydratase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011393742.1" /transl_table=11 /codon_start=1 /translation="MRSDNVTKGVERAPNRSLLYALGYSKEEIERPLIGVVCSYNEIVP GHMNLDKIADAVKTGIEMAGGTAVMFPAIAVCDGIAMGHIGMKYSLVTRDLIADSTESM AIAHQFDGLVMIPNCDKNVPGLLMAAARVNVPTIFCSGGPMLAGRLNDGRRTCLSHMFE AVGAYKAGKLDDAGVEEYEQNACPTCGSCSGMYTANSMNCLTEGLGMALRGNGTIPGVY SARLRLAKHTGMQIMELVKKNIRPRDIMTEQAFHNAETLDMALGCSTNSMLHLPAIAHE CGIELSFDMANEISEKTPNLCHLAPAGNTYMEDLDRAGGVYAVMTELCKKDLLDTSVMT CTGKTMKENLEGVVNRDPELIRPIENPYSPYGGIAVLKGSLAPEGCVVKQSAVAEEMMV HQGPARVFDSEEDAIAAIYEGKIVAGDVVVIRYEGPKGGPGMREMLNPTSAIAGMGLDK DVALITDGRFSGATRGASIGHVCPEAAQGGPIAFVEEGDQIAIDIPNKTIELLVDEETL AARKAAWVCPEPKVKTGYLARYAKLVTDSSRGAVLE" /locus_tag="LOCUS_5560" /gene="ilvD" /EC_number="4.2.1.9" /note="WP_011393742.1 dihydroxy-acid dehydratase (Moorella thermoacetica) [pid:61.7%, q_cov:100.0%, s_cov:100.0%, Eval:5.3e-196]" /note="MGA_801" ORIGIN 1 atgaaggccg gtttcgatac gctggtggaa gcaggctacg ctcccgagat ggcatacttt 61 gagtgcatcc acgagatgaa gctcatcgtt gacctcatca actccggcgg ctttgccatg 121 atgcgttact ccatttccaa taccgccgag tacggcgact acagaagcgg caagcggatc 181 atcaccgaag agacccgcaa ggagatgaag aagatgctgg gcgagatcca ggacggcacc 241 ttcgcttccg agttcattca ggaattcaag gccggcggaa aagccaagtt ccttgcttcc 301 cgcaacaagg aagccaatca tcctctcaac aaggtgggcg acgagctccg tgagatgatg 361 agctggctga agaaataagg aaggcatcat tatgagaagt gataatgtaa caaaaggcgt 421 agagcgtgct cccaaccgct ccctgctgta cgctctcggc tattccaagg aagagatcga 481 acgtcctctc atcggcgtgg tctgctccta taacgagatc gttcccggtc atatgaatct 541 ggacaagatc gccgatgcgg tcaagaccgg catcgagatg gccggcggta ccgccgtcat 601 gttccccgcc atcgcagtct gcgacggcat cgccatggga catatcggca tgaaatactc 661 cctggtcacc cgtgatctga tcgcggactc cacggaatcc atggccatcg cccatcagtt 721 cgacggactg gtcatgatcc ccaactgcga caaaaacgtt cccggtctgc tcatggcggc 781 agcccgtgtc aacgttccca ccatcttctg ctccggcggt cccatgctgg ccggccgtct 841 caacgacgga cgccgcacct gcctgagcca catgttcgaa gcagtcggcg cctacaaagc 901 cggcaagctg gatgatgcag gcgtcgagga atacgaacag aacgcctgtc ccacctgcgg 961 ttcctgctcc ggcatgtata ccgcaaactc catgaactgc ctcaccgagg gtctgggcat 1021 ggcactgcgc ggaaacggca ccatccccgg tgtctactcc gcccgtctgc gccttgccaa 1081 gcacaccggc atgcagatca tggaactggt gaaaaagaat atccgtcccc gcgacatcat 1141 gaccgagcag gcattccaca atgccgagac tctggacatg gcactgggat gctccaccaa 1201 ctccatgctt catcttcccg ccatcgccca tgagtgcggc atcgaactga gtttcgatat 1261 ggcaaacgag atctccgaga agactccgaa cctgtgccac ctggcaccgg ccggaaacac 1321 ctacatggaa gatctggacc gcgccggcgg tgtttacgcc gttatgaccg agctgtgcaa 1381 gaaagacctt ctggacactt ccgtcatgac ctgcaccggc aagaccatga aggagaatct 1441 ggaaggtgtg gtcaaccgtg atcccgaact gatccgaccc atcgagaacc cctactcccc 1501 ttacggcggc atcgcagttc tgaagggctc tctcgctccg gaaggctgcg tcgtcaagca 1561 gtctgccgta gcagaggaaa tgatggttca ccagggtccc gcccgtgtct tcgacagtga 1621 ggaagatgcc atcgccgcca tttacgaagg caagatcgtt gccggcgacg tggtggtcat 1681 ccgctacgaa ggtcccaaag gcggccccgg catgcgcgag atgctcaatc ccacctctgc 1741 catcgccggc atgggactgg acaaggacgt tgccctcatc accgacggac gtttctccgg 1801 agcgacccgc ggcgcctcca tcggacatgt gtgtccggaa gcggcacagg gcggtcccat 1861 tgccttcgtg gaagagggtg accagatcgc catcgacatc cccaacaaga ccattgagct 1921 tctggtggat gaagagaccc tcgcagcccg caaggccgca tgggtatgcc ccgagccgaa 1981 agtgaagacc ggttatctgg cacgttatgc caagctcgtt accgattctt cccgcggtgc 2041 ggttctggag taattacatt attaatgaaa gaaccctttc ctgtctcatt ggacggaaag 2101 ggttcttttt ttccttttgt gacaataaac agacaatgtt gacaaacaca atttagggta 2161 ttaaagttag gaacaatgag aattttcttc agaagatata aaaggagtac tctaacatga 2221 tcaaaaagta ttatgacaaa gactgtgatc tgagcctgtt cgaaggcaag accgtagcaa 2281 tcctgggcta tggctcccag ggccacgcac atgcacagaa cctgaaggaa tccggcgtca 2341 acgtgatcgt tggtctgcgc gagacctcct ccagcgttca gaaggccaag gatgtcggcc 2401 tggaagtatt cagcatcgaa gaagctgccg agaagggcga catcgtcatg atgctcgttc 2461 ccgacgagat gcaggctgac gtttacaaga ac // LOCUS sequence184 2489 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence184 VERSION sequence184 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2489 /mol_type="genomic DNA" /organism="" /note="sequence184" CDS 415..1314 /product="DMT family transporter" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_164921808.1" /transl_table=11 /codon_start=1 /translation="MNDKDKRTGLLLAALAAIFFGLSSITAKLASTNAGGNGISIAFYR NLSVLPVLAIILKVKGYGFKLTRKQLIALFFIGMTCGGLTAMLLYLSYDYISVGLTLCL HFTYPAIVALVYALFFKQKLTKIQGCSLLLACLGIWVMMFGGLEANPVGLILALLSAVA YSSYLIITDKSGIRELTGFKISFYNTLFGTVFLFIFGKIFGYSFGECRPAGWIWLFLTG LMVVCIGNVMTPEAVKRVGPTVTGILGILEPITSLVCSILLLNEPLTPRTLVGGLLVLV SAFLITLGDHKKSSAKES" /locus_tag="LOCUS_5570" /note="WP_164921808.1 DMT family transporter (Rhodopirellula baltica) [pid:23.4%, q_cov:93.0%, s_cov:91.8%, Eval:3.2e-12]" /note="MGA_804" CDS 1319..2191 /product="Cof-type HAD-IIB family hydrolase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003568028.1" /transl_table=11 /codon_start=1 /translation="MKMYYKTPLFKERLDKIKILAFDMDDTLLDGHGKLSDGNRAALDR AIEKGYHVVIASGRVWSALPKDVLAVPGIQYAITSNGARIRDVHADKILYENLLEASSV EACYPWMKDPKVMLEIFYDDQVVADRYCMEHLAEFGRVRPKSQHYVLTTRIPVDNLWEL IEENKNKLENINLIFADQEKRLRYLKEIKEQVKGVTAVSSTPENIELGGPTTSKANALD ALAQMLGCTKENIMAFGDSTNDEQMLLHAGIGVAVGNAVPELLDIADYIAPTHDDDGVA YTLEHLLGI" /locus_tag="LOCUS_5580" /note="WP_003568028.1 Cof-type HAD-IIB family hydrolase (Lacticaseibacillus) [pid:29.7%, q_cov:91.4%, s_cov:93.8%, Eval:2.8e-26]" /note="MGA_805" ORIGIN 1 ctgtgcacga atccggagaa cgacgactat attacgaaac tcgtgacccc ggtcaaggaa 61 aagcgcctgt cccaggcagc gctggaggtg ctggcggtca tcgcatataa gcagcccgtt 121 acgaaggcgc agatcgacgc tgtccgcggc atcaagagcg accgggtgct ggagaccctc 181 atgaagaagg atctcgtgga ggaaaagggc agaagcaagc agatcggacg ccccatcctg 241 tacggcacca cccgcaactt cctgttcacg ttcggcttcg aatccctgga cgagctgccc 301 gagctcgagg acatcggaag ccttacgctg gacgacgatc cggagggcct ggagctgctg 361 cgcgaagtcg atccggacca gctgaccctg cctctttccg aggaataaaa aaccatgaac 421 gataaagaca aacgtaccgg attgctgctg gctgcgctgg cagcgatctt tttcggactt 481 tcttccataa cagcaaaact ggcgtctacg aacgctggcg gcaacggcat ctccatcgct 541 ttctaccgaa acctgtccgt gctgcccgtg ctggccatca tcctgaaggt gaaaggctac 601 ggttttaagc tcacccgcaa gcagctgatc gccctgttct tcatcggcat gacctgcggc 661 ggcttaacgg ccatgctgct gtacctgtcc tacgactaca tctctgtggg ccttacgctg 721 tgcctgcact ttacgtatcc ggccattgtt gcgctggtct acgcgctgtt cttcaagcaa 781 aaacttacga agatccaggg gtgctcgctg ctgctggcat gcctgggcat ctgggtgatg 841 atgttcggcg gcctggaagc gaaccctgtg gggctcatcc tggcactgct gtccgccgtg 901 gcctattcct cttacctgat cattacggac aagagcggca tccgggaact gacgggcttt 961 aagatctcgt tctacaacac cctgttcggc acggtcttcc tgtttatctt cggcaagatc 1021 ttcggctatt ccttcggcga atgccggccg gcgggctgga tctggctgtt cctgaccggg 1081 ctgatggtcg tctgcatcgg caacgtcatg accccggaag cggtcaaacg cgtcggccct 1141 accgttaccg gcatcctggg catactcgag cccatcacca gcctcgtgtg cagtattctg 1201 cttcttaacg aaccgcttac gccgcggacg ctcgtcggcg gcctgctcgt gctggtctcc 1261 gcattcctga tcaccctcgg tgaccataag aaatcttcgg caaaggagtc gtgatcccat 1321 gaaaatgtac tacaaaacgc ctctcttcaa ggagaggctc gataagatca agatcctggc 1381 gttcgacatg gacgatacgc tgctggacgg ccacggcaag ctgtcggacg gcaaccgtgc 1441 cgcactggac cgcgccatcg aaaagggata tcacgtggtg atcgcctcgg gccgcgtctg 1501 gtcggcgctg ccgaaggacg tgctggcggt gcccggcatc cagtacgcca ttaccagcaa 1561 cggcgcccgc atccgggacg tccacgcgga taagatcctg tacgaaaacc tgctggaggc 1621 ctcctctgtg gaagcctgtt acccgtggat gaaggatccg aaagtcatgc tggagatctt 1681 ctacgacgac caggtggtgg cggaccgcta ctgcatggag catctggcgg aattcggccg 1741 ggtgaggccc aagagccagc attacgtact tacgacccgc atcccggtgg acaacctgtg 1801 ggaactgatc gaagagaata agaacaaact ggagaatatc aacctgatct ttgccgacca 1861 ggagaaacgc ctgcgctatc tgaaggagat caaagagcag gtgaaggggg tcaccgcggt 1921 aagctccacc ccggaaaaca tcgagctggg cggcccgacg acctccaaag ccaacgcgct 1981 ggatgcgctg gcgcagatgt tgggctgcac gaaggagaac atcatggcgt tcggcgattc 2041 caccaacgac gagcagatgc tgctgcacgc cggcatcggt gtcgccgtgg gcaatgctgt 2101 gcccgagctg ctggatatcg cggattacat cgcacccacc cacgatgacg acggcgtggc 2161 gtacacgctg gagcacctgc tggggatcta gccccagcac agggggacag gtacactgtg 2221 tggcctgcac ctatccaaat cgcaaaaata gccccttgag atagggatcc ctatctcaaa 2281 gggctttttt aatacataga taggtaaatt gccgggtcat caagggattt cgcctatccg 2341 gatgctgtct ttgcaacgct cagataggtt tccctatcca aagccccttt tccacgatcg 2401 tggataagga cccttgtaaa gacaagacgg ctttaccggc actcctccac caatctccta 2461 aagatcggca gcacggcatg cttgtccgc // LOCUS sequence185 2483 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence185 VERSION sequence185 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2483 /mol_type="genomic DNA" /organism="" /note="sequence185" CDS complement(691..1344) /product="HAD family hydrolase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_005785068.1" /transl_table=11 /codon_start=1 /translation="MEKKYKIVLFDMDGTILDTLRDLSDSVNWALAECGLPQRTFAENR RFLGNGIINLIHRAVPEGTPEDLELQVRTVYKHHYEQHCNDTTKPFDGIPEALAELRRR GYKLACVSNKPDDDVARLAERYFGGLLDDWSGPLPGMPIKPAPDLCDRILARQGLTRAE AIYVGDTEVDIKTAENGGMECIVCAWGFRDEDWLVASGAKTIIHRPQELLELLP" /locus_tag="LOCUS_5590" /note="WP_005785068.1 HAD family hydrolase (Bacteroides fragilis) [pid:37.1%, q_cov:97.2%, s_cov:99.1%, Eval:3.3e-33]" /note="MGA_807" misc_feature complement(1357..>2483) /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_011726996.1:PucR family transcriptional regulator" /note="WP_011726996.1 PucR family transcriptional regulator (Mycolicibacterium smegmatis) [pid:25.9%, q_cov:97.3%, s_cov:85.9%, Eval:1.1e-15]" /note="MGA_808" /locus_tag="LOCUS_5600" ORIGIN 1 cccggaacgt cacgtccttt cccgcgaaag gaaagccgta gatgcgggcc ggatcgtcct 61 ggtagcccgg cctggggtcc agctccagga tggccctcag agcctctgtt ttgccctctg 121 ggaggcattt gatccattct tcgggtattt ccaccttcag agtctccacg ttgcgcaaac 181 ggccgattcc gcgttccgca tccggaatgc tctcggtaga cggcaggtag ggtttgatgt 241 cgaagatggg cgtaccgtcc atcagatcca ccccggacac gcggatgacc ggtccatcgg 301 cgctgtcgag ctcgatccct tcgatcttta cgaccgacag ccccagccgg ttgggccggt 361 tgggcgaccg cgtcgcgaac acgccgaccc gggtgttgcc gtccatcttc ggcggacgca 421 ccgtggggct ccaggacggc gtttctgcgg cctcttcgtg accgtcgtag cggccttcct 481 gctttgccga agcgaaacct tcggagaaat gccagatgag ccagatatgg ctgtagttct 541 ccagcccccg cagcgcgtcg ggattgcggt acgccggctc gaacacgatg gtgccttcca 601 gttcgggcac gagcccggac tgccggggaa tgccgaactt ggaggatagg tccgtgcgga 661 tatgggcgat cgggtgaatg atatgctgcg tcatggtaac aactccagta gttcctgcgg 721 cctgtggatg atggtcttcg caccgctggc gacgagccag tcctcgtccc gaaagcccca 781 ggcgcagacg atgcattcca tgccgccgtt ctccgcggtc ttgatatcca cttccgtatc 841 gccgacgtag atggcttctg cgcgggtcag cccctggcgc gccaaaatgc ggtcgcacag 901 atccggcgcc ggcttgatgg gcatgccggg cagcggaccg ctccagtcgt ccagcaagcc 961 gccgaaatac cgctccgcca gccgggccac gtcgtcatcc ggcttgttgg agacgcaggc 1021 cagcttatat ccccggcggc gcagttcggc aagcgcttcg ggaatgccgt cgaagggctt 1081 cgtcgtgtcg ttgcaatgct gttcgtaatg gtgcttgtac accgtgcgga cctgcagttc 1141 cagatcttcc ggcgttcctt ccggcacggc ccggtggatg agattgatga tgccgttgcc 1201 taaaaaacgg cggttttcgg caaatgttct ctggggcagg ccgcattcgg ccagcgccca 1261 gttgacggag tccgacagat cccggagcgt gtccaggatg gtgccgtcca tatcaaataa 1321 aacgatcttg tacttctttt ccataatttt tttactctac tcgtcccgga tcatgcgtac 1381 gcacagctga agcagaagac ggtccctgtg atccttcagg gagagcccgg tgagcgcctc 1441 gatcttctcc aggcgctgga gaagtgagat ccggtggatg tgcagttcct ccgccgcctt 1501 gctggcattg ccgcagcagc ggaaatacac tgcgaggctc ttcagatatt cgctgccctt 1561 cccgtccgcg gaaagcaggg gctgcagcgt ctgtgcggca atggagaccg cctgctcgtc 1621 cctcagcagc gccgcgatga gcgccgcttc cttcgcgtct ttatacgtat acatcccgcc 1681 gggagaatcc gccgcgtacg ccagcgccat ggcagcctgg cgggccagca gcggaaagtc 1741 cgcaggcgca tcgcccgctg gacagatccc aaacgtgagt gccgcatccg ccaggttctc 1801 ctgcagtttg ctgcgcagca cttccgttat gcgctgcagg tcctccgcct ccctgctctg 1861 ccggacctgc acgtaaagca gaaactccag cgacatggcc gcatacatgc cccgcagccc 1921 gcagagccgg caggcgcttt cgatcgcatt ctccgccaag gccgctgcct ccgctgcccg 1981 ggcggaatat tccggcacgt cttccggcag cgcagcccgg aaacgaatgc aggcgtagtt 2041 cagactcaga tcgaacttca gccggagccc ctggaccgcc atctgctgca gatcttcccc 2101 gccggatgcc agattccaaa caaagtcgtt cttcagcttc cgttccgtca gatattccac 2161 gttgcgccgg tggatgcgcc ggatgaggtc cgtctggacc tgagcaaacc ggactttcca 2221 ggggatgcgg aacacaggta gtccctgctt ttgagcctgc agccgcaaag ccagcggaaa 2281 tttgtaggcg gggtcgcgga acgcaaacag cacgccgcag gcaccgctcg ccgcaagttc 2341 ctgcagaaaa gcagaaaact tcgtttcgtc ctccgtgcac ccttctgccg tggatagcac 2401 aagatccccg ggctggacga agtcgtccgc cgggtattcc tgcacggtaa cggcagagat 2461 ctcggcgctg gccgggtcac cgg // LOCUS sequence186 2471 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence186 VERSION sequence186 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2471 /mol_type="genomic DNA" /organism="" /note="sequence186" CDS 423..1595 /product="YgeY family selenium metabolism-linked hydrolase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003421980.1" /transl_table=11 /codon_start=1 /translation="MQNEKLVPFLQSLIRAGSVSGEEGGVAALLEEFFTQNGFDEVKVD EYGSITGCIKGKRPGKKVLFDGHMDTVPVADPTKWTMDPWAADIKDGKMYGRGTSDMKG ALSAMCMAAADFAKETGKDFAGEIYVAGVVHEECFEGVASSKISKEVQPDIVVIGEASD LNLKIGQRGRAEIVVETFGKPAHSANPDKGINAVYKMAKVIEEIRKLVPEEHPVLGKGI LELTDIKSSPYPGASVVPEYCRCTYDRRLLTGETKESVLAPIQALLDKMMAEDPQLKAK VSYAVGEEDCYTGAKIRGERFFPGWLYKEDDDFVQAAYQQLKADGYDPSITIYNFCTNA SHYAGEAGIPTLGMGPSNESQAHVVDEYIELSQLDGVYGCYKSIMKALLK" /locus_tag="LOCUS_5610" /note="WP_003421980.1 YgeY family selenium metabolism-linked hydrolase (Clostridioides difficile) [pid:66.8%, q_cov:98.7%, s_cov:98.5%, Eval:1.5e-148]" /note="MGA_810" ORIGIN 1 tcaatcccgg caggatctgc agttccagga cctcgcactc ctttgcggtc tcgtcgatcc 61 atgctttgta ttcttccggc gttctgcgga taaagtcgtg ccaatctttc agatcgcggg 121 tgtaggagag acccggaaat ttggtccggt ccactttggg gaaaaacctg tcatggtagt 181 tttcttcgca caggatgccc tggtgcttct ccgccagcag acgcaccata gtggatttcc 241 ccgcatacgc gttgccggta ataaaatagg tgtttttgat ttgttccata gtagccctct 301 tttgtatccg tttctatcat aacatacttc acccgaaccc tcgtccggat acactgattt 361 gcgcctattt gtgctatact gaatacagac gccgcagttt tgcggcagag aggagcatac 421 atatgcagaa cgaaaaactc gtaccgtttt tacagtctct catccgggcc ggcagcgtct 481 ccggtgaaga aggcggcgta gcagccctcc tggaagagtt ctttacacag aacggctttg 541 acgaggtcaa ggtcgacgaa tacggcagca ttaccggctg catcaagggc aaacgccctg 601 gtaaaaaggt gctgttcgac ggtcacatgg acaccgtccc cgtggctgac cccaccaaat 661 ggaccatgga cccctgggct gctgacatca aggacggcaa gatgtatggc cggggcacgt 721 ccgacatgaa gggcgcgctt tccgccatgt gcatggccgc tgcggatttc gccaaggaga 781 ccggcaagga tttcgccggc gagatctacg tggcgggcgt cgtgcacgaa gagtgcttcg 841 aaggcgtggc aagttccaag atcagcaagg aagtgcagcc cgatatcgtg gtcatcggcg 901 aagcttccga cctcaactta aagatcggcc agcgcggccg cgcggagatc gtcgtggaaa 961 ctttcggcaa acccgcgcat tccgccaacc ccgataaggg catcaacgcg gtgtacaaga 1021 tggcgaaggt catcgaggag atccgtaaac tcgtacccga agagcatccc gtgctgggca 1081 agggcattct cgagctcacg gacatcaagt ccagcccgta tcccggcgcc tccgtcgtgc 1141 ccgagtactg ccgctgcact tacgaccggc gtctgctgac gggcgagacg aaggagagcg 1201 tgctcgcgcc tatccaggct ctgctggata agatgatggc ggaagatccc cagctgaaag 1261 ccaaggtctc gtacgctgtc ggagaggagg actgctacac cggcgcgaag atccgcggcg 1321 agcgcttctt cccgggctgg ctgtacaagg aggacgacga cttcgttcag gcggcgtatc 1381 agcagttaaa agcagatggg tatgacccat ccatcaccat ctacaacttc tgcaccaacg 1441 cgtcccatta cgcgggcgaa gcgggcatcc cgaccctggg catgggtcct tccaacgaga 1501 gccaggccca cgtcgtggac gaatacatcg aattaagtca gctggacggc gtgtacggat 1561 gctataagtc catcatgaaa gcactgttga aataaggagt accatgaaag caagagacgt 1621 aaaagtagat cagtggctgg cggcgcacca gcccgaagtt ataaaagacc tgcagaccct 1681 gctgcgctac cgcaccgtgg aagacgagac ggccgtgccc gaacccggca agcccttcgg 1741 gcccatcacc tacgactgcc tgcaggaagc cctgggcatc gcgaagcgcc tgggcttcga 1801 cggcgagagc gtggacggct actgcggcag catcgtcgtt cccgcggaga agtgcgagag 1861 cgaaaagccc cagactttcg gcattttagc ccacctggac gtcgtgcctg agagcaccgg 1921 ctgggactat cctccgtatg gggcagagat cgcagacggc aagctctacg gaagaggcgc 1981 catcgacgac aagggccctg ccgttgcctc cctgtgggca ctcaaagccg ttctggagtg 2041 cggctataaa ctcaagaaga acgtcaacgt catcctgggc tgcaacgaag agaccggcat 2101 gcgctgcctg gaatacttta aggaacaccg tcccgtgccc gatttctcta tctcgccgga 2161 cggggaattc ccgctcacga attccgaaaa gagcagggcg gaagctgcct ttgaaagacg 2221 ctatgcctcg aagatccgcc tgcattccgg caccgtggtg aacgcggtcc ccggagaagc 2281 ggaaggcttc gtgcctctgt ctctggatgc ggtcaaagcc gcggcggaaa cctatgccga 2341 agaaagtccc ttcgctgtcg ttgcaacggc ggaagagggc ggcacgaaga tcaaggtgat 2401 cggaaggacc gcccacgcct ccatgccggc ggacggcgaa aacgccatgc tgggcatgct 2461 gcagctgctg a // LOCUS sequence187 2466 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence187 VERSION sequence187 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2466 /mol_type="genomic DNA" /organism="" /note="sequence187" CDS 1089..1406 /product="thioredoxin" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_012545412.1" /transl_table=11 /codon_start=1 /translation="MNEITYLTEETYETVLSGAEAAVVDYYADWCGPCKAMLPIFEACA AEYDKIAFCKINVDDHKKLAIQNRVMGIPCFMFFKNGKMVKRIDGAVDETTFKAALNEL L" /locus_tag="LOCUS_5620" /gene="trxA" /note="WP_012545412.1 thioredoxin (Thermodesulfovibrio) [pid:41.6%, q_cov:94.3%, s_cov:91.8%, Eval:3.7e-16]" /note="MGA_813" ORIGIN 1 atcgtaatac ccggcgttta cgctgtactt tgcgtagagc cagcggctcc gggaattgct 61 gggccagtat ccctcttcgt tctggcagag gatcatacgg tccagtacga agcagttcag 121 cgtatccata acggggcatt ccgcggcatg gcgcgcatag acccaggcca aatagcaggc 181 gggccggttg gcgtaaacgt catctcccca gggttcgtaa ttggcggcgg attcgtaata 241 gtacccatcg tacagcatgc gccacgcgcc gtcgttcgtc aggatctgcc agagggccga 301 tacttcgtcg tcttcccagt cgatcgcagc ggcatccgtg cggcaaagga agaaatcaga 361 ggaggcattt tctccgggag gcatcgcgta cagggagatc ttccacatgc catccgccgt 421 tttgcggacg tccatccacc cttttgcatc tttgagcacc cggatgcatc cgttttcgat 481 gtgttcatac ccctggggca gatagaggat atagctgcct tcgtccgtgt cgaggaacag 541 gcatccggag cggtatatgc ccttctgcga agacctgtgc cactcgccgc cgcggaaaaa 601 gcgcagttcc atgctgcggc agacagtctc aaaaaccggg atggcatcgc cgccggtctc 661 cgaccgcaga gaacctgcga aaacggtatc gccgttgtcc agctcgtagt aactagcgtc 721 cagcaccgcg tccccgtgca gctcgtcgcg gaattccgtg acccgcacag gaacgtcgtt 781 cacttcgaac tgccgggacg atccgggggt caccgacact gcggcataat acgccggcag 841 cggacactgt acaggttctt ccgcagccgt atccgtacag gcgcacagaa gcgccgtcaa 901 aagcagtacc gttatgaaga ttgtaatggg tctgcgtcga tccattgcgt ccctttacct 961 cacagaataa gtattatatt ataccatcaa ttgccccgct ttgtcagtcc tgccgggcgc 1021 ttgcaacggc gtcccctccg tgatatcata aagtgctaaa atatgttgca aatcatgagg 1081 aggaaaaaat gaacgagatc acatatctga ctgaagagac ctacgaaacc gttttatccg 1141 gcgccgaagc tgccgttgtc gactattacg cagactggtg cggcccctgc aaggccatgc 1201 tgcccatttt cgaagcctgc gctgccgaat acgataagat cgccttctgc aagatcaacg 1261 tagacgatca caagaagctt gccatccaga acagagtcat gggcatcccc tgctttatgt 1321 tcttcaagaa cggcaagatg gtaaagcgca tcgacggcgc tgtagacgag accaccttca 1381 aggcagctct caacgaactg ctgtaagatc ttttggccgc cgcgcggccg cagcataaga 1441 aagtattccg aaaatgctca ctgccctgta cagattgatc actctctatg aaaattcccc 1501 tacggcgatc atcacgacga tcttcgtcat cgatcttctt ttgagcttcg ccgtcatctt 1561 cctggagaga aagagcccgt ccgccacgct ggcgtggctc atggtcatca atctgctgcc 1621 gggcctgggc atttttcttt atttcttcct ttcccagaac atcacgaggc agaagctgtt 1681 caaacggtcg cgcttcgaga tgcagaaagc cggagaggat ctgagcatcc agatggacga 1741 catggcctac ggccggtacc gccacatgaa cccggagggc gaaaaatgga aggatctgat 1801 ctacctgaat caggtccacg ccatggcctt ctactcccag aacaacgacg tgcgcatctt 1861 tacggagggc cgggcgaagt tcgaccagct ggtccgggat ctggaggcgg ctgagaagtt 1921 catcaacatg gagtacttca tcatgaagcc cgacgacgtg ggtctccgca tccttcgcgt 1981 gcttcgcaaa aaagccgagg aaggcgtgga agtacgcctg cttctggatg ccatgggctc 2041 gcggcagatc aaggaaaaac atctgaaggg tctgaaggca gccggcggca aggtagcctt 2101 cttcttcccc gccaacgtgt tcaagatcca gctgaagccg aactaccgca accaccgcaa 2161 gctggtcatc atcgacgaaa aagtagctta cgtgggcggg ctgaacgtcg cctccgaata 2221 cgaaggccgt tccacgaagt tcaacggctg gcgcgatacc catctgcgcc tggtgggagg 2281 ctgcgtcgag gacgtggatg accgcttcct tctggactgg cgctacgcca gcggcgagga 2341 tttccacggg gacgatctgg actacaaggt cctcatccct gccggcagca gcggcgtgca 2401 gatcgtgtcc tgcggcccgg acagccccga agaagagatc aagcggctct atctgaagat 2461 gatcac // LOCUS sequence188 2464 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence188 VERSION sequence188 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2464 /mol_type="genomic DNA" /organism="" /note="sequence188" CDS complement(915..1685) /product="gamma-glutamyl-gamma-aminobutyrate hydrolase family protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003438111.1" /transl_table=11 /codon_start=1 /translation="MKKPVIGVTMNHFMSVTGSEFDNVGFSRSPWTTGADEYANSVEKA GGLPVLMPFYLDQENIKEFVNTLDGLLVTGGDDVGPWLYGEDIIKESNAVNIVRDTQEI ALLRYVLDETDLPVLGICRGMQMLNVAYGGKLEQDNKRNGFWHSTGPNVPLYDLAHKVE FAPGSKIEKIVGKSCLYTNSYHHQNVLPDHVGKGLKITGCVKDTAKGLPYDMPEVIELE GDRFVLGVQWHPEWMPQFEEHQAIYRALVDAARK" /locus_tag="LOCUS_5630" /note="WP_003438111.1 gamma-glutamyl-gamma-aminobutyrate hydrolase family protein (Clostridioides difficile) [pid:38.1%, q_cov:93.0%, s_cov:92.1%, Eval:3.7e-32]" /note="MGA_816" ORIGIN 1 agcggtaggt cttgcacacg ccgtcgatca gttcgcggat gcgctcgcgc acctgcgcgt 61 cgtcgttatg cagacagcgg atggagcctt ccattaagca gtcgtcgggc acgacgatgt 121 tgaattcgcc ggcctgcagc ttgcccaccg taacggtcgt gggcttcttg gcatccatct 181 ccagggtgtg gaaggtctgg aacgcctgca gcacgtgcat cgcgcagtcg atggggttga 241 tgcaggaatg gggggaaccg ccgtgaccgc ccttgccgtg gatcgtcagt ttgaagtacc 301 agctggaagc catcagcgcg ccgggcacga tgccgatcca gccttccttc gtgtagctcc 361 agacgtgcat gcccatgatg gcatccggcc ggggatcatc cagcgcaccg gcgtcgatca 421 tgtcctgggc accggcgtct tcctcgttcg tctggaacag gaacacgata gtaccgggga 481 tctcttcgcg gtggttcgcc atcagccgcg cggtcgtcag caggcaggcc atgtggttat 541 cgtggccgca ggcgtgcatg acgccggggt tctcggaagc aaacggcaga cccgtctctt 601 cctgaacggg cagcgcgtcg atgtcggaac gcatgcagag ggtcttgccc ggttttccgc 661 ccttcagcac gccgatgacg cctgtcggca ggcatctgcg cacttccatg cccagagact 721 tcagctcgtc ttcgatcttc tgcgccgtgc ggaattcctg cgtgcccact tcgggatgcg 781 cgtggaaatc gcggcggagt gcaatcaggt tcggggtaag ttctgcgatc tcttttctca 841 ggtccattct ggttcctccg tggtaaaaat gtgacccgcc catgggcggg tcacgcaaaa 901 atggtacgcg gtcgttattt gcgggcagcg tctaccagcg ctctgtagat cgcctgatgc 961 tcttcgaact gaggcatcca ttcggggtgc cactgaacgc cgagaacgaa gcggtcgcct 1021 tcgagctcga tgacttcggg catgtcgtag ggcagaccct tggcggtatc ctttacgcag 1081 ccagtgatct tcaggccctt gccgacgtgg tcgggcagga cgttctggtg atgataggag 1141 ttggtgtaca ggcaggattt gccgacgatc ttctcgatct tggagcccgg tgcgaattcg 1201 accttatggg ccagatcgta cagaggaacg ttcgggccgg tgctgtgcca gaagccgttt 1261 ctcttgttgt cctgctccag cttgccgccg taagcgacgt tcagcatctg catgccgcgg 1321 cagatgccga gtacgggcag gtctgtctcg tcgaggacat agcgcaggag agcgatctcc 1381 tgggtgtcgc ggacgatgtt gaccgcattg gactccttga tgatatcttc gccgtagagc 1441 cagggtccta cgtcgtcgcc accggtgacg agcaggccgt ccagggtgtt aacgaattcc 1501 ttgatgttct cctgatccag atagaagggc attaggacgg gaagaccacc agccttctcc 1561 acggaatttg cgtattcatc cgcgccggtc gtccaagggg aacgggaaaa gcccacgtta 1621 tcaaattcag atccggtaac ggacatgaaa tgattcatgg tcacgccaat aacaggtttt 1681 ttcattcttt cctccttcag gttatgctaa acatacttca ctgttgagca cacacatatt 1741 gctacgctaa ctataccata ctttacagtt attttgcact tatatttctg ttgtaagaaa 1801 actgacgcag ccccttcaaa ttgtggtatc atctagccat gaagaccata caggaaagga 1861 tgcgcggatt ccacgacaac gcgggagaac tgcacaagga tgtggatgaa cgcatcagaa 1921 aagtcaatag aaaaagactg aaaaaaacgg tcgtagccct caccatgacg gctgcggtcc 1981 tcgtgggcag tctgttctcc gggcccgatg acatcaccgg aggaaacatg cagcagatcc 2041 tggagcccac accggtcgtc atggatatcg attccttcga cgcggaggtg caggacgagg 2101 aaccggcccc ggaggaggca aagaaaaacg gcatcaaggc aaggatacgc gctgctattt 2161 tagccatgcc caaatggctg cgctacgtgg tcgtgctgcc gctgtgggct ttgggctacg 2221 cgctgcttct gctgggcagt tttctgcagc agacggtgct ggcgcccttt gtgggggtca 2281 tcgtttcggc cctcatcggc atcgccgcca tgatcgggct gtttgccgtg accgccaaga 2341 tgctgttccc ggacatgccc tggcggaaga tcttcagcaa gggcaacctg atcgccctga 2401 tcgtgaccgg cgcagcgctg gcggcggcgg atgttatcgt gccccgctac tacagcggct 2461 atcc // LOCUS sequence189 2456 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence189 VERSION sequence189 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2456 /mol_type="genomic DNA" /organism="" /note="sequence189" misc_feature complement(1742..>2456) /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_011860813.1:ornithine racemase Orr" /note="WP_011860813.1 ornithine racemase Orr (Clostridioides difficile) [pid:51.9%, q_cov:100.0%, s_cov:66.9%, Eval:3.1e-67, partial hit]" /note="MGA_819" /locus_tag="LOCUS_5640" ORIGIN 1 gtctctgcgc gggtcacaag agcatccggt gcgtatttgc cgtcgccctt tccgccgacg 61 atgtcggcct tcgccagcgt gaggatgtcg gacgcgtaat cgctggagga aatatcgctg 121 aattccacgg ttttcttttc cgtatagtaa cggacttcca gcgtgtgcgc gaaatagtac 181 gccatctctg cgcggctcac gttctgcatc tccttgccgt cgaaacggtc gtcgatgatg 241 ccctcggcct tgcagtagtc ctcatatgcc tggtaccagg cgctgccggc cggcttattc 301 gccaggaaat catagttgtc gcccttctgt ttgctgtgca gctgggagac catcaccatg 361 atctgggcat gggtcagctg cgcatccggg ctgtaggtgt cggcgctggt gccgcccacg 421 atcttgttgt cgtaggcgct ctgcaggtac ttttcgtacc aggcgccgga ggaaacatct 481 ttaaagataa acgaaacttt atcggtgacc ccgggaatgt tcggtgccgg aacaacgccc 541 ggcagcttga cgccgtccat caccttgacg aatgtcttgg tatccgaata cgttccgttg 601 cccaggctgc cgctgccgac tccccagagc gcgccgtctt tcttcagaac atacaggctc 661 gtagatccaa acaccgctgc ggatacatta tccagcacct tgacgggctt cgcctggtct 721 gtcgtatttc cggtgcccag ctggccccgc tcgttctgac cccaggtcca gagcgtgccg 781 tctttcttta cgaccgcaaa acggttgtcg aagatgctga cagaggctgc cccgtccatc 841 accttcgacg gggtgtcgtg gtagctgcgg acgaggttgc cgcccttaac gccttcatac 901 ttgaccagtc cgatatgcca gaccgaacca tccgccttaa ccgccagaag accctgaccg 961 gaaatgctga aggatacgac gccgtccatc tgctttgcag gcttcgaagt ataggcgtag 1021 gtgctgtgga agaacaggct gccccaggcc cacaggctgc cgtccttttt cagggcgccg 1081 gcacagtcgg aatgcgcctg gatcgcggcc acattgtcca tcagcttaac gggcgctgcc 1141 gcattttcgt tggtgccaag gcccagacag gacgttctgc cgcagcccca gagggtgccg 1201 tcgtacttca ggatgagcgt atatccgttg ccgcaggaca cggcctgcac gccgtccatg 1261 atccggacag gggtctcgac gaaatccccg gccgcaccgg tccccagctg gccgctgttg 1321 ttctttcccc acatccagag agaaccgtcc gatttgataa aaccggcgtg gtcgctgccg 1381 ttgcttgcgg tcacgacatc gtccgccacc tttaccggcg aaaggcctcc gtttttatac 1441 agcgtggaac tgccccaccc ccagagagtt ccgtccgatt tgatgacggc tgtcccgccg 1501 tattccgtcg agatcgtatt tgcaaagcgc tcttttgcga attccgaacc tgccatggcc 1561 gggctggcga gggacaggca gaggatcgat ataagcagta atgagatgag gtttttcatg 1621 gtaagccttc ctttctttcc atcttatagt ttaccgcgtt ccggcgcttg tgcgcaatac 1681 gaaaacggga ccgccatcgc ttgcggtccc gctttcgtta ttcagtatat ctatggagaa 1741 tttagatgta tgcgcgttcg atataggcgc tggtgaagag cttcaacagc gcgccgtagt 1801 ccagggagaa gtccacggta tcgcccagct tgtagttctc cttcgtcacg tccatgatca 1861 gatggtcgga ggaagcgccg agcacgtccg ccttggtgtt gagcggggtg agcccgtcgg 1921 gattcatatc ctgcttgccg acggcgaaga tggcccggtc gatccagccg cggtcctcat 1981 aggatggcac ctggccgaag gcgtccacac ctacgtcgcc gatgggaagg gagggcttgt 2041 gcttcagctc gatgatctgc gcgcgcaggg tgaccgcatc attgtaagtg ccggggatgc 2101 gctggctgta agccgtctcg ttgccgagga taaaggattc accgaggcgc aggttgttga 2161 tcttcgcagg cagctcgccc ttggggatga ggtagacgga ggagctgttg ccgccggaga 2221 cgatgttcag gcggatggag aacttcttct cgatcttctc cgcgatggcg cacaggccgc 2281 ccagattgtc gggcttgggg atgatggccc cgtagcagga cagattgacg ccgatgcctt 2341 ccagcaccac atgctccatc ttgaggatct cgcagcaggt cttgaggatg gcttcttcgt 2401 cctggaagaa catgccttcc cgcaggtcgc ccatgtcgat catcaggatg acttta // LOCUS sequence190 2440 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence190 VERSION sequence190 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2440 /mol_type="genomic DNA" /organism="" /note="sequence190" CDS 11..1189 /product="pyridoxal phosphate-dependent aminotransferase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_010966253.1" /transl_table=11 /codon_start=1 /translation="MKYNFDEIIDRRGTDCLKYDFGPKRKGRSDLLPMWVADMDFKLPD EILADLHKRVEHGIFGYTDPLDDYFEALNHWFFTRYGYTVEPEWVTLGAGLVYAVHLSV QAFTKPGEGVMVMQPVYYPFSEAIKQNGRKLVNCQLHYDGAYSIDFEKMEKQIKEEDVK VLIFCSPHNPVGRVWTKEELTKVADICLENGVILMIDEIHCDFIFPGHKFTSIMNLDEK YHKIIALYSSPGKTFNVAGLQSANVIIPDPELRAKFKKANTSAGYSQANCMGQCALMSC YTKGAEWVDELVEYIWGNVCYMKDFVEKNFPKAHFVDPDGTYLTWVDFSGYGLEDDDLE HLMVEEAKLWLDSGAIFGPETKQFERFNLGCPRSVVEQAMKQLKAAFDARGL" /locus_tag="LOCUS_5650" /note="WP_010966253.1 pyridoxal phosphate-dependent aminotransferase (Clostridium) [pid:41.4%, q_cov:99.0%, s_cov:99.7%, Eval:5.8e-95]" /note="MGA_820" CDS complement(1238..1555) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MFTILKACLLTVLIETVLFYLLGYRTKDDITIVACANVVTNLSLN LILAISGTRATYWNIVVPLELAVVFAEFLIYARAFGPSKPLFWKVLATNALSFGIGLLL F" /locus_tag="LOCUS_5660" /note="MGA_821" CDS complement(1559..1750) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MRHFRKILPALLLILSAGGYSYADIAPLPEPQEAGINFIPILFLI ALIVAAALIIRAILRKRK" /locus_tag="LOCUS_5670" /note="MGA_822" CDS complement(1747..1962) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MKNISRIWLLILCMFALFTAPVFADAAIGPAFAIVGAGFILAVAG LIICLVLLIKTIRRRKNSRTQEEDKK" /locus_tag="LOCUS_5680" /note="MGA_823" ORIGIN 1 aggagaaaac atgaagtaca attttgacga gatcatcgac cgccgcggta cggactgtct 61 gaaatacgac ttcggtccca agcgcaaggg cagaagcgac ctgcttccca tgtgggtcgc 121 ggatatggac tttaaactcc ctgacgagat cctggccgac ctgcataagc gcgtcgagca 181 cggcatcttc ggctacaccg atcctctgga cgactatttc gaagccctca accattggtt 241 cttcacccgc tacggataca cggtagagcc tgaatgggtc accctgggtg caggcctcgt 301 ctacgccgtg catctgagcg tacaggcctt taccaagccc ggcgaaggcg ttatggtgat 361 gcagcctgtt tattatccgt tctccgaagc cattaagcag aacggccgca agctcgtaaa 421 ctgccagctg cattacgacg gcgcgtattc catcgacttc gaaaagatgg agaagcagat 481 caaggaagag gatgttaagg tcctcatctt ctgcagcccg cacaaccccg tcggccgcgt 541 ctggacgaag gaagaactca ccaaggtcgc cgacatctgc ctcgagaacg gcgtcatcct 601 gatgatcgac gagatccact gcgactttat cttcccgggt cacaaattca ccagcatcat 661 gaacctggac gagaagtatc ataagatcat cgccctgtac agctccccgg gtaagacctt 721 caacgtggcc ggtctgcagt ccgccaacgt catcatcccc gatcccgaac tgagagcgaa 781 gttcaagaag gccaacacct ccgccggtta cagccaggcg aactgcatgg gtcagtgcgc 841 actgatgagc tgctacacca agggcgccga gtgggtggac gagctggtcg aatacatctg 901 gggcaacgtc tgctacatga aggacttcgt ggaaaagaac ttcccgaagg cccacttcgt 961 ggatccggac ggcacctacc tcacctgggt cgacttctcc ggctacggcc tcgaggacga 1021 cgatctggag cacctgatgg tggaagaagc caagctgtgg ctggattccg gcgccatctt 1081 cggcccggag accaagcagt tcgaacgctt caacctgggc tgcccgcgca gcgtcgtgga 1141 gcaggccatg aagcagttga aggctgcctt cgacgccaga ggactgtaaa agcaagacat 1201 aacaaaagcg ggtccgcgag ggcccgcttt ttgcgtgcta aaagagcagc agaccgatcc 1261 caaaggagag ggcgttggtt gctaaaacct tccaaaataa gggcttcgac ggtccgaaag 1321 cccgtgcgta gatcagaaac tccgcgaaaa cgacggcgag ttccaacggc acaacgatat 1381 tccagtaggt ggcgcgggtg ccgctgatcg caaggatgag gttgagcgac aggtttgtta 1441 cgacattggc acaggcgacg atcgttatgt cgtcctttgt ccggtatccg agcaggtaaa 1501 acagaacggt ctcgatcagc acggtcagaa gacatgcttt caggatcgta aacatcgtct 1561 attttctctt ccggaggatc gcacggatga tcagggctgc tgcaacgatc agggcgatga 1621 ggaataggat ggggatgaaa ttgatgccgg cctcctgcgg ttccggcaga ggcgcgatat 1681 ccgcgtaaga atagccgcct gcgctcagga tgagcagcag ggcaggcagg atctttcgaa 1741 agtgtctcat tttttatcct cctcctgggt gcggctgttt ttgcgcctgc ggatcgtctt 1801 gatcaaaaga acaaggcaga tgatgagccc cgcgaccgcc aggatgaatc cggcgccgac 1861 gatggcgaag gccggcccga tcgccgcatc ggcgaagacc ggtgccgtaa acagggcaaa 1921 catacaaaga atcagtaacc agatccggga aatgtttttc atggtcgatc tcctttcttc 1981 ttcagaaaga ttacgctata ccaaacggag acaagcccca aaagaaaact gaacaggatg 2041 agcgccttct gcgccgcgcc ggtcagctgg atgagctgac ccagcagggt gcccggccaa 2101 agcgccgagg ccgccaggcc gaaggcaaaa ccgggctcgt ccggcagcag ccggtacagc 2161 agccagagcg taacgggcat gctgaggtta agaagaaact gccccagcag cgatccgccc 2221 atactgaacc cgcagaacgc gatcagaatc gctgatggaa cgatcgaaac ggcggaagac 2281 tttaccgcgc cggtccggtc gcacaggaag ccgcctgccg cctttcccgc aaacacgaag 2341 acagccgtcg cgactgccgt ggcgatgccg gtattccagg gaaagactgc cgcacagccg 2401 ccgatcgccc gcaccgcaac ggcgatggta agggctgcga // LOCUS sequence191 2396 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence191 VERSION sequence191 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2396 /mol_type="genomic DNA" /organism="" /note="sequence191" CDS 517..1485 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MAIRKARLLCMTLAILLASTACSSGAEKTNTQVPQVRSESAVEVA DSASGVQMSDTTSSGFLGSQFNQEKAVAKGTAYIDVSSVANGYVAVSAVADKRLKFQVI CGNATYNYDMSNTGKPSIFPLQSGDGQYKFRIMKNVQDKKYAEIHSVVCDVKLSDPFQP FLRPSDYANYSQNSRCVAKAAEITKGMTNDLAKIKAVYEYVCKTVKYDRQKAATVKSGY LPTPDETMATGKGICFDYASLAASMLRSQGIPTKVIFGYVSPDGLYHAWNMFYTKESGW VTVSYSINPSNWTRMDLTFSANGADGKFIGDGGNYKDVYMY" /locus_tag="LOCUS_5690" /note="WP_010965705.1 transglutaminase domain-containing protein (Clostridium) [pid:31.3%, q_cov:41.9%, s_cov:33.2%, Eval:4.4e-10, partial hit]" /note="MGA_826" ORIGIN 1 accatcacct tcgatctgcg cgttcccatc tccatgaagg gagaagaggt acagagcaaa 61 ctggaagccg gcatggcgaa agccggcgca tccctgaagt cgttcgaatt cggcgaaggc 121 tactgcattc cggacgatac gcctttcgtg cagaaactga tggacgtgtt caacagccgc 181 actggggaga acatgagccc caagtacatc ggcggcggca cctacgcccg tcatctgccc 241 aacgcggtaa gcttcgggcc ggaaggctat ctgtgcgaag cgcatgccca cgtcgccaac 301 gagtttatcg atctggaaca gctctacttc aactgctgcg tactggcgga cgcgatcatc 361 gcgctgtgct gcgaatagac gccaaaaaaa tttaaaaaat tttgcgggga cggggaaccg 421 tccccctttg ttttgcgtct aacaggtgaa aggcaattct atagcataat tttcaggaat 481 cctgtataat acacagtgaa ggaaaaggag actcacatgg cgatcagaaa agcgagactg 541 ctctgcatga cactggcgat cctgctggca tcgacggcat gctccagcgg agcggaaaaa 601 acgaataccc aggttccgca ggtccgcagc gaaagcgccg tggaggtggc ggacagtgcg 661 tccggcgtgc agatgtccga cacgacctct tccggtttcc tcgggtcaca gttcaaccag 721 gaaaaagccg tggcgaaggg cacggcctat atcgacgttt cttctgtggc aaacggctat 781 gtcgccgtat cggcagtcgc agataaacgc ctgaaattcc aggtcatctg cggaaacgcc 841 acgtataact acgatatgtc gaacaccgga aagccgtcca tctttccgct gcagagcgga 901 gacggacagt ataagttccg gatcatgaag aacgtgcagg acaagaaata cgccgagatc 961 cattccgtgg tctgcgacgt taagctgtcc gatccgtttc agccgttcct ccgccccagc 1021 gattacgcca actactcgca gaattcccgc tgtgtggcga aggctgcaga gatcacgaag 1081 ggcatgacga acgatctggc aaagatcaag gctgtttacg agtacgtatg caagaccgtc 1141 aagtacgaca gacagaaggc tgcgaccgtt aaatccggtt acctgccgac acccgacgag 1201 accatggcta ccggtaaggg gatctgcttc gactacgcgt cgctggcagc ctccatgctg 1261 cgcagccagg gcatcccgac gaaagtcatc ttcggttacg tctctcccga cggactgtac 1321 cacgcgtgga acatgttcta cacgaaggag agcggctggg tgacggtgag ctattccatc 1381 aatcccagca actggacccg catggacctg acgttctccg ccaacggcgc ggacggcaag 1441 ttcatcggcg acggcggcaa ctataaagac gtttacatgt attaggagcg atcacgatct 1501 atgagtaaac agttagatca tatgggagta agcgcctttt gcgaaagcat gggcatgatg 1561 atccgctcgg gcatccaggt ggatgaggcg gtcgacctgc tgcagcacgg caggacgaag 1621 accggcggcg ttctggaatc cggattggcg gtcataaagg agcacgtgga taatggagaa 1681 gggttagccg ctgccatgaa ggcaagcggc attttccctg attacgcgct gcagatggtc 1741 gaggccggcg agacgtccgg caaactggaa ggcatcctgt tccggctggc ccgctattac 1801 gcggatcaga agaccatctc cgaaaagctg aagaatgccg ttacgtatcc ggcggtcatg 1861 atcctgctca tcatcgtgct tctcgcggtg atgatccgca tggtgctgcc gtcgttctcc 1921 gcggtctacg agagactgac gggcagcctc gccgcgtcgt cctacggcta tgtccgctgg 1981 gcctacgtgt tctgctggat cgcgcttatc gcgctcatca tcatcgcagc ggcgctgctg 2041 atcggctacc ggatgtggaa aggcggcaaa cgggaatccg tggaagcgct gctgaggaag 2101 tcccccgtct gcgcgtccat cctggagaat atggctatgt tccggttcac gtcggctctg 2161 gccaccttta tcgccagcgg cgacatgcag gacgaagccg tggagaagag cattcccatg 2221 gcggattacg gtcctgtgga ggagaaactc aagcgtgtcg catccggcat gctggaaggc 2281 cacagcatcg cccaggctgc ctacgacgag gaactgttcg agcccactta cggccgcatg 2341 ctgctggcag gcgaacgcag cggcaatctg gaaaacgtgc tggagaggct caccga // LOCUS sequence192 2356 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence192 VERSION sequence192 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2356 /mol_type="genomic DNA" /organism="" /note="sequence192" CDS 574..1515 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MLKYSIKRLARSLITLVILITIVFALLRFMPEEGYFTNYEKMSPA QIELGLTKMGLKDPLYLQVVRFIGKILKGDLGVSYRYRVNTPIARIIAPKIAISAKLGL ICMAISLPLGLALGVLMARYKGRFWDRLGNAYIVFIQAVPNAVYFIFIQLYGSTWLKIP MLYNENDWRTLILPTISLALPSISSYAMWLRRYMVDETNKDYIKLARAKGVPNTTIWFR HVFRNAVVPIVNLIPGSLLMTISGSIYTESFYSIPGMGGLLVDVIKRQDNNMVLVLVVL FAAVGIVGLLLGDIAMAIVDPRISFTKKEGSR" /locus_tag="LOCUS_5700" /note="WP_002902452.1 ABC transporter permease (Streptococcus) [pid:36.0%, q_cov:78.0%, s_cov:48.2%, Eval:5.0e-40, partial hit]" /note="MGA_829" ORIGIN 1 cggcaactac gccatccagg aactgaactg gggcgctgac ttcatggatc ccgagacctg 61 ggcggatccg ttcgacagag agaactccta taacttcttc tgccacgata ccgacaccta 121 cagagtcttc caggatacca agtccgacga gaccaacgct ctcatcgacg agtactacag 181 actgtgcgac tatgcccgta cctgtgtcga cgatttcgac gaaagatacg aagcgttcgc 241 agcagccgaa tccttctacc tcgatcacgc gatcgtggtt cccggcttca tctccggcgg 301 ttcctaccag gcaacgaagc tgaacggctt cgaaggccag tacgccatga tgggccagtc 361 ctccagcaga tacaagggac agcacgtcta cgcggaagcc atgtcccagg atatgtacga 421 cgaacagtac gaagcctgga cggaagcgct cggcggcaat taagacctgc ccccttctga 481 caccgaagga caactgatca aaccaactgt aagcggctct gctgccaggc acggcgcgga 541 gccgctttcc tttataagtg aaggagactt aacgtgctga agtattcgat caaacgtctt 601 gcacgatcgc tcataacgct ggtcatcctg atcaccatcg tcttcgccct tctgcggttc 661 atgccggaag aaggctactt cacgaattac gagaagatgt cccctgcgca gatcgaactg 721 ggcttaacga aaatgggcct gaaggatccg ctgtacctgc aggtggtgcg ttttatcgga 781 aaaatcctga agggagatct gggtgtctca taccgttacc gggtcaatac tccgatcgcc 841 aggatcatcg cgccgaagat cgcgatctcg gccaaactgg gtctgatctg tatggcgatc 901 agcttgccgc tcggccttgc cctcggcgtg ctgatggcgc gctacaaagg cagattctgg 961 gaccgtttag gcaacgccta catcgtcttt atccaggccg taccgaacgc ggtctacttt 1021 atcttcatcc agctgtatgg ttccacctgg ctgaagatcc ccatgcttta caacgaaaac 1081 gactggcgga cactcatcct gcccaccatt tcccttgccc tcccctccat ttccagctac 1141 gccatgtggc tgcgccggta catggtggac gagacgaaca aggactatat caaactcgcc 1201 cgcgcgaagg gcgtgccgaa caccacgatc tggttccggc acgtgttccg caacgcggtc 1261 gtgcccatcg tcaacctcat tcccgggtcc ctgctcatga ccatctcggg ttccatctac 1321 acggaatcct tctactcgat cccgggcatg ggcggacttc tcgtggacgt catcaagcgc 1381 caggacaata acatggtgct cgtactcgtc gtcctgttcg ctgctgtcgg catcgtcggc 1441 ctgctgcttg gcgacatcgc catggccatc gtcgacccgc gcatcagctt cacgaagaag 1501 gaggggtcca gatgagcaag tattcaccga aagaaaggat caccggcaaa ctggtatccg 1561 cgcaggagga attcctcaag aagcacggca tcctcaccgg cgacctgatg gacgacaacc 1621 tctgcgagga acagatcgcg ggtctggaca aagacctgtt cggcctggcc atcgtcgacg 1681 agagcgaggc ggagcgcacc gggtattcca actactccta ctggggctcc accgtccgca 1741 tgttcttcaa gaacaaggtg gcggtcttca acctcatcgt catgctggcg ctggtgctgt 1801 tcacgttcat ccagccccac ctgccgaacc agttcgaccc gaacctggtc aattactacg 1861 attcgaaggc ggtctggttc caggtcgaag acgacggcgg ctacaccgtg gacggcatga 1921 agcgcacgaa gggcgattac gccgtcgaac ctgccgcgga cgagatcctc gcctacatcc 1981 agacgccctc ttcctggggg acgcccgaag cgttctccta caacgaagaa ggcgaagaaa 2041 cgcagctggc cgtttccgct gacccggcca acaagggctg gttctactgc ctgctcagca 2101 aagacgcgcc gcatctggcc gtcatgtcgg aagaccatac gaagagcacg ttctacgacg 2161 ccgtatggct taccgtcacc ggcgataaga acgcggtcta ctgctcctct gtcaaacaga 2221 cgaagagcga actgatcgac aacgtgcccg caggaaagag cctcgtctac gtgtccgcgc 2281 ccgcaggctg gggcacgccc caggtcaagg tccagggcgc gctgggcgcg agcagcgcgg 2341 aattcatcaa ggtcaa // LOCUS sequence193 2354 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence193 VERSION sequence193 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2354 /mol_type="genomic DNA" /organism="" /note="sequence193" misc_feature <1..1510 /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_010966446.1:biosynthetic-type acetolactate synthase large subunit" /note="WP_010966446.1 biosynthetic-type acetolactate synthase large subunit (Clostridium) [pid:49.7%, q_cov:98.8%, s_cov:89.7%, Eval:2.4e-128]" /note="MGA_831" /locus_tag="LOCUS_5710" CDS 1510..2040 /product="acetolactate synthase small subunit" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_010896015.1" /transl_table=11 /codon_start=1 /translation="MADTYFNPTVIVMIVEDNPNVLSRISLMFGQRGFNIDTITASHTH DPKFTRITITTHGDQTVIDRIVRQTHKLVEVHKVAVQTAGTHIERELILVKVEVKEDQR SQIREICEIYHGMIVEMTRTSMILEMTGKPPRIDAFLEVLEPYPIIEMTRTGVTAIDRG PEPLDYDKERAYA" /locus_tag="LOCUS_5720" /gene="ilvN" /EC_number="2.2.1.6" /note="WP_010896015.1 acetolactate synthase small subunit (Buchnera aphidicola) [pid:39.4%, q_cov:87.5%, s_cov:98.1%, Eval:9.9e-31]" /note="MGA_832" ORIGIN 1 cgcagcagac ggctatgccc gttccaccgg aaaagtcggt gtctgcatct ctaccagcgg 61 accgggtgca acgaacctgg tcaccggcat tgccaccgca tacatggaca gcattcccat 121 gatcgccatc acctgcaatg tcgcccagag cctcatcggc aaagacagtt tccaggaggt 181 ctttattacc ggtgtcacca tgccgatcac caagtacaac gttggcatcc ggagcgtcaa 241 cgatctggcc gacaccatcc gggaatgctt ccgcatcgcc aagagcggcc gtaagggacc 301 tgtcctgatc gacattccca aggacgtcct gctggcaaag tgcgagtaca ctcccgccga 361 gcccatcaag acggagatgc cggccaagcc cgatcccgct ctcatcatgg aagcggcaaa 421 gatgatcaat gcggcggaac gccccgttct ctgcttcggc ggcggcgcca tcagcgccga 481 tgcctccaaa cagatcgcct ccctcattgc cgacggacat atccccgcct gccataccat 541 catgggcacg ggcgtggtga gtttcggtga tgagcacgat ctcggcatgg tgggcatgca 601 cggaagtctc atcgccaacg aggctattgc cgaagccgat ctgctcatcg cagcaggcat 661 ccgattcagc gaccgtgtcg ctctgaacac cggcaagttc gcgcccaatg ccaagatcct 721 gcagttcgat atcgacccca gtgagaacag caagaacatc aacgttacca gtttcgtgta 781 cggcgatctg aaggactgcc tcaacgagct gcttcctctc atcgagaaga aggaacgtac 841 cgagtggttt gaccgtctga acggtctgcg cgagaaggac tattatccca catccatccc 901 cggccagctg cgtcctcatg agatcatgga gatcatcggc gaagtcgtgg gcgaagacgc 961 agtcatcgtt accgacgtcg gccagcatca gatgtgggct gcccagtact gcaaggccac 1021 ccgtccccgc ggattcatta ccagcggagg actgggaacc atgggctttg gctacggtgc 1081 cgccatcggg accaagttcg gtgttccgga ggccaaggtc atccacatca ccggcgacgg 1141 ctccttccac atgaacatga acgaagcctg cacggcagtg tccaatgatc ttcaggtcat 1201 caccgtgatc atggacaaca aggtcctcgg catggtgcat cagtggcaga atctgttctt 1261 caatcagcac tacatggaga ccgagcccgg acgccgtacc gattacgtca aggtcattga 1321 aggttttggc ggacacggtt ttgagggcga tactcccgaa cacttccgca aggctctgga 1381 agaggccctg acgatccagg gtcccagctg gatccgctgc cccatcgatc cggatgaatt 1441 cgttcttccc atgatccccg cgggcaagac cgtggaagac atcgttgtca gcgaggagga 1501 tttgtactaa tggcagatac ctatttcaac cccactgtca tcgttatgat cgtggaagac 1561 aatcccaatg tgctctcccg catctctctg atgttcggac agcgcgggtt caacatcgat 1621 accatcaccg cgtcccatac gcatgatccg aagttcaccc gcatcaccat caccacccac 1681 ggtgatcaga cggtcattga ccgcatcgta cgccagactc acaagctggt ggaggtccac 1741 aaggtggcag ttcagaccgc cggcacgcac atcgagcgcg aactgatcct ggtgaaagtc 1801 gaagtcaagg aagatcagcg ctcccagatc cgtgagatct gcgagatcta tcacgggatg 1861 atcgtggaga tgacccgcac cagcatgatc ctggagatga cgggcaaacc gccccgcatc 1921 gacgcattcc tggaggtgct ggagccgtac cccatcatcg agatgacccg taccggcgtc 1981 accgccatcg accgcggtcc ggagcctctg gattatgaca aggaacgtgc ctacgcataa 2041 gaagttaacc aaacgaagat aaataaggag tgtttcaaat gatcaaaaag tattatgaca 2101 aagactgtga tctgagcctg ttcgaaggca agaccgtagc gatcctgggt tatggctccc 2161 agggccacgc acatgcacag aacctgaagg aatccggcgt caacgtgatc gtcggtctgc 2221 gcgagacctc ctccagcgtt cagaaggcca aggatgtcgg cctggaagta ttcagcatcg 2281 aagaagctgc cgagaagggc gacatcgtca tgatgctcgt tcccgacgag atgcaggctg 2341 acgtttacaa gaac // LOCUS sequence194 2341 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence194 VERSION sequence194 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2341 /mol_type="genomic DNA" /organism="" /note="sequence194" CDS 1390..1566 /product="zinc-ribbon domain-containing protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003387504.1" /transl_table=11 /codon_start=1 /translation="MEDKTLVCQDCGKEFIFTVGEQQFYKEKGFDNEPKRCKECRDKRK QARRAMRETGSAE" /locus_tag="LOCUS_5730" /note="WP_003387504.1 zinc-ribbon domain-containing protein (Clostridium) [pid:71.2%, q_cov:89.7%, s_cov:92.9%, Eval:4.3e-17]" /note="MGA_835" CDS complement(1628..2113) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MPVHMLALWRSGRCPFLVPASFWETPDGLRIRLDAEGLVQVASYA AVCPDGLEKGFCLLLTSLASAARAFASLQQWLADPAYISLDPSLLFFDRDKGSSLLMFS DSPDSRPFLARFSDLCRGLGPSGALIAERLEEAGRSVRMEEQGTARFLEKWLLQILA" /locus_tag="LOCUS_5740" /note="MGA_836" CDS complement(2113..2340) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MEAVLTEQLKRRYAACKTCRPSSLPYGSLVFLFSDGSRVYHRKEC PCITKYYVSMPKGEAVAEGYTPCLFCQEGL" /locus_tag="LOCUS_5750" /note="MGA_837" ORIGIN 1 acttccttgt atgctgcgat aacgccgccc ttgacttcct tcaggacggt aacgttgagt 61 acttccttgc tgtccagtgc tgcggtgatc tcttcccagt tttcgccgga ctgaagcttt 121 ttcttggaaa ggaggatgtt gccgtcgccg tcatcggtct tgatgacttt cgcctgcact 181 tcgtcgcctt ccttaaatgc tgcagtaaga tcctgaccgt cttcgagagt gacctcttcc 241 ttcggcagca tgccgtcctt cttgcagccc aggtttacta cgacgtaatc gttcgtgacc 301 tgcactaccg ttccggtaac tacttctcct ctaccgggaa gcttaagaga cttctcgatc 361 tcgtccatat aggcgagcat ttcgttcatt tctgtgttct gatctttgag tacttcactc 421 atgttagcaa taacctccaa aataatttgt tgcggtgcgg atgcactcgc tgcaacgcct 481 attttattat attttgaaat ttcttgcaac ggtaaatcgt cgaatttttc gataaaaact 541 gtaaatatgc aattctgtga acagatgtcg aatagcttgc gggagttaga gctcgtttta 601 tcgccgatca ccaccatcgc atcggagttt gccgcaagtt ttgcggccgc gtcctgccgc 661 tgtttcgtgg cgttgcagat ggtatcctcg atctgaaggt cgccgcagat cttcttcaat 721 tcgtcgcagc aggcatcgaa ttttgcccgg gtgagcgtcg tctgggccag tgccgtgacc 781 ggtccaccct tgagaatctc tgcataatat gcaatgcggg agggatcgtc gcaggcacct 841 accgcccggt ccgttgaccc gaggatacct ttcacctccg gatgatccgg gtcaccgatg 901 acgaagacga gccgcccggc ttctcctgct tttctcgccg cgtcgtggat gcggtatacg 961 aacggacagg tctcgtccag gatctcgatc cccgcggctt ccgcagcccg atacgtgctg 1021 tccggttccc cgtgggcccg gatgagcacc cggctgccgg gatccgcctc ttcgatcgaa 1081 cggatcgtga tgagcccctt ctccgccaga tcttccgtaa cggctttgtt gtggatgagg 1141 gaaccgaggc aatacagttt gacgccgtct gccttcgccc gtttcagctc ctgctccgct 1201 gcgtctaccg cgcgctttac accaaagcaa aagcctgcat gttctgcaac tgaaataata 1261 taattcataa cctttttcct tcttatgaaa attgcgatat gaatgtaaaa aactgtttac 1321 aaatccgaaa aagcattata tgattaacta tctcatattc tactacataa ttgccaagga 1381 gttaaagcaa tggaagacaa gacattagta tgtcaggact gtggtaagga atttattttc 1441 acagtaggtg aacagcaatt ctacaaggaa aaaggcttcg acaacgagcc caagagatgc 1501 aaggaatgca gagacaagcg gaaacaggca agaagagcca tgagagaaac gggatctgct 1561 gaataaattc gaagaatcag gaagacatag aaaaggaccg gaagcgctcc ggtccttttc 1621 tcttgtgtta cgccaggatc tgaagcagcc atttttcgag aaagcgtgca gtaccctgct 1681 cttccatccg gacggaccgg ccggcttctt ccagccgttc tgcgatcagc gcaccgcttg 1741 gccccagtcc ccggcacaga tccgaaaagc gcgccaaaaa cggcctgctg tccgggctgt 1801 ccgaaaacat cagcaggctg cttcccttat cccggtcaaa aaacagcagc gagggatcca 1861 gcgagatata agcgggatcg gcaagccact gctgcagcga ggcgaatgcg cgggcagctg 1921 acgcaagaga agtcaggagc agacagaacc ctttctccag tccatccggg cagacggccg 1981 cataggaagc gacctgcacc agtccttccg catccaggcg gatccgcagc ccgtccgggg 2041 tttcccagaa ggaggcgggg acgagaaacg gacaacgccc gctcctccag agcgcgagca 2101 tgtggaccgg catcacagtc cctcctggca gaacaggcaa ggcgtatacc cttccgcgac 2161 ggcttcgcct ttcggcatgc tcacgtagta cttcgtaatg caggggcatt cttttctgtg 2221 atagacccgc gatccgtccg agaacagaaa gaccaggctg ccgtacggca gcgaggaagg 2281 tctgcaggtc ttgcaggctg cgtagcggcg cttcaactgt tccgtgagga ccgcctccac 2341 g // LOCUS sequence195 2341 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence195 VERSION sequence195 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2341 /mol_type="genomic DNA" /organism="" /note="sequence195" CDS complement(381..1340) /product="bifunctional oligoribonuclease/PAP phosphatase NrnA" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_005808862.1" /transl_table=11 /codon_start=1 /translation="MQNWNDIQKAIAKAQKILIFTHVNMDGDAAGSSCALCRSLRAMGK DCFILLEDDCPRYLQFLDDRGMFIKQAPWTPDLSIAVDCGDDSRIEKRKDVFHAAPVTM CIDHHMKSGPFAQLEAIDPAAPAAGSLIFELLQAMNAPIDKDAAEALYVAIATDTGSFK HGNTTAEAHLDAAKLYGYGIDAVKLNNFVYGSYPLPQLKLEAMAVERVQLFADGKAAVS WCTQEDLRRFGALDEHTECCIDRIRSIEGVEAAAFLKEKADGRIKVSLRSKSYADVNAV ARQFDGGGHLRASGCTFYCSIEEALEQIRPALEASVAP" /locus_tag="LOCUS_5760" /note="WP_005808862.1 bifunctional oligoribonuclease/PAP phosphatase NrnA (Desulfitobacterium) [pid:35.7%, q_cov:95.3%, s_cov:93.6%, Eval:5.3e-53]" /note="MGA_839" CDS complement(1340..1786) /product="30S ribosome-binding factor RbfA" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011144020.1" /transl_table=11 /codon_start=1 /translation="MGKSHRPQRMGEEMRKILSDMLMRGQLKDPRFSGAMISVNAVEVT NDGSYATLYVTALPFGSGPLTAEQKKEILAAFERSKGHIRTEIGKNLKARHVPELIFKY DESLEYGAKMDAILDKIEIPADDYDYGLPQEESTAPDDEEYFDD" /locus_tag="LOCUS_5770" /gene="rbfA" /note="WP_011144020.1 30S ribosome-binding factor RbfA (Gloeobacter violaceus) [pid:38.7%, q_cov:95.9%, s_cov:97.7%, Eval:8.7e-20]" /note="MGA_840" misc_feature complement(1786..>2341) /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_130864481.1:translation initiation factor IF-2" /note="WP_130864481.1 translation initiation factor IF-2 (Bacilliculturomica massiliensis) [pid:74.5%, q_cov:100.0%, s_cov:19.6%, Eval:1.0e-76, partial hit]" /note="MGA_841" /locus_tag="LOCUS_5780" ORIGIN 1 cttttttccg tttactttga tggccgaaaa aacgggcggt ttctgttcga tctcaccctc 61 gagggtacgg agtacctctt cgacgttttc tcgcgttaaa tcggctgttt cgggccttct 121 gtcgcaaagc acggtgcccc atatatcccg ggtgtccgtc gtcagaccga gctggcagtc 181 cgcgacatag gtcttggggg cttcgtccat gtattccagc agacgcgtgg cttttccgat 241 acacagcggg agcacgccgg tcgcctgggg atccagggtg ccggtatgtc cgatcttgcg 301 ttctcccgtc agtctgcgca ggatggcgac gcagtcgaag ctggtgtatc ccgccggttt 361 gttcagattt aagatgccgt tcatggcgca acgctcgctt ccagcgcagg gcggatctgc 421 tccagcgcct cttcgatgct gcaatagaag gtgcacccgc tggcgcgcag gtgaccgccg 481 ccatcaaact gccttgccac ggcgtttaca tccgcgtagg acttggagcg cagagagact 541 tttatccttc cgtctgcttt ctccttcagg aaagctgccg cctccacgcc ttcgatgctg 601 cggattcgat cgatgcagca ttccgtatgt tcatccagcg caccgaatct cctcaggtct 661 tcctgcgtgc accaggagac cgcggccttg ccgtccgcga acagctgcac tctttccacc 721 gccatcgcct ccagcttgag ctggggaagc ggatagctgc catagacgaa gttgttcagc 781 tttacggcat cgatgccgta gccgtatagc ttggcagcgt ccagatgcgc ttccgccgtc 841 gtattcccgt gtttaaacga accggtgtct gtggcgatcg ctacgtagag cgcttccgca 901 gcatccttat cgatgggtgc gttcatcgcc tgcagcagtt cgaatatcaa agaacctgcc 961 gccggagccg ccggatcgat ggcttccagc tgtgcaaaag ggccgctctt catgtgatgg 1021 tcgatgcaca tcgtcaccgg tgctgcatga aacacgtcct tgcgcttttc gatgcggctg 1081 tcgtcgccgc agtccaccgc gatgctcaga tcgggcgtcc aaggcgcctg ctttataaac 1141 atgccgcggt cgtccagaaa ctgcagatac cggggacaat cgtcctccag caggataaag 1201 cagtcctttc ccatcgcgcg gagacttctg cataacgcac aggaagaccc tgcggcatct 1261 ccatccatgt tcacatgggt gaagatgagg atcttctgcg cttttgctat tgctttttga 1321 atgtcgttcc aattctgcat cagtcgtcga aatactcctc gtcgtcggga gctgtgctct 1381 cttcctgggg cagaccgtaa tcatagtcgt ccgcggggat ctcgatctta tccaggatgg 1441 cgtccatctt cgcgccgtat tccaggctct cgtcgtattt gaagatgagc tcgggcacgt 1501 ggcgcgcctt cagattcttg ccgatctcgg tgcggatgtg acccttggag cgttcgaatg 1561 ccgccaggat ctctttcttc tgttccgccg taagcggacc ggagccgaac ggcagagcgg 1621 taacgtacag ggtggcgtaa ctgccgtcgt tcgttacttc gacggcgttt acgctgatca 1681 tggcgccgga gaaacgcggg tccttcagct gaccgcgcat cagcatgtcg ctgaggatct 1741 tccgcatctc ctcgcccatc ctctggggtc tgtgagactt gcccattatc tctccacctc 1801 ttgcatgacg aaggcttcga tcacgtcgcc ttccttgatg tcgttatact tttcgatgcc 1861 gataccgcat tcgaagccgc tggccacttc tctcgcgtcg tccttgaaac gcttcagcga 1921 ggagatgacg ccctcgtgga tgacgatgcc gtcgcgcagc aggcggacct gtgcgtttct 1981 ggtgaccttg ccttccatga cgtaagcacc tgcgaccgtg ccgacaccgg gaaccttgaa 2041 agtattgcgg acttccacct tgcccaggat gacttccttg aacacggggt ccagcatacc 2101 cttcatggcc gcttcgatat cgtcgatgat ctcgtagatg atgcggtagg tacggatctc 2161 cacaccgtct ctgtctgcca tagcctggac agcggagctg ggacgcacgt tgaagccaat 2221 gatgacggca tcggaagtgc tggccagcat gacgtcggat tcggtaacgg taccgacgcc 2281 ggtgtggatg atcttaacgc ggacgttctc gttatgcagc ttttcgaggg atgcttccag 2341 c // LOCUS sequence196 2334 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence196 VERSION sequence196 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2334 /mol_type="genomic DNA" /organism="" /note="sequence196" CDS complement(366..635) /product="ACT domain-containing protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_007053740.1" /transl_table=11 /codon_start=1 /translation="MKAIVSVLGKDRVGITAAVCTKLAENNINILDISQTIMDGNFSMV MIVDMDKATCSIKEMSGVLEDLGKEIGQIIRIQREDIFDAMHRI" /locus_tag="LOCUS_5790" /note="WP_007053740.1 ACT domain-containing protein (Bifidobacterium) [pid:59.1%, q_cov:98.9%, s_cov:97.8%, Eval:5.8e-22]" /note="MGA_843" CDS complement(648..1028) /product="large-conductance mechanosensitive channel protein MscL" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003701438.1" /transl_table=11 /codon_start=1 /translation="MMKEFKEFISRGNVMDMAVGIIIGGAFTAIVSSLVADIITPIIGM LMGGVDFSSLAVTVGSANLTYGNFIQAIINFLLVAWVLFMIVKAMNKMKRKEEEKPAEP EAPAEPPEDIVLLREIRDSLKK" /locus_tag="LOCUS_5800" /gene="mscL" /note="WP_003701438.1 large-conductance mechanosensitive channel protein MscL (Ligilactobacillus) [pid:54.0%, q_cov:100.0%, s_cov:97.6%, Eval:1.4e-31]" /note="MGA_844" CDS complement(1060..2007) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MAKEMPVYLFTGFLEAGKTQFIQTTLEDPNFNAGEKTLVIQCEEG IEEFRHERFWEDNVVVEVLDDPDQINNKFLLELEKKHAPERIMIEYNGMWMLDHLFQEM PEHWIIYQEYSFYDANTFLAYNQNMRQLVYDKLKSADCVVFNRYREGMDRLPLHKVVRG VSRRPDIFYELPSGDAIVDDIEDPLPFDKEAPVIEIKDEDYALWYRDLSEDMPSYEGKT VRVKGITGASGVLQGSDFIFGRQVMTCCVEDIQMAGLVCEWHGVKPAKRSWVTVTAKIR VGKSKAYGSKTGPILVVSKIEGATEPEQPVATFY" /locus_tag="LOCUS_5810" /note="MGA_845" ORIGIN 1 accagggcgg aatagccgcc gatgaagttg acgccgcagg tcttcgccgc ttcgtccatc 61 gccttcgcga aggggacgta gtcctccgta tcgctggcag cagcgatgag tgccatcggg 121 gtcaccgaga tgcgcttgtt gacgatgggg atgccgaact cggattcgat gtcttctccc 181 acctgcacca ggttctgcgc gtagcggcag atcttgtcgt agatcttttg gcaggccttg 241 gccggatctt cgtccgcgca cgaaaacagg gagatgccca tggtgatcgt acggatgtcc 301 agatgctgct gatcgatcat ctgcagcgtg gacaggatct ctttctgatt gagcatggca 361 gcctcctaga tgcggtgcat cgcgtcgaag atatcttcgc gctggatgcg gatgatctgc 421 ccgatctcct tgccgagatc ctccaaaacg ccgctcatct ccttgatgga gcaggtcgcc 481 ttatccatgt ctacgatcat gaccatgctg aagttgccgt ccatgatcgt ctgcgaaatg 541 tccaggatgt tgatattgtt ttcagccagt ttcgtacaga cggccgccgt gatgcctact 601 ctgtccttgc ccagcacgga tacgatcgct ttcatgttcg tctttcccta tttctttaag 661 ctgtcgcgga tctcacgcag cagaacgata tcctcggggg gttctgcggg cgcttcgggt 721 tctgcgggct tctcctcttc ctttctcttc atcttgttca tcgccttgac gatcatgaag 781 agcacccagg cgaccagcag gaagttgatg atggcctgga taaagttgcc gtaggtgaga 841 tttgcgctgc cgacggtgac cgccagagag ctgaagtcga cgccgcccat cagcatgccg 901 atgatcggcg tgatgatgtc tgccaccagg gagctgacga tcgcggtgaa cgcgccgccg 961 atgataatgc ctacggccat gtccatgacg ttgccgcggg agatgaattc cttaaattcc 1021 ttcatcattg tagtattccg cctttcttgt tatatatgac taataaaatg ttgccacagg 1081 ttgttcgggt tcggtcgcac cctcgatctt gctgacgacc aggatggggc cggtcttgct 1141 gccgtaggcc ttgctcttgc cgacgcggat cttcgcggtc acggtgaccc aggagcgctt 1201 cgcgggctta acgccgtgcc attcgcacac gagccccgcc atctggatgt cctccacgca 1261 gcaggtcatc acctgccggc cgaagatgaa gtcggagccc tgcagtacgc cggacgcgcc 1321 ggtgatgccc tttacgcgca cggtcttgcc ttcgtaggag ggcatgtcct cggagaggtc 1381 gcggtaccac agcgcgtagt cttcgtcctt gatctcgatg acgggcgctt ccttatcgaa 1441 cggaagcgga tcttcgatat cgtccacgat ggcgtcgccc gaaggcagct cgtagaagat 1501 gtccggccgc cgggatacgc cccgcacgac tttgtgcagc ggcaggcggt ccatgccttc 1561 ccggtagcgg ttgaatacga cgcagtccgc gctcttcagc ttgtcgtaga ccagctggcg 1621 catgttctga ttgtacgcga ggaacgtgtt cgcatcgtag aagctgtact cctggtagat 1681 gatccaatgc tccggcatct cctggaacag atggtccagc atccacatgc cgttgtattc 1741 gatcatgatg cgctcgggag cgtgcttttt ctccagttcc agcaggaact tgttgttgat 1801 ctggtccggg tcatccagga cttcgaccac cacgttgtct tcccagaaac gctcgtggcg 1861 gaactcctcg atcccctctt cgcactggat gacgagagtc ttctcccccg cgttgaaatt 1921 cgggtcttcc agggtcgtct gtataaactg ggtcttgcct gcttccagaa aaccggtgaa 1981 caggtagacg ggcatctctt ttgccatgtt acgctactcc aaacagatgc ttgacttcgt 2041 cttccttcat ctgggcgccg atgacgcaca gcatgcctgt ggcggctgcg ggacccttgc 2101 ggacgttgat ctcgcccggc gtgtagtcga aatggatcca gccctcggtc ttgtcctgca 2161 cgatgccctt ggctctgagc acgaaaccgt aggtccaggt gtcgtccagc gcggccagct 2221 tctcgcggat ctcgtcttcg gtgaaccggg cagcggtcgt ttcgccccag ctcgtgaaca 2281 cttcgtccgc gtcgtgctcg ccgtcgtgat gatggtgatg atgatggtgg tgat // LOCUS sequence197 2319 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence197 VERSION sequence197 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2319 /mol_type="genomic DNA" /organism="" /note="sequence197" ORIGIN 1 cgggcggcgg agatggcgtc ggcggcctgc accaggcagg cgatgacggt cttggcctcc 61 acgtcgccgt ggtgggcctc gatggcgtgg atgacctcgg gggattcctt gtacttccgg 121 gccagctcca cgcccagctg gacgtggctg ccctccatct cgtggtccac gctcttgccc 181 aggtcatgca gcaggccggc ccgcttggca agggtgacgt cctcgcccag ctcggaggcc 241 aggagccccg cgatgtgggc gacctccatg gagtggttga gcacgttctg gccgtaggag 301 gtgcggtact tctggcggcc caggagcttg atcagctcgg ggtgcagacc ctggacgccg 361 gtctcgaaga cggcgcgctc gccctcgcgc ttgatggtct gctcgacctc gcggcgggcc 421 ttctccacca tgtcctcgat gcgggtggga tggatgcggc cgtcggcgat gagcttctcc 481 agggcaaccc gggcgatctc gcggcggacg gggtcgaagg aggagaccgt gatggcctcg 541 ggggtgtcgt cgatgatgag atcgacgccg gtgatggtct cgagggtccg gatgttgcgg 601 ccctcgcggc cgatgatgcg gcccttcatc tcgtcgttgg gcagaggcac cacggaaacg 661 gtagtctctg cgacgtgatc ggcagcgcag cgctgaatgg caccggtaat gatctccttc 721 gctctgcggt ccgcttcttc ctttgccttg acctcgatat ccttgatcat gatggaagcg 781 tcgcggcgta cgtccttttc gatactctcc agcagctggt tcttagcatc ttccgccgtg 841 catccggaga tccgttccag ttccgcgatc tgcttttcga tgaagccgtc cagttccttt 901 tccttctcgg ccagagctct ctgcttcttc gaaatgccct cttccttctg ctcgatgttt 961 tcgatttttc tgtccaggga ttcttccttc tgaacaagtc ttctttctgt cttttttacc 1021 tcttctctgc gttcgcgaat atctctttcc gcatcttgtt ttatagaatg agcttccgct 1081 ctggcatctg ccagcgtttc tttgcggata gcttcggagc ggttttccgc atccagaata 1141 aggtttttgg cctgtgtttc ggcacttccg atgatctttt cagccttatt cttgcggatg 1201 atataaccta caagtattcc gatggcgaga aaggcaattg caataagtgc ttttacaagc 1261 atgttgcgcc tcctctgcgt atttaaaaat aagcattaca aaaataccaa tacattgtac 1321 tatattatgc gcataaatgt aaagggatac tttccgtttc acatacaaaa aagcggttgc 1381 acttgcacaa aaataaagaa tggatatata ctctaatttg ttagaccgca ataggaacgc 1441 atcggaaagg aggtgccgga aaatgactgc aaaggagata aaacttacga cccttgcagg 1501 ctgcgccgga tgaggggcga agctgggagc aggagttctt gctgaagtat tggacggcat 1561 ttccatgcag agcgatcccg cccttctggt ggggttcgac aaaagcgacg atgcctgtgt 1621 ctataaagtg aacgacgaac tggcgctggt gcagacggtg gactttttcc cgcccgtggt 1681 ggatgacccc tataccttcg gccaggtggc ggcagccaac gccctttccg acgtctacgc 1741 catgggcggt gtgcccaaga cctgcctcaa cgtgatgggc atccccagag attttccgaa 1801 ggaagtaacg agggagatcc tgcggggcgg ctacgataaa gtctacgaag caggcgctgt 1861 cgtggcagga ggccacacca tcctcgacga agagcccaaa tacggactgt ccgtaacggg 1921 ctacgtccat ccggacaagt tctaccgcaa ctgcggcgca aagccgggag acgttctcat 1981 cctcacgaag cctttgggta cgggcatcct tacgaccgca gccaaggcag gaatgctggg 2041 tgcagaagac gagcggacca tgatccgcat catgacggaa ttgaataaaa atgcacgcga 2101 cgcattcgtg cagtgcgaag tccacgcctg caccgacgta acgggcttcg gcctgatagg 2161 ccatctgttc gagatggtga acggcaccga ctgcgaagcg ctggtggaga cggcaagcgt 2221 cgacatcctt tccgccgccc tcgaatttgc gaacatgggc cttcttgcgg aacgcatgta 2281 ccgcaaccgg gactactgcg gcgcacaggt ggaggaaaa // LOCUS sequence198 2317 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence198 VERSION sequence198 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2317 /mol_type="genomic DNA" /organism="" /note="sequence198" CDS 378..1241 /product="peptide chain release factor 2" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_177451831.1" /transl_table=11 /codon_start=1 /translation="MEMAEEAEDEDSAKEAMATFEAFREKAEEVNIRALLSDEYDQNNA LVNIHPGAGGVDAQDWAEMLLRMYTRWAEKKGYKVKILDYQNDTEGGIKNVEILVEGPL AYGYLKTESGVHRLVRISPFNAAGKRQTSFALVDVMPELPEDIQVDIDPGDLRIDTYRS SGAGGQHVNKTDSAVRITHIPTNIVVSCQNERSQHQNKEYAMRMLYAKLYALARQEHKE KISELHGDYGQIAWGSQIRSYVFQPYTMVKDHRTGQETSNVNAVMDGAIDDFIYASLNA LQKGEL" /locus_tag="LOCUS_5820" /gene="prfB" /note="WP_177451831.1 peptide chain release factor 2 (Clostridioides difficile) [pid:63.7%, q_cov:95.8%, s_cov:75.5%, Eval:1.2e-98]" /note="frameshifted, insertion/deletion at around 202" /note="MGA_850" ORIGIN 1 cgcgggcgac gcgaagccgg tgcctttccg cgccgaaaag cggccgggaa gaaacgatcc 61 ctgcccctgc ggcagcggca agaaatacaa gaactgccac ggcagaaacg cgtaaaggtt 121 ggaaaccatg ctcatcttag acaatctgaa aaactccata ccgcaggcag aggagaccct 181 ggggaaactc agggagagcc tttgacgtcg acaagaagcg ggcaagactg gaagaactga 241 attacgaatc cggacttccg gggttctggg acgaccagga gagagcacag aagaccatca 301 aggaacgggg ctctctggag tcggatctgg gcgaatacga cgcctgcagc cggctgcttt 361 ccgacgccca ggtcctgatg gagatggcgg aggaggcgga ggacgaggat tcggccaagg 421 aagcgatggc gacctttgaa gcattccggg agaaggcgga agaggtgaat atccgggcgc 481 tgctctcgga cgagtacgac cagaacaacg ccctcgtcaa catccatccc ggcgccggcg 541 gcgtggacgc ccaggactgg gcggagatgc tgctgcgcat gtacacgcgc tgggcggaga 601 agaagggcta taaagtcaag atcctggact accagaatga caccgaaggc ggcatcaaga 661 acgtggagat cctggtggaa ggccctctgg cctacggtta tctgaagacc gagagcggcg 721 tgcaccggct ggtgcgcatc agccccttca acgcggcggg caagcggcag acgagcttcg 781 cgctcgtgga cgtgatgccc gagctgcccg aggacatcca ggtggacatc gaccccggcg 841 atctgcgcat cgacacctac cgctccagcg gtgcgggcgg tcagcacgtc aacaagacgg 901 actccgctgt gcggatcacc catatcccga ccaatatcgt ggtgagctgc cagaacgagc 961 gcagccagca ccagaacaag gaatatgcca tgcgcatgct gtacgcgaag ctgtacgcat 1021 tggcgcggca ggaacataag gaaaagatct ccgaactgca cggcgactat ggacagatcg 1081 cctggggcag ccagatccgc tcctacgtct tccagcccta cacgatggta aaggaccacc 1141 gcacggggca ggagaccagc aacgtgaacg ccgtcatgga cggcgccatc gacgacttta 1201 tctacgcttc tctgaacgcg ctgcaaaagg gggaattgta gtggaagagc tggaacgcaa 1261 aagaagattt ctcatcaatc tgacctatgc cgttgcggtg ggcatcgtgt attacgtgtt 1321 ggtgcgttac gtgctgtacg cgcttatgcc ctttacgatc gcgttgctgg taacgttcat 1381 gttaaagcgg ccggtagatg ccacgtcccg gctgctgcat atcccgagaa gaggcatcgc 1441 ggcgttctgg gtcatcctgt tctacgggct tatcggagcg ctgctcaccc acgctgttat 1501 ccagctgatc tttacggtgc tcagctggtt cggctccctc acgacgatct atgcgacgca 1561 catcgagccc gccgtgcagc gggtgctgca gtggtacgag gagcttgtgg cggatattga 1621 ccctgccagg gtcagccagg cggaggccat cgccaacaac atcctgggca gcctggccag 1681 cggcgtaacg tccctgtccc gctccctcgt gggatacgcc cagcgtctcg ccgtgggtac 1741 gccgaagttc tttatctccc tgatcttctg catcgtatcc acggtattcc tgtccatgga 1801 ctaccccaac atcaactact tcttcctggc gcagttcaag gagaagtccc agcagaccat 1861 cctggaggcc aaaaactacc tggtcggtac catcggcggc atgctcaagt cctacgggct 1921 catcatgatg atcacctgga tcgaactgac gatcggctta aagatcatcg gactcgagga 1981 ttacatgacg gtggccctta tcatcgcgat cttcgacatc ctgccggcac tcggcaccgg 2041 cggcgtcatg atcccctggg tcatcatcga agtcgtccag ggcaactatt ccatgggcgt 2101 aaagctcctg ctgctctacg ttatcatcac ggtggtgcgc aacgtcctgg aaccgaagat 2161 cgtaggcgaa tccatcggcc tgcacccggt gctgctgctc atctccatct acgtgggcgg 2221 caccatcctg ggacccatgg gcatcgtcat catgcccttt accctcatcg tcatcaagaa 2281 gctgaacgat gcggggcaca tccaggtctt ccgcagc // LOCUS sequence199 2309 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence199 VERSION sequence199 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2309 /mol_type="genomic DNA" /organism="" /note="sequence199" misc_feature <1..1534 /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_000251368.1:beta-N-acetylhexosaminidase" /note="WP_000251368.1 beta-N-acetylhexosaminidase (Streptococcus mitis) [pid:34.2%, q_cov:99.2%, s_cov:81.5%, Eval:5.4e-83]" /note="MGA_852" /locus_tag="LOCUS_5830" CDS 1703..2140 /product="PrgI family protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011861115.1" /transl_table=11 /codon_start=1 /translation="MAYVPVPKDLTAVKTKVLFNLTKRQLICFGSGALVGIPLFFLIKG SVGNTTAALCMMLVMLPFFLFAMYEKNGQPLEKILWNIILVCFIRPKKRPYETNNFYAV LERQNKLDKEVGRIVYGKAHPSRQTGHRGSDRPSQETRQTI" /locus_tag="LOCUS_5840" /note="WP_011861115.1 PrgI family protein (Clostridioides difficile) [pid:66.4%, q_cov:82.1%, s_cov:88.8%, Eval:5.0e-41]" /note="MGA_853" ORIGIN 1 gggcctcaat atgctgatgc tgtactgtga agacagctac gacgtgcccg gagagccgta 61 cttcggctac atgcgctccc gctactccga ggacgacatg cgtgcgctgg acgactatgc 121 ggacatgttc ggtattgaga tgatcccctg tatccagacg ctggcgcatc tggaaaacgt 181 cctgcgctgg ccggcgttcg gggagatccg cgagtacggc gagtgcctgc tcgtcgggga 241 ggagaagacc tatgacttca tccgcgaact gctgatcgcg gcatccaggc cgttccggtc 301 aaggcgcatc cacatcggca tggacgaggc catggagttg gggcggcaca agtatctgga 361 tcgccacggg ctcgtcccgc gcacgcagat catgcgggag cacctggcac gcgtgacgca 421 gatcacgcgc gagctgggac tgcagccgat gatgtggagc gacatgttct tccgggcggt 481 caaccctagc ggcgggtatt acagcgagaa cgtccgattc gaccctgcct tccttgagac 541 cgtgccgaag gatgtgcaga tggtctactg ggattactat cattgggaca gcgaagactt 601 ctaccggaag tacatcgaca tccaccgcag cttcggcgag ccgattttcg caggcggcat 661 ctggacctgg ctgagcttcg gcgccaacta caccaagacc ctgcgcacca cgaatcccgc 721 gctgatggcc tgcaagcgga agggcgtgcg ggaagtcttc gccacggtct ggggcgacta 781 cggaacggag tgcagcgtct acgcgacgct gctggggctc tcgctgtttg cggagcacgg 841 atacacctgg gagctgtccg aagagaagct ccggcggcgt tttgagttct gctgcggtgc 901 gaaatacgac gacttcatga acctgcgata cttcgacgag acccccggcg tggagaagga 961 caatcttctg cagaagaacc cgtcgaagcc gctgatgtgg caggatatcc tgacgggtct 1021 ctttgacaaa aacatcgaag gtctgccgat ggatgcgcac tacgcaaagc tcgccgggat 1081 gctctccccc gcctgcgagc gcagcggcga atgcaacagc atgttcgcct tctgccgcga 1141 ggcggcgcgg gtgctggccg tgaagtcgga gatgggcctg cggctgaccg ccgcttacaa 1201 ggcaggcgac cgcgaagcgc ttcgccgctt cgccgcagac gagctgccct ctcttgccga 1261 acgagtaaaa gagctgcggc gggtacacat ggcgcactgg tacgagattt acaagcccat 1321 cggctgggac atcatcgaca tgcgctacgg tgcactgctg gcccgcattc agagtgctgc 1381 cgacgtcgtc gggatgtatc tcgacgggaa gctcgacgcc attcaggagc tggacgagcc 1441 gcgcctcccc tacaacggcg aggaaggcgt cgcgacttac gccggcttct acaaccgcat 1501 cgtttccgcc agccgcatcg ccgtttacta ctaaagaatg gcaggcttac gacgccatct 1561 cgggacgacc gggcagcggc tatgttttct tggctgactg aacctcagat aaacatcacg 1621 cagttatttc catctgcagg aaaaccgtca tccgaaatag ggtggcggtt tttcaaaccc 1681 caaaaccaga aagggtgaca caatggccta tgtacccgta ccgaaggacc tgacggcagt 1741 caagacgaag gtccttttca atctgacaaa aagacagctc atctgtttcg gcagcggtgc 1801 cctggttggc ataccgctgt tttttcttat caaaggcagc gtgggaaaca cgacggcagc 1861 gctctgcatg atgctggtca tgctgccgtt cttcctgttt gccatgtatg aaaagaacgg 1921 gcagccgctg gaaaagatct tatggaatat cattctggtc tgctttatac ggcccaagaa 1981 gcggccctat gaaaccaaca acttctatgc cgtattggaa cggcaaaaca aactggataa 2041 ggaggtaggc agaattgtct atggcaaggc tcacccgagc cgacaaacgg gccatcgcgg 2101 aagcgatcgc ccgagccagg agacaagaca gacgatataa gacagcacag gaaagcatcc 2161 cctttgagag aatgtatccc gacggcatct gcagggtaac ggatacctta tataccaaga 2221 ccatacgctt tgaagacatc aactaccagc tgaatcagaa cgaggacaag acggcgattt 2281 tcgacggatg gtgcgacttc ctcaattac // LOCUS sequence200 2282 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence200 VERSION sequence200 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2282 /mol_type="genomic DNA" /organism="" /note="sequence200" CDS complement(728..2227) /product="carboxypeptidase M32" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011016113.1" /transl_table=11 /codon_start=1 /translation="MTVFEAKEKLTALQRKMAAYEHAQSLLYYDGCTSAPKGSAGTRAN SLSILSEESYKLYTGEETVQLLEFLDAHKDELNEKEQRIVYLLLKDIREMAKIPMDEYV AYQELLVKADDVWHTAKETSDFALFEPYLQQIFDTNRKFAGYVAPEKDPYDHYLNEYEE GLSREVCDRFFDTLKARLVPLIRKVGEMPQVDTSCIKGHFIAQDQEKLAHWVMRVMCLD PAHIALSTTEHPFTTSLGSHEDVRITTHYYEENVSYSMFSVIHEGGHALYDSGSAEDMA FTALDGGISMGIHESQSRFYENILGRSKAFCGYVLPAMKALFPQMLGVTEDEFFKAINV VEPSLIRTEADEVTYCLHVLIRYEIEKRVMAGELAVHDIPAEWNRLYKEYLGIDVPDDK HGCLQDSHWSGGLIGYFPSYAIGSAYGAQFLQKMKQDLDVDALMAKGDFAPVNAWLKDK IWQYGRLYTPAQILDNVLGEPFDPNYYLDYLEEKCKAVYGF" /locus_tag="LOCUS_5850" /note="WP_011016113.1 carboxypeptidase M32 (Fusobacterium nucleatum) [pid:41.0%, q_cov:98.4%, s_cov:99.4%, Eval:3.5e-103]" /note="MGA_856" ORIGIN 1 gttctcccgg aacttctcca cgtcttcctt cgtgtagcag ttgcggctca tgcggtagta 61 acccagggtc gtgtagcctt cataacccag tttcttcccc atttcgtcgc gcaggtgcac 121 cagtttgtcg tagtgggcgt ccagagcttc ctggttatct ttataccact gtccttccgc 181 tttccaggca gcgaggcgtc tcgcgtcgtc cgggtcgttc ttgaatgggg tcatctgaga 241 cagcgtatag atgccgccct cgaaggggat ctgcgcggaa gccagcagct tttcgtaagc 301 atccgcctcg tcattctctg cctgcagcat cgggatgatc tccgggctga aggtcttgag 361 agccatgtcg ccgttgatga acatcagttc gccgtattcc gcggcaaacg ccttgcggaa 421 cgggctcgcc agcatggcgg ccgtccaggc ctggttgtat tcctgcagtt ccgggcccag 481 cgcgttccac cacttctgtt cgtcgtcgta gaacttgtcg cgggtatcga tggaatggcg 541 gatggagacg agctgcgcca gcgtgttcac gtggttgccc agctcttcgt tctccagaaa 601 gacggttttc gcctcttcgt aggtcttcgc ggccttcagt ctttcggtga acgccgcgat 661 ctgcttctta atgccgtccg cgtcgggccg gctgtagggc atttctgaaa acttcatgca 721 aattctccta aaagccgtag acggctttgc acttttcttc gagatagtcg agataatagt 781 tcgggtcaaa cggctcgccc agcacgttgt ccaggatctg cgccggcgta tacagtctgc 841 cgtactgcca gatcttatcc ttcagccagg cgttgaccgg agcaaaatcg cccttcgcca 901 tgagcgcgtc cacatccaga tcctgcttca tcttctgcag gaactgggca ccgtaggcgc 961 ttccgatggc gtagctgggg aaatagccga tcaggccgcc gctccagtgg gaatcctgca 1021 ggcagccgtg cttgtcgtcg ggcacgtcga tgcccagata ttccttgtac aggcggttcc 1081 actccgcggg gatgtcgtga acagccagtt ctcccgccat gacgcgtttt tcgatctcgt 1141 agcggatgag gacgtgcagg cagtacgtga cttcgtccgc ttccgtgcgg atgagggacg 1201 gctccacgac gttgatcgcc ttgaagaatt cgtcctccgt aacgcccagc atctgcggga 1261 acagcgcctt catcgccggc agcacgtagc cgcagaacgc cttactgcgc cccaggatat 1321 tttcgtagaa acggctctgg ctctcgtgga tgcccatgga gataccgccg tccagcgcgg 1381 taaacgccat gtcttcggcg gagccggaat cgtacagcgc gtgaccgcct tcatggataa 1441 cggagaacat ggagtagctg acattctcct cgtaatagtg ggtcgtgatg cgcacatctt 1501 cgtggcttcc gaggctggtg gtaaagggat gctccgtcgt ggacagcgcg atgtgagccg 1561 gatccaggca catgacgcgc atcacccaat gcgccagttt ttcctggtcc tgggcgatga 1621 agtgaccctt gatgcagctc gtatccacct ggggcatctc gccaaccttg cggatgagcg 1681 gcacgagcct tgccttcagc gtgtcgaaga aacggtcgca cacttctctg gacaggccct 1741 cttcgtattc gttgaggtag tggtcgtagg gatccttttc cggtgcgacg tagcccgcga 1801 atttgcggtt cgtgtcgaag atctgctgca gatagggctc gaacagcgcg aaatcgctgg 1861 tctccttcgc cgtgtgccag acgtcgtccg cctttaccag cagttcctgg taagctacgt 1921 attcgtccat ggggatcttt gccatctcgc ggatatcctt cagcagcagg tagacgatgc 1981 gctgttcctt ttcgttcagc tcgtccttat gcgcgtccag gaactccagg agctgaacgg 2041 tctcttcgcc cgtatacagc ttgtagctct cctcggagag gatggacagg gaattcgcgc 2101 gggtgccggc gctccccttc ggcgccgagg tgcatccgtc gtaatacagc aggctctgcg 2161 catgctcgta agcagccatc ttgcgctgaa gcgctgtcag tttctctttt gcttcgaaaa 2221 cggtcataga taaaactcct ttgatacgtt gggatcgcag cctgccaagg caagctgccc 2281 ta // LOCUS sequence201 2268 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence201 VERSION sequence201 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2268 /mol_type="genomic DNA" /organism="" /note="sequence201" CDS complement(194..979) /product="5'/3'-nucleotidase SurE" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_000698379.1" /transl_table=11 /codon_start=1 /translation="MNILISNDDGVFKYGLKVLANALASMEDVNVYVFAPSQERSCAGH GLFLHEEQVVTPYSTEGFDRVEGVWACSGTPADCVKTGVSILRSKGIPINMVCTGVNHG SNLGRDIHYSGTISAAMEGLFLGIPSIAFSLCSHEALHFEAFPHLIPQVVKAAKGNVPR DTILSVNVPDIPADQLKGVRVCPIGPRDYTDGIEFVRKEGDSEVWLYVSKATYRDDPDP EWDVTAWQEGWVTITPVQMMHENARMMDLVRSWGISLEK" /locus_tag="LOCUS_5860" /gene="surE" /EC_number="3.1.3.6" /note="WP_000698379.1 5'/3'-nucleotidase SurE (Vibrio) [pid:36.9%, q_cov:95.8%, s_cov:96.4%, Eval:2.3e-37]" /note="MGA_858" ORIGIN 1 agcctcttcg acagcagtct taccaagggt gacggcgggg gtgttcttca gggtgccgcc 61 gaagctgccg atgggtgttc tggctgcgct ggcgattact acttctctca tgtgttttat 121 cctcctagat atgtgaatag tcccgcattt gcgggtaagt tataaccaat ttaatattgt 181 ataccgaaaa tgttcacttt tcaagggata tgccccagct gcgcaccaga tccatcatcc 241 tcgcattctc gtgcatcatc tgcaccgggg tgatggttac ccagccctcc tgccaggccg 301 ttacatccca ttccgggtcc ggatcgtccc ggtaggtagc cttggaaacg tagagccaga 361 cttcgctgtc cccttccttg cggacgaatt cgatgccgtc ggtgtagtcc cgcggaccga 421 tgggacagac gcggacgccc ttcagctgat ccgccgggat gtccggcacg ttgaccgaga 481 ggatggtgtc tctgggcacg ttgcccttcg ccgccttaac gacctggggg atgagatgcg 541 gaaacgcctc gaaatgcagg gcttcgtggc tgcataggct aaaggcgatg gacggaatgc 601 cgaggaaaag cccctccatg gccgcggaga tggtgccgga ataatggatg tcgcggccca 661 ggttcgagcc gtggttgacc ccggtgcaga ccatgttgat ggggatgccc ttcgaacgca 721 ggatcgaaac gccggtcttg acgcagtccg ccggcgtgcc gctgcaggcc cacacgccct 781 cgacgcggtc gaagccttcg gtgctgtagg gagtcaccac ctgctcctcg tgcagaaaca 841 gcccgtgacc cgcgcaggag cgctcctgcg acggagcgaa gacgtatacg tttacgtctt 901 ccatggaagc gagtgcgttc gccaggacct tcagtccgta tttgaagacg ccgtcatcgt 961 tgctgatcag tatgttcata acctttttcc ttttcaaagt atttcgcaaa ccattgtatc 1021 atattttgtt gttgaacata tgttctcttt cgaagtataa ttggattatg cagaacttcg 1081 aatccattat ggaaaaactg aagatcctta ccgatgccgc aaaatacgac gtctcctgca 1141 gcagctccgg ccacgagcgc cgggggcagg acggtcatct gggcagcagc gccgccatgg 1201 gcatctgcca cacctggacg gcggacggcc gctgcgtgtc gctgctgaaa gttttgtata 1261 ccaataaatg cgtctacgac tgtgcgtact gcatcaatag acggagcaac gatgtaccgc 1321 gggcagcttt tacgccccgg gaactggcgg acctcaccat ggaattctat cgccgcaact 1381 acatcgaagg gctgtttttg agctctgcgg tggacggcag tccggaccgc accctggagg 1441 agatctgcga agcgctgcgc attctgcgct cggactacgg ctttttaggc tacatccacg 1501 cgaaactcat ccccggcgcg agccctgaga tggtgcagcg catcggcatg ctggcagacc 1561 gggtgagcat caacatcgag ctgccctccc gggaaagcct ggctgccctg gcgcctcaga 1621 agacggcagc gggcatctta acgcccatgc ggcagatcac ggatacgatg gcggagcagc 1681 gttccctcac cggcgcgggc aataaatact cgaagtaccg ctaccgtccg aagcagctgc 1741 cggacagcaa tttcgcgcta ttgggcgaag aagcgccccg cgaaggccgc tattccacgg 1801 cgaagatggt gttccgcggc gccggcaaaa accttaccgt gcggcagatc gatgcgaaga 1861 tggcggtcaa ggaagaccgg tttgcgccgg cgggtcagac gacgcagctg atggtgggcg 1921 cctccggcga gagtgaccgc cagatcctcg ccctgtccca cgcgctgtac aagaatttct 1981 tcctcaagcg ggtctacttc tccgcctaca tcccgctgat gagctcccct ctgctgccgc 2041 aggtcgggtc ggctgtgccc ctcacccggg aacaccggct gtatcaggcc gactggttga 2101 tgcgcttcta cggtttcgac gcttcggaga tcctggacgg aaaggatccg aatctggatc 2161 tgcaactcga cccgaagatc gcctgggcgc tgcgccatcc ggaatacttc cccatggaga 2221 tcaaccgggc gagccccgaa gagatcctgc gcatccccgg catcggca // LOCUS sequence202 2268 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence202 VERSION sequence202 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2268 /mol_type="genomic DNA" /organism="" /note="sequence202" CDS complement(668..1768) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MNKKSILAILLALAMIFSLAACSKDDAAEDESGSESTAAQSYSAG LDENGFFEGITAKDYVTLGQYEGLTVPADQLAITQAEIETEIDGLVSNYTDTKEVTDRA AQLGDTVNIDYEGFMDGEQFEGGTGNNPSLVLGSGSFIAGFEDGIVGHEVGDNFDLELT FPDPYPNNEELSGKPVTFVVTLNSISEEVEPELNDAFVKENFEENYGWTTVAEMRSGVE ETLKENAMYDYLFTQIEDFEVSEVPEALFQYQANNMKAYYEQMATMYGMTLDDFVSGMG IGTMDDIVETAREQLTASARSMLIYQAIAEDAGLSVTDEDIKAEFADMEESEYQDIVDH YGMPYIKCILLNNKVADFIYDSAIVE" /locus_tag="LOCUS_5870" /note="WP_003229611.1 trigger factor (Bacillus) [pid:33.7%, q_cov:83.3%, s_cov:73.3%, Eval:1.8e-39, partial hit]" /note="MGA_861" ORIGIN 1 ctttcttggc gatgaccaca gccatgccgg aggggcccat gttcttctgg gcgccggcgt 61 agatcaggtc gtgatcctcg accttgatgt tcgcgcccag aatggcggaa gaccagtcgg 121 cgacgaaggg aacggcgcct gtctggggtt ttctccacca ggtggtgccg taaatcgtat 181 tgttggcgca gatgtggaaa tatgccgccg tctggggcac catatctgcg gtgatgtcgg 241 gaatgtagga gaaattctcg tcggaagagt ccgcaacctt tacagcgtcc gtccagcgct 301 tgccttcggc gaacgccttc ttagagaact gtccggtgac cgcatacgcc gacttctgcc 361 cctgctttgc caggttcatc gccacagcgg agaactgcag cgtagcaccg ccctgcataa 421 acaggaccgc gtagtcctcg gggatgttca tgatgcggcg cagcgtggct tccgcattgt 481 cgatgatctc ctggaagctg gcgcttctgt ggctcatctc cagcacggaa cagccggctc 541 cgggatagtt gaacagatcc ttctgggcct tcagcagcac gtcctcgggt atcgccgaag 601 gaccggccga aaagttgaat actctttcca tgatgcctcc taaaaagaat gggttaaaac 661 aggtgggtta ttctacgatc gcgctgtcgt agatgaagtc tgcgacttta ttgttcagca 721 ggatgcactt gatatagggc atgccgtagt ggtccacgat gtcctgatat tcggattcct 781 ccatatcggc gaattccgct ttgatgtctt catccgttac ggacaagccg gcatcttctg 841 cgatggcctg atagatgagc atggaacggg cagaagccgt cagctgttcg cgcgcggtct 901 ccacgatgtc gtccatggtg ccgatgccca tgccggagac gaagtcgtcc agggtcatgc 961 cgtacatggt ggccatctgt tcgtagtaag ccttcatgtt gttggcctga tactggaaca 1021 gcgcttcggg cacttcagag acttcgaagt cctcgatctg ggtgaagaga taatcgtaca 1081 ttgcgttttc cttcagggtc tcctccacgc cgctgcgcat ctcggcaacg gtggtccagc 1141 cgtaattctc ctcgaagttt tccttgacga acgcatcgtt cagctcgggc tccacttctt 1201 cggagatgct gttgagggtg acgacaaagg tgacaggctt gccggaaagc tcctcattgt 1261 tgggatacgg atccgggaaa gtcagctcca gatcgaagtt gtcgcccact tcgtgaccga 1321 cgatgccgtc ttcgaaacct gcgataaagc tgccgcttcc caatacgagg ctcgggttgt 1381 tgccggtgcc gccttcgaac tgttcgccgt ccataaatcc ttcgtaatcg atgttgacgg 1441 tatcgcccaa ctgtgcggct ctgtccgtta cttccttggt atcggtataa ttgctcacca 1501 gaccgtcgat ctcagtctcg atctctgcct gagtaatggc gagctggtcc gcgggaacgg 1561 taaggccttc atactggccc agcgttacgt aatccttcgc ggtgatccct tcaaagaatc 1621 cgttctcgtc aagaccggcg gaataggact gggcagcagt gctttcgctg ccggattcgt 1681 cttccgctgc gtcgtctttg gagcatgctg cgaggctgaa gatcatagcc agcgccagca 1741 ggatggcaag gatgcttttc ttattcattg gttggttcaa atcctttctt tgcaaagttg 1801 taaaaacgat ttattatacc atattttagg gaaccggcgt atataattca tgaagatttg 1861 gtgatacaat aaagccatga aactcacttt caacctgaca tcctccgcgg aggaatgcgt 1921 attcctcgcg gacgcaaacg aaacaagaag acagttggaa ggctatgacg gactggagct 1981 gcaggtgatc gaggagccgc ccgaaggatt gatcgacccg catctcgtca tcgggctcca 2041 catgacctgc atcccctgct ggtatgcgct gtggacggga aatgaaaagg ccctgatcgg 2101 cgagtttggc gatcttgcca cggcggaagc gtattacggc ggactccgcc gcgagaccct 2161 tctggacaag ttccggcggg atcttttcta tgcgaagaaa ttcggtgcgg agtacctggt 2221 gttccacatc gcggaatgca acgttctgga gacttacacg gagaacta // LOCUS sequence203 2259 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence203 VERSION sequence203 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2259 /mol_type="genomic DNA" /organism="" /note="sequence203" misc_feature <1..1264 /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_011986938.1:V-type ATP synthase subunit I" /note="WP_011986938.1 V-type ATP synthase subunit I (Clostridium botulinum) [pid:33.3%, q_cov:91.7%, s_cov:59.4%, Eval:5.2e-57, partial hit]" /note="MGA_863" /locus_tag="LOCUS_5880" CDS 1286..1774 /product="V-type ATP synthase subunit K" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_012869602.1" /transl_table=11 /codon_start=1 /translation="MLEFIESYNGLFFAFLGAALAVGLSCVGSAKGTGIVGEAAAGLLS QAPEHFSKCLILQVLPGTQGLYGIVVWFFALYTMGAFSGGIVPLTVTQGLAIFSACMPM ALGGLLSAIAQGRVAASSINIVAKKPNDWFKGTIMCGIVEFYAILSLLASVILLMRAL" /locus_tag="LOCUS_5890" /EC_number="7.1.2.2" /note="WP_012869602.1 V-type ATP synthase subunit K (Thermanaerovibrio acidaminovorans) [pid:46.2%, q_cov:97.5%, s_cov:94.6%, Eval:8.8e-33]" /note="MGA_864" ORIGIN 1 cgcggagcgg atcgataacg agatcgaata cgacgagatc aagatcgagc gcgcgaaggg 61 caaactgatg agcgaaacgg cttaccgcca gtacatccag cagagctggg acagcctcgc 121 cacgaagctg tacgagacgg aaagccgcag ccgcatgctg aattcggaga gttcctttgc 181 tatggaaggc tgggtgccgg aggaagacgt ccccggactg gaagctgtcc tcggcaacta 241 tatcgttcat gcggagttcg aagatccggc gccggaagaa tatccggacg tgccggtcaa 301 actgaagaac aacatcctca cccgctgcat gaacatgatc acgaacatgt actccctgcc 361 ggcctacgac ggtgtggacc ccaaccccct catggcgccg ttcttcatta tattctacgg 421 tatgatgatg gcggacatgg ggtacggcat cctgatgttc gcggcaggac tgttaatggt 481 caagaagatg aaggcccggg gcggcatgag agacttcggc gagctgctcc tctggtgcgg 541 cctctccacc ttcttgtggg gcgccgcgac cggcggcttt ttcggagact ttatcccgca 601 ggccatcaag atctttgacc ccgagagcac ctttaccatg ccggcgctgt ttacgccgct 661 ggaagacacc atcgccatcc tgttcggatc gctggcgctg ggcatcctcc agatctttac 721 cggcatgatc gtcagcgtca aagagaagtt taagagaggg gagttcaaga gcgccctgtt 781 cgacgaattc gcctggtggg cgatcctgtt cggcgtcgca ggcgccgtta ccggcgtcgg 841 caacgtggcc ggaaagcctg tgcttctcat cgcaggtgtt gtgctcctca tcgcaggctg 901 cgtcctgcag aacaaagggg ctgccagggt cacatccatc gtcggcaccg tctacaacgg 961 cgtaacgggc tacttctccg acatcctgtc ctacgcccgc cttatggccc tgatgctggc 1021 aggcagcgtc atctcccagg tgttcaatac cctgggcggc gttacgggga acatcgtgtt 1081 cttcgtcatc atctcgatgg tgggcaacct gctgaacttt gcgctcaacc tgcttgggtg 1141 ctacgtacac gatctgagac tgcagtgtct ggaattcttc aacagatttt ataaggacgg 1201 gggcaaaccc ttccgtcccc tggacgtgca gacgagatat tacaacgtta ctgaacgcga 1261 atagcgtatt taaggaggta aaatcatgct tgagttcatc gaatcctaca acggattgtt 1321 cttcgccttc ctgggcgcag cgctggctgt aggtctgtcc tgcgtcggtt ccgccaaggg 1381 caccggcatc gtcggtgaag ccgctgcggg ccttctgtcc caggctcccg aacatttctc 1441 caagtgcctc atcctgcagg tgctccccgg cacccagggc ctgtacggca tcgttgtatg 1501 gttcttcgcg ctgtatacca tgggcgcctt ctccggcggc atcgttcccc ttacggtgac 1561 ccagggattg gccattttct ccgcctgcat gccgatggcg ctgggcggcc tgctctccgc 1621 gatcgcccag ggcagagtgg cggcgtcctc catcaacatc gtggcaaaga agcccaacga 1681 ctggttcaag ggcaccatca tgtgcggtat cgttgaattc tacgccatcc tttccctgct 1741 ggcttccgtc atcctgctga tgagagcgct gtaggaagaa cccgtaggac gaaaggcaag 1801 cgaaatggct atcaatggag tagaacggat cgccgagcgc atcctgaggg acgcgcagac 1861 cgaagcggcg ggcattaaga aggtcgcgga cgaaaactgc gctgtcatcg atgcccaata 1921 cgagaaacag gccaaagacg cggccgcatc catcctggaa gcagcggaaa aggaagccgg 1981 cgaactgatc aagcgcatga agggcgaagc ggacatgcgg gcccgcagcg cgctgctgga 2041 ggaaaagcag tctttaatgc cgaaggcttt cgaggctgcg cagcaggaac tgttgaacat 2101 ggacgaacag acttaccggg catttctcgt aaaactggcc agcaaggcca gcgtttccgg 2161 aaaagaagaa ctggtgctga acgcgaagga tctggcccgc tacggccagg gactgtgcga 2221 tgagatcaac gaggcgctgg ccaaagcagg gaagacggc // LOCUS sequence204 2254 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence204 VERSION sequence204 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2254 /mol_type="genomic DNA" /organism="" /note="sequence204" CDS complement(446..1735) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MKKWFAIFLAAAMVFGLAACTSSENGPEGAQEPEVVRSDVPAEDQ IDVIVANKDLWLEPAENYATFYAVTDLNNNGRLEVIRCAQTGEWWSEDAFFEMSQDGKT LEALTFPFGDEHSHPDLVDHDEFPLYTGPEGRYLVATDNIFMGPVQQSDYQNYHVLDSL MIAEGTVEAGDIAWCQAMSEDANGDGLEENHIWYYGPEDEGMDRDGEWYVNAPAERFAG YNESVCSIAWWTPDTSETPEDDYTDEALNVGLHYSWDGFGVREDAEVFASLIEDPYYSF YAAGAGGAHIYRADEEVPYFPSFLDLYGTWYIQYAWNDDGITYMGAGLSASELEILSNG LLYASYSNENDPRGAYLFTEMRMVSDAKADGTDADDWVVVYESDDGLWQMQLRPDPENQ MLYVTWYEWTEADHSDEPTGMNLVYSRTAG" /locus_tag="LOCUS_5900" /note="MGA_867" ORIGIN 1 ctggaaacga tcacgatcct ttgggtctgc cagtcctctc cgcagtcctg tgcgatgaga 61 tcgcaggaaa agcggaggtt ttcccgggtg tcggaggcgg cttcctccgc gatgacccgt 121 tcaggatcca cgcccttctc gagaagccag ttacgcatgc actggccttc gctctccggt 181 tcatccgggc cctgcccgcc ggtaacgacg gccttggcat ccggatagtt ttccagatag 241 gccagcgctg cccgcaggcg gtcgtccagc gcgcgggacg gtccccaggg gtcgaccttc 301 gcgccgagaa cgataatata atccgcgtct tcgtagttct gccccttgct ggcccggatc 361 accaggcttt ccgaaacgca gaacgtaatg gcgccgatcg cgataacggc gaggaggatg 421 cccagaacga tcttcaaggc ttttctcatc ctgcggtcct cgaatagacc agattcatgc 481 cggtgggttc atcggaatgg tctgcctcgg tccattcgta ccaggtgacg tacagcatct 541 gattctccgg atcgggccgc agctgcatct gccacaggcc gtcgtcggat tcgtagacga 601 ccacccagtc gtctgcgtcc gtgccgtccg ccttggcatc ggagaccatc cgcatctccg 661 taaacagata ggcgcctctg gggtcatttt cgttgctgta acttgcatag agcagtccgt 721 tgctgaggat ctccagctcg cttgcggaca ggccggctcc catataggtg atgccgtcgt 781 cgttccaagc atactggata taccaggtgc cgtagagatc cagaaagctg gggaagtaag 841 gcacttcctc gtctgcgcgg tagatgtggg cgccgcccgc gcctgccgca tagaagctgt 901 agtacggatc ttcgatgagg gaagcgaaga cctccgcgtc ttcccggacg ccgaagccgt 961 cccagctgta atgcagcccc acgttcaggg cttcgtccgt atagtcgtct tccggcgtct 1021 ctgaggtgtc cggggtccac caggcgatgc tgcagacgct ctcattatag ccggcaaagc 1081 gctcggcggg ggcgtttacg taccactccc cgtcccggtc catgccttca tcctccggac 1141 cgtaatacca gatatggttc tcttccagcc cgtcgccgtt ggcgtcctcc gacatggcct 1201 ggcaccaagc gatatcgccg gcttccaccg tgccttcggc gatcatcaga gaatccagca 1261 cgtgatagtt ctggtaatcg gactgctgca ccggacccat aaagatgttg tccgtcgcaa 1321 cgagatagcg gccttccggt ccggtatata gcgggaattc atcgtggtcc accagatccg 1381 ggtgggaatg ctcgtctccg aaggggaacg tcagcgcttc cagcgtcttt ccgtcctggc 1441 tcatctcgaa gaacgcgtcc tccgaccacc attcacccgt ctgggcgcag cggatgacct 1501 ccagccggcc gttgttgttc aggtccgtga ccgcatagaa cgtagcgtag ttctccgcgg 1561 gttcgagcca cagatcctta ttggcgacga tcacatcgat ctggtcctct gcgggcacgt 1621 cgctgcggac gacttccggt tcctgcgccc cttccggacc gttttcggaa gacgtgcagg 1681 ccgcaagacc gaataccatt gccgccgcaa ggaaaatcgc aaaccatttc ttcatggagc 1741 acctcccccg gtgttacgcg acaccgttcg taaacgttaa cttcatgatc tgcggatccg 1801 cgccgggatc ctcttcgctc caccaatacc aggtgacgta cagtctgccg tcgtcagcgc 1861 cgatggtggc ttcgaaacgg ttgaggccgt cttcgctgtt gaacacgacc atccagcccg 1921 ccgcatccac aggcgcgtcc gtcacttcgg ggtctgcggc ttccgccggt tcctccgcag 1981 catgacccat gccgtcctcc gccatggaga tgggcatgcc ttcgaggctg atctcgcccc 2041 gggcatctgc cggatcgttc caatagaaat ccgccttgcc gtcctgaccg atgatcaggt 2101 ggcagtccag ctcgccgaag tcttccgccg tgcggacttc cagttccgtg gcggcctcga 2161 ccagctgcca gtagtccgcc aggctctcca tgccgtaggt gatgtcggcc ttttcgccgt 2221 tttcatagag ttcttcgtaa taagacgatg gagc // LOCUS sequence205 2252 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence205 VERSION sequence205 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2252 /mol_type="genomic DNA" /organism="" /note="sequence205" misc_feature <1..1476 /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_010966446.1:biosynthetic-type acetolactate synthase large subunit" /note="WP_010966446.1 biosynthetic-type acetolactate synthase large subunit (Clostridium) [pid:43.1%, q_cov:98.4%, s_cov:86.6%, Eval:2.6e-103]" /note="MGA_869" /locus_tag="LOCUS_5910" CDS 1486..1980 /product="acetolactate synthase small subunit" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_012545180.1" /transl_table=11 /codon_start=1 /translation="MRSVVAIYVENNFGVLTRVAGLFMRKGFNIDTLSVGETEDPRYSR ITVVFDGDEYGRGFLIKQVGKLHEVKKIKLMETDNNIEREHMLVKVRNTTESRAELKSA ADLYHASIVDFNPDVICVEVSGEPKIMEEFLNKMKPLGIVEMCRSGIICIDCAGNIFDA V" /locus_tag="LOCUS_5920" /gene="ilvN" /EC_number="2.2.1.6" /note="WP_012545180.1 acetolactate synthase small subunit (Thermodesulfovibrio) [pid:40.9%, q_cov:93.9%, s_cov:94.5%, Eval:1.3e-28]" /note="MGA_870" ORIGIN 1 gcgacttccg gtcccggtgc cacgaacctg acgacgggtc ttgctgccgc catgatggat 61 tccgttccgg tggtcgcgat caccggcaat gtgccgacct atttcatcgg caaggactct 121 ttccaggaga tcaacactat cggcatcacc atgccgatca ccaaacacaa tttctacgtc 181 accgacgtta caaagcttgc ggagatcatc cgcgaagctt tccgcatcgc gaaatccggc 241 cgtcccggcc ccgtcctcgt ggacatcccc agcgacgttc aggcggcgga aacggatttt 301 acaaagtggt acgaggtaca gccttatcag gaagaccagg cgcccgagag cgagatctgg 361 aaagccgtgg agctgatcaa caaggcgaag cggccctaca tctacgtggg cggcggagca 421 gccagccgga acctgggcaa ggcggtcatg gcgctggcag ataagatcga cgcctgcatc 481 ggcagcacgt ttatgggcct ttcctgtgtt cctggcagct gcgaacgcta cctgggcatg 541 cagggcatgc acggccgcta cgcctccacg aaggccaact gggaggcgga cctgatcatc 601 ggcatcggcg tgcgcttttc cgaccgggct acgggcgatc agaaagccta tagagacagc 661 aggagcatca tccagatcga tccggacttc tctgagatca acaagaatat caacgtggat 721 gtggggctca tcggcgacat cgtcttcgcg gtcgaccgca tcctgaagaa cgtaaataaa 781 gcggagcatc cggaatggat gagccgcatc gcagaactca aaaaggaagc gaaagccatc 841 cgcgaccatg cggaggagac ggcggaagat ccctttacga gcattaaact gttcgacgcc 901 atcaacgagc tgaagaccga cgatacgatc atcacgacgg acgtgggcca gcaccagatg 961 tgggcgggtc agttcctgga attcgaaaag ccgcgcaaat tcctgtcttc cggcggcctg 1021 ggcgccatgg gctacggcct gggcgccgcc atcggcgcaa accttgccac gggggaaaga 1081 actgtaatga tcacgggcga cgccagtttc tccatgaacc ttatcgaact ggcgacggcg 1141 gtctcctata agacgcccat cgttatcgtg ttgctcaaca acaactcgct gggcatggtg 1201 cggcagctgc aggccgtgta ctgcgacagc cgctattccg ctacgcttcc ggacagaaag 1261 accgatttct gcatggtggc gcaggggttc ggcgcggcag cgaagcgggt cacagacatc 1321 gatgctttta agtctacttt tgcagaagcc cttgtctcgg atagacctta cgtgatcgag 1381 gccatgatcg acacctggga gatggtgctc ccgatgctgc ccaacggcgg aacgatagac 1441 gatcttatta ccgaaaaacg gcagaagaca gagtaggagg atgccatgcg aagcgttgta 1501 gcgatctatg tggaaaataa tttcggcgtc ctcaccagag tcgccggcct gttcatgaga 1561 aagggcttca acatcgatac cctgagcgtc ggcgagaccg aagacccccg gtattcccgc 1621 atcaccgtcg tcttcgacgg cgacgagtac gggcggggct ttctcatcaa gcaggtggga 1681 aaactccacg aggtaaaaaa gatcaaactg atggagaccg acaacaacat cgaacgcgag 1741 cacatgctcg tcaaggtgcg caatacgacg gagagccggg cggaactgaa atccgcagcg 1801 gacctctacc acgccagcat cgtggatttc aacccggacg tcatctgcgt cgaggtgtcg 1861 ggtgaaccca agatcatgga ggaattcctc aacaagatga agcctctggg catcgtggag 1921 atgtgccgct cgggcatcat ctgcatcgac tgcgccggca atatcttcga tgcggtatag 1981 attctgttat cacttatttg tcatatacat agttctttta taacaaggag agtaaacatg 2041 cagagaattt tctatcagca ggactgcaat ctggacaagc tcaaggataa gacagttgcg 2101 atcatcggtt acggttctca gggtcacgcg cacgcgctca acctgatgga atccggcatc 2161 aaggtcatcg ttggcctgta cgaaggcagc aagagctggg aaaaggccga acagcagggc 2221 tgcacggtca tgaccgcagc agacgcagcc aa // LOCUS sequence206 2252 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence206 VERSION sequence206 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2252 /mol_type="genomic DNA" /organism="" /note="sequence206" misc_feature <1..609 /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_000008568.1:M3 family oligoendopeptidase" /note="WP_000008568.1 M3 family oligoendopeptidase (Bacillus) [pid:44.8%, q_cov:95.0%, s_cov:33.9%, Eval:1.0e-46, partial hit]" /note="MGA_872" /locus_tag="LOCUS_5930" CDS 609..1178 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MAFGDRKKKKYAEFIETASGEVVYVGKYYVYMPDNPLPYNRYRIA LALCCTGAAALVAAAGLYRAPGMDRTLYVLLPYVILLGFTALMCYRGAKVVRAGNPLRA FDYRNALGPMQHWALASAVFAAILLVCYFVHLVRAGAEGCSMAAVVSFPLMIALIAVSD LGLLYVVRKNGWREAEETPDSGENEE" /locus_tag="LOCUS_5940" /note="MGA_873" misc_feature complement(1235..>2252) /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_011087584.1:FAD-binding oxidoreductase" /note="WP_011087584.1 FAD-binding oxidoreductase (Bradyrhizobium diazoefficiens) [pid:28.4%, q_cov:95.6%, s_cov:51.6%, Eval:7.1e-27, partial hit]" /note="MGA_874" /locus_tag="LOCUS_5950" ORIGIN 1 accatcgcgg acaaccgcta tgtggtggag ctcaacgtgg gcggcatgga gacggcggag 61 actcactcca tgagcatgga gttcttcgcc tggccctggg aagagggctt cttcggagag 121 gatacccgca agttctacta cagccacctg gcaggtgcgc tgcagtttat cccctacggc 181 acgctggtgg accacttcca gcacgaagtc tacgccaacc cggactggac tccggcgcaa 241 agacacgcct gctggaagca gctgcagcag atctatatgc cctgggtaaa gctggatgga 301 gacatcccgt tctacagcga aggcatggcc tggcagagac agcaccacat ctactccagt 361 ccgttctact acatcgatta ctgcttggcg cagaccgtat cgctggaatt ctgggcgctc 421 attcagaagg atttcaaggc ggcctggaag acctatatgg actacaccgt gcagggcggc 481 agcgacacgt ttaccaatat gctgaagaaa gccggcctgg atacgccgtt cgacgaagcg 541 tgcctcaaga acgcttccgc cgcggcgaag aaatggctgg atgagttcga cctgaccgga 601 atagagtaat ggcgttcgga gacagaaaga aaaagaaata cgcggagttt atcgaaacgg 661 catccggcga agtggtgtac gtaggtaagt attacgtcta catgccggac aacccgcttc 721 cttacaaccg ctatcgcatc gcgctggcac tgtgctgcac cggcgctgct gctctcgtgg 781 cggcagcagg tctgtaccgg gctccgggca tggaccgcac gctctacgtg ctgctgccct 841 atgtcatcct gctgggattt acggcgctca tgtgttaccg cggggcaaaa gtcgtgcggg 901 cgggcaatcc gctgcgcgct ttcgactacc gcaacgccct gggacccatg cagcactggg 961 cgctggcatc cgccgtgttc gccgcgatcc tgctggtgtg ctatttcgtt cacctcgtcc 1021 gggccggagc cgaaggttgt tccatggccg ccgtcgtcag ctttccgctg atgatcgcgc 1081 tcatcgccgt atcggatctg ggactgctgt acgtggtccg caaaaacgga tggcgcgaag 1141 cagaagagac gccggacagc ggggaaaacg aagaataaaa gaacgtaaaa aagtcccggg 1201 ccgtatggtc cgggactttt gtatgttcga aacgttattc gatggggatg cgcaccctgc 1261 agtcggagag gggataggca gcgcaggcgt ggatgtaacc gaagtcctta tccgcagccc 1321 gtcttccgtc gttctccggg cagatgaata cgttgccggc gaggagcttg ctgcggcaga 1381 acccgcattc gccgctgcgg cagcccgttt cgatgcggat gccggcgcgt tcgagcgcca 1441 cgacgatgct ctccgtcgct tttgccggga tcctgtcttc gtggatgccc cggacgaccg 1501 tcagttcgaa cgtcttatcc gccatgcctt cgggataacc ggcaaactgg gtgatatcct 1561 tcgcctggcc gaatacctcg aaacggatcc ggcgggcggg aatgcccatt ttgtccagtt 1621 ccccgtgcag gaagcggtac atcacctggg gtccgcagat aaagaacgtg cagtcgccct 1681 cagcatattt gcggatgagc tccgcggaga ggaatcctct ttcgcccggc cagtccggtt 1741 cgtcgccgga caggacgtgg acgatccgca ggcggtcgct cttcagctgc tccagttcct 1801 ccttcagggc gatatcgtcc gaggagacgg aaccgaacag gatcgtcaga tccatatcga 1861 gcgtgccgtg ggccacttcc ttcgccatgg acgcgaaggg ggtgatgccg acgccgccgg 1921 ccagcgccac gacgtgcttc gcatctctca gcggttcgta gtagaactgc cccagaccca 1981 tctgtccccg gaacgtatcg ccgggcttca cgttgtcgtt gatgtgatcg cagataaacc 2041 cgtcaccctt ggaacgccgc accgtgatct ccacgaaggg gtgatcgtcc agacgcgctt 2101 cgaacggcgc ggaggagatg gaataggggc gggagatgag gctgtctccg atggggaaat 2161 ccagcacgat atactgaccc gcgtagaacg ggggcagctt ctttccgtcc ggccgctcaa 2221 agcgcagcgt gacgctggtc ttgctggtgg ga // LOCUS sequence207 2243 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence207 VERSION sequence207 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2243 /mol_type="genomic DNA" /organism="" /note="sequence207" CDS complement(273..740) /product="Na+/H+ antiporter subunit E" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011024441.1" /transl_table=11 /codon_start=1 /translation="MFLFLFALWLVFNGRVTAETVLLGLLFAAAIFAFMCRFMDYSLEK DRKAIRLAPLVVRYFFVLLAEIVKSTFTACRFIVSPTLPHDPLLVKFRTPLSTDVARVT LANSITLTPGTITVSLDDGTYTVHCLDKSMAEGIESSRFVQLLLRMEEVTR" /locus_tag="LOCUS_5960" /note="WP_011024441.1 Na+/H+ antiporter subunit E (Methanosarcina acetivorans) [pid:25.7%, q_cov:90.3%, s_cov:87.3%, Eval:5.8e-12]" /note="MGA_876" CDS 912..1403 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MAMFGSKKETPAPVVKAAPAPVVEEPVAPAVPEVKRPRTLIGPGI KFTGNIEASEDIEINGRVEGNISSGNTITVTEGGSIKGDIAAENYILDGVSEGNAKVQK FCKIGKAGSFTGELFASTLVTEDGSEFEGTLHLKKAKAPVFVQPEEPAPEEAPAEEPAF " /locus_tag="LOCUS_5970" /note="MGA_877" ORIGIN 1 gtagatgcgg gaaaagacca cgaccgcaag aaagctgatc atggcgtaga gcagcccgat 61 gtcgatcagg ctgggatctt taaggatggc ggacataaag acgatggcgg agatgaccat 121 cgtgccggcc atgttgatgg acaggatgcg gtccgcgatg cgcgggcccc ggatgctgcg 181 gatgatgcaa aacagaagaa gcagcgccaa cagggcgatg ccgccgatga ggatatagcg 241 ggagaacaat gcgagacggg ggtcggtaaa catcagcggg tcacctcctc catgcgcagc 301 agcagctgta cgaagcggct cgattcgatc ccctccgcca tgcttttatc caggcagtgc 361 accgtgtagg tgccgtcgtc cagcgatacg gtgatggtgc ccggcgtaag cgtgatggaa 421 ttggccaggg tcacccgggc gacgtccgtc gaaagcggcg tgcggaattt gaccagcagc 481 gggtcgtggg gcagcgtggg acttacgata aagcggcagg ccgtaaaggt ggactttacg 541 atctccgcga gaagtacgaa gaaatagcgg acgaccagcg gtgcgagccg gatcgccttg 601 cggtcctttt cgaggctgta gtccataaaa cggcacatga atgcgaaaat ggcagcagca 661 aaaagcagcc ccagaaggac tgtctcggcg gtgacccgcc cattgaatac gagccagagt 721 gcaaacagga aaaggaacat aggacctcaa aataccgata ttctctcaat tttattatcc 781 cataaactgc cttgtgctgg caaggggaaa tcccctcccg tctcgggctt gtgccgaccg 841 ttttcttgtt gtaaaataga aaggacatag agatcgtatc ctcaatttcg tatagaaagg 901 cagtatatac catggcaatg tttggttcaa agaaagaaac tcccgctcct gtcgttaagg 961 cagcgccggc tcccgtcgtc gaagaaccgg tcgcgcccgc ggttcccgaa gtcaaaagac 1021 cgcgcaccct catcggcccg ggcatcaaat tcacgggtaa catcgaggcg tccgaagaca 1081 tcgagatcaa cggcagagtg gaaggcaata tcagctccgg caacaccatc accgtaacgg 1141 aaggcggctc catcaagggc gatatcgcag cggagaacta cattctggat ggcgtatccg 1201 aaggaaatgc gaaagtccag aagttctgca agatcggcaa agccggcagc tttaccggcg 1261 aactgttcgc ttccaccctc gttacggagg acggttccga attcgaaggc acgctgcatc 1321 tgaagaaggc aaaggcaccg gtcttcgtac agccggaaga gcccgccccg gaagaggctc 1381 cggcggaaga accggccttc taaacccgca accctgaggg cgagcaagtc tcgccctttt 1441 ttataccgtc ggttggagtg tttttatgaa tatctttaat gtgatctcac tattgggcgg 1501 tctggccatg ttcctgtacg gcatgcgcat gatgggcgac ggactgaagg aaagctcgtc 1561 cggcaccctg aagatcgcca tggagcaggt gacgaacaat ccctttaagg cgtttctgct 1621 cggcgttctc gtaacggcca tcatccagtc atccaccgcc accatcgtca taacgtccgg 1681 tctggtgggc gccggcatca ttacgctcaa acagtcgctg ggcatcgtca tcggcgccaa 1741 cgtcggcacc acggtgacgg gccagatcat ccggctgctg gacgtcgacg attccgccac 1801 ctcctggctg cagttcttta aaccttccac gctggcaccc ctcgccctca tcatcggcat 1861 ggtgctcatc atgggcttta agtttaagaa ctccagccga atcggcacca tcgccatcgg 1921 cttcggcatc ctgttctccg gcctcatgaa catgacgggg tctgtcacga gcctgtcgga 1981 cagcgggctt ttcgaaaaca tgttctcccg cctgggagac aatccggtcc tgggatacct 2041 caccggcgcc ggcatcgcgt tcctgctgca gagctcgtcc gcgaccatcg gtatcctgca 2101 ggctttctcc atgacggggc tgctgtcctg gaacgccatc tacgctgtca tcgtcggcat 2161 ctatctcggc gactgcgtga ccaccgccat cgtctgttcc atcggggcaa agcccgaagc 2221 gaagcgggtg ggcgtggtca aca // LOCUS sequence208 2236 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence208 VERSION sequence208 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2236 /mol_type="genomic DNA" /organism="" /note="sequence208" misc_feature <1..1081 /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_005814361.1:TetM/TetW/TetO/TetS family tetracycline resistance ribosomal protection protein" /note="WP_005814361.1 TetM/TetW/TetO/TetS family tetracycline resistance ribosomal protection protein (Desulfitobacterium hafniense) [pid:41.1%, q_cov:96.4%, s_cov:40.0%, Eval:1.4e-71, partial hit]" /note="MGA_879" /locus_tag="LOCUS_5980" CDS 1082..1825 /product="RNA-binding protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003232140.1" /transl_table=11 /codon_start=1 /translation="MEKEEKLLLAQAEDKARQRNNRNILTHTGFLSMAEQALLEHTHPD GTFYGGYEDAERCMLVFLPDWLTDIPAEDGPVCVLRVTLPKGASKLTHRDYLGSLLALG VERSVIGDILVQENGADILVSADMADYLVQNYVQAGRTSLSCTILPLSALRPGVFTVET RRDTVASLRLDSVLASMFSMSRGKAQEAIHMGLAAVNNRIVDKPDHFLSEGDKVSLRGK GKAVLKEVGGKSRKDRDCIVFERYL" /locus_tag="LOCUS_5990" /note="WP_003232140.1 RNA-binding protein (Bacillus) [pid:37.2%, q_cov:88.3%, s_cov:86.0%, Eval:4.1e-33]" /note="MGA_880" ORIGIN 1 cgcggtgcgc cagggcctga tgtgcgcgaa aaacgtactg ctggaaccct ggtaccgctt 61 ccgcctcgag gtgccgcccg aatgcatcgg cagagccatc ggcgacgtaa aggccatgca 121 cgcggaattc gaaggcccca tcgacagtgt ggacagcctg ctccttaccg gcacggctcc 181 cgtatcggag atgcaggact accagaagga actgctctcg tacacgaaag gccgcggcaa 241 gctgacttgc cgcttcgagg ggtatttccc ctgccacaac acggcgaagg tgatcgaaga 301 gaccggttac gacgcagagc gggacgccga taatccagcg gactccgtgt tctgctccca 361 cggtgccggg gtcaacgtaa aatgggacaa agtccgggac tttatgcacg tggacagcgg 421 cctgcgggta gcggacggcg aggtcgtaga ggcatcttcg cccaaggtgc gcaccgccgg 481 cagcctcgat ctggacgagc gggcgctgga agagatcatg gcgcgggagt tcgggcccat 541 caagcggccc gtctacagtg cggtgacccg gggagaaaag gccgcgaaag acgccaaacg 601 gcaggagatc cgcaaagact acctgatcgt ggacggttac aatgtgatct tcgcctggga 661 cgaactaaag gagctggcaa aaggcagttt cgcgggcgcc agagaacgtc tcgtcgaaat 721 gctcgtaaat taccacggct accggggcgg cgagctggtc ttggtcttcg acggttacaa 781 agtaaaggga aatcccggca cacgggaaga gaccggcggc atccatgtag tctacacgaa 841 ggaaaacgaa agcgccgaca actatatcga gaaactggtg cacgagatcg gaaagaacta 901 tcacgtgcgg gtggcgacct ccgacggact catccagctg acggctctgc gcatgggcgt 961 gcagcgaatg tcttcccgcg aactggagtt cgaggtgcgg caggcgctct cggagatcga 1021 cgacgtgctg gcgtcccagg acaggagcgc gtataagctg ggcgacctgg tggaactata 1081 gatggaaaaa gaagaaaaac tgctgctggc acaggcagaa gacaaggccc gccagcggaa 1141 caacagaaat attctcaccc acaccggttt tctctccatg gcggagcaag cgcttttgga 1201 acatacccat ccggacggaa cgttctatgg cggctacgaa gatgccgaac gatgcatgct 1261 ggtatttctg ccggactggc tgacagacat accggccgaa gacggcccgg tctgcgtgct 1321 gcgggtgacc cttccaaaag gcgcctcaaa actcacccac cgggactatc tgggctccct 1381 gctggcgctg ggcgtagagc gttccgtgat cggcgacatt ttggtgcagg aaaacggcgc 1441 ggacatcctg gtttccgcag acatggcgga ttacctggtg cagaattacg tgcaggcagg 1501 cagaacgtct ctatcctgca cgatcctgcc gctttccgcg ctgcgcccgg gggtttttac 1561 cgtggagacc cggcgggata cggtagcgtc tctccgcctg gacagcgtgc tggccagcat 1621 gttttcgatg tcccggggaa aggcgcagga ggcgatccat atgggactgg cggcggtcaa 1681 caaccgcatc gtggataaac cggaccattt cctctccgaa ggcgacaaag taagcctgcg 1741 gggcaaagga aaagcagtcc ttaaagaagt cggcggcaag agccgcaagg accgggactg 1801 catcgtgttt gagcgctatc tgtgatcaac aaaataagta aataaaagcc gaaccatacg 1861 gttcggcttt tttcatgctt tcgctgcact atttgcaggt ttccacgaag gccttgaaga 1921 tcttcttcat gtcttcgttg tcgtacatct tccttgccaa ggttgtcttt ttgtgggtac 1981 aaacctattt tatttcttca gcaatctcgg tgcaagcaga actgccagcg ccagaccgca 2041 gatgcccgcc gtaagcttcg cggcgatcat ggggacggaa acttccgggg cggcagccgc 2101 cagataggca agatggtcgc cgaacacgaa gcaggcggac gtagcaaacg caacattcag 2161 catgcggcct ttctcgtcca tcaggggcag atccgccagc gtcggcagcg aactggccag 2221 cgtggtcagg aaatcc // LOCUS sequence209 2235 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence209 VERSION sequence209 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2235 /mol_type="genomic DNA" /organism="" /note="sequence209" misc_feature complement(826..>2235) /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_012047966.1:M20 family metallopeptidase" /note="WP_012047966.1 M20 family metallopeptidase (Clostridium botulinum) [pid:30.7%, q_cov:95.1%, s_cov:80.8%, Eval:2.1e-57]" /note="MGA_883" /locus_tag="LOCUS_6000" ORIGIN 1 gttggacacg ggacaagtgg cgaccgtcgc ccccttctcc cggatgatat ccatatcgct 61 ctcctcgatc cacacgcagt gggccagggt agcgggcaca tccagcaggc cgcagtccgc 121 cagatattcg atgtcggtgc ggccgtttct gcgcaccttg cactccgccg cttcgctctt 181 cgtctccgcc gcgtggatat gcagatgcac gccctgctct ttcgccagcg ccgcgaggcc 241 cttcgccacc ttctcggtgg aggtgtactc gccgtgcagc gccagatccg tcaggatgcg 301 gccgtctgcc gccccgtgcc attgtttata ggcatcgcag gcgatcttat aagccggcag 361 atcttcgaat gcagaatcgt cgaagcacag cacggcgttg ctcatgttca tcttgcagcc 421 ggcttcggcc accgccctgc ccgcatcatc aagccagtaa tacatgtccg tggagctcac 481 gatgccgctg cggatagact ccgccatggc cagcttcacg cccgtgtaga tgtcgctgcc 541 caccatcttc gcctcgaagg ggaagatctt ggtgttgagc cagtcctgca gattcatgtt 601 ttcggcgtag ccccgcagga gggtcatggc gctgtgggtg tgggcgttgt agaaagccgg 661 catcaacagc tttccctgcc ccctataaac agagccgaag tcttccttcg gctctgcagc 721 tcccacatac gcgacgcgtc cgtcctttac gcccacgaac tggtgctcgc ggaccgcaaa 781 gttctcgtct aagatcgtaa tgtcggaaaa tatcatgttt tgtccctact tccaaagaga 841 ttcgatcagt tcctgggtca cggcgggcag ttcttccagc aggctcttct tgagcgcgcg 901 ctcggtccac tggtgatatt ccttcgtgat gggtccgtac aggataaacg gaatgttgtt 961 cgcttcgatg gtcttgaagt ccacggtgta cagctggccg tagcacggcg tattcaggga 1021 gaacttgtcg taatcgaagg ggtgacccac cgcagtatag gaaccgtcgg aaatacccat 1081 gaagtagtgt tcgttgaagg attctctgcc gaacttttcc ttggcagcct tctccacgac 1141 ttcgtaagcc ttgagggcgg cgttttcctt gcccttgacg gcgtcgccgt tgacagccgg 1201 ataataggga ggcgcgaagc ccagcagcac ggtgggctgc ttgaggtctg cgtagtccat 1261 gaccttctgc atgatctcta ccgtggcatc ggggaagttg atgcggcctg cttcgatgtc 1321 gtccttaatg ccgttgtaga cttccgcgaa gaacttctcg aaaccttctc tgtcggtctg 1381 cttgatctta gcgaccagtt cctcgaaggt gtagacctcg ggatagtaga ccaggtggtc 1441 cttatcggcg gacttgtcga tcttcttgta ttcctgatag gtagcgtcga tcttggcgca 1501 ctcttccttc aggacctcca tggagatctc cttgaggcgt gcgatgatct ggtccggcgt 1561 tctgtcgaag tgcagcagcg taaagtagcc gtaagcccgg agaggaatgg ttacgtcgta 1621 cagttccttg ttgtcgcgga acttctgcca ggtgggcggg caggctgcct cgccgtcgta 1681 ggaatcggag aattccagcg cgttgttggt tctctgatag atgcctgcca ggaagttcat 1741 gggggagatg ccgttgaagc agtgacccac gtgagcggtg acgccctggg ccatgacgac 1801 gggcatcagc ttgccgacgg tacctctgga gaaggactgc ttgccgccta cccagttgga 1861 gggttcgggg atgatcatca gctgaacgtc cagctgatac tgctcgacca gtctgcggat 1921 gatcttggcg ccctctctca taccgacgga gaagctttcc tcgtcaggta cgggcagata 1981 catgtagcag ccgggcagtt cgcccttctg cgccatctcg gcgtattctt cgaacagtgc 2041 cagatgaacg gcatgtccgc ccttcatatc gcctacgccg cggccccaga tccattcgcc 2101 gctgttcatg tcgaaacggg cttccgcatc cagatttctg gttgccagag ccttttcgag 2161 ctcttcgcct acgtggaagg ccatgtcctt taagggaccg tagttatcgg tgccgactac 2221 gtcgaagtga cccga // LOCUS sequence210 2234 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence210 VERSION sequence210 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2234 /mol_type="genomic DNA" /organism="" /note="sequence210" misc_feature <1..1138 /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_012582490.1:M20 family metallopeptidase" /note="WP_012582490.1 M20 family metallopeptidase (Dictyoglomus turgidum) [pid:36.1%, q_cov:99.5%, s_cov:96.9%, Eval:3.0e-61]" /note="MGA_884" /locus_tag="LOCUS_6010" ORIGIN 1 cccggagatc gtcgcgatcc gcagagatat ccatcagcat gcggagaccg gttttcagga 61 attccgcaca tcgaagatca tcaaggaata tttaaaggag ctgaacctgg acagcattca 121 ggaatgcgcc gggaccggtg tgatcgcgac cctcaaaggc ggaaagccgg gaaagcgcat 181 catgctgctg gcggacatcg acgcgctgcc catggaggag aagagcggag aaccgtttgc 241 atcggaaagc aagacggcgg gtcactgctg cggtcacgat gcgcatactg cgatccagct 301 gggcgttgcc aaagttctgg cgaagcaccg ggacgaaatc cccggcagtg tcgtcttcct 361 gttccagccc aacgaggagg atgccggcgc acagatcatg atcgacaacg gtgcggtgga 421 gatggcgggt cacccggatg cgatcttcgg cagccacaac agcccagccc tgcggcttgg 481 ccagttcggc gtcgttcccg ggcctgcgat ggcttccagc tattattata agatcgtgat 541 ccgcggcaag ggcggccacg gaggcagacc ccacctggcg gtgaacccgg tggatgccag 601 cgctttcgtg ctgctggcga tcaagaacat gatcacggcg gagcagtcgg cgctggaacc 661 caccgttatt acgaactgca tgatccacgg tggggagaag gagatcacga tcccggagac 721 ctgcgagatg caggggtcca tccggtgcct gcatgcgggt cacgaagcgg tgcacgcccg 781 gtttaaggaa gtcgtggcgg cagcctgcgc catcaacggc tgcacctgcg agatcgagct 841 gaagtgcggc aattcgctgc tgtacaacga tccggatctg gcggaactgt gcgccgagac 901 catcaaggag gctttcggcg aggactgcat cgtaacggag ggcgtaaagg ctatgggcgg 961 cgacgattat gcagaattcc tgccctacat gcccggcaat tacatctggt atggaacggc 1021 ggatgacacc ggggagtggc cggggctgca taatccggcc taccgcttta acgaaaaggc 1081 gatcccgctg tttatggaag cacagatccg ctgcgtcatg aagtatttgg agcagtaatc 1141 gaataggact attaacaaag tgtagttgta aaatgtgatg caaactacac tttgtttctt 1201 gttgagcctc ttttgttcct gtaaagtata agtgcaaaaa cctgttcaaa catttccatc 1261 catatacgaa aaggagcaaa accatgagtt tcaagaccga tcttcttcac gacaaccaag 1321 tccatcagaa gctgtggggc gactacaaga gcatcgcagc cacccatacc agcccgatct 1381 accagaccac gaccttcatc ctggacgact tcgacagcgc cgtctacctg aaccagcacg 1441 tggaccaggg cttcgtctac agccgtttcg gcggtccgtc cagcgacgaa ctggagagaa 1501 aagtagctca tctggagcac gcagaagcgg cgttggcgct ggcttccggc ctgggcgcca 1561 tctccacggc agctctgtcc tgcctgaagg ccggcgatca cgtggtcttc ggcgacgtca 1621 tctacggatg cacgtttacg ctgttcgcca aggtcctgac caatttcggg gtcacctaca 1681 ccagagtcga caccacggat ccccagaatg ttgcagacgc catccagccc aatacgacgc 1741 tggtctacgt ggagaccccg gccaacccga ccctgaagat ctccgacatc gaagcgatcg 1801 ccaagatcgt tcacgagcat gaaggcatga agctgatcgt agacagcacc ttcgcttctc 1861 cctatctgca gaaccccatc gatctgggtg cggatatggt cgttcacagc gcgacgaaat 1921 atctgtgcgg tcacggcacc gcaacggcag gcgtgatcgc cggccgcaaa gaactgatcg 1981 accgctgcag gatgcccttt atgcagtgct tcggcgctgt gcttggaccg ttcgaagcct 2041 ggctcgtcat gcagggcatg aagacgctgg ccgcccgcat ggacgttacc tgcgccaatg 2101 ccatgaaggt cgcgaagttc ctggagaacc atcccaagat cgaccgcgtg tactatcccg 2161 gtctggagag ccatcccacc cacgccatcg ccaagaagca gatgcacaac ggtttcggcg 2221 gcatgatgag cgcc // LOCUS sequence211 2233 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence211 VERSION sequence211 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2233 /mol_type="genomic DNA" /organism="" /note="sequence211" CDS 109..1587 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MGRHTRKKKRVKIHYGRFCLFLGVVAAVIFAGILFWPLPAEAEPE VFDVDPLEEETVQEPVHLSIRAVGDVMCHPAQYQSAYNASTGEYDFSGNYIYLKKYIQD ADLALCNVETTFKGDGNYVGYPIFNSPDSLATAIKDAGFDVAWFANNHMIDTGRTGVMR TVELMRGEGMTVAGARLETSEPRSPIVDVKGVKIGIVAYTYETTTGERRLINGNPIWDG GTDYINSFRCESGLAYAVEADRAAIAAEIKGCKDRGADLVICYFHWGNEYQREYNAGEE KMAQFAADAGADMIFASHPHLLQGVDCFEYQVKYPEPEPEIVEPEPEPEEEKEPWIIRV RKHFGLIKEEEPVEEPEPVEEEPKPEFWTKKVPVFYSMGNLVSNQRVETMSDYIPAKAR FTEQGMVAWVDFDYDQETGEISNLQMQCLPTWVEKYKKNGHVEYYIIPLDKDLNSNPEL ANSGHLSRAQQALQDVKDLIEDPENPVCKVIDGY" /locus_tag="LOCUS_6020" /note="WP_005808454.1 CapA family protein (Desulfitobacterium hafniense) [pid:29.9%, q_cov:60.0%, s_cov:64.8%, Eval:7.9e-31, partial hit]" /note="MGA_887" CDS 1577..2095 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MDIRFDLVKKLTKPLPKAKGITLRSLRTSEDGQSASAILMAGGYQ QIREEVENYRMLTGLPLNARSKGRSLELTSECGDGSALVLMDFLKWISFNSEDVMETIE FFDRYLGKDADSDIRVLSMDMSAEDLRIACALEAGEGETPESIFAYVSSLLDRYDMGII KEETAEETE" /locus_tag="LOCUS_6030" /note="MGA_888" ORIGIN 1 ccgttaagaa cggcatcgaa tccttcctga aggaaaactt tgcggaagtt aaggcagtag 61 aagctgtcaa catgtatcag ttctaaagag accggttaaa ttcagggtat gggaagacat 121 acgagaaaaa agaaacgcgt aaagatccac tacggcaggt tctgtctgtt cctgggcgtc 181 gtggcggcgg tcatcttcgc cggcatcctg ttctggcccc ttcctgcgga agcggaaccg 241 gaagtgttcg acgtggatcc tctcgaagag gagaccgtcc aggaaccggt gcatctgtcc 301 atccgcgcgg tgggcgacgt gatgtgccat ccggcgcagt accagtccgc ctataacgca 361 tcgacggggg agtacgattt ctccggaaac tatatctatc tgaaaaagta catccaggat 421 gcggacctgg ccctctgcaa cgtggagacc acctttaagg gcgacggcaa ttacgtgggc 481 tatccgatct tcaactcgcc ggattctctg gcgaccgcca tcaaggacgc cggtttcgac 541 gtggcgtggt ttgccaacaa ccacatgatc gataccggcc gcaccggcgt catgcgcacg 601 gtggaactga tgcgcggcga aggaatgacg gtggcaggcg cgcgcctgga gaccagtgag 661 ccccgcagcc ccatcgtgga tgtgaagggc gtcaagatcg gcatcgtcgc ctatacctac 721 gagacgacga ccggcgaaag acggctcatc aacggcaatc ccatctggga cggcggcacg 781 gattacatca actcgttccg ctgcgagtcc gggcttgctt atgccgtgga agcggaccgg 841 gcggcgatcg ctgcggagat caagggctgc aaggacagag gcgcagacct ggtgatctgc 901 tatttccact ggggcaacga ataccagcgg gaatacaacg ccggggaaga gaaaatggcg 961 cagttcgcgg cggacgccgg cgcagacatg atcttcgcct cccatccgca cctgctgcag 1021 ggcgtggact gcttcgagta tcaggtgaaa tatcccgagc ccgagccgga gatcgtggag 1081 ccggaacccg aacccgaaga ggagaaggag ccctggatca tccgggtgag aaagcacttc 1141 ggcctcatca aggaggagga accggtggag gagcccgaac ctgtcgagga agagcccaag 1201 cccgagttct ggacgaagaa ggtgcccgtg ttctattcca tgggcaacct ggtgtccaac 1261 cagcgcgtgg agaccatgag cgactacatc cccgccaaag cccgctttac ggagcagggc 1321 atggtggcct gggtcgactt cgactacgac caggagaccg gcgagatctc caacctgcag 1381 atgcagtgcc tccccacgtg ggtggaaaaa tacaagaaga acggccacgt ggaatactac 1441 atcattccgc tggataagga cctcaacagc aatccggagc ttgcgaacag cggccatctg 1501 agccgcgcgc agcaggcgct gcaggacgta aaggacctga tcgaagatcc ggaaaacccc 1561 gtctgcaagg tgatcgatgg atattagatt cgacctggtg aaaaaactca cgaaaccgct 1621 gccgaaggcg aagggcatta cgcttcgcag tctgcgcacg tcggaggacg ggcagagcgc 1681 ttccgctatc ctgatggcgg gaggttacca gcagatccgg gaagaggtgg agaattaccg 1741 catgctgacg ggtctgcctt taaacgcccg ctcgaagggc cgcagcctgg aactcacgtc 1801 tgaatgcggc gacggctccg ctctcgtgct gatggatttc ctcaagtgga tctccttcaa 1861 cagcgaagat gtgatggaaa cgatcgagtt cttcgaccgc tacctcggaa aagacgcgga 1921 cagcgacatc cgggtgcttt ccatggacat gtccgcggag gatctgcgca tcgcctgcgc 1981 cttggaagcg ggggagggcg agacgccgga gagcatcttt gcctatgtat catccctgct 2041 ggaccggtac gacatgggca tcatcaagga agagacggcg gaagaaactg aataaaacgc 2101 aagatgtggt gggttcaccg gaaggtgacc ccctatctat agaaagatgt gaaacacccg 2161 gatgagttgt cgtgaaatcg aagatatgca ttcgctgcat aaaccccgga aagccttaaa 2221 ataagcgctt ttc // LOCUS sequence212 2227 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence212 VERSION sequence212 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2227 /mol_type="genomic DNA" /organism="" /note="sequence212" CDS 321..1232 /product="transketolase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_010875269.1" /transl_table=11 /codon_start=1 /translation="MAKKTYTNEEIQQTANKIRKQVLKFAIERGGCYITQTNSSAEILA TLYLDVMNLGDSLGDPDGIPFPGVPGPDNMDFPRGSLYNGPTQAPYDRFFLSPAHYACT LYCTLFAVGRISETGIERFNKDGWIFEQIGAEHSPGFETTAGSLAQTISVACGTAHARK LKGEEGTIWCFMSDGELEEGQLWEAIQAAAFYKLDNFVLVCDINGQQIEGPTKEIMNTQ PLYDRFTAFGAKTVEIDGHDIQAIKDACHTAHPGQPLVVLCNTKPTHGMPFLDHRTERL HFVNVKTPEQIAEAKAFYDSME" /locus_tag="LOCUS_6040" /note="WP_010875269.1 transketolase (Sinorhizobium fredii) [pid:35.1%, q_cov:97.0%, s_cov:96.4%, Eval:3.1e-39]" /note="MGA_890" ORIGIN 1 gacgcggaag tcgtcgcgtt ctgcacggag atggtcgcgc gcatgctggt ggacggcaag 61 ctgcagtacg gagaggatct gcgccccgac gtggagaatc cgtactacaa atccccgaac 121 accctgaaga agatcgcagc ccgcgaggag cgcatccgtg caagaaaaca acagtgaccg 181 cagcgatgcg gacaggcctc cggcgctgcc gggggctttt gctattgatg gaagtttatg 241 atataattaa tcggttaaag ttttcgttga atcttggggc ataaacccat ttccggtata 301 gaaaagcaag gaggaaaagc atggcgaaga aaacgtacac caacgaagag atccagcaga 361 cagccaacaa gatccgcaag caggttctca agtttgccat tgagagaggc gggtgctaca 421 tcacgcagac gaattcgtcc gcggagatcc tggcaacgct gtatctcgac gtgatgaatc 481 tgggcgacag cctcggcgat cccgacggca tcccgttccc cggcgttccc ggtcccgaca 541 atatggactt cccgagagga agcctgtata acggccccac gcaggcgccc tacgacagat 601 tcttcctgtc tccggctcac tacgcctgca ccctgtactg cacactgttt gccgtcggcc 661 ggatctccga gaccggtatc gaacggttca acaaggacgg ctggatcttc gaacagatcg 721 gcgcggaaca ctcccccggt ttcgagacca ccgcgggctc gctggcgcag accatctccg 781 tcgcgtgcgg cacggctcac gccagaaagc tgaagggcga agaaggcacg atctggtgct 841 tcatgtccga cggcgaactg gaagaaggtc agctgtggga agccattcag gccgcagcct 901 tctataagct tgacaacttc gtcctcgtct gcgacatcaa cggccagcag atcgaaggac 961 cgacaaagga gatcatgaac acgcagccgc tgtacgaccg gttcaccgcc ttcggcgcca 1021 agaccgtgga gatcgacggc cacgacattc aggcgatcaa ggacgcctgc cataccgctc 1081 acccgggtca gcccctcgtc gtgctctgca acaccaaacc cacgcacggc atgccgttcc 1141 tggatcacag aacggagaga ctgcacttcg tgaacgtcaa gacacccgaa cagatcgcag 1201 aagccaaggc tttctacgac agcatggaat aggaggaaag cgctattatg atcatggaaa 1261 ccaacgtata ctccaagagc atcacagaat ggggcgcaaa acacccggag accgtcgttc 1321 tttctgcgga cctgggtacc tcctgcgaga tcatggattt taagaagaac tatcccgacc 1381 gttatttctc cctgggcatc gccgaacaga acatgatcgg ctgggctgcc ggtcttgcca 1441 gagaaggctt cctgccctat ctgcattcct tcggcgtctt cctgtacaga cgcgttctgg 1501 accaggtgga gatgtccgtg gcatacggca atctgcccgt aggcctcgtg ggcttcgttc 1561 ccggcctcac cacccccggc ggtgtatccc accagtccac caacgacatc ggcacgctgc 1621 gcagcgtacc caacatgcgc atctactcca tcgccgacgc gacggatatc gaaggcttcc 1681 tgcccatggc atacgaagcc ggcggtccgt tctacgtaag aatgctgcgt aagtctgttc 1741 ccagactgtt cccggcggat cagacgatcc agttcaacca cgcccgtatc gctgcagaag 1801 gctccgacgt ggcgctgttc acagaaaaca tcgcgaccga agaaggtctc aaggcggtca 1861 aggtgctgca gaaccacggc gtatccgtgc agatgctgtc cgtttccacc ctcaagccct 1921 tcaccgatcc gcaggtcgtc gacgccctga agaaggcgaa gtacggcgcg gtcacttacg 1981 agaaccacaa catcatcggc ggcctgggca cctgcgtggc ggaagtcatg gcggagaacg 2041 gcatcggcaa gccgctcatc aaggtcggcg tggacgatct gtacacccac ggcgcatcga 2101 agatgttcct gctgaagaaa tacaacgtgg acgccatgag ctgcatcaag gcagtcgaaa 2161 agctgatcgg caaagacctc ggcatcgaag aatccgagat cgaggccgtc cgcttcgaag 2221 atttcaa // LOCUS sequence213 2199 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence213 VERSION sequence213 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2199 /mol_type="genomic DNA" /organism="" /note="sequence213" CDS complement(367..1905) /product="DUF5597 domain-containing protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_010920642.1" /transl_table=11 /codon_start=1 /translation="MARLIVEDRPFLSIAGESSNSASGSLAYMESIWPALRQIHLNTLL VPLCWDMVEPREGEFDFTVVDGIISQARREGVKLSFLWFGSWKNMVSSYAPSWVKLNPR RFPLLQDKNGGQIQMLSVFSDNNVKADAGAFAALMRHIRSVDAAEQTVIMMQVENEVGY TGGERDWADAARKAWRSAVPKELTDYLRTHRESLIPEFRAHWERFGARTSGSWSELFGD TPEGNEIFMSYHYAKYIGAVVAAGKREYAIPMFANAAIGRQDRKIASYPCGGPLPFVMD VWQCAAPQLDAISPDIYYGDFEGHCRAYTQNGNPLIIPETRGDDVGLGKALLAYAEHGA LCFSPFGIEGYAGRSIGSFYADLQQLAPMILSRIPGKTMRAVMVGSDTPVQTLEIGKYH VFCEYGHRGNQPAGETVGYALILQDEDDSFYVYGRNISLQFSLVERGAKNLVTGILDCE EGSFENGVWKPFRRINGDQIMNDYSFAAAYLDGRSGNGLRFGQAGVQYVRLYHY" /locus_tag="LOCUS_6050" /note="WP_010920642.1 DUF5597 domain-containing protein (Caulobacter vibrioides) [pid:35.9%, q_cov:99.6%, s_cov:78.5%, Eval:8.4e-84]" /note="frameshifted, insertion/deletion at around 705,654" /note="MGA_893" ORIGIN 1 aggtccagca aacgcaggtg ttcgttctgc cgcagattgc ccagcgtgtc cgtcagttcg 61 gcatcccaca tatgcaccct gtatgccttg agccccaggc gggtcagatg atagacatcc 121 tgccggatcc cttcttcgaa atcaagcccg agatcctggt aattcgcgta tgccgttgag 181 aacggcaggg cataatgcac gccgaactcc gcgatttcct gccgccctgc agtccagcgc 241 agaacgccgt tccggtccac gaaagcactc gggcgtcttt gcgcaaaaac agttgtttgg 301 ccggacagca gcaggaaaga aaggacaatg gatactaacg gtaatggttt catttttacc 361 tctgtctcaa taatgataca gtctcacgta ttgcacacct gcctggccga aacggagtcc 421 gtttccggag cggccgtcca gatatgccgc ggcaaaggag tagtcgttca tgatctggtc 481 gccgttgatc cggcggaagg gcttccagac gccattctcg aacgaccctt cctcgcagtc 541 caggatgccg gtgaccaggt tcttcgcacc acgttcgacc agggagaact gcaggctgat 601 gttacggcca tagacataga acgaatcatc ttcatcctgc aggatcaggg catatccgac 661 cgtctcgcct gccggctggt tgccacggtg gccatattcg cagaacacat ggtatttccc 721 gatctccagc gtctgcacgg gcgtgtcgga gcccaccata acggcccgca tcgtcttgcc 781 cggaatccgg gagaggatca tcggagcgag ttgctgcaga tccgcataga acgatccgat 841 ggagcggccg gcataccctt ctatcccgaa aggagagaag cagagggcac cgtgctcggc 901 atacgcgagc agggcctttc ccagaccgac gtcatcgccc cgcgtctccg ggatgatgag 961 cggattaccg ttctgcgtat aggcgcggca atgtccctcg aaatcaccgt aataaatatc 1021 cgggcttatg gcgtccaact gcggcgcggc gcactgccac acatccatca cgaagggaag 1081 cggacccccg caggggtaac ttgcaatctt gcggtcctgc cggccgatcg cggcatttgc 1141 gaacatcggg atggcgtatt cgcgcttacc ggcagccacg acggccccga tgtacttcgc 1201 ataatggtac gacatgaata tctcgttgcc ttcgggcgtg tctccgaaaa gttccgacca 1261 ggacccggaa gtcctggcgc cgaagcgctc ccaatgggcg cggaactccg ggatcaggga 1321 ctccctgtgc gtccggagat agtccgtcag ctctttcgga acggcggaac gccaagcctt 1381 cctggcggcg tcggcccagt cccgctctcc gccggtgtag ccgacctcgt tctcaacctg 1441 catcatgatg acggtctgct ccgccgcgtc caccgagcgg atgtgccgca tcagcgcggc 1501 gaaagcacct gcatccgctt ttacattgtt gtctgaaaag acggaaagca tctgtatctg 1561 gcctccattc ttgtcctgca ggagcgggaa acggcgggga ttcagtttca cccaggaggg 1621 cgcataggac gagaccatat tcttccagct gccgaaccac aggaacgaga gtttcacccc 1681 ctcgcgccgc gcctggctga tgatgccgtc cacgactgta aaatcaaact ccccttcccg 1741 gggctcgacc atatcccagc agagcggcac cagcaaggtg ttcagatgga tctgccggag 1801 cgccggccag atggattcca tataggcgag gctgccggac gcggagttcg acgattcacc 1861 ggctatggac aggaacggac ggtcctccac gatcaggcgt gccaccccat ccgtcttttc 1921 gatatgcgga gcgctctgcg cggccgcgaa gcttgctgga agcagaacgg ctgcagcaag 1981 gaaagcaaaa aaggcccctc tcataatgcg aagcgttgtt ccttcccgaa gggatcgaaa 2041 gtcagcaggc gcgtgcggcc gtccaccgtc acttcggcgg tcaacagctc gcggtagagc 2101 gccggatcga ggtcgcagga aggcttgata ccgatgcact tgcggtactt gcgcacccgg 2161 atcgtgcagt gctcgcgctc cgcacggtag gatgcgatg // LOCUS sequence214 2172 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence214 VERSION sequence214 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2172 /mol_type="genomic DNA" /organism="" /note="sequence214" misc_feature <1..1150 /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_002680089.1:methylaspartate ammonia-lyase" /note="WP_002680089.1 methylaspartate ammonia-lyase (Treponema denticola) [pid:66.9%, q_cov:98.4%, s_cov:90.8%, Eval:1.0e-141]" /note="MGA_895" /locus_tag="LOCUS_6060" CDS 1234..1512 /product="citrate lyase acyl carrier protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_000691461.1" /transl_table=11 /codon_start=1 /translation="MNTLKKASCGTMESSDAYMELEPIEAGTQIELQSVVEHQFGDSIR ALAAEMLKEEGVENVKLSIVDRGALECTLRARLETLIGRAREEAAHA" /locus_tag="LOCUS_6070" /gene="citD" /EC_number="4.1.3.6" /note="WP_000691461.1 citrate lyase acyl carrier protein (Salmonella) [pid:43.8%, q_cov:95.7%, s_cov:91.8%, Eval:3.9e-13]" /note="MGA_896" ORIGIN 1 cgtaacggaa ggcttcacct ccgtcagaat gcccggcgaa tccatctccg tgcagatcat 61 tctggaagac ggccaggtcg cattcggcga ctgcgcggcc gttcagtact ccggcgcagg 121 cggcagagat cctctgttcc tggcgaagga cttcatcccc gtcatcgaca agtacatcaa 181 gcccatgctc gtaggcagag aagcggacaa cttccgtcag ctggccgctg agatggaagc 241 tatccaggtc gaaggcaaga gactgcacac cgccatccgc tacggcgttt cccaggccat 301 tctggacgct gttgccaagg caaagcacaa gatgatgtgc gaagtcgtcg ccgaagaata 361 cggctgcgaa gtttccgaca agcccatcga catcttcacc cagtccggcg atgaccgcta 421 cgataactcc gacaagatga tcatcaagca ggcgcaggtt ctgccccacg ctctgatcaa 481 caacgtcgag accaagctgg gtccccatgg cgaactgctc gaaaagtacg tcgcatggct 541 gagagaccgg atcctcaaca acagagcgga cgagaactat aagcccattt tccacatcga 601 cgtatacggc accatcggcg ctgccttcgg caacaccaac ttcaaggcta tggccgacta 661 cctcgaaaag ctggccgaga ccgctaagcc cttccacctc cgcatcgaag gacccatgga 721 ctgcgatacc gacagagaga ctcagatgct ggctctgaag ggcctcaccg aagagatcga 781 ccgcagaggc atcgacgtcg agctggttgc cgacgaatgg tgcaacaccc tcgaagacgt 841 caagtacttc accgataacc acgccggtca catggtccag atcaagactc cggacctcgg 901 cggcgtcaac aacaccatcg aagctgttct gtactgcaag gaacacggca tgggcgctta 961 ccagggcggt acctgcaacg agaccgaccg cagcgctcag gtctgcaccc agtgcgcaat 1021 ggcaactcag cccgctcaga tcctggccaa gccgggcatg ggcgtagacg aaggctacat 1081 gatcgtttac aacgaaatgc agagagttct ggcgctgaga gctgccaaga aggcctgcgg 1141 ctgcaagtaa gctgtgcaat gtgaccctat agggtcatcc cataagcccg aagcaacgcc 1201 ttcgggcttt ttccaaacga aaggaaatcc gttatgaata cactgaaaaa ggcttcctgc 1261 ggcaccatgg aatccagcga cgcctacatg gaactggaac ccatcgaggc gggtacgcag 1321 atcgagctgc agtccgtggt ggagcaccag ttcggcgatt ccatccgcgc gctggcggca 1381 gagatgctga aagaggaagg cgtagagaac gttaagctga gcatcgtcga cagaggcgct 1441 ctggagtgta cgctccgggc acgcctcgag accctcatcg gcagagcgag agaggaggca 1501 gcccatgcgt agatccatgc tgttcctgcc gggcaatgcc ccgaacatga tcttaagcgg 1561 cgactgcctc ggcgcggacg ccatcatcct tgacctggaa gacgcggtcg ctcctgacca 1621 gaaggacgcg gccagagtgc tggtccgcaa tgccatcaag tacctgcagt tccccggtgt 1681 ggagaagatc atccgcatca actccctgga tacgccgtac tggaagaagg atctggacga 1741 gatggtcccc ttaaagccgg agctcatcat gaccccgaag acctcctgcg cagcggacgt 1801 gctggaattc gacgcctaca tgtccgaact ggaggataaa ctgggattcg aaagaaatat 1861 cgttaagctg ctgcccctca tcgagacggc cctgggcgtg gagaacgcat tcgccatcgc 1921 ctccgccagc aagagagtcg cagccatctt cctcggcgcg gaagacctgt ccgccgacct 1981 gcactgcaag cgcacgaagg aaggcaagga gatcctgtac gccagaggcc gcatggtaat 2041 ggcggcaaga gcggcaaacg tggacgtcta cgacaccccg ttcaccgacg tgaacgacga 2101 cgaaggcatc cgcatcgacg cagaattcgc caagggtctc gggttcaccg gcaaggccag 2161 catctccccc ag // LOCUS sequence215 2159 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence215 VERSION sequence215 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2159 /mol_type="genomic DNA" /organism="" /note="sequence215" CDS complement(1521..2126) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MAGFSAAYGLDIQTLIKIGKNAEKAMYAATKGVNAHKGAIFAFSL YLAAAADCLMRGGDPVEKVKELAAEKVAKAAPAPPTHGDAVRAVYTGYGKEGALAEACK GFPMALLTAQTICETQDPLLALCRVMSQLTDSNLLYRGGVKGLNWVKAEAAKLCAMEAP QRLDALRRMDEECIARNLSPGGAADMLALGMFLAELPL" /locus_tag="LOCUS_6080" /note="WP_015704364.1 triphosphoribosyl-dephospho-CoA synthase CitG (Klebsiella aerogenes) [pid:37.0%, q_cov:94.0%, s_cov:68.5%, Eval:3.2e-21, partial hit]" /note="MGA_899" ORIGIN 1 cgagacgcct gcggcggtca tccattggtc gacagaatcc gcaattctgg taattccggc 61 atccagcagg tcctgtaaat acggaccgat caggaaaaac gtcaggtaga acacgacgcc 121 catgatggcg ataaagccgg gaaatgccgt ccattttccg gtcaggatgc ggtcgatgcg 181 ctcgctgcgc tcccgctcct tgctctcccg gggctttacg acgctctgcg ccaccaggtt 241 ctggataaag ccaaagcgca tgtccgcgat ggcggcagcc cggtccaggc ctctctcctc 301 ttccatcgtc aggatgatgt gctcgatggt ctccttttcg ttctgcgtaa ggcccaggcg 361 gtccatcagc gcattgtcgc cctcgatgat cttcgtggcg gcgaatcttg caggaacgcc 421 tgcggctgcc gcgtggtcgt cgatcaggtg aacgatgccg tggatggccc ggtgcacggc 481 cccgccgttt tcgtcctcgc tgcagaagtc gttgcgggcg ggcggctcct gatatttcgc 541 cacatgcagc gcgtggtcca ccagttcctc gatgccctct cctttcgagg cggagatcgg 601 aacgacgggg atgccgagca gcgattccat cctgttgatg tcgacggatc cgccgttgcc 661 ccgcatctcg tccatcatgt tgagggccag caccatgggg acgttgagtt ccatcagctg 721 catcgtcaga tacaggccgc gttcgatgct ggtagcgtcc aggatgttga tgacgccttt 781 cggcttttct tccaggatga attcccggga aacgatctcc tcgctggtgt acggggaaag 841 cgagtagata ccgggcagat ccgtgatgag ggtctgggga tgtcctttga tgacgccgtc 901 ctttctgtcc accgtgaccc cgggaaagtt gccgacatgc tggttggcac cggtgagctg 961 attgaacagc gtagtctttc cgctgttctg attgcccgca agggcaaagg tgagcgtttc 1021 ggaatccggc agcggatgct ccgtctttct ttcatgggac ttgccgtatt cgccgagacc 1081 cggatgttcg atgtctttat agacgccgca ggcagtcttc cagaccggcg cgtccgccgc 1141 ttcgatctcg atctgctccg cgtccgccag gcgcagcgtc agctcgtagc cgtgcaggcg 1201 cagttccatg ggatcgccca tgggcgccag ttttatcatt tccaggacgg tgcccggggt 1261 cacgcccatg tccaggaagt gctggcgcag cgcgccctct cctccgactt tcgtgacccg 1321 gccgaactcg cccggcttta attcatttaa gcggatagaa tgattcatgg atttgtttcc 1381 aacctttcct tggagttagc ctcagcaaac aagattataa attagcaagc gctaacttgt 1441 caatatcaaa acacaataaa aagcggcctc gccgttttca aacagcgtca ccgctttttt 1501 ctcatatttt aaaataaaat ctacaacggc agttctgcga ggaacatgcc cagagccagc 1561 atatccgcgg ccccgccggg ggacaggttg cgggcgatgc actcttcgtc catgcggcgc 1621 agcgcatcca aacgctgcgg cgcctccatc gcgcacagtt tggcggcttc tgcctttacc 1681 cagttgagcc cttttacgcc gccccggtac agcagattgc tgtcggtcag ctgagacatc 1741 acccggcata aggccagcag cggatcttgc gtctcgcaga tggtctgagc ggtgagcagc 1801 gccataggaa aacccttgca ggcctccgcc agagcgcctt ctttgccgta acctgtgtat 1861 acggcgcgta cggcgtctcc gtgggtgggc ggcgcgggcg ccgctttggc caccttttcc 1921 gcagccagtt ccttcacctt ttccacgggg tcaccgcctc gcatcaggca gtccgccgcg 1981 gcagccaaat acagcgaaaa cgcgaagatc gcacccttgt gggcattgac tcccttcgtt 2041 gcagcgtaca tggctttttc ggcgttttta ccgattttta tgagcgtttg gatatccaac 2101 ccgtaagccg cggaaaagcc cgccatttgg gcgaaaaacg gccttatcgc ggatgctga // LOCUS sequence216 2150 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence216 VERSION sequence216 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2150 /mol_type="genomic DNA" /organism="" /note="sequence216" misc_feature <1..630 /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_010965929.1:trigger factor" /note="WP_010965929.1 trigger factor (Clostridium) [pid:34.9%, q_cov:78.9%, s_cov:38.5%, Eval:1.5e-24, partial hit]" /note="MGA_900" /locus_tag="LOCUS_6090" CDS 694..1278 /product="ATP-dependent Clp endopeptidase proteolytic subunit ClpP" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003417102.1" /transl_table=11 /codon_start=1 /translation="MSNLIPYVVEQTSRGERSYDIYSRLLKDRIIFLDGEVNSDTASLV VAQLLFLESEDPDKDINLYINSPGGVITAGMAIYDTMQYVKPDVSTICVGMAASMGAFL LAAGAKGKRYALPNAEIMIHQPLGGAQGQATDIKIQADHIIRIKEKLNRILAEKTGQPL EKIAADTERDNYMTAEEAAAYGLIDKVVEKR" /locus_tag="LOCUS_6100" /gene="clpP" /EC_number="3.4.21.92" /note="WP_003417102.1 ATP-dependent Clp endopeptidase proteolytic subunit ClpP (Clostridioides difficile) [pid:78.0%, q_cov:98.5%, s_cov:98.5%, Eval:1.7e-80]" /note="MGA_901" ORIGIN 1 gacgtttccg agttcgatac cctggaagaa gtaaagaagg acatccggga aaagctggag 61 aagaccgtca aggacgccat ggaatacgaa ggcaaggata aggtcctgca gcaggtctac 121 gaagccaacc ccatcgagct tccccaggcc atgatcgaca gcgaagctgc caacatgctg 181 aatgaattcg gctatcagct gcagtcccag ggcatgaacc tcgacatgta ctgcaagtac 241 ctcaataaga cccaggaaca gatgatcgac gaggtcaagc ccgacgccga gaagagagtc 301 aagagcagac tcatcgtcga agccgtcgcc aagcaggaag ccgtcgaagt caccgaggcg 361 gacatcgaga aggaactggc cgcaatggcg ctgcagtacg gcatggcgca gtcccagatc 421 aaatccatct tcggcgaaga gaacatggat tacctgaaga aggacatctt aagccgcaag 481 gccatcgatc tgatgtacga agccgcggag atcaccgagg tcgaagaaaa gaaggaagag 541 cccaaggagg ctcccaagaa agccgccaag aagaagtctt ccaagaaggc cgaagaaaag 601 ctggctgaag aagcgaaaga cgaagaataa acgatcaagt caggcggaac caaaagttcc 661 gcctgaagtt tccaacaaga aaggatgcaa tcgatgagca accttatccc gtacgtcgtg 721 gagcagacct cccggggaga gcgttcctac gacatctatt cccggcttct caaagaccgg 781 atcatcttcc tggacggaga ggtgaacagc gacacagcca gcctcgtggt ggcccagctg 841 ctgtttctgg aatccgaaga cccggacaag gacatcaatc tgtatatcaa cagccccggc 901 ggcgttatta cggccggcat ggcgatctac gacaccatgc agtacgtaaa gccggacgta 961 tccaccatct gcgtcggcat ggcagcctcc atgggggcgt tcctgctggc ggcaggcgcc 1021 aagggcaagc gctacgcgct gcccaacgcg gagatcatga tccatcagcc tctgggcggt 1081 gcccagggtc aggcgacgga catcaagatc caggcagacc acattatccg catcaaggaa 1141 aagctcaacc gcatcctggc ggagaagacg ggccagcccc tggagaagat cgccgcggat 1201 acggaacgcg acaactatat gaccgcggaa gaagcggcag cctacggcct catcgataag 1261 gtcgtggaaa aacgctaatc gaaacattac ggagaaagta tggctaaatt tgacagctca 1321 aaagaattaa cgtgcagttt ctgcggaaag ccccagagcc aggtgagacg gctcattgcg 1381 ggtccggacg tctatatctg cgacgagtgc gtcaagctgt gcgatgagat cctggcggag 1441 gagttccccg agatcaaaga gatggcgtct ctggatttcg gcggggaatt gcccaaaccc 1501 aaggagatcg atgcgacgct ggcggattac gtcatcgacc aggacagagc caagaagatg 1561 ctggccgtgg ccgtctacaa tcattataag aggataagca atctgccggc gaagcccgcg 1621 aagaagggca tcaaggctgc tcagaccgac gatggcgtcg agatccagaa gagcaatatc 1681 gtcatgatcg gaccgaccgg ttccggcaag accctgctgg cccagaccct ggccaagatc 1741 ctggacgttc cctttgccat cgccgatgcg acgaccctca cagaagccgg ctacgtaggc 1801 gaagacgtgg agaacatcct gctgcgcctc atccaggctg cggacggcga cgtggagcgg 1861 gcccagaagg gcatcatcta cgtggacgag atcgataagc tcgccagaaa gagcgaaaat 1921 ccctccatta cgagagacgt atccggcgaa ggcgtgcagc aggcgctgct gaagatcgtg 1981 gaaggcacgg tctccaacgt accgccccag ggtggccgca agcacccgat gcaggagttc 2041 atccagttcg atacgacgaa cgtgctgttc atctgcggtg gtgctttcga cggtctggat 2101 aagatcatcc agaaccgcat cggcgagaag accatcggct tcaactccga // LOCUS sequence217 2143 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence217 VERSION sequence217 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2143 /mol_type="genomic DNA" /organism="" /note="sequence217" misc_feature <1..1586 /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_005810415.1:dimethyl sulfoxide reductase subunit A" /note="WP_005810415.1 dimethyl sulfoxide reductase subunit A (Desulfitobacterium hafniense) [pid:43.8%, q_cov:99.2%, s_cov:66.6%, Eval:1.4e-118, partial hit]" /note="MGA_903" /locus_tag="LOCUS_6110" CDS complement(1640..2053) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MGIKRIWKTEEVFHLPDGDLRYYGHLGIPHYEEMDDGIVQASMPV THALLNGHGTVQGGAVASLCDIAGAAYMRILVGDEVTLNSSMQFYRPGKEGSVLTARVT PRKLGKTICTLVCEVTDETGTLIADSVQTFYRI" /locus_tag="LOCUS_6120" /note="MGA_904" ORIGIN 1 ccctggcgga tgagtggatc cccatccggc cgtcttccga cggcgccatg gcggatgcca 61 tgtgctacgt catatggaaa aacggcctgc aggaccaggc attcatggac aagttctgca 121 tcggattcga cgaagcgcac atgcccgaag gcgtaccggc gggcgagtcg tatcattcct 181 acctgttcgg gaaaaaggac ggcgtggaaa agacgccgga atgggcggag gcgatctgcg 241 gcgtgccggc gaagacgatc gaagatctgg cgatccgctt tgcgaaggca aagcccgcct 301 gtctgctttc cggccttgcg ccccagcgca ccggtaacgg cgaacagacg gcccgctgct 361 tcatggcgct ggcctgcctg tgcggctacg tgggcgttcc cggcggcaac agcggcggca 421 cgggctggca ggcgaaccgc accgcatccc ccgacgtgtg cgaatacgag aacccctacg 481 ggaaaagcat cccgtccttc ctgtggacga gagccgtcat ggagccggag atcttctcgc 541 ccgagatgca gctctggggc ggtgaccgcc tggataccgg ggtcaaactg gtgttctccc 601 tggccaacgg ccagacgctc tcccagcatt ccaacatcaa cgagaccatc gagatgtaca 661 agacgccggg caagctggag atgctggtgt tctccaacct gttcatgacc cccgcagccc 721 tctacgccga cgtggtgctg ccggcgccgt cgttcttcga gcaggacaac atcgtgccct 781 cctgggacaa caactactat ttcctgtaca acaaccactg catgcagccc ctgttcggct 841 gccgcttcga acacgactgg atccgggact gcgcggatct gctgggatac ggcgaagcct 901 tccgggacgg caaggagacg acggaggact ggctgagaca cgtatacgaa aagatggcgg 961 cggatttccc ggaccgcccg gaactggtgc ctttcgagga attccagaag aacggcatcc 1021 acgtgtggaa actgccggag cgcaacatca gtttcgagga gaacatcaaa gacggcgtac 1081 cctttaagac ccccagcggc aagatcgaga tcttcagcaa gaagctgtgg gatatgaact 1141 ggaaggacgt gccggcgatt ccgggcttcc tggactgcta cgaagggccg cgcgacccga 1201 aacaggcgga ctaccccctg cagctcatcg cataccacac gaagcgccgg gcccattcca 1261 tccacgacaa caacgtgctg atggaggagt tggatccgcc ccggatctgg atctcacaga 1321 aagacgcagc cgcacgcggc atcgcggatg gagaccgggt ggaggtgttc aacgaccgcg 1381 gcgtatgccg caccacggcg ttcgtgaccg accgcatcat ctccggggtc gtcgccatga 1441 gcgaaggcgt ctggtataaa ccgggcgagg acggcgtcga cgaacgggga agcatcaacg 1501 tgctcaccca taccgtgccc acgccctatt cccgggccaa tccccagcac acgaacctgg 1561 cggacgtaag gaaatataac ggataaggac tgcagcaaaa agccggaagg gatcttccct 1621 tccggctcgt ttttttgatt cagatccggt agaacgtctg cacggaatcc gcgatgagcg 1681 tgccggtctc gtccgtcact tcgcagacca gcgtgcagat ggtctttcca agtttgcggg 1741 gcgtcacccg ggccgtcagg acggaccctt ccttccccgg acggtagaac tgcatggaac 1801 tgttcagggt cacctcgtcg cccaccagga tgcgcatgta tgcagcccct gcgatgtcgc 1861 acagagaagc gaccgccccg ccctgcaccg tgccgtggcc gttcagcagc gcgtgggtga 1921 cgggcatgga agcctgcacg atgccgtcat ccatctcctc ataatggggg atgcccagat 1981 gcccgtaata gcgcaggtcg ccgtccggca gatgaaagac ctcttccgtt ttccagattc 2041 gcttgatgcc cataggttac ctcagaaaca gctttacgag ccgctgcatg ctctttttgt 2101 agggttgata ccgcatattc agatcgatcc acgtcttttt gtc // LOCUS sequence218 2129 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence218 VERSION sequence218 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2129 /mol_type="genomic DNA" /organism="" /note="sequence218" CDS complement(255..941) /product="response regulator transcription factor" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011986772.1" /transl_table=11 /codon_start=1 /translation="MKSNILIIEDEAKIARFVELELSHEGYVCDKAEDGRKGLEMAESG AYDLVLLDIMLPELNGLEVLRRLRKTSDVPVIVLTARDAVMDKVSGLDMGADDYVTKPF AIEELLARIRLALRRGGASKMKEDLLVCGSLSLSVPRHEVRWDGSEIDLTSREFSLLQT LLENKNVVLSRDSLLEKVWGYDYMGETNVVDVYVRYLRNKIAAAGGENVIQTVRGVGYV IREEHE" /locus_tag="LOCUS_6130" /note="WP_011986772.1 response regulator transcription factor (Clostridium botulinum) [pid:65.0%, q_cov:97.4%, s_cov:98.7%, Eval:9.1e-77]" /note="MGA_907" CDS complement(944..1627) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MEPREMENLEKVEQLVEKAGCTYAEAKDALEYSDWNLLDAIIRLE HEGKAVKSSAAYKTADPQEAPKTGSYVEPEVIHAEEAEHIKPDEFKKESRSGYGNGSFG EDARHYGQQAAGAAKGFFGRAKEALTQNYMTVFGRAGNQILRLPMWVLLILLLCWFWGI LMIALVLMVFGCRFHFEGKDFGKTNVNNTFDRWSEYTYNAGQKVKQEFTAKEEPKAEED PNREE" /locus_tag="LOCUS_6140" /note="MGA_908" ORIGIN 1 aaacgatgac cccctcgatc tgcagcacga tgtcgaaccg gcggctcgta acgacgtctt 61 tgcaggcgga aaacgcgctt cgcagcactg ccgcggggtc tgcccccgtc tcgatctggg 121 gccaggcctc cacgatcatg acggcgatgt ccaccacgag aaacgccagc agcagataca 181 acgcggaccc caaagcgatg cgaagcgcga tggagcccgt ttttattctc ttatctttcg 241 ttttgttttc ggtgttactc atgttcctcg cggatgacgt accctacgcc ccgcacggtc 301 tggatcacat tttctccacc ggccgctgcg atcttgttgc gcaggtagcg gacgtacacg 361 tccaccacgt tcgtctcgcc catgtagtcg tagccccaga ccttttccag caggctgtcc 421 cgggacagca ccacgttctt gttctccagc agcgtctgca ggagagagaa ttcccggctg 481 gtgaggtcga tctccgaacc gtcccagcgc acctcgtggc ggggaacgga gagggagagc 541 gatccgcaga cgagcagatc ttccttcatt ttggaagcgc cgccccgccg cagcgccagg 601 cggatgcggg ccagcagctc ttcgatggcg aagggtttcg tcacgtagtc gtccgcgccc 661 atatccaggc ccgacacctt atccatcacg gcgtcccgtg ccgttaaaac gatcacggga 721 acgtcgctgg tctttctcag cctcctgagc acctccaggc cgttgagctc cgggagcatg 781 atgtccagca gcaccaggtc gtaggcgccg ctctccgcca tctccagccc cttccgtccg 841 tcttccgcct tgtcgcagac atatccctcg tgggacagct ccagttcgac gaaccgggcg 901 atctttgcct catcttcgat gatcaggatg ttgcttttca taattactct tctctgttcg 961 gatcttcttc cgccttaggc tcttccttgg cggtgaattc ctgctttacc ttctggcctg 1021 cgttatatgt atattccgac cagcggtcga aggtgttgtt gacgttggtc ttgccgaaat 1081 cctttccttc gaagtggaag cggcagccga agaccatcag caccagggcg atcatgagaa 1141 tgccccagaa ccagcacagc agcaggatga gcagcaccca catgggcagg cgcaggatct 1201 gattgccggc gcggccgaag acggtcatgt aattctgggt cagcgcctct ttggcccggc 1261 cgaagaagcc cttggcagcc cccgctgcct gctggccgta gtggcgggca tcttctccga 1321 agctgccgtt gccgtaaccg cttctgcttt ccttcttgaa ttcatcgggc ttgatgtgct 1381 ccgcttcctc cgcatggatg acttccggtt ccacgtaact gccggtcttc ggcgcttcct 1441 gcggatccgc cgtcttatac gctgcggaag attttacggc cttgccttcg tgctccagcc 1501 ggatgatcgc atccagcaga ttccagtcgc tgtactccaa cgcgtctttc gcctctgcat 1561 aggtgcagcc ggccttctcc actaactgtt caactttctc cagattttcc atttctctcg 1621 gttccatgtt cgttcctcct gtatgatgaa tacctctttt gatggtccca tcataccgcg 1681 gcaaaatgaa agccccatag gagaaaaatg agaaaacgat gagaattgcg ttttcttttc 1741 tatagttcgc tcttgcccgc ggccttcagg ccgatgttga tccgttcttt ataggcggca 1801 tcgagagcct gctgcgcgcc taccagcgag tcgcacagct gctttcccgt attgttgacg 1861 aagatcgtcg tggggatgta ctgcacgtcg ttcaccagcg tggcgagatc ccctgttgca 1921 ctgatgatgc agcggccttc gaagccggct tcgtccagga tggcctgaca ctcttccgta 1981 tgggtcggcg catccacgca gaacagcatg agctgcacgt tgtccggcag cgtcttttcg 2041 aattccgcca gttcgtccat ctcgtccagg cagggcgggc accaggtggc ccagatgttg 2101 atggcggtca cgtcgcattc cccgaacag // LOCUS sequence219 2124 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence219 VERSION sequence219 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2124 /mol_type="genomic DNA" /organism="" /note="sequence219" CDS complement(943..1149) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MAELSFERTFEALLEEKKYSTIKDVLVTMNPADIAAIFEDVDEER LPLLFRLLPKELAAETFVEMEPE" /locus_tag="LOCUS_6150" /note="MGA_911" ORIGIN 1 gaggatcatc ttgtccacga tcatcagttt tgcgaagcag gcagccgcca gggaaatgcc 61 gcacagcacg gcggtccgga tatccttcca gatgaccacc ggcagatctt cgaattcgat 121 gtcatccagg gacagcgcac ggatgaccgt aacagaggcc tgcgagcccg agttgccgcc 181 cgtatccatc agcatgggga tgaatgcggt gagcacgacc tgcgccgcca gtgcgttctc 241 gaaatgggta atgatgatgc cggtgaacgt ggcggagacc atcagcagaa gcagccaggg 301 aatgcggtgt ttaaacagtt cccaggggga ggaccggtag tacgtctttt ccgaaggcgt 361 aatacctgcc atgatctcca tgtcttccgt ggtctcttct tccagaacgt ccatagcgtc 421 gtcgaacgtt acgataccga ccatcctcag gtcgctgtcc acgacgggca gcgccaggaa 481 gctgtatttc gtaaacatgt tggcgacttc ttcctggtcg tccagggtat tgacggagat 541 gacgttcgtc tccatcaggt cgcccacctt cacctcgtcc ttcgccgtaa gcaattccct 601 tacggtgacc gtgcccagca gttttctctc gtcggtcacg taacaggtgt agatggtctc 661 tttatccaca cctgtgcggc ggatgcgctc gatggcgtcc cctaccgtca tggacgggtg 721 cagattgacg tactccgtcg tcatgatgga ccctgccgaa tcctcgggat agcggaggat 781 ctcgttgatc tcccgccgca tcttcgggtc ggcctgggcc aggatgcgct tgaccacgtt 841 agcgggcatc tcctccacca ggtctaccgc atcgtccacg aacagttcgt ccataacttc 901 gtgaagttct cggtcggaga acccttccac cagaatctcc tgctattcgg gctccatctc 961 gacgaaggtc tccgccgcca gctctttcgg gagcagacgg aacagaagag gcagacgttc 1021 ttcgtccaca tcttcgaaga tcgcggcgat gtccgcggga ttcatggtga ccagcacatc 1081 tttgatggtg gaatatttct tttcttccag aagcgcttcg aaagtgcgct caaatgataa 1141 ttctgccata acttatcctc tccattaaag ggaaataata agatattggc aggtctggat 1201 aagtctatcg ggatcagaag gcagccacgg acgatcgcgg cggctctgct agactttggc 1261 ctgccgataa acctatcgta cttccgctat ccatggtctt tcctcctttt ctgattcaaa 1321 aaatactcac gaaaacaaac gcatactgcg caataatatc ttaccacgcg aagaagacca 1381 tcgtcaaaca cggcgcggtt tttatgatat acttttttgc atgtgggact atctggcgaa 1441 gaccgaaaag aacatcctga tctacggccg cggcaacgcc gcagaggcca tcgtttccga 1501 gctggcaaag cggggcaagc gccccgccgg ctttttcgcg tccgacggat tcgtacgggc 1561 gaaggagttc ctgggctatc cggtcacctc attcgaagaa gcgctgcaga agttcggagc 1621 ggaaagcatc gtgctgctgg ccttcggctc ccacagggag gacgtgctgg atcagatcca 1681 aaatgtcgcc gcaaagaccg aattctttgc tccggacctt cccgtcgtgg gcagcgggct 1741 gttcgataaa gcgtattaca ccgctcatga accgcagctg caggctgcgt tcgaactgct 1801 ggcggacgat cagagccgca aagttttccg gaacgtcgtc tcctacaaac tcagcggaaa 1861 aatagacttt ctgcaggact gcgagacctc ttcagaggag aattgggcgt tgctctcccc 1921 ttctgcagac aagatttacg tcgacctggg cgcctatacc ggggacaccg tgctggaatt 1981 cctcggtgcc tgcggcggtc ccgccgaccc gcccatcctg gccgtcgagc cggagccccg 2041 caacttccga aagctgcagg agacggttgc ggcagccggt cttacccgct gccgctgcgt 2101 gcaggcagcg atcggagacc gcac // LOCUS sequence220 2120 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence220 VERSION sequence220 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2120 /mol_type="genomic DNA" /organism="" /note="sequence220" CDS complement(780..1421) /product="cytidylate kinase-like family protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_008766580.1" /transl_table=11 /codon_start=1 /translation="MEAKHVITIAREFGSGGREIGIKLSEILGIPFYDKELLRLASEQG GLNEEFMAANEEKAPVVNAASFGRRTLNAFYQPSLSDTIFLEQSKIIRSLAEKGPCVIV GRAADYVLRDMGSVDVFISASMPYKIARKHKVAPEKADYTDAQMEKYIKDIDKHRQKYY EHYTGRRWGMIGNYHLCIWADNVGSDGAVQVILNYLEQMDKFQPEQKTEK" /locus_tag="LOCUS_6160" /note="WP_008766580.1 cytidylate kinase-like family protein (Bacteroides) [pid:39.5%, q_cov:93.4%, s_cov:96.2%, Eval:2.9e-31]" /note="MGA_914" CDS 1502..1660 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MADLIVIAILAAAVCAVIYKMRKDKKAGKHSCGGNCAGCAFSCDQ RKEEYDL" /locus_tag="LOCUS_6170" /note="MGA_915" ORIGIN 1 ggtgccgccg aagccgtagt cgttgcagag gaacgtggtc tcttccggca gcatgtcgag 61 gccgcagtgg cacatctgca tggcgatgga cgtcgcggag cagatgaccc cgccatagtc 121 cggatctctt ctcttctggg aaatgacagg agtatccaga tgtacgctcg ttggcatttc 181 cttcagccct tcacggcact gcggatcttc gctcttctct tgccaatccg gggcgtttgt 241 gttcttccac gtcgccccca gcagggtgag ggagggaaga tcgcccgcat ccgcggtccg 301 cagcaccgcc ttcagttgga atgcgtccgc cgtttttccg tcttttacgt tgacggagct 361 gtcgccccag tcccggtagg tgttggccca tacgagaccg tcctcctggt cgggacaata 421 cctctttata tgggcacccc agacgcccca gctcatccag gcgctccaga cgccgtccac 481 ccgcaggcga gcgtagattt ccgcttcgct cttgcccggg gtctgcgcgt tccaggatgc 541 gacgagatcg ttgaaaggtt cctccgtctc gaaaggctcc gcaagaaaca ccccttcgta 601 aggcgcgtcc agggtaagcg ctctcttcgt ttcgttatag gtaagattgt tcacgcggcc 661 gcggagcaga ccgctgtttt tccataagac tgtgttcatg cagtttcact ctcccggctc 721 attgtagcac agacaacaca aaaacgctcc cttttagggg agcgttttgc ggtttttcgc 781 tatttttctg tcttttgttc gggctggaac ttgtccatct gctccagata gttgaggatg 841 acctgcaccg caccgtcgga acccacgttg tcggcccaga tgcagaggtg atagttgccg 901 atcatgcccc agcgtctgcc ggtgtagtgc tcgtagtatt tctggcggtg cttgtcgatg 961 tccttgatgt atttttccat ctgggcatcg gtgtagtccg ccttctccgg cgccaccttg 1021 tgttttctgg cgatcttata gggcatgctg gcggagataa agacgtccac gctgcccatg 1081 tcccggagca cgtagtccgc ggcgcggcct acgatgacgc agggaccttt ttccgcgagg 1141 ctgcggatga tcttggactg ctccaggaag attgtatcgg aaagggaagg ctgatagaag 1201 gcattgagcg ttcttctgcc gaaagatgcg gcgttgacca ccggagcctt ttcctcgttg 1261 gcagccataa actcctcgtt taagccgccc tgttcggacg cgaggcgcag taattcttta 1321 tcgtaaaaag gaatgccgag gatctcggat aatttgatcc cgatctctct gccgccgctg 1381 ccgaactctc ttgcgatcgt aatgacatgt tttgcttcca tagttgtcgt ctcctttaac 1441 gcattaatct taccacactg tggtttttta tggtaaactt tttatgcatc aggaggtgtc 1501 tatggcagat ctgatcgtca tcgcgatact ggctgcggcc gtatgcgcgg tgatctacaa 1561 gatgagaaaa gacaaaaaag caggaaagca cagctgcggc ggcaactgcg cgggctgcgc 1621 tttttcgtgt gaccagagaa aagaggaata cgacttatga tcatgttcaa ttgcgactat 1681 aacgaaggat gctgtccgga gatcatggag gcgctcaccc gcaccaacat ggagcagcac 1741 gagggctaca gcgaggataa gatcacggcg cacgccaagg aacttatcaa gaaggcctgc 1801 gaacggaacg acgtggatgt acatattatg gtaggcggca cccagaccaa catgacggtg 1861 atcgcagcca cgctgcgtcc gtatcagggc gttatcgctc ctgcgacggg tcacatcgcg 1921 cggcacgaga ccggcgccat cgaagcccac ggccacaagg tgctggcgct gccggagacg 1981 gacggcaaga tctcggcaga gcagatcgag gcattctgcg cggatcatta ccgggacgaa 2041 tccttcgagc acatcgtgca gccgggcatg gtctacatct ccagccccac ggaactgggc 2101 acggtctata agagagcgga // LOCUS sequence221 2101 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence221 VERSION sequence221 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2101 /mol_type="genomic DNA" /organism="" /note="sequence221" CDS complement(1081..1527) /product="D-aminoacyl-tRNA deacylase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003547036.1" /transl_table=11 /codon_start=1 /translation="MIFVIQRVSEARVDIEGECRGKIGKGFMTLIGVADTDTKEIADKM VRKMCNMRIFEDENGKTNLSLADVDGSLLLISQFTLYADCKKGNRPSFIGAGAPDMANE MYEYIIEQAKTYCPRVERGEFGADMKVSLTNDGPFTIVLNSKDL" /locus_tag="LOCUS_6180" /gene="dtd" /EC_number="3.1.1.96" /note="WP_003547036.1 D-aminoacyl-tRNA deacylase (Lactobacillus acidophilus) [pid:56.2%, q_cov:97.3%, s_cov:99.3%, Eval:1.4e-38]" /note="MGA_918" misc_feature complement(1543..>2101) /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_010964851.1:D-isomer specific 2-hydroxyacid dehydrogenase family protein" /note="WP_010964851.1 D-isomer specific 2-hydroxyacid dehydrogenase family protein (Clostridium) [pid:42.1%, q_cov:98.4%, s_cov:56.1%, Eval:4.9e-39, partial hit]" /note="MGA_919" /locus_tag="LOCUS_6190" ORIGIN 1 caggtgaaca ggccgccgtc gggaacggtc cacttcgtgc ccttcgggaa gtattcctcg 61 atgcactcca tcatcttctg gcagcgttct ctgtacaggc tgcagatcat ctcgtgatgt 121 tcgggatagt aacctctctt gaagaactca gcgcacagca cctgcggcag catggaggtg 181 tgggagttca tggcggtctt tacatcctgc agcggctgca tcatctcggg caggcctacg 241 atgtagccca gacggctgcc tgcggagaag atcttggaga aggagttgcc caggatgacc 301 ttgccggcct tgtcgaagct cttgatggga gccaggtcgt gtccggtaaa gcggatgtct 361 ctgtaggggt catcctcgaa gaccagcacg tcgtactttt cggccagttc cgcgatcttc 421 tttctcctct ccagcgtgag cgttctgccg gaggggttct ggaaggtggg gatgacgtag 481 atcatcttcg gattgtattt ctggatcttg gcttccagat cgtccattct catgccgtct 541 tcgtccatct cgacgccgat gcacttcgct tcgaacatct cgaaggtctc caccgcgtgg 601 acgaaggtcg gtctctcgac gagcaccaca tcgccgggat cgatgtagat ctcgcaggtg 661 agggagatgg tctccaggcc gccggtggtg atcatgatgt ggtccgcgtc ggtcttgacg 721 cccttgggag ccagcagctg gtcgacgatg acttctctta agtccttgac gccgagcagg 781 ggtccgtact gcagggcttc cacgcctctg ctgtcccgtc tcagcacgtc gtttgcgatc 841 tcgcgcaccc gctctacggg gagcgcttcc ttagcggggg cgccgatgct cagggagatg 901 agctcgggat ctgccaggga attgaacagg ccgcgtacga cttccgctga gcctgccatg 961 gtgtgtattc tctttgcgaa tttattgctg ctatccatac cgattacctc ctgttcggaa 1021 tttccatttt tatcttatca caaaacaaat ccatcgagat atcgatggat ttgatggaac 1081 ctataaatct tttgaattaa gaacgatggt aaagggaccg tcgttggtaa ggctcacctt 1141 catgtcggcg ccgaactccc ctctttccac ccgggggcag taggtcttcg cctgttcgat 1201 gatgtattcg tacatctcgt tggccatatc cggggcgccg gcaccgataa aggaaggccg 1261 gttgcccttc ttgcagtcgg cgtagagcgt aaattgggag atgaggagca gcgagccgtc 1321 cacgtccgcc agagacaggt tcgtcttgcc gttttcgtcc tcgaagatgc gcatgttgca 1381 catcttgcgg accatcttgt ccgcgatctc cttcgtgtcc gtatccgcga cgccgatgag 1441 ggtcataaat cctttgccga tcttgccgcg gcattcgcct tcgatatcga cgcgggcttc 1501 gctcacccgc tgaatgacaa atatcatcgc tctctccgtt ctttacttga tctcgtaggg 1561 gttgggtttt ccgctcagcg ccaggtaaga cgcctcgatg gcggtcttca gctgttcgtt 1621 ggcggacagg taggtgcaga aggccatatg ctgcagcagg gtcacctcgg gcagttcctc 1681 cagggccgcg atgtgttcgg gcaccggttt ctgccgcgca tcggtgtagt agtagccgga 1741 ctcgtcctcg atgacgtcca gcaccgcgcc gcccagcttc ttcgcccgca gggcgtcgat 1801 gagggcccag gtgtcgatga ggtcgccccg agctgtattg acgatgtagg cgccgggctt 1861 catgagggcc agtttttccg cgttgatcag gtgatggttc tccgggctgg cgaaggcgtg 1921 cagcgtaacg atgtcgcagc gctgcagcag ttcctccatg gatacgtatt cgcagaattc 1981 cttcagaccg tcgttttcgt agatatcata gcaaaggatc ttgcattcga aggggcgcag 2041 gcgcttcgcc acgcactggc cgatcttgcc ggtgccgatg atgcccaccg tgagctcgga 2101 c // LOCUS sequence222 2096 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence222 VERSION sequence222 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2096 /mol_type="genomic DNA" /organism="" /note="sequence222" CDS 1..600 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MGYAVAAERLQKQLADEGVTVDEAHPLFVTIPCGVGGAPGGVAFG LKQIYGDNVHVLFAEPVQACCMVLGMATGLHNQICVQDIGLSGKTHADGLAVGRASSLV GKIMEPLLTGEVTLEDYKIYDYMRDLRDSEGLFIEPSSCAGFEGPVQFAKNAAFAPYIE KYGLSEALQNASHIVWATGGKLVPEQVRQAFYETYL" /locus_tag="LOCUS_6200" /note="WP_000658347.1 D-serine ammonia-lyase (Bacillus cereus group) [pid:53.8%, q_cov:99.0%, s_cov:43.5%, Eval:5.5e-58, partial hit]" /note="MGA_920" CDS 620..1480 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MKYSTRAATMADVPRLREIEMAAMPHSKWYSTECAPLFIEQKGQQ GEMVVAEIPELPAGDPNKTIGMGQYSVMPDGSGWLECLRILPEYQRTGAGRQIYERYQE LWTETDAPHVAMFTGRKNVASKALSEVYGFEYTGAYDEYSLPLEGIEAACPAGFERVTD LETVAKALDAREGVGNHIVFNRTYLHYSEPIYRWLIGRGMVWSDGKTLLVLGARMLQER GWYLAFWSDDPDKCLAFAIAKTKEAGLPALTVNFPPEREDLKAYFERKGFHYVYSNIVM ELNRR" /locus_tag="LOCUS_6210" /note="MGA_921" ORIGIN 1 atgggctatg ccgtggcggc ggagcggctg cagaagcagc tggcggatga aggggtcacc 61 gtggacgaag cgcaccccct gttcgtaacg atcccctgcg gcgtgggcgg cgcccccggc 121 ggcgtggcct tcggattaaa gcagatctac ggcgacaacg tgcacgtgct gttcgcagag 181 cctgtccagg cctgctgcat ggtgctgggc atggcgacgg gtctacacaa ccagatctgc 241 gtgcaggata tcgggctttc cggcaagacc catgcggatg ggctggcggt gggccgggcc 301 tccagtctgg tcgggaagat catggaaccc cttctgactg gcgaggtgac cctggaagac 361 tataagatct acgactacat gagggatctg agagattcgg aaggactgtt catagagccc 421 agttcctgcg cgggtttcga gggacccgta caatttgcca agaacgcagc tttcgccccg 481 tatatcgaaa aatacggcct ctcagaggca ttacaaaacg cctcccatat cgtctgggcg 541 accggcggca aactggttcc cgaacaggtg cggcaggcgt tttacgagac gtatctgtag 601 gtaagaaagg atcaagtcca tgaaatacag cacaagagca gccaccatgg cggacgtgcc 661 ccggctgcgg gagatcgaaa tggcagccat gccccattcc aagtggtaca gcacggaatg 721 cgcgcccctg ttcatcgaac agaagggcca gcagggcgag atggtcgtgg cggagatccc 781 ggagcttccc gcgggtgacc cgaacaaaac cataggcatg ggccagtatt ccgtcatgcc 841 cgacggctcc ggctggctgg aatgcctgcg catcctgccg gaataccaga ggaccggcgc 901 ggggcggcag atctacgaaa gatatcagga gctgtggacc gaaacggatg cgccccacgt 961 ggcgatgttc accggccgca agaacgtggc cagcaaggcc ctgtctgagg tgtacggctt 1021 cgaatacacc ggcgcctacg acgagtacag cctgccgctg gaagggatag aggcggcttg 1081 cccggcgggg tttgaacggg tcacggatct ggagaccgtt gcgaaagccc tggatgcccg 1141 ggaaggggtg ggaaaccaca tcgtcttcaa ccgcacctac ctgcactaca gcgagcccat 1201 ctaccgctgg ctcatcgggc gcggcatggt ctggtccgac ggaaagacgc tgctggtgct 1261 gggcgcccgc atgctgcagg aaagaggctg gtacctggca ttctggtccg atgacccgga 1321 caagtgcctg gccttcgcca tcgcgaagac gaaggaggcc ggcctgcctg cgctgaccgt 1381 gaatttcccg ccggagcgcg aagacttaaa agcatatttt gagagaaaag gcttccatta 1441 cgtctattcc aacatcgtaa tggagctgaa cagacgctga ttttcgtaaa gaaagcgtca 1501 aaatcgaaga taggcctgcg ggcatctgct gattaagata aagacacaac agatcccgac 1561 aggcctttcc gtttcctgat tgaattttgg agatccatca aaaagtttga tggatcacat 1621 aaaaactaaa aaatgggaaa atgcatttaa gaggtggcaa agcgccgcaa aggacttata 1681 ataaaaatag tttatccgtc aacccgattg cagttcagta aaggagatgc agcatggaat 1741 ataagaccga tatccagatc gcacaggagt gcgaaaagaa aaagatcacc gagatcgcaa 1801 aggtggcagg cgtagacgag aagtatctcg agcagtacgg caactacaaa gccaaggtag 1861 attatcagct gctgagagac aaggcagacc agcccgatgg caagctcatc ctcgtaacgg 1921 ccattacgcc gactccggcc ggcgaaggca agaccaccac gtccgtaggc ctcaccgacg 1981 gtctgagaaa gatcggaaag aacgccatcg tggcactgag agaaccctcc ttaggtcctg 2041 tgttcggggt caagggcggc gctgccggcg gcggctatgc ccaggtcgtt cccatg // LOCUS sequence223 2090 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence223 VERSION sequence223 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2090 /mol_type="genomic DNA" /organism="" /note="sequence223" CDS 316..1158 /product="DMT family transporter" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011948436.1" /transl_table=11 /codon_start=1 /translation="MVMLIASMAIWGSLGLFRRAIPLPSSVLAFVRGVAGSLFLILFVK ARGGRVNAGMTRKQIAWFGTAGAIMAFNWILLFDAYNYTSVAVATLCYYMMPVFVTLAS ALLFGEKLTARKLLCVAVCVAGMLLVTGVAEGDAPTGSEIRGIVMGLAAAVLYSTVVLM NKKMPGMDAYEKTIVQLIGAAVIMVPYILVTEDVTALSLDGRGALMLFIVAAVHTGIAY ALYFGCMDDLKAQTVAIFSYVDPIVAVLLSAFVLGEPLSALGVLGVVLVLGAAVVSEL" /locus_tag="LOCUS_6220" /note="WP_011948436.1 DMT family transporter (Clostridium botulinum) [pid:36.9%, q_cov:92.9%, s_cov:88.1%, Eval:1.5e-48]" /note="MGA_924" ORIGIN 1 ggctgcggct actgcatgcc ctgcaccgtc ggcatccaga tcaaccagtg cgcgcgcatg 61 tcccagatgg tgagaagagc gccttccgcc tcctggctca acgactattg gcagaaagag 121 atggcgaaga tcgacgaatg cgtggaatgc ggcctctgca agacccgctg cccgtatgag 181 ctggatacgc ccaacctgct gagaaagaac ctggcggact acagagagat cctggcagga 241 aaggtgtccg tctgatcgta agaccggagc atttgcagat catccatgga agacagacaa 301 aaagaaaaac ggtcgatggt catgctcatc gcctccatgg cgatctgggg cagcctcggc 361 ctgttccggc gggccattcc gcttccgtcc tccgtcctcg cattcgtgcg gggcgtggcg 421 gggtcgctgt tcctcatcct gttcgtcaag gcgaggggcg gcagggtaaa cgccggcatg 481 acccgaaaac agatcgcctg gttcggcaca gcgggggcca tcatggcctt caactggatc 541 ctgctgttcg atgcatataa ctatacgtcg gtggcggtcg ccacgctgtg ttattacatg 601 atgccggtgt tcgtaacgct ggcgtcggcg ctgctgttcg gcgagaagct gactgcgaga 661 aaactgctct gcgtcgccgt gtgcgtcgcc ggcatgctgc tggtgacggg cgtcgcggaa 721 ggggatgcgc ccaccggctc cgagatccgg ggcatcgtga tgggactggc tgccgcggtc 781 ctttactcga cggtcgtgct catgaataag aagatgcccg gcatggacgc ctacgaaaag 841 accatcgtgc agctgatcgg tgcggcggtc atcatggtgc cgtacatcct tgtaacggaa 901 gacgtaacgg cgctaagcct ggacggccga ggcgcgctga tgctctttat cgtggcggcc 961 gttcacaccg gtatcgccta cgctctatac tttggctgca tggacgatct gaaggcgcag 1021 accgtcgcca tcttcagtta cgtagacccc atcgtcgcgg tgctgctctc cgccttcgtg 1081 ctgggagaac cgctctccgc cttaggcgta ttgggcgtcg tcctcgtatt gggcgccgcc 1141 gtggtaagcg aactatgaaa gcactcatcg ccatgagcgg cggcgtggat tcctccgtcg 1201 cggctctgct tacaaaagaa tccgggtacg actgcatcgg ctgcaccatg aagctctggg 1261 atctgccgga ggaggatgtg ggtgcggtaa agccttccaa gacctgctgc agcctggacg 1321 atacggagga tgcaagaagc gtcgcctacc ggctgggcat gccgttctat gcgttcaact 1381 acaaggacga attcatggaa aaggtcatct gcccgttcgc cgaaagctac gaacagggca 1441 ggacgcccaa tccctgcgtc gagtgcaacc gcttcttaaa gttcggcaaa ctctacgcaa 1501 gggcgaagga gctgggctgc gaaaagatcg tcacgggtca ctatgcccgg atcgaacagg 1561 gtccggacgg aaaatatctg ctgaagaagg ggctcgatcc ctccaaggat cagagctacg 1621 tactgcattg ccttacccag gagcagctgg cgcatacgct gtttcccctg ggggactata 1681 cgaaggagca ggcgaggagc atcgcggcgg agcacggctt cgtaaacgcg aataagcccg 1741 acagccagga tatctgcttc gtaccggacg gcgactacgc gaaggtcgtg cagcactacg 1801 gaagcggagc agggacggag cctggcgcct ttgtggacct gcagggaaag cccatcggca 1861 cccataaggg cctgatccac tataccatcg gacagcgcaa gggtctgggc aacacctggg 1921 gaaaacctgt atttgtctgc gccatcgacg cggcggccaa taccgtgacc atcggagaca 1981 gcgaagacct gtttgagacc cgggtggaag tgaaggactt caactggatc gcaggcgaag 2041 cgcccaaaga gtccatccgc tgcacggcga agctgcgcta ccggcagaaa // LOCUS sequence224 2082 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence224 VERSION sequence224 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2082 /mol_type="genomic DNA" /organism="" /note="sequence224" misc_feature <1..562 /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_011389229.1:citrate:proton symporter" /note="WP_011389229.1 citrate:proton symporter (Rhodospirillum rubrum) [pid:50.6%, q_cov:94.6%, s_cov:40.6%, Eval:8.2e-50, partial hit]" /note="MGA_926" /locus_tag="LOCUS_6230" CDS 604..1950 /product="DUF1446 domain-containing protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011389228.1" /transl_table=11 /codon_start=1 /translation="MRTIRIGSGAGYAGDRLEPSLELIEKGNLDYISYECLAERTIAIG QEAKLKDPKKGYNGLLEYRMEKALPLCWEHKVKLITNMGSANPEAAAEKCVEIAKKHGL TGMKIACVTGDDILPIIGKYDEVEVWENHKPLRELDGKVVSANAYMGVEGIIKALKAGA DVVITGRVADPAIFMAPAIFEFGWDLEDWDKLGKGTAMGHLLECGGQATGGYFMEPGKK DIPDPAHLGFPIAEISEDGSLVITKVEGSGGMVTRDTLKEQICYEIHDPENYITPDVVA NFKHIQFTQEGKDRVRVTGATGKPKTATFKCSIGYKDCFIGDGEISYGGEGCLERAKLA LEIIKERLELVAPGAFDEMKYDIIGCNSLYWNPDNQLPSAPSEVRVRVAGRAKTKAIAD LVPNEVEALYTNGPAGGCGAVKRTRDIVSVASILINRNDVKPEIAVYTV" /locus_tag="LOCUS_6240" /note="WP_011389228.1 DUF1446 domain-containing protein (Rhodospirillum rubrum) [pid:56.5%, q_cov:100.0%, s_cov:100.0%, Eval:1.3e-141]" /note="MGA_927" ORIGIN 1 gaagtccggc ttcgcacccg ctgtcgtctt catggtcttc tacgtcatcg cgaccgtcgt 61 caactatccc gacgttaaga cttccaaggc cagagttgac gcccacgcaa aatcctgcct 121 catgatgtgc tccgtgctgt tcgccgcagg ctgctttacg ggcatcatga agggcaccgg 181 catgatcacc gccatgtccg aagcgctggt ctctatcatc cccgcttctc tgggtaagtt 241 cttcccgctc atcatcggcg tcatctccat gcccgcatcc ctgctgttcg acccggattc 301 cttctactac ggcgttctgc ccgttctggc gaacaccgca gccggcttcg gcgttgccgc 361 tgcagacgta ggccgcgccg ccatcctggg ccagatgacc gtcggtttcc cgatctcccc 421 cctcaccgca tccaccttcc tgctgatcgg tctggccggc gtagacttcg gcgaacacca 481 gaagaagacc atccccgttg cctgggcagt cagtttggta atgctgctcg tcgcactcgt 541 taccggcggc gtacacctgt aacctctgcg cagcttgagt tatagaacga aaggaaatcc 601 atcatgagaa cgatccgcat cggttccggc gccggctatg caggcgacag actggaaccc 661 tccctggaac ttatcgaaaa gggaaatctc gattacatca gctacgagtg cctcgcagag 721 cgcaccatcg ccatcggtca ggaagccaag ctgaaggacc cgaagaaggg ttacaacggc 781 ctgctggaat accgcatgga aaaggctctg cccctgtgct gggagcacaa ggtcaagctc 841 atcaccaaca tgggctccgc taaccccgaa gctgccgctg aaaagtgcgt ggagatcgcc 901 aagaagcacg gtctcaccgg catgaagatc gcctgcgtca ccggcgacga catcctgccc 961 atcatcggca agtacgacga agtcgaagta tgggaaaacc acaagccctt aagagaactg 1021 gacggcaaag tcgtctccgc caacgcctac atgggcgtcg aaggcatcat caaggccctg 1081 aaggcaggcg ccgacgtggt catcaccggc cgcgtcgcag accccgccat cttcatggct 1141 cccgccatct tcgaattcgg ctgggatctg gaagactggg ataagctggg caagggcact 1201 gccatgggcc acctgctgga atgcggcggc caggcgaccg gcggctactt catggagccg 1261 ggcaagaagg acatccccga tcccgcacat ctgggcttcc ccatcgccga gatctccgag 1321 gacggttccc tcgtcatcac caaggtcgaa ggctccggcg gcatggtcac cagagacacc 1381 ctgaaggaac agatctgcta cgagatccac gatcccgaaa actacatcac ccccgacgtc 1441 gtcgcaaact ttaagcacat ccagtttacc caggagggta aggaccgtgt acgggtcacc 1501 ggcgctaccg gcaagcccaa gacggccacc ttcaagtgct ccatcggcta caaggactgc 1561 tttatcggtg acggcgagat ctcttacggc ggcgaaggct gcctcgaaag agccaagctg 1621 gccctggaga tcatcaagga aagactcgaa ctggtcgctc ccggcgcgtt cgacgagatg 1681 aagtacgaca tcatcggctg caactccctc tactggaatc ccgacaacca gctgcccagc 1741 gcacccagcg aagtccgcgt aagagtcgca ggcagagcca agacgaaggc catcgcggat 1801 ctggtaccca acgaagtgga agctctgtac accaacggtc ctgcaggcgg ctgcggcgcg 1861 gtcaagcgca cccgcgacat cgtctccgtt gcatccatcc tgatcaacag aaacgacgtt 1921 aagcccgaga tcgcagtata taccgtctaa ggaaaggagg acgcagaaca atgaaacttt 1981 atgagatcgc acattcccgc acaggcgata agggaaatat ctccaacctg tccctcattc 2041 cctacgatga gaaggacttc gaaatgctca aggagaaggt ga // LOCUS sequence225 2078 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence225 VERSION sequence225 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2078 /mol_type="genomic DNA" /organism="" /note="sequence225" CDS 215..694 /product="pantetheine-phosphate adenylyltransferase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003728846.1" /transl_table=11 /codon_start=1 /translation="MRTAIFAGSFDPIHNGHLDIITRAAKMYDEFTVAVTVNLSKKSLF TPEERMALIEELTADLPNVKVVRIDGLRADYVNAHAFTADVRSLRNTADFNYEMPIAQG SAYLYNNTETVFLFTDPKWSFLSSTMIKEVASLGGDISAWVPANVLHSILEKYRK" /locus_tag="LOCUS_6250" /gene="coaD" /EC_number="2.7.7.3" /note="WP_003728846.1 pantetheine-phosphate adenylyltransferase (Listeria monocytogenes) [pid:51.0%, q_cov:98.7%, s_cov:98.1%, Eval:3.1e-35]" /note="MGA_930" CDS 705..1232 /product="vacuolar-type H+-ATPase subunit H" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011392454.1" /transl_table=11 /codon_start=1 /translation="MKVLELLDELDEIIEVASSVPVVRKVMVDPNEVTEIVKEIRLELP DEIQQAQWIKNERQRILDEAKAEYESILNEARQKADALVENDEITVKAKARADEILRIA QENSQVMKMSILDYTDSMLYNLQEKVDQMYATYFTDMYDDLQATFDKINTNIATSRNEV KEQIYKSQVEKD" /locus_tag="LOCUS_6260" /note="WP_011392454.1 vacuolar-type H+-ATPase subunit H (Moorella thermoacetica) [pid:30.4%, q_cov:77.1%, s_cov:79.4%, Eval:1.3e-19]" /note="MGA_931" ORIGIN 1 atatcttctt cctggatccg ccctatgcgg acaagtccat ccccgatgcg ctgaaggcca 61 tcgacgaagc cggaaactgc cggccgggca cggtcgtagt ctgcgaacac cgtcataaag 121 atgttctccc ggaacagatg cacggcttta cctgcatcaa ggacagacgc tacggtgcta 181 ccggggtcac catttacgaa agagacaaag aggaatgaga acagccatat ttgccggatc 241 cttcgatccg atccacaacg gccatctgga catcattacc cgggctgcga agatgtacga 301 cgaatttacg gtagccgtta ccgtcaatct gtctaaaaaa tcgcttttta cgcccgaaga 361 gaggatggct ctcatcgagg aactgacggc ggatctgccc aacgtaaagg tcgtccgcat 421 cgacggtctg cgggcggact acgtgaacgc ccatgccttt acggcggacg tgcgcagcct 481 gcgcaacacg gcggatttta attacgaaat gcctatagcg cagggaagcg cttatttgta 541 taataatacg gagactgtgt tcctgttcac cgacccgaag tggtcgttcc tgagcagcac 601 catgataaag gaagtggcca gcctgggcgg cgacatcagc gcctgggtgc cggccaacgt 661 tttgcatagc attttggaaa aataccggaa gtagggggta acacatgaaa gttttggaat 721 tactggacga actggacgag atcatcgaag tcgcatcttc cgttcccgtc gtacgcaagg 781 ttatggtcga tcccaacgaa gtaacggaga tcgtcaagga gatccgtctg gagcttcccg 841 atgagatcca gcaggcgcag tggatcaaga acgagagaca gcgcatcctg gacgaagcca 901 aggccgagta cgaatccatc ttaaacgaag cgcgccaaaa ggcagacgct ctggtggaaa 961 acgacgagat caccgtaaag gcaaaggcaa gagccgacga gatcctgcgc atcgcacagg 1021 aaaactccca ggtgatgaag atgtccatcc tggactacac cgactccatg ctgtacaacc 1081 tgcaggagaa ggtagaccag atgtacgcca cgtactttac cgacatgtac gacgatctgc 1141 aggcgacgtt cgacaagatc aacaccaaca tcgccacctc cagaaacgag gtcaaggagc 1201 agatctacaa gtcccaggtg gagaaggact gatatgtccg tcgcaggcat catcgccgaa 1261 ttcgacccgt tccacaacgg gcaccaatat ctgatcgata cggtccgcag agaactttct 1321 ccccgggccg ttgtttgcgt gatgagcgga aactttacgc agcggggcga accggctatc 1381 ctggacaagt ttacgagggc gcagctggcc ataaagggcg gcgccgacct cgtcgtggaa 1441 ctgccggtgt gctgcgcggt gaacgctgcc agggaattcg ccttcggcgg cgtgcgcacg 1501 ctgcatctgc tgggctttgt gacccacctc gccttcggct cggaaacagg ggacgttaaa 1561 ctgctggaac atgccgctga actggctcta aaagaaaacg atgcgttccg caaagcgctg 1621 aaggggcaga tggaagctgg gcggccctac ggcactgcct atgcccgggc tctgaaagcc 1681 gttctgggac ccgagatcgc cgatttccag gactttccgg catcgaacga tatcctggcc 1741 ctcgaatacg taaaacagct gaaacagggc atttcggata tgcagcccta cgccgtaaag 1801 cgagccggag cagggcataa ggacacggag atcggcaagg tctattccag cggcgaggcg 1861 atccgcatga tgcttaccta cgagacagat ccggaagaga tccgggacga aatgcccggt 1921 tttacggtcg aagcgctgga aaacttcaat ttcctgccgg acatggaaga ccgtatgctg 1981 gatctgctgc gctaccgcat tccgcagctg ccgcttgccg ccatcatgag tgcccccggc 2041 gtgtccgaag ggctggagaa cgtcgtaaag cgggagat // LOCUS sequence226 2077 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence226 VERSION sequence226 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2077 /mol_type="genomic DNA" /organism="" /note="sequence226" misc_feature <1..990 /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_005816469.1:tRNA (N(6)-L-threonylcarbamoyladenosine(37)-C(2))-methylthiotran sferase MtaB" /note="WP_005816469.1 tRNA (N(6)-L-threonylcarbamoyladenosine(37)-C(2))-methylthiotran sferase MtaB (Desulfitobacterium hafniense) [pid:43.1%, q_cov:83.3%, s_cov:60.1%, Eval:1.4e-56, partial hit]" /note="MGA_933" /locus_tag="LOCUS_6270" CDS 1019..1360 /product="HIT domain-containing protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_010964599.1" /transl_table=11 /codon_start=1 /translation="MSDCLFCKIIAGEIPSNKVYEDDEILAFNDVAPQAPVHFLIVPKK HMASLDDTTDEDAALLAHIMLKIKDIAKDLGLENGYRVVINTGEDGMQSVKHLHVHVLG KRRLLWPPG" /locus_tag="LOCUS_6280" /note="WP_010964599.1 HIT domain-containing protein (Clostridium) [pid:54.4%, q_cov:100.0%, s_cov:100.0%, Eval:3.6e-35]" /note="MGA_934" ORIGIN 1 gatcccgtcg tgcatcagac cgcatacgag cagcacgagg gcattaccgg catggagacg 61 aagacgcgcg ccctcatcaa gatccaggag ggctgcaacc ggttctgctc ctactgcgtc 121 atcccccacg ccagaggaca ggtgcgcagc cgcagcgccg ccgccatcaa aaaagaggcg 181 gaatcgctcg tttccgcagg ttataaggaa attaccctta cgggcatcaa tacggcgctc 241 tacggggcgg aaaagggctt tacagacgat ctgaacacgg gactggacgg tgtggagatc 301 atcgtaaagg cgctgagcga cattcccggc gatttcctca tccggctggg atccatggag 361 ccgaccgtca ttgacgcgga ctatatacag cggctgttcc gctacgaaaa actggcgcat 421 cacgtgcacc tgtccatcca gagcggatcc gatgccgtca tcgcgcggat gaaccgccat 481 tataccgccg cagactatct ggagatcgtc cggcgctgcc gggacttcga tcctctctac 541 ggcattacga cggatatcat tacgggtttt cccggagaga cggaggctga tttcgaagcc 601 agcaaggaga tcgtaaggca ggtaaactat ctgcatgtcc attgcttccc ctacagccgc 661 aggatgtata cgccggcggc ggacatgccg gatcagatcg caccgcccgt caagaaacag 721 cgtaacaagg acctcatcgc tgttgccgaa gatgtctcga aacagttccg ttcttccatg 781 atcggctccg tgcagcgcgt gctggcggag gaggccgggg aaacggagca gggcaggctc 841 tggaagggtc actgcagcaa tttctgcacc gtctatttcc gcgatccgtc catgaccgat 901 ccgtcccgcg ccgcttccct ggaaaaccag tggatcgacg taaaagtcga agcggtctac 961 gaggacggcg ttatgggaaa tatgctataa tagatcatta ctgaaaggag gagatcctat 1021 gtccgattgc ttattctgta agatcatagc gggggagatc ccatccaata aggtctacga 1081 agacgacgag atcctggcct tcaacgacgt tgcgccccag gcgcccgtgc atttcctcat 1141 cgttcccaag aagcacatgg cttccctgga cgacacgacg gacgaagacg cggcgctgct 1201 ggctcacatc atgctgaaga tcaaggatat cgccaaagac cttggcctgg agaacggata 1261 ccgcgtggtc atcaacaccg gcgaggacgg catgcagtcc gtcaagcatc tgcacgtcca 1321 cgtcctcggc aagagaagac ttctctggcc tcccggctga tgcattttca ttgacaacca 1381 caggcagtag tatataattt tccttgtatg tcactttgta tctgacatgc aaaaggagag 1441 aaagattatg gcagaagaaa tcaaagtcaa caaattcgac gacgaagaat acagacagac 1501 ttattggcat tcctgctccc acgtcatggc gcaggcagtc aagagactgt ggcctgaagt 1561 aaagctggcc atcggtcctt ccatcaagga aggctggtac tacgacatgc tggctccgtt 1621 tgcgtttacg ccggaacacc tggaaaagat cgaagcggag atgaagaaga tctgcaagga 1681 gaacctgaag atcgagcgtt tcgaactgcc cagagacgaa gctatcaaat tcatggaaga 1741 aaaggaagag ccgttcaagg tagagctcat caacgacctg cctgagggcg aacccatctc 1801 tttctataag cagggcgaat tcaccgacct gtgtgccggt ccccatctgg acttcaccgg 1861 ccgtatcaag ggcaacgcca ttaagctgct tacggcaaat gccgcctact ggagaggaga 1921 ctccaacaga gagactctgc agcgcatcta cggcatagct ttcccgaaaa aggatgagct 1981 tgacgcctac cttcagcgca ttgaggaggc gaaacgccgc gaccacagaa agctcggccg 2041 cgatctcggc ctgttcgctt tccgcgatga agctccc // LOCUS sequence227 2068 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence227 VERSION sequence227 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2068 /mol_type="genomic DNA" /organism="" /note="sequence227" ORIGIN 1 aaagcggaat gaaggcgttg aacacgttgg agccgaaggc cacccattcc aggatgcgga 61 tggcttcgtg gcggtccgga cggatctggg tgagcgaaag gaaattgttc cggttgaccc 121 cgatgggccg cagttcgccc ttgtgcaggg gttcgctgct ggaggcgtag ggatcataca 181 tggtgccctg atagtgggaa gacagcacgt actttacgtc ttctaccgtg atcttgcgct 241 ccggcgccat gcagaagggg atgttgtcgg agaagggcgt aaagtccgca tccgggccgt 301 cccagaaata tgtgttcttg ttgaaatagc gctcaatgta ccaggcgcgg ggcgtgttgt 361 agacgtggtc cgcatcgctg tggctgccga aagccgtgcg ggcgtcgaag ggcatgcctt 421 cgaaactgag gtccaggtgg ttttctgcaa taaactcgcg gatgtctgcg ctggccatgt 481 gctccttttg ttctccgagg gcatcgtcca ggtcgaattc gtccaggttg aagtagttgg 541 gtgctaccgc atagcagtcg tcgggcaccc ggcgggcgat ccagtgatgg ccgccgatgg 601 tctccagcca ccagacttca tcgatgtcgg agaaggcgat gccgttcatc tcgtaggtgc 661 cgtaggtctc cagcagcatc cccagccgct ttacgccttc ccgggcgctg cggatatagg 721 gcagggtgat cgttacgata tcctcctcgc cgatgccttc ctttaccatc ggatcgccgg 781 agagcacccg ctcgttggag gtgagggtct ctgtggcggt catcgaaacg cctgcggtgt 841 tgaccccggc agcgtaccag ttgccttcgg agggatctcc gttgggcatg gcggtgtagc 901 gcatgggatc gtccgggaga tcgatcttta ccttagagat gacggattcg taatgccggg 961 gctggtccgc cggctgtacg acgatatgtt tcttggaatt gaacgagagt ccgccggaat 1021 cttcgtttct tgcgatcatg gtggacccgt cgaaggttgc tttctttcct actaaaagtg 1081 tggtgcaggg catggtcttc ctccttttac ttctgatgat tttagtgtag cacaaatttt 1141 ttaaaaatat tttccgtgac cccaaaaatc ccaaaacgtc ctccgaaata gatagtgcaa 1201 gaggggatgg gaccccgaag agatcggaag ataatcagaa gataaggaga aataccatga 1261 ataagatcgt aaagaaagca gccaccataa cactcgcggc cagcatgatc gctgcacccg 1321 taagcgtctt cgcagacgac gcgcagcaag cgcagagcgg cagctccagc tggatctcct 1381 ggttcggaca aaagatccag cagatcctgc agggcggaat gcccagccag caagctccga 1441 tgggaacggc gcaaaacgca agcgaggcgt ccgagatcaa gaccagcacg ctggcgagca 1501 acacagcgga agccctgacg gtcgatacca agaacgccga gaccatcgtg atgagcgatt 1561 ccaataatca agtgaccatc agcgaggcgg gcacctatat catcaccggc acctgcagcg 1621 acggcaacat caaggtaaag aaagggaccc aggacgtggt cctcgtgctg aaagatctta 1681 cactctccag caccaccggc gcaacgcttt ccgtcaacaa gggggccgag gccaagatcg 1741 tggtcgaagg caccgttacg ctcaacgata acgaagatac cgcagacgaa gaactggata 1801 cctacgatgg cgcggtcatc aaggcgaagg ccggcagcgc agtggtcctc accggcaccg 1861 gtaccctgaa cgtcaacggc aacgccgagc acggcatcaa ggtgagcagc accgatgcag 1921 acgatatcgc agacggctac agcgacgctt ccttcatcgt cgacggttcc ctgaagatca 1981 acatcacctc ggtggacgac ggcatgaatt ccggtacgga tctgaccatc aagagcggaa 2041 ccattaccgt aagcgcaggc gatgacgg // LOCUS sequence228 2068 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence228 VERSION sequence228 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2068 /mol_type="genomic DNA" /organism="" /note="sequence228" misc_feature complement(755..>2068) /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_002680008.1:FAD-dependent oxidoreductase" /note="WP_002680008.1 FAD-dependent oxidoreductase (Treponema denticola) [pid:51.5%, q_cov:97.5%, s_cov:46.5%, Eval:1.7e-122, partial hit]" /note="MGA_939" /locus_tag="LOCUS_6290" ORIGIN 1 agtcggcgaa gtcgcccacg ccgatgcacc agtactgctc gatgtcgccg gagccctcgc 61 cccggatgcg ctgctgcttc cggcaggagc agatgcctac gccgatctgg ccctcgtact 121 ttttcagcca gtggctcagg tgctcgatat ccagggattc gcactcggcg gggatggcct 181 gctccacggg gatcacgtgc atgccgatgc cgccaccgcc gggaggcacc atctgggtga 241 tgcccgccag gggcagatag gtcatccgct cgaaaaagtc cgtcacatgg ggcgtgaccg 301 gggagatctc cggccgcatg accatgatct ccgcgctgcc gggcacgaac atatccagca 361 cccagcgctt ctcatggttg gggttcttgc cgtccagatt ttcgaaatgc cactccacca 421 gactggcctg gcacagggcc tccagcacca gcgcaaggcg ctcgtcatcc agaccggaca 481 gggccttcaa ctgggcgaag gtcttgggct tgcgcttgcc catttgcagg gccacgtcca 541 gacagtcgtc cgccacgtcc ttgccgtagc ggcgctcggc gtactggagg ccgcagtcga 601 tgccccaata ctcgggggac tcggtggaca tcttctccag gccaaggaga atctccttgc 661 ggtcggtgat gattttacct aatttgaaaa ttttttcgtc gcgggtcatt tggtgctctc 721 ctttcaaaat ggggaaattt ggctcgggaa aaaattactg ctccgtggga taatcggact 781 tgccggtgat ctttttcttg agaatcttca tgccgcgttt cagggcgtag ggggccacca 841 ccttcatcat ctcctcggcg gtgtgcatgt cgctggcggc gggcaagtca cgggtgaggt 901 ggatggcgtc gaactggcag cgggtggtgc acaggccgca gccgacgcac tggttgaggt 961 cgacggtagt agcgccgcat tttaagcagc ggccagcttc gatgcgcacc tgctcttccg 1021 tgaggggcag gcgcagatcg tcgaacgtcg cggctgcttc gccgggctta aggccgggca 1081 tctggcgctg ggcgttgtcg tagctctcca cccggatgtc gtctctgtcc agttcgatga 1141 attcccgcag gtcgcgtccg atggtgaggg actggccggg atggacgaac cggttgatgg 1201 agaccgcgcc ctggcggcct gccgcgatgg cgtcgatgac gaacttctga ccggtgtagg 1261 cgtcgccgcc gacgaagata tcgggctcgc cggtctgata ggtgacgggg tctgccttca 1321 cggtaccgtt tttgttgaat tccacgttcg tgccttcgag cagcttgccc caatcgggct 1381 tctgtccgat gcagtacagc acgttttcgc atgcggcggt ctcggtgacc gcgtcgtcga 1441 actgcggatc gaagcggcct tccgcgttct ttacggacag gcacttgcgg aagcggatgg 1501 ctttgcattt tccgtcttct gcgacgatct ccgtctggcc ccagccggca tggatgcgga 1561 tgccttcttc ttcgcattct ctgcggtcat ccggccccat gggcatgtcg tcgtaactct 1621 ccaggcagta gagatccacg ctttctgcgc cggctctcag cgccgttctt gcgatatccg 1681 ccgcgatgtt gccgccaccg ataacgacgg tcttgcccgc gatgcggatg ctctcgtcct 1741 ggttgatttc ccgggcgaat tcgatgccgg cgcgaacgcc ctgcgcgtct tctccgggga 1801 tgcccatcct gccgccgctc tgcagaccgg tggcgagata gaaggcttta tagccctgtt 1861 ctctcagctg ctgaatggta atgtccttgc cgatctccac gccgcagcgg atctcgacgc 1921 ccatcttctc gatgatgtcg atctcgcctt ggatgacttt cttttccagg cggaagttgg 1981 ggatgccgtt catcatcatg ccgccgggcc gcttctcgcg gtcgaacacc gtaacggggt 2041 agccttcctt gcgcagataa tacgcggc // LOCUS sequence229 2066 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence229 VERSION sequence229 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2066 /mol_type="genomic DNA" /organism="" /note="sequence229" CDS 946..1545 /product="TetR/AcrR family transcriptional regulator" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_010965893.1" /transl_table=11 /codon_start=1 /translation="MKRSQNNTKGKIVSAAWKLFYEQGYDKTTVDDIVEASGTSKGSFY HYFESKESLPASLSYLFDEKYEELTETMDPSLGVIEKLVFINQELFLMIENTVSIDILS RLFASQLVSGSERSLLDPTRTYYKLLRQIVIEGQQQGLFREEFTTLDVTRAYAVFERGL MYDWCISGGNYSLAQYSAQLLPQFLMGFCKESVDSK" /locus_tag="LOCUS_6300" /note="WP_010965893.1 TetR/AcrR family transcriptional regulator (Clostridium acetobutylicum) [pid:29.1%, q_cov:89.4%, s_cov:88.7%, Eval:6.2e-17]" /note="MGA_941" ORIGIN 1 aaggggacgt tgttcttgac gcagctgtag atgatgccgt tgctgatgcc ttcgcccttg 61 attaacgcgg ggatggatcc gtaggtgttg atggcgttga tggtctccag atggttgtag 121 tgacccatgt agtggagctt ctggttgcgg atgtcgcagc ccagcgccgt gcccagatag 181 gcgccttcca aatcgtgggt ggcaagcgca ttgccggcca gcagcgcctg gcagtagcct 241 tctgcgatga gcttagacat gatctccctt gccgttacgt cgaaactgca ggcggggccg 301 agcacccaga ccacgtagcc gccgtgttct ttttcgtatt tcagcaggtt caccaggcgc 361 tcgtagtcgt aggtaaaact ggtctcccgg ttgcggctgc ggcggaagga gaagacgttc 421 tcggcgcttt cctcctcgtc gctggtaaag cagtccgcat gcacgtagat gccttcgctg 481 ccgtcctcgc tgcggccggt gaccacgaga tcgttctctt tgatgttgcg gaattccacg 541 actttgatct ccccgtccag ccagaccgcc acggcgtcca tgcgggtatc cttggccagg 601 tgccaggtgc cgtttatctt aaagtattca gggtagatgg acgtggcgtg gaagcctttc 661 ggcgccgcct tggcgtgggg cgcctttacc agcgtgcagt ccggtgcctc cgcgagaaat 721 ttctgtgtga aatcgggttc gatgtaggtg ttgagttgaa acatgatgcg attcctttcc 781 gtaattgtac tgcattctaa catggaaaga gaaagaacaa aatacggaat agagtttaga 841 ctaaaaaata gaattgtccg gtattgaatt tcaaaaacaa ttgaaaattc aatcttttat 901 tgttaaacta aattatagac tgagataagg acgaaaaaat aaactttgaa aagatcgcag 961 aacaatacaa aagggaagat cgtttccgcc gcgtggaagc tgttttacga acagggctac 1021 gacaaaacga cggtggatga catcgtagag gcctcgggca catccaaggg ctccttttat 1081 cattacttcg agagcaagga atcgctgcct gcctcccttt cgtatctgtt cgacgagaag 1141 tacgaggaac tgacggagac gatggacccc tctttagggg tcatcgaaaa actggtgttc 1201 atcaaccagg aactgttcct gatgatcgaa aacacggtct ccatcgacat cctcagccgc 1261 ctgttcgcct cccagctggt gtccggcagc gaacgcagcc tgctggatcc gacgcgcacc 1321 tactataagc tgctgcggca gatcgtcatc gaaggccagc agcaggggct gttccgggag 1381 gaatttacga cgctggacgt cacccgggcc tacgccgtct tcgagcgggg cctgatgtac 1441 gactggtgca tctccggcgg caattattcg ctggcccagt attcggccca gctgttaccg 1501 cagttcttaa tgggattctg caaagaatcg gtcgatagca agtaaaggag taccccatga 1561 gtgaatttgg cttaagaaaa gtcaaaatgc gcaagttcga gcacgaggtc aaggaaaagg 1621 acatcatcgc cgccatcctg gatacggcgc ccttcgtggt cgtgtccgcg acggatgagg 1681 acggcctgcc ttattccgtg cctctctgtt acggtgcggt ctgcgatgag gaaggcgtca 1741 agatctacat ccactccgcc agagaaggca gaaaggtgga tctgtggcgc aaggagccca 1801 tcgtcacctg cgtcgccgcc tatctctaca acaacacgga cccggaattc tattaccgcg 1861 acgtgttcca cgactaccgc tgcgttatgc tgcgcggccg gctgacccag gtaaagcggg 1921 aagagttccg cagcaagcac ggcgaagcgg tgcaggccat gctgcgccac tacggcagag 1981 gcccctccca tttctccgtg cctcactacg gctggatgga cgtgttcgtg gtcacctgcc 2041 cctgggagga cgtctcctgc aaggcc // LOCUS sequence230 2061 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence230 VERSION sequence230 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2061 /mol_type="genomic DNA" /organism="" /note="sequence230" misc_feature <1..664 /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_003384686.1:tRNA (guanosine(37)-N1)-methyltransferase TrmD" /note="WP_003384686.1 tRNA (guanosine(37)-N1)-methyltransferase TrmD (Clostridium botulinum) [pid:52.1%, q_cov:95.5%, s_cov:85.4%, Eval:2.9e-61]" /note="MGA_943" /locus_tag="LOCUS_6310" CDS 693..1829 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MNRRGKRTAGVAAGIVFLAVCAALYAYIYVVPSVTGALTPTAIAQ YGEMQTLNPASCIVFRSEKVVKAEQSGNAGYYVDEGAKTRLGVKVADIYPADGSGTGYF METTGIVSYWCDGYEETFTPETTENITLDSFPSEEEGAEPPAQPESVRTGTKQEGDPLY KIVTGDTWYFAFRIEDQYMDRYAMGQRVDVVLPNGTVDATVTRMTQYEDYWVVIAYTNR YYEGFDQLRYCDVTIVTESNDGLIIPTTARAMQEQEDGSMLEGVYVKNIRGDYVFRRIL VLAEDENTGETLVEPDSFYEKDETGESVLVGSIGVYDEVLRDAGGLSDVTVTDEIEEPE EEEIVFEWEKNKEETPEEPVEEPQETIPEGPEEETPQD" /locus_tag="LOCUS_6320" /note="MGA_944" ORIGIN 1 gctggagctg gacatcgtca atatccggga ctatacgctg gacaaacaca gaaagaccga 61 cgacacgccc ttcggcggcg gcgccggcat ggtgatgaca ccgcagcctg cgttcgacgc 121 actgcgcagc ctcggggcgc agggtaagcg catcctgtac atgtccccca gaggccccat 181 cctggaccag aacctggccg aagacctggc gtcggaggag gagtttttca ttctgtgcgg 241 tcattacgaa ggggtggatg aacgcatcct caaagcctgg aacatggagg aggtctccat 301 aggcgattat atcctgacgg gcggcgaact ggctgccatg gtcctcgtcg actgcgtgtc 361 gcggctcgtt cccggcgtgt tgggaagcgg cgattcgctg tccgaggaat ccatctacag 421 cggcctgctg gaatatcccc agtacacgaa gccccgcagc tacgagggga tggacgtgcc 481 cgaggtgctt ttcaacggca atcacaagct catccacctg tggcagtacg aacagtccct 541 gttgctgacc gcaaagagga ggccggatct gttcgcgcgt tacgtgcagt cgggcccgga 601 cctgacgaag gacgaaaaaa agatcctgga aaaagttatg cgcgaaacac aaagtattga 661 atagagcatt gaaagatgct acaatatttt gtatgaatag aaggggcaaa aggactgcgg 721 gcgtcgcggc gggcatcgtt ttcctcgccg tctgcgccgc attatatgca tatatctacg 781 tcgttccctc tgtcaccggg gcgctcaccc cgacagccat cgcgcagtat ggggagatgc 841 agacgctcaa tccggccagc tgcatcgtgt tccgcagcga aaaggtggta aaagccgaac 901 agagcgggaa cgccggttat tatgttgacg aaggggcgaa gacccgtctc ggggtcaaag 961 tcgccgatat ctacccggca gacggttccg gtaccggcta tttcatggag accaccggca 1021 tcgtaagcta ctggtgcgac ggatacgagg agacgtttac gccggaaacg accgaaaaca 1081 tcacgctgga ttcgttcccg tccgaagagg agggcgcgga gccgccggct cagccggaat 1141 cggtgcgcac cggaacgaag caggaaggcg atcccttata taagatcgtc accggcgaca 1201 cctggtattt cgcattccgc atcgaagacc agtacatgga ccgctatgcc atgggtcagc 1261 gggtcgatgt cgtgctgccg aacggtaccg tcgatgcgac ggtcacccgc atgacccaat 1321 acgaagacta ttgggtggtg atcgcttaca cgaaccgcta ttacgaaggc ttcgaccagc 1381 tccgttactg cgacgttacg atcgttacgg agtccaacga cggcctcatc atcccgacga 1441 cagccagggc catgcaggaa caggaagacg gctcgatgct ggagggtgtc tacgtcaaga 1501 atatccgcgg cgattacgtc ttccggcgca ttctggtgct ggcggaggac gagaacaccg 1561 gcgagaccct ggtggaaccg gacagcttct acgagaagga cgagacaggg gagagcgttc 1621 tcgtcggctc catcggcgta tacgacgaag tgcttcgcga cgccggcgga ctgagcgacg 1681 ttaccgtaac ggacgagatc gaagagcccg aagaggaaga gatcgtgttc gagtgggaaa 1741 agaacaaaga ggagacgccc gaagagcccg tggaagagcc tcaggaaacg attccggaag 1801 gacccgaaga agagacgcct caggattaga ccgggaggga tctatgagca ttactcagaa 1861 tatcgcggag atccgcagca gaatggctgc agccgccgtc cgcagcggca gaaagccgga 1921 ggacatcctg ctgatcgccg ttacgaagct gcacgagccg gacgagatcg aagaagcgct 1981 ggcagcaggg ataacggata ttgcagaaaa taaggtgcag gagatccaga agaaattcga 2041 ccagatccac agccctgcga a // LOCUS sequence231 2050 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence231 VERSION sequence231 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2050 /mol_type="genomic DNA" /organism="" /note="sequence231" CDS complement(179..982) /product="MBL fold metallo-hydrolase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003435698.1" /transl_table=11 /codon_start=1 /translation="MNLAICSLASGSSGNCYVIRGGDTFVLVDAGISGKQIRERLSAIG LEPSRLSAILLTHSHSDHVKGLAAVLKTTDACLFTNEATAADACAGLPAERVKFFETGD GFDLGELQVHTFPVSHDTADPVGFTFLRGGKQISIVTDTGIVTRPIYEQIRGADILVLE SNHDENILRMGRYPWFLKQRILGEEGHLSNEAAAKALAAALEEERDAQAERQHTVLLAH LSQENNFPEMALTTVNNILEERGLLRSDLKIRVLPRTQQSPVYTV" /locus_tag="LOCUS_6330" /note="WP_003435698.1 MBL fold metallo-hydrolase (Clostridioides difficile) [pid:38.4%, q_cov:98.5%, s_cov:98.5%, Eval:2.2e-46]" /note="MGA_947" CDS complement(1064..1597) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MDWSKAKNIIIAVLVAANLLMGINLLSRSAGARQQIAQASEESIA FLEQQGMSFETDVPKKTEKLPVLFLRLQRAGELSAPEEYKGYPIVVQGSQIGFEIAGSG QQAAETMPAAEALLKLYAQLSGTESVKGRTVEAIDLVYLLSPDDTSYAAQDTASPAWRI RLSGHTYYIDAYEE" /locus_tag="LOCUS_6340" /note="MGA_948" CDS complement(1607..2050) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MLCSAVESGSGRSKVYTFGFAQMLGGVKLLSEDGPAIIVTVSGGE VSYYRRAVAKAATATAETQPAAEAANVIAGNSHLIYSVLTGNVLSANSDEEFAYVADHL KDAYIAYVVTEDSLRPAWVVATKEDALFFFGLYDALPLGFTRE" /locus_tag="LOCUS_6350" /note="MGA_949" ORIGIN 1 gcttccgagg tcctgccgct gccagccgcc gcctcgatcc agcccttatc taccggaaag 61 ttgtaggcgt aggctccccc gaacccgcag acgaatgcga tcgccgcgac cagaaggatc 121 gcgaccagct gtccaattcc ctttttcatg tttgtccctt ctttcctctg atgtctttct 181 agaccgtata gaccgggctc tgctgcgttc tcggcagcac ccggatcttc aggtcggagc 241 ggagcaggcc ccgctcttcc agaatgttgt tgactgtggt gagcgccatt tccggaaaat 301 tgttctcctg gctgaggtga gccagcagca ccgtgtgctg ccgttccgcc tgcgcatctc 361 tctcttcctc cagcgccgcg gccagcgctt tcgccgccgc ctcgttggac agatggccct 421 cttctcccag gatcctctgc ttgaggaacc aggggtagcg gcccatgcgc aggatgttct 481 catcgtggtt gctttccagc accagaatat ccgcgccccg gatctgttcg tagatgggcc 541 gggtcacgat gccggtgtcc gtgacgatgg agatctgctt tccccctctc aaaaaagtga 601 accccacagg gtccgccgtg tcgtgagata ccgggaatgt gtgcacctgc agttcgccca 661 gatcgaagcc gtcgcccgtc tcaaagaact ttacgcgttc cgcaggcaga cctgcgcagg 721 catccgccgc tgtagcttcg ttggtgaaca ggcaggcgtc cgtcgtcttg aggaccgccg 781 ccagtccttt tacgtgatcg ctgtggctgt gggtgagcag gatggccgac agccgggagg 841 gttcgagccc tatggccgat aagcgttccc ggatctgttt gccggagatc cctgcgtcca 901 cgaggacaaa ggtgtcgccg ccgcggatca cgtaacagtt tccgctgctc ccgcttgcca 961 gggagcatat ggctaaattc attctttctg attactcctg gataatagtc gggaaatgtg 1021 acaaaactgt gtcgattccc gcacgaaaat ttgtaaattt tatctattct tcgtaggcgt 1081 ctatgtaata cgtgtgcccg gacagccgga tgcgccaggc agggctcgcc gtatcctggg 1141 ccgcatagga cgtgtcgtcc ggggacagca gatacacgag gtcgatggcc tccaccgttc 1201 tgccctttac gctttccgtt ccgctcagct gggcgtacag cttgagcagc gcttccgccg 1261 caggcatcgt ttccgccgcc tgctggccgg accctgcgat ctcaaaaccg atctggctgc 1321 cctgcaccac gatgggatag cccttgtatt cttcgggggc gctcagttcg cctgcccgct 1381 gcaggcgcag gaacagaacg ggcagtttct ccgtcttttt gggaacgtcc gtctcaaacg 1441 acatgccctg ctgctcgagg aaggcgatgg attcctccga cgcctgggcg atctgctgcc 1501 gggcgcccgc cgaacgggac agaaggttga tccccatcag cagattcgcc gccaccagca 1561 ctgcgataat gatgttcttc gctttcgacc agtccatgcc gcacctctac tctctcgtaa 1621 agcccagcgg cagcgcgtcg tacagcccga agaagaacag cgcgtcctcc ttcgtcgcga 1681 cgacccatgc cggccttaaa ctgtcttccg ttacgacgta ggcgatgtac gcgtccttca 1741 ggtgatccgc cacataggcg aattcctcgt cggagtttgc agaaagcacg ttgcccgtca 1801 gcacgctgta gatcagatgg ctgttgcccg cgatcacgtt agccgcttcc gccgccggct 1861 gcgtttccgc cgttgccgtt gcggcttttg ccacagcgcg tctgtaatag ctgacttcgc 1921 cgccggacac cgttacgatg atggccggcc cgtcttcgct gaggagcttg acgccgccca 1981 gcatctgcgc gaacccgaag gtatagacct tgcttctgcc gctgccggat tccacggcgc 2041 tgcagagcac // LOCUS sequence232 2040 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence232 VERSION sequence232 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2040 /mol_type="genomic DNA" /organism="" /note="sequence232" ORIGIN 1 ctgctgcccg acaacccggg ctataaactg ttcgactact ttgtcgacaa ctgcagatga 61 tcgcaaggcc cgctgcggcg ggtctttttc tatggttgaa tcgaaggcct aaatactata 121 taatgtggtt gagtgttttt gcgtgcacaa aatcagggat tttaccatat attaaaagga 181 gagggaaaca tgagcactgt catcaaacgg aacggtcagg aagtcgtctt cgacccgtcc 241 aagatccaga tcgccatcga gaaggcgatg caggagaccc gtttaggggt agacgttgga 301 ctgtccgcgg acatcgcgca gcggatcgcc gcgcaggtgg agcggtcgca gcagaacgtc 361 cacgtggaag atctgcagga cctggtggag gacttcctga tggccagcga acgcaaggac 421 gtcgccaaaa agttcatcat ctaccgctac gaaagagaga agactcgggt ggaccgtagc 481 gcggattccg gccggctcat cagcgaggct ttcatcagcc agtataagca cgcgcccagc 541 cccatgaacc agctgggcag cttcgtgtac taccgcacct attcccgctg gcttccgacg 601 gaatccagaa gagagtactg gtgggagacc gtccgcagag ccgtggaata caactgcagc 661 ctcgtgccga cgtcccggga cgaagcggag agactgttcc gcaacgtgtt ctcgctcaaa 721 cagttcctgt ccggcagaac gttctgggtg ggttccaccg acgtctccaa attctatccc 781 atgagcaatt tcaactgctc gttccaggtg ttggacagct tttccagctt ccacgacgtg 841 ttctacctgc tgatggtggg ctccggcgta ggcgtgcgca tcttaaagtc cgatgtggcg 901 aagctgcctc cgatccgcaa ggacgtggaa ctcatccacg agtcctacac gccgctgctc 961 aaggcgctgc ggcaggacaa cacctccctg gaattcaccc ataacgatac tgtcaagatc 1021 accatcggcg actcgaagga gggctgggtg cagtccctgg attactatct caaggtgctg 1081 tacagctccg aataccgcaa gatcaagacc gtcatcctca actacgacaa cgtgcgcgaa 1141 agaggcgaaa agctcatgac cttcggcggc acggcttccg gccacgccag catgaagaat 1201 atgtttacaa agatcaaccg cgtggtggaa aaggccgcga cgagagatgc aggtgaacgc 1261 atcaaactgc gccccatcga ctgcatggat atcgcgaaca tcatcggcga gaacgtcgtc 1321 gtgggcggcg tccgcagaac agcggagatc gtgctcatcg acgcggacga taaagagtgc 1381 atcgaggcga agagcaatct gtacaagaaa gtcgatgaaa aatgggtcat cgaccaggag 1441 atcgcccacc gccagatgtc caacaactcc atctactatc tgcacaagcc cacccgcgaa 1501 cagctgcact ggcacctcac ccagatgcgc tattccggcg aaccgggcta tgtaaacgcg 1561 gaagaagggc agagaagacg gccgaacttt aacggggtca acccctgcgc cgagatcctg 1621 ctggattcca agggactgtg caacctgacg actgtcaact gcatgggctt cgtggacgaa 1681 aacggcgtgc tggataaggc ggctcttctg gaggcccagc gcctgtccgc ccgggccggc 1741 taccgcatga cctgcacaga gctggagatc ccggaatgga acaccgtgca gcagagagac 1801 aagctcatcg gctgctccct caccggctgg caggacatgg tgaacgccac ccatatgacg 1861 aaggacgaac aggcagcgct gctttccgaa ctgcgcgccg ccgccagaga agcagcacgc 1921 agctatgcgg aggaactggg catgccggtg cctctgctgg tgaccacggt caagcccgaa 1981 ggcaccctgt cgctgctgcc cgtcgtatcc tccggcgtgc acttcagcca cgcgccgtac // LOCUS sequence233 2038 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence233 VERSION sequence233 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2038 /mol_type="genomic DNA" /organism="" /note="sequence233" misc_feature <1..1857 /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_011947903.1:UPF0182 family protein" /note="WP_011947903.1 UPF0182 family protein (Clostridium botulinum) [pid:48.7%, q_cov:84.0%, s_cov:58.1%, Eval:3.3e-146, partial hit]" /note="MGA_952" /locus_tag="LOCUS_6360" ORIGIN 1 aacatcgatt acacccgcat ggcctacgat ctgcaggaca tcgcggtgcg ggatttcgtg 61 ccccagaaca acctgtccat gaaggacgtg ctgctcaaca tgggcacgtt ctccaacatc 121 cggatcaacg atttcgagcc tgcccagcag ttctataatc agacccagtc catccgtacg 181 tactacgaat tcaacgacgt ggacgtggac cgctacaacg tgaacggcga atacacccag 241 gtcttcctgt ccgccagaga gatcaaccag gcccggatcg aggatcagtg gctcatccgc 301 cacctgaagt atacccacgg ctacggcatt acgctgtcgc gtgtcgacaa ggtgacggcc 361 tccggccagc cggacatgct catcgacagc attccgccgg tgtccgaagt gcccgagatc 421 tcgatcgacc ggcccgagat ctatttcggc gaatccacga acgattacgt cattacgaac 481 acgtccgaaa cggagttcga ctatcccagc ggcgaatcca acgtgtattg cgagtacgaa 541 gggacaggcg gcattccgct caatttcttc aaccgcatcc tgttcgccat ccgggaacgc 601 tccctcaaga tgctcgtctc cacgaacatc aaatcggatt cgaagatcct catctaccgc 661 aacatcacgg agagagtctc caagatcgcg ccgttcctga tgctggacga cgatccttat 721 gtggtcgtcg cggacggcaa ggtctattgg atgatcaacg cctacaccgg cagcgaatac 781 tatccgtatt ccgagcccta tgcaaaggat tcggccatca attacatccg caactccgtc 841 aagatcgtgg tggacgccta taatggcgac acggacttct acatctgcga cggaagcgat 901 cctgtggtgc agaccctgca gaagatctat ccgaaactgt tccagagctt cgagtacatg 961 ccggacgccc tcaaggaaca cgtgcagtac cccaacgcca tgttcggcat ccaggcggac 1021 gtcttccaga agtaccacat gacggatgtg gcggtcttct accagaacga agacctgtgg 1081 gacatcgccc gggaaagcta cggccagacc gaggtcgaga tgaccccgaa ctacttcatc 1141 atgaagctgc ccggcgagga gaacgtggaa ttcgtaagct ccattcccta tacgcccagc 1201 ggcaagaaca acatgaccgg catcctcacc gcccgttccg acggcgagaa ttacggcgag 1261 atcatcctgt accggctgcc caaggaccgc atcatctacg gcccggcgca gatcgaggcg 1321 cagatcaacc aggatgcgga gatctccaag gagttctccc tgtggaacaa ctccggctcc 1381 acctacagcc ggggcaatct gtacgtgctg cccgtggaag ggtcactcct ctacgcggaa 1441 cccatctatc tggaggcttc cagcggcagc ctgccggagg tgaagcgggt catcatgtac 1501 tacggcgaca aggtggctta cgaaccgacg ctggcagaat gcctggatca gttgttcggc 1561 aaaggcgccg gaacgcccct cacgaccgcc tatcccatcg aggaaggacg cctgatggcg 1621 gaggccatcg aaaagggcga ggtcgatcct tcgaaaccgc cgcagacgga gcccggtggc 1681 gaacctgccg aaccgggcga agagacggct cccgactatc tggagctggc gactgaggcc 1741 tacgagaagg ctttggaata tttgcagcag atgaaggaat acctggacat ggccggcggc 1801 gtgtccgaag aaccgcagga gccggtccag gacctggaca ccagtgagga caactagtta 1861 tgctcgacaa aatgcttttt accatcccga aagataaaca cgacgcagag gctgtaagag 1921 cgctgctttc cgaacacccc gagatccgtt tcgtgagcct ggcagccgcg gacatcttcg 1981 gcaacgacac cgacgagaag atccccatcc gcatcatgct caaggatgtg gacaagtt // LOCUS sequence234 2035 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence234 VERSION sequence234 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2035 /mol_type="genomic DNA" /organism="" /note="sequence234" misc_feature <1..750 /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_003420541.1:replicative DNA helicase" /note="WP_003420541.1 replicative DNA helicase (Clostridioides difficile) [pid:55.8%, q_cov:96.4%, s_cov:53.8%, Eval:2.9e-71, partial hit]" /note="MGA_954" /locus_tag="LOCUS_6370" CDS 757..2007 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MDYSKQNVSNYYLYDTQVENLFLSEYMASAPGEYVKAYLLALMYA QLNKPADDRMIARSVGMAPEKMAECWAYWESRGVVRRIYADPEDSASFRVEFVNLREEV FGSRTPAAPEAKASARLDDKALAKLYRDVEAVTGRMMEAREPEEIASWLSEYGMSPEFI LCGYRFCTAKRRSNRCRYVATVLKDWKSKGFSSPAQVEEYLEGMDRHFDLQKQIFKALG FSRNATEEEKRIMNKWFDDYGFDLEKIKEACSKTSGISNPNINYVDSILTSWYRESGRT PEDNAQLLIARIEKSYEDDRKRNAARMEQIREEVFTRIPRIKSIMEELRSCSFNVSRYL LMGENGKEAAARERKTIESLRSERARLLTEAGYGTDALDPVYTCSKCKDTGMLEDGGRC SCYKEKVRLFTQQEGSK" /locus_tag="LOCUS_6380" /note="WP_014519082.1 ATP-binding protein (Clostridium) [pid:35.1%, q_cov:27.2%, s_cov:34.6%, Eval:1.5e-11, partial hit]" /note="MGA_955" ORIGIN 1 tccgacctca tcatcatcgc ggcccgtccg tccatgggaa agaccgcgtt tgccctcaac 61 atcgcgcaga acgtggcgtt aaaagaggac aaacgcgtgg tcatcttctc gttggaaatg 121 gcgaaagaag cgctgggcat gcgtctcatc tccatggatt cgcgggtgga cagcaagcgc 181 ctggagatcg gcgacctgtc cgacgaggac ttaaacgacg tgctggattc catcggccgc 241 atgtccgaaa aagatatcat catcgacgcg acgcccggta tcggggtcat ggagatgcgc 301 aacaagtgcc gccgcatcaa cgcggagcgc aagatcgacc tcatcgtcgt ggactacctg 361 cagatcatga gcgcggacat ccagagcgaa agccgccagc aggaagtgtc caatatctcg 421 cgttacttaa agcagctggc cagagagatg gagtgccccg tcatcgtgct ttcccagctt 481 tcccgtgctt cggaaaagcg gcagggcagc cacaggccca tgctttcgga tctgcgcgac 541 tccggtgcca tcgaacagga cgccgacgtc gtcatgttcc tgcacagaga agactactac 601 cgcacggcgg aggaagagcc cgacaacatc tgcgaagtca tcatcgcgaa gcagagaaac 661 ggcgagaccg gcacggtgcg cctcacctgg atcccccggt tcaccaagtt cgtggaccgc 721 tacgtggagg gcagcagccc cctggattaa acggcaatgg attacagcaa acagaacgtc 781 tccaattact atctgtacga tacgcaggtg gagaacctgt ttttatcgga atatatggca 841 tcggctcccg gcgaatacgt aaaggcgtat ctgctggcct tgatgtacgc acagctgaac 901 aagcccgcag acgaccggat gatcgcccgc agcgtcggga tggcgccgga aaagatggcg 961 gaatgctggg cgtactggga aagccgaggc gtcgtgcggc gcatctacgc tgacccggag 1021 gacagcgctt cttttcgtgt ggaattcgta aacctgcgcg aagaggtgtt cgggtcacgg 1081 acccccgccg cgccggaggc aaaggcctcg gcccgtctgg acgacaaagc cctggcgaag 1141 ctgtaccgcg acgtggaagc cgttacgggc cgcatgatgg aagccagaga gccggaggag 1201 atcgcctcct ggctgtccga gtacggcatg agcccggaat tcatcctctg cgggtaccgg 1261 ttctgcaccg caaagcgcag aagcaaccgc tgccgctacg tggcgacggt cttaaaagat 1321 tggaaatcca agggattcag cagccccgcc caggtggagg aatacctgga gggcatggac 1381 agacatttcg atctgcagaa gcagatcttt aaagcgctcg gcttctcccg gaacgccacc 1441 gaggaggaga agcgcatcat gaacaagtgg ttcgacgatt acggcttcga tcttgagaag 1501 ataaaagaag cctgcagcaa gacctccggc atctcgaacc ccaacatcaa ctacgtggac 1561 agcatcctta cgtcctggta ccgggagagc ggcagaacac cggaagacaa cgcgcagctg 1621 cttatcgcga ggatcgagaa gtcctacgaa gacgaccgga agagaaatgc tgcccgcatg 1681 gagcagatcc gggaagaggt cttcacaaga attccaagaa tcaagagtat tatggaggaa 1741 cttcgttcct gcagttttaa cgtttcccgc tatctgctga tgggggagaa cggcaaggaa 1801 gctgccgcca gggaacggaa gaccatagaa tcgctgcgca gcgaacgcgc ccgcctgctt 1861 acggaagcgg gatacggcac ggacgccctg gatccggtct atacctgcag caaatgcaag 1921 gataccggta tgctggaaga cggcggccgc tgctcctgct ataaggagaa agtgcgcctg 1981 tttacgcagc aggaaggaag caaatgacgg acaaaagcgc cgacaatata aataa // LOCUS sequence235 2029 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence235 VERSION sequence235 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2029 /mol_type="genomic DNA" /organism="" /note="sequence235" CDS complement(425..1165) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MSDRVLEVNNMSVVYQDSTVFGKKSNFQALTDVSFHIDHGEIVGL VGESGCGKSTLSKAILGMLDDAKVTGEIRHYTKRPQMVFQDPHGSLNPARTVGWILEEP LRIFGKYDAPERKRRVLDMMTRVGLDHELVTHKPRELSGGQKQRVSIATALIQRPRFVV ADEPVSALDVSIQGQILQLLLNLRDELDLSYLFITHDLNLCYSICDRVLVMYKGQIVEQ GPVDEVYEHPQHEYTKALLDAVLK" /locus_tag="LOCUS_6390" /note="WP_013384738.1 ATP-binding cassette domain-containing protein (Ketogulonicigenium vulgare) [pid:42.2%, q_cov:99.2%, s_cov:71.7%, Eval:6.7e-52, partial hit]" /note="MGA_957" CDS complement(1162..1950) /product="ABC transporter ATP-binding protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_004081442.1" /transl_table=11 /codon_start=1 /translation="MGDMLTVKDLRVTFLDNNKEAIHGISFSMQEGERLGLVGESGSGK TVTAMAISGLIERSRVTISGDVFFEDTDLRRCSRSELRSLQGPGIGVVFQEPMNSLNPL IKVGYQVEETLRIHTKKTPEERRKMAIDALDRVGLPNPDEIYSKYPHQLSGGQRQRAMI AAAMVIHPKLLICDEPTTALDVSVQAKILKLLKELSDEYKVGILLISHDLMVVKQLCEN VAVMYKGNIVEQGKTLDIFNAPKDEYTQQLMAAIPKRRRK" /locus_tag="LOCUS_6400" /note="WP_004081442.1 ABC transporter ATP-binding protein (Thermotoga) [pid:47.1%, q_cov:97.3%, s_cov:76.9%, Eval:2.2e-64]" /note="MGA_958" ORIGIN 1 ctgcctcgtg ctcatcaacc tgcattttct ctggaagatg agccgcatgg acagggattt 61 cgatctggtg aagacgggga agggcgacgc gttcctgcgc tatttcatcg acaaccgcag 121 ggaggatatc cgggcgtgtt tccccggcat ctcgctggac ttctccgatg ccacggacgc 181 ctacatcgtc tgctgcaagg ggctgcctgt gggggtcacc gtaggcgaag cgagcggcga 241 cgccctgaac cttgtgctgg actacaccat tccggagtac cgggatttct ccgtgggccg 301 cttcctgaac gcggaattaa aaaaacaggg catccgcaaa ctgtgttacg gaggccctgt 361 ggaacatcat ctgccctatc tgcagaagct cggctacgtg aagaacgggg agctgtacga 421 aaaattactt tagcaccgca tccagcagcg ctttcgtgta ttcgtgctgc ggatgctcgt 481 agacttcgtc caccggtccc tgctccacga tctgaccctt gtacatgacc agcacgcggt 541 cgcagatgga atagcagagg ttcaggtcgt gggtgatgaa cagatagctc agatccagct 601 cgtcgcgcag gttcaaaagc agctgcagga tctgcccctg gatagaaaca tccagggcgg 661 agacgggttc gtccgccacg acgaagcggg gcctctggat gagggccgtc gcgatggaga 721 cgcgctgctt ctgaccgccg gacagctccc gcggcttgtg ggtgaccagc tcgtggtcca 781 atcctacgcg ggtcatcata tccagcaccc ggcgcttgcg ctcgggtgcg tcgtattttc 841 cgaagatgcg cagcggttcc tccaggatcc agcccaccgt cctggcgggg tttaagctgc 901 cgtgggggtc ctgaaatacc atctggggac gcttcgtgta atgccggatc tctccggtga 961 cctttgcatc gtccagcatg ccgaggatcg ccttggacag cgtggatttg ccgcagccgg 1021 attcgcccac cagtccgacg atctcgccgt ggtcgatgtg gaacgaaaca tccgtaagcg 1081 cctggaaatt gctcttcttt ccgaataccg tcgaatcctg atagacgacg gacatgttat 1141 tcacttcgag aacgcggtca ctcatttgcg tctcctcttg ggaatggcag ccatcagctg 1201 ctgcgtgtat tcgtccttgg gagcgttgaa gatgtccagc gtctttccct gctccacgat 1261 atttcctttg tacatgacgg cgacgttctc gcacagctgc tttacgacca tcaggtcgtg 1321 gctgatcagc aggatgccga ctttgtattc gtcgctcagt tccttcagca gttttaagat 1381 ctttgcctgt acgctcacgt ccagggctgt ggtcggctca tcgcagatga gcagcttcgg 1441 atggatgacc atcgcagccg cgatcatggc gcgctgccgc tgacccccgg acagctggtg 1501 cgggtatttg ctgtagatct cgtccggatt gggcaggcca acgcggtcga gggcatcgat 1561 cgccattttc ctgcgctctt cgggcgtctt tttcgtatgg atgcgcagcg tttcttccac 1621 ctgatacccc actttgatga gggggttgag ggagttcatc ggctcctgga acacgacgcc 1681 gatgcccggc ccctggaggg aacgcagctc gctgcggctg cagcggcgca gatccgtatc 1741 ttcaaagaag acgtcgccgc ttatcgtaac gcggcttctt tcgatgagcc cggagatggc 1801 catggccgtt acggtcttgc cggagccgga ttcgcccacg aggcccagcc gttcgccctc 1861 ctgcatggag aaactgatgc cgtggatcgc ttctttgttg ttgtcgagga atgtgaccct 1921 cagatctttt acggtaagca tatcgcccat gctattcacc tcccatgcct tcggacagca 1981 gtccgaatcc caggatgagc aggatgatgg caagacccgt gcagatcgc // LOCUS sequence236 2012 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence236 VERSION sequence236 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2012 /mol_type="genomic DNA" /organism="" /note="sequence236" CDS 569..1159 /product="chromate transporter" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_005802804.1" /transl_table=11 /codon_start=1 /translation="MLLQIFITFFKVGLFTIGGGYAMLPIIQDAVCKEKGWLTDEEFLD SISLTNSLPGPLATNCATFIGYRLKRVPGSIAAILGTICPSIIIILLIAMVFNTAMDNA YVQAFFRGVGPAVFALIVSAVYKLATKANIMKDKLTLVVAVASFALIAFAGVTPILIVI AAAVIALVADSVKKSKTAAGAEEKGGSNDGSHS" /locus_tag="LOCUS_6410" /note="WP_005802804.1 chromate transporter (Bacteroides fragilis) [pid:38.8%, q_cov:84.2%, s_cov:90.6%, Eval:1.8e-29]" /note="MGA_961" CDS 1143..1676 /product="chromate transporter" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_008761975.1" /transl_table=11 /codon_start=1 /translation="MDLILRMCLAFIKIGAFCFGGGYAAVGLIENEVVKTMGWLTPDQY INIIAIAEMTPGPIAVNTSTFAGYLMSGPIAGILCTLSVILIPSCLALLTAFFFEKVKN NQKVQVAVKGIRPGAIGIIAAAGISIAKNGFHDYFSVVLFAVAAFIIFKLKKSPILALL SCGALGVIVYGFIL" /locus_tag="LOCUS_6420" /note="WP_008761975.1 chromate transporter (Bacteroides) [pid:36.4%, q_cov:96.6%, s_cov:99.4%, Eval:1.8e-27]" /note="MGA_962" ORIGIN 1 cattctgctc gtctgctcct acgtactgct gtacaagacg agactgggcc tccgcctgca 61 ggcctgcggc gaacatcccc aggcagcggc ttccgtcggt atctccgtct acaagatgcg 121 ctacatcggc gtcatcatct ccggcttcct cggagggctg ggcggcatcg tctacatcac 181 gtccggcgta tccgagtgga agttcgagaa cggcgtagcg ggcttcggct tcctggctct 241 ggctgttatg atcttcggcc agtggaaacc ccacaggatc gcggtctccg cgctgctgtt 301 cggtttgttc cgggctctgt ccaacgtcta tatgggattc aatttcctgg cgacgttaaa 361 tatccccagc ggcatctaca acatgctgcc gtacatcatc tgcctcatcg tactggcctt 421 cacttccaag aagtccagag cgccgaaggc ggaaggcatt ccctacgaca agggtatgcg 481 gtaagatcgg tataacgggg cggcaatccc gccgcccctg gatatacgcg gaatccggga 541 tcggacaaaa actcagaaaa gaggaaaatt gcttctacag atctttatca cattctttaa 601 ggtgggattg ttcaccatcg gcgggggcta cgccatgctc cccatcatcc aggatgcagt 661 ctgcaaggag aagggctggc tgacggatga ggagtttctg gactccatct cccttaccaa 721 ctcgctgcct ggcccgctgg ccacgaactg tgcgacgttt atcggctacc ggttgaagcg 781 ggtgccgggg tccattgcgg ccattttagg cacgatctgc ccgtcgatca tcatcatcct 841 gctcatcgcg atggtgttca atacggcgat ggacaacgcc tacgtgcagg cgttcttccg 901 gggcgtaggc ccggcggtgt tcgcgctcat cgtaagcgcc gtctacaagc tggctacgaa 961 ggccaacatc atgaaggata agctgacgct cgtcgtcgct gttgcatcct tcgctctgat 1021 cgcctttgcc ggggtcaccc cgatcctgat cgtgatcgca gcggccgtga tcgctctggt 1081 cgccgacagc gtaaagaaga gcaagacggc tgccggcgcg gaagagaaag gaggttcgaa 1141 cgatggatct cattcttagg atgtgcctgg ccttcatcaa gatcggtgcc ttctgcttcg 1201 gcggaggcta cgcggcggta ggcctcatcg aaaacgaggt cgtcaagacc atgggctggc 1261 tgacgccgga ccaatacatc aacatcatcg ccatcgcgga gatgaccccg ggaccgatcg 1321 cggtcaacac gtccaccttc gcgggctatc tgatgagcgg acccattgcg ggcatcctgt 1381 gcacgctcag cgtcatcctc atccccagct gcctggcgct cctcacagcg ttcttcttcg 1441 aaaaggtgaa gaacaaccag aaggtgcagg tggcggtaaa gggcatccgc ccgggtgcca 1501 tcggcatcat cgcggcggcg ggcatctcca tcgcgaagaa cggttttcat gattatttct 1561 ccgtggtgct gttcgcggtg gctgccttca tcatctttaa attaaaaaag agtcccatcc 1621 tggcgctgct ttcctgcggt gccctggggg taatcgtcta tggattcatc ctgtaaggtc 1681 cactttggag acaaccttgc atacatgaag actcttgcgg acgggtcgat cgattttatc 1741 tacgtcgacc cgcctttttt ctctgcggcg gattactaca cccgcaaggg aaagcaggcc 1801 tacggtgacc gctggagcgg cggtctggac cagtatctgg ccatgctgaa gccccggctc 1861 gaggagatgc accgtctgct gaaggacagc ggcaccatcg ccgtacatct ggactggcac 1921 gcggtacatt acgtgaaggt gatgatggac ggcatcttcg gcatgaacaa tttcctgaac 1981 gagatcatct gggcgtataa gtccggcggc gc // LOCUS sequence237 2004 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence237 VERSION sequence237 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..2004 /mol_type="genomic DNA" /organism="" /note="sequence237" CDS complement(2..961) /product="ABC transporter permease" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_000534165.1" /transl_table=11 /codon_start=1 /translation="MRTFKYVVKRLLFLAITFLIILTITFCLIKMLQAEVPLGKQGQTE LARRKALGWDKPILVQYGIYLRNLFTKFDIGTSLKVSYMTPVAEVIASRMPPTILVNVL SILLGLPLGIVLGIFAALKKNTWIDHLVSVVIVIFISVPSFVLAFFLQYFLSFKAGWFP LVMFSKSEAGGLFTWKMVYSLMLPIMASAFYEIAYFARTVRAELTEALTSDYMLLARTK GLTQSKAVIHHALKNAMVPILPVVIGTFLGVMGGSMVLERIFAIPGVGDLTLKALSTLD YDLFVGTAMFYTLIGLLAGIVTDLSYGFLDPRIKMGER" /locus_tag="LOCUS_6430" /note="WP_000534165.1 ABC transporter permease (Bacillus) [pid:36.1%, q_cov:97.8%, s_cov:97.7%, Eval:1.8e-53]" /note="MGA_964" ORIGIN 1 cttacctctc ccccatcttg atgcgcggat ccaggaatcc gtagctcagg tcggtgacga 61 tgccggcgag caggccgatc agggtgtaga acatggccgt accgacgaac aggtcgtagt 121 caagcgtaga cagggctttg agcgtcagat cgccgacgcc cgggatcgcg aagattcttt 181 ccaaaaccat ggagccgccc atgacgccca ggaaggtgcc gatgaccacg ggaaggatgg 241 ggaccatggc gttcttcagg gcgtggtgga tgaccgcttt ggactgagtc aggcccttgg 301 tcctggccag cagcatatag tcgctggtca gcgcctccgt cagctccgcg cggacggtac 361 gggcaaaata cgcgatctca tagaaggcgc tggccatgat cggcagcatc agcgaataga 421 ccatcttcca cgtgaacaat ccgcctgctt ccgacttgga gaacatgacc agtgggaacc 481 atccggcctt aaaggacagg aaatactgca ggaagaatgc cagaacgaac gatggcacgg 541 agatgaagat gacgatcacg acggaaacca ggtggtcgat ccacgtgttc tttttcaacg 601 ccgcgaatat gccaagcacg atgcctaacg gcaggcccag caggatcgac agcacgttca 661 ccaggatcgt cgggggcata cggctcgcga tgacctcggc aacgggcgtc atataggaaa 721 ctttcaatga agtgccgata tcgaatttag tgaaaagatt gcggagatag atcccgtatt 781 ggaccaggat cggtttgtcc cagccaaggg ccttgcgtct tgccagctcc gtttgaccct 841 gcttgccaag ggggacttcc gcctgtagca tcttgatcag gcagaacgtg atcgtcagga 901 tgatcaaaaa cgttatggcc agaaagagca aacgctttac aacgtatttg aatgtgcgca 961 tagtgctatt ccctcttctg tgttatttcg cgccttgcgg catgaagatc agagttccca 1021 ttaacacagt ctcgaagccg gagaccggct tcgagactgg ttttcctctt aacgggtttt 1081 cattgcccga tcgctagatt acttgtagtc gatcgtgccg ttctggctgg caacgaactc 1141 tgcccactct gcgtcgttgt agttgaactt catcagacgg atgccgccgt agccatacat 1201 gatgttgtaa tcctcggtgg cgtactcgat cttcttggag aacagcgtgc actcgcactc 1261 gcagccgaag gggatgcact gataggaacc gaggaccgcg gtctcgatgt agctcaagat 1321 gttgagcctg gtctcggcat actcgtcacc accgaacttg ccggcaggct ggatggcctt 1381 ggcccagttc tggatggtat cggtcacttc ctcgccatcc agggggatgg tgatggtctc 1441 cacggtggga tcccaaccgc aggactcatg gatcttggtc atgccgccca tgtagtcggg 1501 ctcgcagtag acgcggatcg tggagaaggg atagaacgcc gcaccgcccc atgcgccgcg 1561 gatcatctcg atcttgccca gggccacgtc ttcgtaccgg ttggcgatgt tgccgaggaa 1621 ctcgaagtcg acgaggcctt cgaaaccggt gcccttggtg gcttcagcaa cgtagtcgtt 1681 caggtactcc tgctgacggg tatcctcagc cgcgatggcg gaagccttgg cttcgcagcg 1741 gatgtggacc ttctggcctt cggtgtagtt gccgtcggcg atggcctgct catagacctt 1801 ctggaacaga gcgcgagcct gctcaatatc gtagccattg acggaatcgt aggcagccac 1861 gtcgtcggca aaagccttgc cctcgccgta ctctacgcca tagagacgga gcaccgcatc 1921 acggccggcc ttggtgttac gatactggga ctcggtgttg ttctcgatgt cacagtcgta 1981 caggctgttg agcagatagt acgc // LOCUS sequence238 1989 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence238 VERSION sequence238 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1989 /mol_type="genomic DNA" /organism="" /note="sequence238" CDS complement(875..1987) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MAEAVERTGLFSRISWGIIRLFRPDFKGIALSLFAVGLLFAPLIP SATAKAVLGAALAESLSDAMGYDPHSEGRCGLFVASFVGFSVSTAAFSTGSVFTYTLQG MLPAEVLATVSWGRWLLSSLPWLVLTLGICYAGICLLYGRNAHTQLDASHTQDMHASHG PMTRKEKIAAALLAGCVLLWIFERQTGIPAAATSMTAGVLCFACGLLKPEDLKTAFPWG LFLYLGVILNLGTMFAAYGINDMLQTELQPLIRLMHSPVSAVLLVGILTILVRFLLVSQ TVTVAILMAVLLPAAGQTGTSPFLLGFVILATEQIWFASYENTVFSPALACMKGTLDHR KTVKASFVYAGAALLACLVSIPWWRMLGYL" /locus_tag="LOCUS_6440" /note="WP_000804912.1 L-tartrate/succinate antiporter (Enterobacteriaceae) [pid:22.8%, q_cov:78.6%, s_cov:60.8%, Eval:1.3e-08, partial hit]" /note="MGA_967" ORIGIN 1 catctcctgt acgtagtcct gcggtccggt gagggcttcc agcgcaccca tctgaatggc 61 gcccgccacg ctggaggtga cgctgctctg gatcttcgtc atctgcaggc acatgtccgc 121 cggcgccacg caccagccga cccgcaggcc cgccatggcg taggtcttgg agcaggaatt 181 gcaggtgaca gtccgttcct tcatgccggg caggctgccg atgctcatct gcaccgcgcc 241 gtcgtacaga agcgcctcgt agggctcgtc ggagatgacc cacagatcgt gcttcttcgc 301 gaattccgcg atctccttca ggtcttccgg cggcgtcacg gaccccagag gattggaggg 361 gctgttgatg aggaccgccc gggtcttcgg cgtcaggcat ttctccaggt ttgccgcctt 421 tacgtggaaa tgatcttcct cgtagaccgg cacgtccacg atattcacct ccgccacgtc 481 cgccatgccg atataggcgg cgtagtacgg gcaggggatg agaatatcct ctcccgggtt 541 gagcacgcac agcatcgtca tcagcagggc gtgggtagcg ccgacgaaca cgtgcacgtt 601 ggaggcgtcg cagtccagcc cgttcagcgt ccgggaccgc tctgcgatgg cttcccgcag 661 ggcgggaatg ccggcgttgg acacgtattt cgtgtaaccg ttgttcaggg cccaggcggt 721 cttatcgatc acgttctgac ccgtccggaa cccgggttcg ccgatgccga aattgatggt 781 attttcgtac ttcgccgcgg cttcgaacac ggcgcggatg ccggaaaacg catacttttt 841 cgaacgttca ctcaattcca ttcttcaatc acctctataa ataaccgagc attctccacc 901 aggggatgga gacgaggcag gccagcagcg ccgcgcctgc gtagacaaaa ctggctttta 961 ccgtttttct gtggtccagc gtgcccttca tgcaggccag cgccgggctg aataccgtat 1021 tctcgtagga tgcgaaccag atctgttccg tcgccaggat cacgaagccc aggaggaagg 1081 gagacgtgcc ggtctggccc gctgcaggca gcagcaccgc catcaggatg gccacggtca 1141 cggtctggga caccagcagg aagcgcacga ggatcgtcag gatgccgacc agcagcaccg 1201 ccgacacggg actgtgcatc agccggatga ggggctgcag ctccgtctgc agcatgtcgt 1261 tgatgccgta ggccgcgaac atcgtcccca gattcaggat gacccccaga tacaggaaca 1321 gtccccaggg aaacgccgtc ttcagatcct ccggcttcag caagccgcag gcaaagcaga 1381 gcacgcccgc cgtcatggac gttgcagcgg ccgggatgcc ggtctgccgc tcgaagatcc 1441 agagcagcac gcagcccgcc agcaaagcgg ctgcgatctt ttccttgcgg gtcatcgggc 1501 cgtgggacgc gtgcatgtcc tgcgtatgcg aagcatccag ctgcgtatgg gcgtttctgc 1561 cgtacagcag acagatgccg gcgtagcaga tgcccagggt gaggacgagc cagggcagag 1621 acgacagcaa ccatcttccc cagcttaccg tcgccaggac ctccgccggc agcatgccct 1681 gcagcgtgta ggtaaagacg ctgcccgtgg aaaaagccgc cgtggacacg gaaaatccca 1741 cgaaggaagc cacgaacagg ccgcagcgac cttcgctgtg cggatcatac cccatggcgt 1801 cggacaggct ctccgccaac gcagcgccca acaccgcctt cgccgtcgcg ctggggatga 1861 ggggcgcaaa cagcaggccc accgcgaaca gagacagcgc gatgcccttg aaatccgggc 1921 ggaacagccg aatgatgccc caggagatcc gggagaacag gccggtgcgc tccaccgctt 1981 ccgccatgc // LOCUS sequence239 1987 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence239 VERSION sequence239 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1987 /mol_type="genomic DNA" /organism="" /note="sequence239" CDS 211..1125 /product="ABC transporter permease" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_010973851.1" /transl_table=11 /codon_start=1 /translation="MLIISLILISLLAFLAFQIIPGDPTTKILGTDYTPERAEALREQL GLNDPLPARYLGWLKGLLQGDPGISYSYFIPVKEVMSGKIQVTAALSLLSWVLVMLFSI PLGILLARFEGGHFERAGIVLNQVFMAVPPFFLGMLFTYLFGLVLHWFMPGGYIPFSQS VPGALGYMFFPALAIAIPKAAKTAKLLRSSILNEMNKDYVRTAYSRGNSRWAVLRDHVL RNAMLPVITYLAMSLADTVAGSIIVEQVFALPGLGRLLLSAIGNRDFPVAQCIVVIIAF IVVFMNYLADIITQYVDPRVRLS" /locus_tag="LOCUS_6450" /note="WP_010973851.1 ABC transporter permease (Agrobacterium tumefaciens complex) [pid:36.5%, q_cov:96.4%, s_cov:92.7%, Eval:1.2e-54]" /note="MGA_969" CDS 1127..1924 /product="ABC transporter permease" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_012583225.1" /transl_table=11 /codon_start=1 /translation="MKQYLKDKNFRAGLLITGIMLCVILIGLLWTPYDPNAMSGSEKLL KPSAAHLFGTDNFGRDIFSRVIQGAGATFLIAAAAVAIGLVIGLIIGGLTGYYGGVLDE ILMRIADTILAFPSILLALVMIAILGKGKYNIIIALGILFIPSFARIVRSEVAKQKNTD YVRNARLMGASNMRILFLHIMPNIVPVLLSSVAIGFNNAVLSEASMSYLGVGVQPPDPS LGRLLSEAQGYLFQAPWYAICTGLAIILLILGFGLLSEGMGGE" /locus_tag="LOCUS_6460" /note="WP_012583225.1 ABC transporter permease (Dictyoglomus turgidum) [pid:37.5%, q_cov:98.5%, s_cov:90.9%, Eval:1.6e-49]" /note="MGA_970" ORIGIN 1 cagacgagac tgttcaagga atgcgagacc atcctcgcgg aagaggcagc caacgtctac 61 atccaggacg gcgcatcctt caccgccatg gcaacggatc tggaaggcat ggagttctat 121 ccgctctacg tcctcgatct atctacgatc tacagaacga agtaatccca ccgggaaaaa 181 gcagtgacgt acgtattaaa gaagaccgga gtgctgatca tctccctgat cctcatttcc 241 ctgcttgcat tcctggcatt tcagatcatt cccggcgacc ccacgacgaa gatcctgggg 301 accgactata cgcccgaaag ggcggaagcg ctgcgcgagc agctgggcct caacgacccg 361 ttgcccgccc gctatctcgg ctggctgaag gggctcctgc agggggaccc cggcatcagt 421 tacagctact ttatccccgt caaagaagtt atgagcggca agatccaggt aacggcagcc 481 ctttcgctgc tgtcctgggt ccttgttatg ctgttctcca tccctttggg catcctgctc 541 gcccgcttcg aaggcggcca tttcgagcgc gccggcatcg tgctcaacca ggtgtttatg 601 gcggtgccgc ccttcttcct gggcatgctg tttacgtatc tgttcgggct ggtgctgcac 661 tggttcatgc cgggcggcta catccccttc tcccagagcg tgcccggcgc cctcggctac 721 atgttcttcc cggcgcttgc catcgccatt cccaaagcag caaagaccgc aaaactgctg 781 cgttcctcca tcctcaacga gatgaataag gactacgtgc gcacggccta cagccgcggc 841 aactcccgct gggccgtcct gcgcgaccac gtgctgcgca acgccatgct gccggtcatc 901 acctatctgg ccatgagcct ggcggatacg gtggcgggct ccatcatcgt ggagcaggta 961 ttcgcgctgc ccggtctggg cagactgctg ctgtccgcca tcggcaaccg cgatttcccc 1021 gtggcgcagt gcatcgtcgt catcatcgcg ttcatcgtcg tgttcatgaa ctatctggcg 1081 gacatcatca cccagtacgt cgatccgaga gtgaggctga gctgacatga aacagtatct 1141 gaaagacaag aacttcagag ccggcctgct cattacgggg atcatgctgt gcgtcatcct 1201 catcggcctc ctctggacgc cttacgaccc caatgccatg agcggatcgg aaaagctgct 1261 gaagcccagc gccgcccacc tgttcggcac ggacaacttc ggaagagaca tcttctcgcg 1321 ggtcatccag ggcgcgggcg ccacgttcct catcgcggcg gcagcggtcg ccatcggcct 1381 cgtcatcggg ctcatcatcg gcgggcttac gggctattac ggcggcgtgc tggacgagat 1441 cctgatgcgc atcgccgaca ccatcctggc atttcccagc atcctgctcg ccctcgtgat 1501 gatcgccatc ttaggcaagg gcaaatacaa tatcatcatc gctttgggca tcctgttcat 1561 tcccagcttc gcgcgcatcg tgcgttcgga ggtggcaaag cagaagaata cggactacgt 1621 gcgcaacgca cgcctgatgg gcgccagcaa catgcgcatc ctgttccttc acatcatgcc 1681 caatatcgtt ccggtgctcc tgtcttccgt cgccatcggc tttaacaacg ccgtgctgtc 1741 ggaggcttcc atgagctatc tgggcgttgg cgtgcagccc cccgatccga gcctcggaag 1801 actgctgtcc gaagcccagg gctacctgtt ccaggcgccc tggtacgcga tctgcacggg 1861 tcttgccatc atcctgctca tcctgggatt cggactgctg tccgaaggca tgggaggtga 1921 atagcatggg cgatatgctt accgtaaaag atctgagggt cacattcctc gacaacaaca 1981 aagaagc // LOCUS sequence240 1986 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence240 VERSION sequence240 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1986 /mol_type="genomic DNA" /organism="" /note="sequence240" CDS complement(10..471) /product="glycine/sarcosine/betaine reductase complex selenoprotein A" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011345262.1" /transl_table=11 /codon_start=1 /translation="MAILKDKKVIIIGDRDGIPGPAIAACAESAGAEVVFASTECFVUT AAGAMDLENQKRVKEFAEQYGADNVVVLLGAAEGEAAGLAAETVTLGDPTFAGPLAGVS LGLTCYHVCEPEVKAEFDPDVYDEQISMMEMVLDVDDICSEMHAIRDQL" /transl_except=(pos:complement(340..342),aa:Sec) /note="codon on position 44 is selenocysteine opal codon." /note="PseudoGeneDetection:WP_011345262.1 glycine/sarcosine/betaine reductase complex selenoprotein A (Carboxydothermus) [pid:72.4%, q_cov:99.3%, s_cov:97.4%, Eval:1.4e-80]" /note="MGA_973" /locus_tag="LOCUS_6470" /gene="grdA" CDS complement(537..854) /product="thioredoxin domain-containing protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003356487.1" /transl_table=11 /codon_start=1 /translation="MLEVDKTTFEEEVLKAEGYVLVDFYGDGCVPCAALMPHVHALADE YGDKMKFCSINTSKARRLAIGQKVLGLPTITVYKDGEKVEELVKDDATAENVAAMVQKY I" /locus_tag="LOCUS_6480" /note="WP_003356487.1 thioredoxin domain-containing protein (Clostridium botulinum) [pid:71.2%, q_cov:99.0%, s_cov:98.1%, Eval:1.8e-39]" /note="MGA_974" CDS complement(864..1802) /product="thioredoxin-disulfide reductase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003416869.1" /transl_table=11 /codon_start=1 /translation="MAKQYDIVIIGAGPAGLAAGLYAGRARMSTLIIEKEKDGGQIVQT AEIENYPGGLLEDSGPSLVARFSAQAEKFGCEKELDTVQEVELDGPVKKIVCNKETYEA KAVIIASGASPSHIGCPGEAEFTGKGVSYCATCDAAFFEDFEVYVVGGGDAAVEEAMYL TKFARKVTIIHRRDELRAAKSIQEKAFKNEKLAFMWNSVIKEIRGEGLVNSMIVENTKT GEQTEIVADEEDGIFGIFVFIGFKPATAVFEGKVNMEKGYIVTDQEMRTNVPGVYAAGD CRVKDLRQVITAASDGAIAAWQAARYIDEMN" /locus_tag="LOCUS_6490" /gene="trxB" /EC_number="1.8.1.9" /note="WP_003416869.1 thioredoxin-disulfide reductase (Clostridioides) [pid:57.9%, q_cov:99.4%, s_cov:98.7%, Eval:2.1e-99]" /note="MGA_975" CDS complement(1805..1984) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MPISLTVGANRIVPTVAIPHPLGNPALSHEEEHDLRKKLVGRALK ALETPVDGQTVFEE" /locus_tag="LOCUS_6500" /note="WP_011196985.1 glycine reductase complex selenoprotein B (Symbiobacterium thermophilum) [pid:77.6%, q_cov:98.3%, s_cov:13.5%, Eval:6.2e-19, partial hit]" /note="MGA_976" ORIGIN 1 caggatcgat taaagctggt ctctgatggc gtgcatctcg ctgcagatat catccacatc 61 gagtaccatc tccatcatcg agatctgttc gtcatagacg tccggatcga attcagcttt 121 gacttcgggt tcacatacgt gataacaagt gagtcccaac gagactcccg ccagaggacc 181 ggcaaacgtc ggatcgccaa gcgttacggt ttctgctgcc agacctgccg cttctccttc 241 ggctgcgcct aagagaacga cgacgttatc tgcgccgtac tgttccgcaa actccttgac 301 tctcttctga ttttccagat ccatggcacc tgcggccgtt cagacgaagc actctgtcga 361 agcgaagacg acttctgctc cggcagattc agcgcaagcg gcgatcgcag gacccggaat 421 gccatcgcgg tctccgatga tgatgacctt cttatctttt aagattgcca tgctacattc 481 ctccttttcg attcgttaca ggtactattt acaagggcga tcgccctgtg caaatcctag 541 atatacttct ggaccatcgc agcgacattc tctgcggtgg catcgtcctt tacgagctct 601 tccaccttct cgccgtcctt gtaaacggtg atggtgggca ggcccaggac cttctggccg 661 atggcaagtc ttctcgcctt ggacgtgttg atggagcaga acttcatctt gtcgccgtat 721 tcatccgcca gagcgtgtac gtggggcatc agcgcggcgc agggcacgca gccgtctccg 781 tagaagtcta cgagcacgta gccttccgcc ttcagcactt cttcttcgaa tgtagtctta 841 tctacttcca gcataatttc ctcctagttc atctcgtcga tataacgggc tgcctgccag 901 gcggcgatgg cgccgtcgga agcggccgtg atgacctgac gcagatcctt gactctgcag 961 tcgcctgcgg cgtagacgcc gggcacgttc gtgcgcatct cctgatccgt cacgatatag 1021 cccttctcca tgttcacctt gccttcgaat acggcggtgg ccggcttgaa gccgatgaac 1081 acgaagatgc cgaagatgcc gtcttcctcg tccgccacga tctcggtctg ttcgccggtc 1141 ttggtgtttt ccacgatcat ggagttcacc aggccttcgc cccggatctc cttgatgacg 1201 ctgttccaca taaaggccag cttttcgttc ttgaacgcct tctcctggat ggacttggcg 1261 gcgcgcagtt cgtctcttct atggatgata gtgacctttc tcgcgaactt tgtcaagtac 1321 attgcttctt ctaccgcagc atctccgccg cctaccacgt agacttcgaa atcctcgaag 1381 aacgcggcgt cgcaggtggc gcagtaggat acgcccttgc cggtgaattc cgcttcgccg 1441 gggcatccga tatgggaggg agatgccccg gacgcgatga tgacggcctt cgcctcgtag 1501 gtctctttat tgcagacgat cttcttgaca ggaccgtcca gctccacttc ctgaacggtg 1561 tccagctcct tttcgcagcc gaacttctcc gcctgggcgg aaaatctggc gacgagagac 1621 ggaccggaat cttccagcag accgccggga tagttctcga tctccgcggt ctggacgatc 1681 tgtccgccgt ccttctcctt ttcgatgatg agggtggaca tacgagctct gcctgcgtac 1741 agtccggcgg ccagacctgc ggggccggcg ccgatgatca cgatgtcata ctgttttgcc 1801 atacttactc ctcaaatact gtctgtccgt ccaccggggt ctccagagcc ttgagcgctc 1861 tgccgaccag ttttttacgc agatcgtgct cctcttcgtg agagagtgcg gggttgccca 1921 gcggatgggg aattgcgacc gtcggaacga tcctgttggc gccgacggta agagagatgg 1981 gcacga // LOCUS sequence241 1979 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence241 VERSION sequence241 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1979 /mol_type="genomic DNA" /organism="" /note="sequence241" CDS complement(178..1026) /product="energy-coupling factor transporter ATPase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_012048350.1" /transl_table=11 /codon_start=1 /translation="MQIEVRELGYTYSEGLPFATTALEDVNFTIPSGEFAAIIGHTGSG KSTLLMHLNGLMKPTKGCVLADGIDINEKTKEAREARRKIGLVFQYPEYQLFEETVLKD VCFAPKNYGFTPEECEEKAIAALKLVGIDPDAKRDVSPFELSGGEKRRVAIAGVLAMEP QVLILDEPTAGLDPKGHKDILDMVEKVRRDRNLTILLVSHNMDDAARMADRVLVLDKGH LAMNGTPREVFSHHKELHEIGLGAPSSSELLYLLKEKGLNVRTDIFDEDEAAREIVNAL R" /locus_tag="LOCUS_6510" /EC_number="3.6.3.-" /note="WP_012048350.1 energy-coupling factor transporter ATPase (Clostridium) [pid:49.6%, q_cov:100.0%, s_cov:97.9%, Eval:3.3e-80]" /note="MGA_978" CDS complement(1017..1898) /product="energy-coupling factor transporter ATPase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_010966383.1" /transl_table=11 /codon_start=1 /translation="MSKETVIQLKNVTFSYYVEDAEGNVTTNNDVDVKHSEKRMALDGV TLDIEKGSFVAIVGSNGSGKSTLAKHLNALLLPSSGEVLVCGMSTADPDNTWEIRRRCG MVFQNPDNQLVSSVVEDDVAFGPENLGVDPAEIRQRVDNALNAVGMYEFRKKGPHLLSG GQKQRIAIAGVLAMQPECIVFDEPTAMLDPSGRAEILKIIRGLHEEGKTVILITHFMEE AAQADRIIVMDKGRPILDETPAALFAHGEKLQELNLQMPFGASMAAKLRDLGVDLPEGI ITAERLAECLCR" /locus_tag="LOCUS_6520" /note="WP_010966383.1 energy-coupling factor transporter ATPase (Clostridium) [pid:52.9%, q_cov:98.3%, s_cov:97.9%, Eval:4.4e-83]" /note="MGA_979" ORIGIN 1 aattttgacg agaatggcga gacagatgcc gcagaacaga aatcccgtaa aattctttac 61 gacaaacagc gacacgagga aaaggatcgt gccgatgagc ttggtccggg gatccagctt 121 gtggaccacg gaatcgccgg gataatattg tccgagtgtg atgtctttga tcgccattta 181 tcttaaagcg tttacgatct ctcgtgccgc ctcgtcttcg tcgaagatgt ccgtgcggac 241 attgagtcct ttttctttta ggaggtaaag gagttcggag gaagatggtg caccgagacc 301 gatctcgtgg agttctttgt ggtgggagaa gacttcccgg ggcgtgccgt tcatggccag 361 atgacccttg tccagcacca gaacgcggtc cgccatgcgg gcggcgtcgt ccatgttgtg 421 ggagaccagc agaatggtga ggttgcggtc gcgccgcacc ttctccacca tgtccaggat 481 gtccttatgg cctttgggat ccaggcctgc cgtcggctca tccaggatga gcacctgggg 541 ctccatggcc agaacgcccg cgatggccac gcggcgcttt tcgccgccgg acagttcgaa 601 gggagaaaca tcccgcttcg catccggatc gatgcccacg agttttaggg ccgcgatcgc 661 cttttcctcg cattcttccg gcgtaaaccc gtagtttttc ggcgcgaaac agacgtcctt 721 cagaacggtc tcctcaaaca gctgatattc cggatactgg aacaccaggc cgatcttccg 781 gcgggcttcc cgggcttcct tcgttttctc gttgatatcg atgccgtccg ccagcacgca 841 gcccttcgtg ggcttcatca ggccgttcag atgcatcaga agcgtggact tgccgctgcc 901 ggtgtggccg atgatggccg caaactcgcc gctggggatc gtaaaattca cgtcttccag 961 cgccgtggtg gcaaagggca ggccctcgct gtaggtatat cccaattctc tgacttctat 1021 ctgcataggc actctgccag cctttccgcg gtaatgatgc cttccggcag atcgacgccg 1081 aggtctctca gcttggctgc catggaagcg ccgaagggca tctgcaggtt gagttcctgc 1141 agtttttcgc cgtgcgcgaa cagcgcggcc ggcgtctcat ccaggatggg tctccccttg 1201 tccatcacga tgatgcggtc cgcctgggcg gcttcttcca tgaaatgcgt aattaaaata 1261 acagtctttc cctcttcgtg caggccgcgg atgatcttca ggatctccgc tctgccggaa 1321 ggatcgagca tggccgtggg ttcgtcgaac acgatgcatt ccggctgcat ggccagcacg 1381 ccggcgatgg cgatgcgctg tttctgaccg ccggacaaca gatgcgggcc ctttttacgg 1441 aactcgtaca tgccgacggc gtttaaggcg ttatccaccc tttgacggat ctccgccggg 1501 tcgacgccca gattctccgg gccgaaggcc acgtcgtcct ccacgacgga agagaccagc 1561 tggttgtccg gattctggaa caccatgccg cagcggcggc ggatctccca ggtattgtcc 1621 gggtctgccg tagacatgcc gcacaccagc acttcgccgg aggacggcag cagcagggcg 1681 ttcaggtgct tcgccagcgt ggacttgccg cttccgttgc tgccgacgat ggcgacgaag 1741 ctaccctttt cgatgtccag ggtgaccccg tccagcgcca tgcgcttttc ggaatgcttt 1801 acatccacgt cgttgttcgt ggtcacgttg ccttccgcat cctccacgta gtaggaaaac 1861 gttacgtttt tcagttgtat gaccgtttct ttgctcataa ccaaatcagt ataacataaa 1921 aggccccgga aatggggcct tcctgcgctt attctttcgt tatttcaaag cgatcgtgg // LOCUS sequence242 1977 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence242 VERSION sequence242 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1977 /mol_type="genomic DNA" /organism="" /note="sequence242" misc_feature <1..501 /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_003416419.1:leucine--tRNA ligase" /note="WP_003416419.1 leucine--tRNA ligase (Clostridioides difficile) [pid:47.9%, q_cov:98.2%, s_cov:20.2%, Eval:8.9e-44, partial hit]" /note="MGA_980" /locus_tag="LOCUS_6530" ORIGIN 1 aaggacgacc ggcagctcgc ctatattctg aacaacacca tcaagagagt ttccgaggat 61 atcgagaagc gattcaactt caacacggcg ctcgccgcca tcatggagct ggtcaacgag 121 atgtaccgct ataaggaact ggaagatatc aacctcggcc tgctggcaga cgctaccgaa 181 aaactggtgc tgatgctggc tccgtttgtg ccccatatcg gagaagagat gtgggaaggc 241 atcggcgggg aaggcctggt ctacgacgcc aagtggccgg aagtggacga atccatgctg 301 gtaaaagact ccgtggagat cgtcgtacag atcaacggca aagtccgcga aaaggcggaa 361 gttcccgcag gtctggataa ggcaggactg gaagagaccg tgcttgccat ggacagcgta 421 aaagcgctca tggaaggcaa gaatgtggtc aaggtcatcg cggttcccgg aaaactcgtc 481 aatatcgtag taaaaggata acgtatgaca gaaagcaaaa gaccgaaggt ctataagagc 541 agaaagctcc gggtcatccc cctcgggggc ttgcacgaga tcggcaagaa catgaccgtg 601 ctggaatacg gaaacgacat tatgatcatc gactgcggca tggctttccc cgatgacgaa 661 atgctgggga tcgacgtggt catccccgac ttcagttatc tcgtcgccaa cagcgacaag 721 atccggggcc tcgtcatcac ccatgcccac gaggatcata tcggtgccat tccgtatctg 781 ctccaaaagc tcaacgtgcc catttacagc acgcggctga ccctcggatt tatcaaaaat 841 aaattgaaag aacacaaggt ggaggccgac ctgcacgaga tctccccggg ggatgagatc 901 cgcctgggcg tcttccgggt cgaagccatc cacaccaccc acagcgtcgc ggattcgctg 961 gcgctgtgca tcgatacgcc ggtgggcaag gtcttccaca cgggagactt taagatcgac 1021 tacacgccgg tggacggcga gcctctcgac cttaaccgcc tggcggctct gggcgacgaa 1081 ggcgtgctgc tgctgatggc ggacagcacc aacgcagccc gcaagggata tacgccctcc 1141 gaaaagcagg tgggcatcgc cctcaacaac atcttcgcct ccacgaagaa gcgcatcatc 1201 atcgcgatct tcgcctccaa cgtgcaccgt gcccagcgca tcatcgacat ggcggtggcc 1261 aacgggcgga aggtggccat ctccggccga agcatggaga acatggtgcg gatcgcggag 1321 gaactgggct acctggacat ccccgacggt acgctggtgg agatgaacaa gatcaagaat 1381 atccccgacg acaaactggt gatcatgacc accggcagcc agggagaacc catgagcgcg 1441 ctggcccgca tggccaacag catgcaccgg caggtgcaga tccggccggg agacatggtc 1501 atcctgtctt ccaccgccgt tcccggaaac gagaagatgg tgtccaacgt cgtcaactcc 1561 ctgatggaga agggggcgga ggtcatctac aacgatatcg ccgagaccca tgtttcgggt 1621 cacgcatcca gcgaagagct aaagctcatc cacacgctgc tgcgtcccag cttctttatg 1681 ccggtccacg gcgagatgaa gcatctgatg gctcacgccc agatcgcgga gagcctgggg 1741 ctcgataaga gccgcatcct gctgggcgcc aacggcgatg tgttcgagct gacccgcgga 1801 aaggccaaaa aggcgaagga aacggtccac gccggcgctg tgatggtgga cggcctgggc 1861 atcggagatg tcggaagttc cgtgctgaag gagcgttcct acctgtccga agccggcctc 1921 atcgtgatgg ccgcctgctt cgagaacggc aggctggtga gcggcccgca gctggaa // LOCUS sequence243 1975 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence243 VERSION sequence243 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1975 /mol_type="genomic DNA" /organism="" /note="sequence243" CDS complement(515..922) /product="ATP-binding protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_009871913.1" /transl_table=11 /codon_start=1 /translation="MDNLIVTAEVKNLDAVTDFVLQRPEIAACPKNTQLQLRLAVEEVF VNIASYAYDPAIGPAEVRCEVLDDPLRVVIQFLDHGKPFDPLAREDADTSEEALMERIG GLGILLVKETMDEVSYSYEEGKNILSILKKL" /locus_tag="LOCUS_6540" /note="WP_009871913.1 ATP-binding protein (Chlamydia trachomatis) [pid:27.1%, q_cov:94.1%, s_cov:88.4%, Eval:2.2e-08]" /note="MGA_983" CDS complement(939..1244) /product="anti-sigma factor antagonist" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_009871778.1" /transl_table=11 /codon_start=1 /translation="MSMNMDLIKHGNDAELKLDGYIDATNAPEVEKILLDVASKFDNLT LDMEKLEYVSSAGLRTFKLVYMELHRKSGVLFAKNTGKSVMEVLEVTGFTRLFKFI" /locus_tag="LOCUS_6550" /note="WP_009871778.1 anti-sigma factor antagonist (Chlamydia trachomatis) [pid:32.0%, q_cov:95.0%, s_cov:83.6%, Eval:1.8e-07]" /note="MGA_984" misc_feature complement(1341..>1975) /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_012047993.1:pyruvate, phosphate dikinase" /note="WP_012047993.1 pyruvate, phosphate dikinase (Clostridium botulinum) [pid:71.5%, q_cov:98.6%, s_cov:23.5%, Eval:4.0e-81, partial hit]" /note="MGA_985" /locus_tag="LOCUS_6560" ORIGIN 1 cggtcgccgg gcaggaatcc ggattcttcc gattcgtccg gatccgcgat cattaccaga 61 gaactcgtag ccgcgtcgta agtcgcgacg tacaggtcgt ttacgtcgct ggtcttgagg 121 aattcgccca ggacctcttt cagatactga taatcttccc tttcttcgat ctcagcaaaa 181 tgcgcccggt actcttcggt gcgggtcatc tccagttctt cccggtacag ccccttatag 241 atcgttaaaa tgtcgcctgt cagatcttcc acgtccacga tgttctccac gaccatcgcg 301 gtgctgcggc aaagcccgaa agcttcgccc gtatactggc cgaccaacgc gtaggcaaac 361 agaccgagcc cgatcagaaa ggcaacgagc cccacgatga ccgagccgat gacgcttccc 421 caaaacgtgc gggcttccag agaatacatc ctccgttccc gccagctcat ttctcttacg 481 cttttttccg gcatgattcc cccgtttgtt tcgtttacag tttctttaag atcgataaga 541 tattcttgcc ttcctcatag gaataggaca cttcatccat ggtctccttc acgagaagga 601 tacccagacc gccgatgcgc tccatcagcg cttcctcgga cgtgtcggcg tcttccctcg 661 ccaaggggtc gaagggtttt ccgtggtcca ggaactggat gaccacccgc agcggatcgt 721 ccagcacctc gcagcgcact tccgcagggc cgatggccgg gtcatacgcg tagctcgcga 781 tattgacgaa gacctcctcg acggcgaggc gcagctgcag ctgcgtgttt ttggggcagg 841 cggcgatctc gggacgctgc aggacgaaat ccgtgaccgc gtcgagattc ttcacctccg 901 ccgttacgat cagattatcc atgaccggta cctccccatc agataaattt gaaaaggcgg 961 gtaaagcctg ttacttccag aacttccatg acggatttac cggtattctt cgcaaacaga 1021 acgccgcttt tgcggtgcag ttccatatag acgagcttaa acgtgcgcag accggcgctg 1081 gagacgtact ccagtttctc catgtccagc gtaaggttgt cgaacttgga cgccacgtcc 1141 agaaggatct tctccacttc cggtgcgttc gtcgcgtcga tgtagccgtc cagcttcagc 1201 tcggcatcat tgccgtgttt gatcagatcc atattcatgc tcatggtcct catcctcctt 1261 atgtgtatgt agtatacacc ctgaaggaat aaaaatgaac agacctccgg ccgggaccgg 1321 aggtctgaaa cagtttgttc ttatgcgttt tccttgatgg ctgcctgagc tgctgccaat 1381 ctcgcgatgg gtacgcggaa cgggctgcag gagacgtagt cgagacccac cttgtggaag 1441 aattccacgc tggaggggtc tccgccgtgc tcgccgcaga cgcccaggtg caggtcgggt 1501 ctggtggctc tgcccagctt gcaggccatg tcgaccagct tgcctacgcc cttctggtct 1561 atcttcgcga acggatcgtt ctcgtagatc ttggtgtcgt agtaagcgga gaggaacttg 1621 cctgcgtcgt ctctggagaa gccgaaggtc atctgggtga ggtcgttggt gccgaaggag 1681 aagaactcgg cttcggtcgc gatctcgtcc gccgtgagcg cggctctggg gatctcgatc 1741 atggtgccga cgagatactt catctcgatg ccggaggctg cgataagttc gtccgcgacc 1801 tttacgacga tatccttaac atacttgagt tccttaactt cgccaacgag cgggatcatg 1861 atctcggggg ccatggtcca ctcgggatgt ctcttctgaa cggccagcgc tgccttgatg 1921 acggctctgg tctgcatctc tgcgatctcc ggataggtaa cggtaaggcg gcagc // LOCUS sequence244 1963 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence244 VERSION sequence244 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1963 /mol_type="genomic DNA" /organism="" /note="sequence244" CDS complement(256..1386) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MFKISKKIIIIAVAVFALATVGLTLLRGGEDGGVLDIPIFEQSDT KLSKDMTPIVVDESSPFYEVFQSKDRVNLLLLGVNQGMTDVIMVCSYDMENQYVNLISV PRDTFYYRPGWEANYAGNKINAIYHSEGIVPLAEAVSKTLYGMPLHYYAIVEYADIEKV MDVIGGVQVDVPFDMIYDDPTDDPPLHIRIYAGEQTIDSSNVMEYLRYRKGYRNGDIGR IQVHQELVKKVIKECLKAGNILDVAKVAVENVESDITYSMAISVATKAFKLSGDSINSY VLPGTDAMIQGFSFWQPNEDGVFQMLEEIYRIGSGEEGDLSIPTTIRLLEKPTLNRNYL PKGDGTVIDIEFDSQGNVITDPEPVEGSEEGSETGE" /locus_tag="LOCUS_6570" /note="WP_012582789.1 LCP family protein (Dictyoglomus turgidum) [pid:28.6%, q_cov:70.5%, s_cov:86.0%, Eval:1.8e-29, partial hit]" /note="MGA_986" CDS complement(1390..1962) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MQARAAAALSRGSSTEFCAVRFGNVLGSNGSVIPIFRRQIAAGGP VTVTHKDITRYFMTIPEAVQLVIQAGAMASGGEIFILDMGEPVKIMDLAEKMIRLSGLE VGKDIDIQVTGLRPGEKLYEELLLSEEGIKQTQHGKIFVGHPIEFSDGFIRLQDVGLEE SLAALTDKGDEEVRKFIKEIVPNYTGG" /locus_tag="LOCUS_6580" /note="WP_009897930.1 nucleoside-diphosphate sugar epimerase/dehydratase (Clostridioides difficile) [pid:59.1%, q_cov:92.1%, s_cov:27.0%, Eval:6.0e-51, partial hit]" /note="MGA_987" ORIGIN 1 ctctgccgcg ggtcttactg tgatgtttgt tgctgttgct gtcattttct gcacctttct 61 gccggggtca tttatctatg atggtgctat tttagtccct tctgcggggc gtgtcaaggc 121 aaaaattgtg gccgcaggca cgggtttttg ttatattttt gttgaccctg cacaaattca 181 gccccgatct gccctgcact cccccgcttt agtcaataaa agtgcaggca ttttgttgcc 241 tgcaccaaat tgcttttatt ctcctgtttc tgagccttct tcggacccct cgacaggctc 301 gggatccgtg atcacgttgc cctggctgtc gaactcgatg tcgatgacgg tgccgtcccc 361 cttgggcaga tagttgcggt tgagggtcgg cttttccagc aggcggatgg tggtggggat 421 ggagaggtca ccctcctcgc ccgaaccgat gcggtagatc tcctcgagca tctggaacac 481 gccgtcttcg ttgggctgcc agaacgagaa gccctggatc atggcgtcgg tgccgggcag 541 cacgtaggaa ttgatggaat ccccggagag cttaaacgcc ttcgtcgcca cggagatcgc 601 catgctgtag gtgatgtccg actccacgtt ctccaccgcg accttcgcga cgtccaggat 661 gttgcccgcc ttgaggcatt ccttgatgac cttcttgact aactcctgat gcacctggat 721 gcggccgatg tcgccgttgc ggtagccctt gcggtagcgc aggtactcca tgacgttgga 781 agaatcgatg gtctgctcgc ccgcatagat gcggatgtgc agcggagggt catcggtggg 841 gtcgtcgtag atcatgtcga agggaacgtc cacctgcacg ccgccgatga cgtccatcac 901 cttctcgatg tccgcgtact ccacgatggc gtagtagtgc agcggcatgc cgtacagggt 961 cttggaaacg gcctccgcca gcggcacgat accttcgctg tggtagatgg cattgatctt 1021 gttgcccgcg tagttggctt cccagccggg gcggtaatag aaggtgtcgc ggggcacgga 1081 gatgaggttg acgtactggt tctccatgtc gtagctgcac accatgataa cgtcggtcat 1141 gccctggttt acaccgagca gcagcagatt tacgcggtcc ttgctctgaa agacctcgta 1201 aaacgggctg gattcgtcca ccacgatggg ggtcatatcc ttggacagct tggtatcgga 1261 ctgttcgaag atggggatgt cgagcacgcc cccgtcctcg ccgccgcgca gcagcgtgag 1321 ccccacggtc gccagcgcga acacggccac cgcgattatg atgattttct tactgatctt 1381 aaacatgcac tatcccccgg tgtaattggg tacgatctct ttgataaact tgcggacctc 1441 ttcgtccccc ttgtccgtga gggccgccag gctttcttcc aggcccacat cctgcaggcg 1501 gataaatccg tcggagaatt cgatggggtg acccacgaag atcttcccgt gctgcgtctg 1561 cttaatgcct tcctccgaca gcagcagctc ctcgtagagc ttttcgccgg gccgcaggcc 1621 cgtcacctgg atatcgatgt ccttgccgac ctccaggccg gaaaggcgta tcatcttttc 1681 cgccaggtcc atgatcttga cgggctcacc catgtcgagg atgaagatct cgcctccgga 1741 tgccatggcg ccggcctgga tgaccagctg caccgcctcc ggaatggtca tgaagtagcg 1801 ggtaatgtct ttgtgtgtga ccgtcacagg acccccggcc gcgatctggc ggcggaagat 1861 gggaatgacg gatccgttgg accccagcac gttgccgaaa cgcacggcac agaactccgt 1921 ggagctgccg cgggaaagcg ccgcagccgc tctggcctgc atc // LOCUS sequence245 1950 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence245 VERSION sequence245 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1950 /mol_type="genomic DNA" /organism="" /note="sequence245" CDS 36..251 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MSLFSKPKHPYWIQHSHLFGDPEYICSECGCKVEFPQPECPGCGA QMGSSRDDANWVDEAEILDILFGEDK" /locus_tag="LOCUS_6590" /note="MGA_988" CDS 263..1417 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MSPKAKHEAKRNILALPKLAEKEKKPGLLDPEKLNVLVLGAPGSG KSTLIEAIRPYVEADGALELIDAPESSAKLKALRKEPVSIVWYCLDGMQRSILEEDLDG LRQAAKLWPDLPLIAVFTRSLGTDERDVANILMLQDAFAEYRPAKDLALRTKDIICVLA HEFETPLGIVPVRGLDRLMERTRECIPEAQQAASERKVRSVVWDLKRKEANATVAASSA LAATIGAVPVSFPDATLLVPVQTAMLAKITRLYDLKDKNAASQISDAALKAGATTIVGR SLLVALKGIPVVGTIGGSVLNAAVAAAVTAAVGETTVAVYDRIHRGELVIDESTDFGRI VNEIFSGRVPDIVSVVARTFAGKKASDIPKNLAKLVYEMVAKGK" /locus_tag="LOCUS_6600" /note="WP_002384134.1 YcjF family protein (Enterococcus) [pid:28.7%, q_cov:33.3%, s_cov:50.4%, Eval:5.7e-07, partial hit]" /note="MGA_989" ORIGIN 1 acgttgaaat aattgagccc ggaaggagta gagccatgtc tttattcagc aaacccaaac 61 atccttattg gatccagcac agtcatctgt tcggcgatcc cgaatatatc tgctccgagt 121 gcggttgcaa ggtggaattt cctcagccgg agtgtccagg ctgcggcgca cagatgggct 181 cttcccggga cgacgcaaac tgggtggatg aagccgagat cctggatatt ctgttcggag 241 aagacaagta aggagctgac ccatgtctcc caaagcaaaa cacgaagcaa aacggaatat 301 actcgctctg ccgaagctgg cggagaagga aaagaaaccc ggcctgctgg atccggagaa 361 gctcaacgtc ctggtgctgg gcgcgccggg atcgggcaag agcacgctca tcgaggccat 421 ccggccttac gtggaagcag acggcgcatt ggagctcatc gacgcgccgg aatcttctgc 481 aaagctgaaa gcgctgcgta aagaacctgt gagcatcgtc tggtactgcc tggacggcat 541 gcagcgcagc atcctggagg aagatctcga cggtctgcgg caggctgcca agctgtggcc 601 ggatctgccg ctgatcgcgg tgttcacccg ttcgctgggt acggacgagc gcgacgtagc 661 caacatttta atgttgcagg acgccttcgc cgaataccgg cccgcgaagg atctggcgct 721 gcgcacgaaa gacatcatct gcgtgctggc tcatgaattc gaaacgccgc tgggcatcgt 781 gcctgtgcgg ggcctggacc gcctgatgga gcgcacccgg gaatgcatcc ccgaagcgca 841 gcaggctgcg tcggagcgca aggtgcggag cgtggtctgg gacttaaagc gcaaggaggc 901 gaacgcaacg gtagcggcgt cttctgcttt ggctgcgacg atcggtgctg tgccggtcag 961 ctttccggat gccacgctgc tggtgccggt gcagaccgcc atgctggcga agatcacccg 1021 gctgtacgac ttaaaagaca agaatgcggc atcgcagata agcgatgcgg ctttaaaggc 1081 aggcgccacg accatcgtgg gccgttcgct gctggtggcg ctcaaaggca tccccgtggt 1141 gggcaccatc gggggcagcg tgctgaatgc agccgtagcc gccgcggtga ccgccgcagt 1201 aggcgagacc accgtagcag tctacgacag gatccaccgc ggggagctcg tgatcgacga 1261 gtccacggac ttcgggcgca tcgtaaacga gatcttttcg ggccgcgtgc cggacatcgt 1321 gtccgtggtg gccaggacgt tcgccggcaa aaaagcctcc gatatcccga agaacctcgc 1381 caagctcgtg tacgagatgg tggcgaaggg gaaataggtc ttttttaacc gcttaaccct 1441 ttaacgcgtt aaacttttat gctacaataa aacacgtaaa tcggccggcc cggtttcggg 1501 ccggtctttt gttttcgttt taacggtaat aggtatggac aacagagaga gttttaaatc 1561 gagacttggt ttcctgctgg tgagcgcggg ctgcgccatc ggcatcggaa acgtttggaa 1621 attcccctac gtaacagggg cgaacggcgg cggcatcttc gtcgtctggt atctcatctt 1681 cctgatcatt atgggcatcc ccgtcatgac catggagctg gcgatcggcc ggagcagccg 1741 caagagcatg atccgcggct acgaagctct ggaaaaaccg ggcgccaaat ggcacatcca 1801 cggctggctt tgcatgatag gcaactacct gctgatgatg tactacacca ccgtatccgg 1861 ctggatgttc tgctacttct ggaaattcct caccggcggc tttacagccg gtatgaccgc 1921 agacgaagtg agcagcgtgt tcggcggcat // LOCUS sequence246 1948 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence246 VERSION sequence246 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1948 /mol_type="genomic DNA" /organism="" /note="sequence246" misc_feature complement(750..>1948) /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_003113524.1:dipeptidase" /note="WP_003113524.1 dipeptidase (Pseudomonas) [pid:39.7%, q_cov:59.3%, s_cov:56.1%, Eval:8.1e-36, partial hit]" /note="MGA_992" /locus_tag="LOCUS_6610" ORIGIN 1 acgccgcgct tcagatggaa atccagatac ttcagcatgt cgttgatggt ggaattgatg 61 ccgccggcag gagcgctcac gtcggagttc cagtgagcca ccttgaaggg accgtcttcg 121 ccgggccagt agccgctgca gacgttttcg ctttcgttca gatatttgac gagggtgctg 181 ctgcgggtca tgcccagggg cttaaagatg cggtcgttga ccatatcatc ccaggacttg 241 cccgtcacct tttcggcgac gtgggccgcc atgtccacca tgtagttgtt gtactgggcc 301 ttataccgga acggcagatt cggctttaaa tactgcagcc tccgccacag ctcagagcgc 361 tctttgatgg tatcgtcgga ccagaccgcg tcgtaggaag cgaggcccgt gcggtgacac 421 atcatgtcgc gcagggtgca ttccgccgtt gcgaatgcgt cgtacatctt aaagtcgggc 481 aggtattcct tgatgggccg gtcgaaatcc agcacgccgt cgtccacgag catgcccagc 541 agcgttccgg taaagctctt gctgcaggat gcgatcgccc acatggtgtc tgcgtcgatc 601 cgctccttcg tctccagatc cttatagccg aaaccgccgg caaacagcac ttcgccgttc 661 cggatgaccc ccacacccat gcccggggtc ttgtatctcg ctaattcttt ttctacgtat 721 tctttgctga tgacttccat ggaaacctcc tagacgggaa taggcagccc ggtcttctcg 781 ataaaggcca gatggttctt gacccggaac acgtccgtgc cgttttcttt aatatccgcc 841 tcgatctttt cgatcagcat gtccatggag gcgctggcct tctcgaagca ttcgtccgtg 901 cagcctctca gcagttcttc cgcagacttt tcgttgccct gcgccagcag catgtccgct 961 gcctgcagcg cccgttcgga tgcctgatgg aacagcgcgt ccagatagcg gcgctcgtcc 1021 ttgatccact ggctgtactt ggggtgatcc gcttctacgt ccacctgcag tctcttggcc 1081 ttccaccaga aggaatcttc ggagtacttg ttggtgcctc tgcccatggc ttcggggatg 1141 tagccgatgt tgaagaacgg catcgcgaag ctgctgcagg gaggcgccat gctggcccag 1201 tagacgaact tggtcatctt gaagtccggc tttctgtatt cggtcaccat ggtagccgcg 1261 gactggcagg gtcccggttc gcagccgtgc atgcagatgc cagccgccag cgttgcagca 1321 gcgccccagc ggggctccag catggagcct tcgaagtggt cgcgcaggat ggtccacatg 1381 tcttcgcccg tgtacttgcg gttgccgaag ctgcggatga tctcgtgggc tctctgctct 1441 ctgggataac ccgacagcgt gcgggtattc agcagcacga agctcttgga gaagtcgaag 1501 gcccttctcg ggtcatgcag accgttggcc acggcgtagt ccgccagccc ctcggaacat 1561 tcgtcgaaat ccgtgccgat ggtgtacagg ttggagatgg gatagatgcc ggtgagccgc 1621 ttggcagccc agtggcggtc cacggtctcc agcagccaca tggcttcgga gtcggcgatc 1681 ataaaggtgt tgtggtagtt atcgtcggga ttctgatagg cgcatccgcc gccctggccg 1741 tacttttcca ggtggtcgat gatgacgtgc atggcctgat aagccgtgcg gccccgttcc 1801 agacccaggc gcagcagatc catgcccagc agcgcttctt ctttctgcgc cgggatctcg 1861 gaccagtccg cctcgttgcc gatgcagacg ccgtgctcgt tgatgcccat ctcaaatccc 1921 cagatccacc agggctggga accgatca // LOCUS sequence247 1937 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence247 VERSION sequence247 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1937 /mol_type="genomic DNA" /organism="" /note="sequence247" CDS complement(291..1121) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MKKKGCLFLSLLLLMGLAACSGGAGDLQDFQGKWFDVNGETVLEF SGDQLTVSFRNWSDVYTVHLESDGSLRYINSDKDYEFGAMSKLQILDDGTLSAYEQILD AEGHDYHFVREEALAAEREIRDKSKDLPKTIASREIETFSLTLKIDGVSYGLDEDWPHG NFSWALERLEDGSYQNDVDIMGDSYIAARYNGTEDASYAEGLADLIQELELPSLNGYYK TNNVRSHSYYLYVKYASGEKLEIGASGDAANTCPFDVNALMAYVKDKVQEGPYF" /locus_tag="LOCUS_6620" /note="MGA_994" tRNA complement(1210..1285) /product="tRNA-Arg" /inference="COORDINATES:profile:Aragorn:1.2.38" /locus_tag="LOCUS_t0120" /note="Aragorn_12" CDS complement(1314..1748) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MTFEEAKTVLGTDGITCIVLKEGNDPLISRVRGVKPIVGWIEEGA DLKDAAVFDTIVGRAAAMMYILAGVGFVYGRVMSRGGAAELEKAGISYEAGEYTDRIVN RQGTGMCPMEETVLEITDPEEAFSALKAKIAALQSARPAV" /locus_tag="LOCUS_6630" /note="MGA_995" ORIGIN 1 tcaacggatc ggacgcgacg ttcagtccca tctgcttcat ggtgaccagc acgcggctgc 61 ccgcataagc ggcgccagct gccacttcca tggcggtctt ttcgttgatg gaccattcca 121 cataacaatc ctgcggtctg tgcttcgcca ccgtttcgag cacctccgtc gaaggtgtgc 181 cggggtagcc gcataccagg tcgaccccgg cagcgatcgc acccatggcg atggcttcgt 241 tgcccattaa aaattcttta tgcaagatat cacctcgctg tattgaccgc ctaaaagtac 301 ggaccttcct gcaccttatc cttgacgtat gccatcaggg cgtttacgtc gaacgggcag 361 gtattcgcag cgtcgccgct ggcaccgatc tccagttttt caccggaagc gtatttcacg 421 tacagataat agctgtgact gcgcacgtta ttcgttttat agtagccgtt gagagacggc 481 agttccagtt cctggatgag atccgccaga ccctccgcgt aagaggcatc ttccgtgccg 541 ttgtatctgg cagcaatata ggagtcgccc atgatgtcga catcgttctg atacgagccg 601 tcctccagac gttccagggc ccaggagaaa ttgccgtgtg gccagtcctc atccaatccg 661 taggaaacgc cgtcgatctt cagggtcagc gaaaacgttt cgatctcccg ggatgcgatc 721 gtcttgggca gatccttgga tttgtcgcgg atctctcttt ccgctgccag cgcctcttcc 781 cgtacgaaat gatagtcgtg cccttctgcg tccaagatct gctcgtaggc ggacaacgta 841 ccgtcgtcga ggatctgcag ttttgacatc gcgccgaatt catagtcctt atcgctgttg 901 atatagcgca ggcttccgtc gctctccagg tgcactgtgt acacatccga ccagtttctg 961 aaggagaccg tcagctgatc gccggagaat tccagcacag tttcgccgtt gacatcgaac 1021 catttgccct gaaagtcctg cagatcgccg gctccgccgg aacaggctgc aagccccatc 1081 agcagcagga ggcttaagaa caggcatcct tttttcttca tgaccggtat cctccttgtt 1141 taatttatta ttttacaaca attcgtttgt gatagcaaaa caaagacccc ggacaagccg 1201 gggtcttgct ggtgcgccac gcgggattcg aacccacaac ctactgattc gtagtcaggc 1261 actctatccg ttgagctagt ggcgcgtatg cgcttttcag aacgcaacaa agattatacc 1321 gcaggtcttg cggattgtaa agcggcaatt ttcgctttca atgcggaaaa tgcttcttcc 1381 ggatccgtga tctccagaac ggtctcctcc atggggcaca tgccggtgcc ctgccggttg 1441 acgatgcggt ccgtatattc cccggcttcg taggaaatgc ccgctttttc gagttcagcg 1501 gcgcctcccc ggctcatgac ccgtccatag acgaagccaa caccggccag gatgtacatc 1561 atggcggcag ccctgcccac gatggtgtcg aacacggcgg cgtccttcag atccgcaccc 1621 tcctcgatcc agcccacgat gggctttacg ccccgcacgc gggagatcag agggtcgttt 1681 ccctccttca gcacgatgca tgtaatgccg tccgttccca atactgtctt tgcttcttcg 1741 aatgtcatgg aactgcccct ttctgtttgg atggaactca ttttatcacc ttgagaaagc 1801 ctgctcaacg gggtaaaata aattgttagg catttttgcc gaaaggagaa ccgttttatg 1861 aaaaattatt ccgaatgcac ccacgaagaa ctgcagcagg agaaagaact gcttctgaaa 1921 aaatacaagg aatatca // LOCUS sequence248 1927 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence248 VERSION sequence248 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1927 /mol_type="genomic DNA" /organism="" /note="sequence248" ORIGIN 1 gtccgtactg ggaaatgttc tccaccgcga cacggatcat ggttccgtcg tcggtgacga 61 tcagaatatc ctgacctgga cgaaccagct tgacagaggc aacaggaccg gtcttttcgg 121 tgactttgtg gttggtcacg ccaaaaccgc cgcggctctg gtagcggtac tcgccaacat 181 ccgtccgttt gccgaagccc ttctccgtga tgctgaggat ctcttcacct tcggaactgc 241 ttcccgcacc gacgaccacg tcgtcttcac ggagcctgat gccgcgaaca ccgactgccg 301 tacggcccat gacacgcacg tcactctccg ggaagcgaat ggcaagaccg ttgcgggtgg 361 cgatcatgat gttctcatcg ccctctgtcg gtatgacggt gatgagctcg tcgccctcgt 421 cgagggtgat cgcccggatg ccgatgttgc gcaggttctt cagagaggcc tggctgatgc 481 gcttgaccgt gccgtttttg gtgacgaaga acaggtactt gtcctcctca tagcctctgc 541 cgctgatcat ggcgctgacc ttttcgttct catcgccgat ctcgatgggc aggatgttca 601 cgatgttcgt gccgcgggca ttccgtcccg cttcggggat ctggtagccc ttgcgcacga 661 agacgcggcc cttcgaggta aagaacagga tgtggtcatg tgtggaggcg gtgaagaccg 721 tctggacgta gtcctcttcc ttcgtcgcca tggcgcgcac gcccttgccg ccgcggccct 781 gggcacggta ctcgctgacc ggcagacgct tgatatagcc gccgtgggtc agggtaaaga 841 cgcactgttc ttcttcgatc agatcctcaa tgtcgatctc atccgcgatg tcctggatct 901 cggtcttgcg ttcgtcgccg aacttgtcgc ggatggcgat gagctcatcc ttcaggacgc 961 ccttgatctt ctcgggatcg gccagcagtt ccttataata cgcgatcttc tcttccagct 1021 gcctgtattc ttcttccagc ttttcccggt tgagtccctg cagctgaatg agacgcatgt 1081 cgcagatggc ctgggcctgg acgtcggaga agccgaaccg ctccatcagg ttctgctttg 1141 cgttgtcgta gctggaacga atgatgcgga tgacttcgtc gatgttgtcc tgtgcgagca 1201 gcaggccctg cagcagatgt gcccgctctt ccgccttttt cagatcatag cgggttctgc 1261 ggacgatcag gtcctcctgg aaggtcagat attcgtccag aatgttccgc agtgtcagaa 1321 tcttcggctg ggtctggttc ttgaccaggg ccagcatgtt gatggagaag ctggactgca 1381 gcgccgtctg ggcaaagagg cggttcagga ccacctgggg attggcgtcg cgcttgagtt 1441 cgatgacgat gcgcatgccg ttgcggtcgg tctcatcgcg caggtccgag atgccctcca 1501 ggcgcttttc gtggacctgg tcggcaatgt tgcggatgag ctgccgcttg ttgacctgat 1561 agggaagctc cgtcacgatg atgcgggtgc ggttctggcc gtgctcctca aactccgttc 1621 tagcccgcag cacaaccttg ccgcggcccg ttaaataggc ctggcggatg ccgctgcggc 1681 ccatgatgat gcctttggtc ggaaaatccg gtccggtgat gtactgcatc agatcgctca 1741 gctcggcatc cggattctcc agaacacaga cgcaggcgtt gatgacttcc ttcaggttgt 1801 ggggcgggat gtttgtcgcc atgccgaccg cgatgccgct ggagccgttg accagaaggt 1861 tcgggaaacg ggagggcaga acgcggggct ctttccggct ctcgtcgaag ttcggatccc 1921 agtccac // LOCUS sequence249 1924 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence249 VERSION sequence249 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1924 /mol_type="genomic DNA" /organism="" /note="sequence249" CDS complement(390..1361) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MQERIAEIQKQIRSQKVGQYGMFPIDGSLVADGEYPIQVESSSPF FRIIEATLTVKNGQMTADITISSLSYQWVYSGTGEQADADTEDHYIGYWDDGGHGVFTI PVEALNKPIPCAAYSKKRKRWYDRDILFLASTLPAGALQVELPDYEAIETALKAYEVKD LEELAARPHKIPEPISVPKSDGEYSIEVNMTGGSGRASISSPTLLTVRDGKAYATLIWS STYYDYMILEEEYYLNLTEDGGPSRFEIPITAMDTPIPVIADTTAMGDPVEIHYELTFY EESIGEKGQIPQEAAKKVLMIAAAIIVLGGILNYFVKKKRAA" /locus_tag="LOCUS_6640" /note="MGA_999" ORIGIN 1 cccaggctgg atacggcgac gaccgttctc ccctgtctgt ggaccgcggg gaagatcgcc 61 gttccgtcgt ccaccttgca ggcgctgtta aagggcacgt tctgccgttt gcacgcgccg 121 gataagagtt tctgcgcttc ttcgttgccg gtggcatcga tcaccagggc tttgcccaat 181 acatcttcct ctgtgaccct gcgcaatacc ggggtcaccg gaagagccag gatctcttcg 241 cagatcttgg gcgccacgac ggtaacggct gcgccctgct ccgttaaaag cgccgctttg 301 tgcagcgcca gacggcctcc gccggccacc aggcaagaca gaccgtccca gtcgatcagg 361 accggaaaaa atgccatagt atctcctcct tacgccgcac gctttttctt tacgaaatag 421 ttcaggatgc cgccgagcac gatgatcgca gcggctatca tcagcacttt cttggctgcc 481 tcctggggga tctgtccttt ttctccgatg gattcctcat agaacgtcag ctcgtaatgg 541 atctccacgg gatcgcccat ggcagtcgta tccgcaatga cggggatcgg cgtatccatg 601 gccgtaatgg ggatctcgaa ccgggatggg cctccgtctt ccgtcaggtt gaggtaatat 661 tcctcttcca ggatcatgta gtcgtaatac gtgctgctcc agatgagggt ggcgtaggcc 721 ttgccgtccc ttacggtgag cagcgtgggc gaactgatgc tggcccggcc gctgccgccg 781 gtcatgttga cctcgatgga atactctcca tcggacttcg gcacgcttat cggttcgggg 841 atcttatgcg gtcttgctgc caactcctcc agatctttga cttcgtacgc ctttaacgcc 901 gtttcgatcg cttcgtaatc cggaagttct acctgaaggg ctcctgcggg aagcgtcgaa 961 gcaagaaaca gaatgtcccg gtcgtaccag cgcttgcgct ttttgctgta agccgcgcag 1021 ggaatgggct tgtttaacgc ctccacaggg atcgtaaaca cgccgtgacc accatcgtcc 1081 cagtaaccga tatagtggtc ttcggtgtcc gcatccgcct gttctcccgt gccgctgtac 1141 acccattgat agcttaagct ggagatggtg atgtcggcgg tcatctgtcc gttctttact 1201 gttaaggtcg cctcgatgat gcggaagaac ggggagctgg actccacctg gatgggatat 1261 tctccatcgg cgacgagaga gccgtcgatc gggaacatgc cgtactgacc gaccttctgc 1321 gagcggatct gcttctggat ctccgcgatc ctctcctgca cggacaactc ttcttctccg 1381 tccgcgtaaa ctgcatccca acagtctgtc agaacaagaa gcaggcagaa cagcagggca 1441 agcagcctct ttccccggcc tattctattt tggaataata agttcctcat aaaacctctg 1501 cttcttgcgc gtgttcgcag taaagcttcc gcacaccggc gatctgccca agtccctgca 1561 gcaggcattc cgtacagaac ccttccgcct tcagcctgct gttccaggaa tcttcagctt 1621 ctcctgccat gtcggtcacc gcatggtcgc ctgcgaccac catcagcggt gctagccaga 1681 tctttgcggg tctttttgct ttcgcggcct gcaggacagg ctcaaatcct ggctcgaact 1741 ccacggtgcc gacacagaag cgtccgggaa cgatctgttc cagggcagtc tgcagtttcc 1801 ggtagggatt ttccatggga aattcgctcc cgtgacccat cagagcaacc agatcctcct 1861 tctgggcaaa ggagaatgcc tctgcaagca cctgtgccag cgcctcgata tcgcggtcct 1921 ccgc // LOCUS sequence250 1922 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence250 VERSION sequence250 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1922 /mol_type="genomic DNA" /organism="" /note="sequence250" misc_feature complement(776..>1922) /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_011861409.1:DNA mismatch repair endonuclease MutL" /note="WP_011861409.1 DNA mismatch repair endonuclease MutL (Clostridioides difficile) [pid:31.4%, q_cov:99.5%, s_cov:62.4%, Eval:2.8e-54, partial hit]" /note="MGA_1002" /locus_tag="LOCUS_6650" ORIGIN 1 ccgcagcttc ttcgatggga cggccttcgg aaaggcagtc gatcacttct ttatacccga 61 tgcccttcat ggcgatgtcc ttgctcgtaa agcccttcgc catcaggctt cggacctcgt 121 cctccagccc tgcctccagg atcttgtcca ccctgcggtc gatgcggtcg tacaattcgc 181 tgcgatcccg gtccagaccg atcaacaggc tgtcgtagtc cgggtacggc gtctcgatat 241 cggtgaacgc cgccagtttc gcttcgccgt gctccaggcg ctcgatggct cgcagcatgc 301 gctttacatt gttgggatgg atggcttcgg cggcgtccgg atccagagaa cgcaggcgtt 361 cgtggacttt ctgcgggtca tgcccgcatt cgtcccacac ccgctgccag aaaccgtcgt 421 ctcccttggg cgccgaaaag tccatgtcgt acagcaacgc gttgatatac agccccgtgc 481 cgccgcttac gatgggcagt ttgccgcgcg ctgcgatctc cgcgatatag gagcgggcca 541 gtttctgata gtccgagacg ttgaaaggcg tcttcggatc gatctcgtcc acgagccagt 601 gcttcgcctg gtcgcgctct tccggcgtgg gcttggcgct gccgatatcc atgtacttat 661 agagctgcat ggaatcggcg gagacgatct ctccgccgca gtcccgggcg atccggatgg 721 cgtattctgt tttgccgcag gccgtcggac ccgttaaaaa cagaactttc atcggttatt 781 ttctcttgaa ctggcgttcg atatcgcttt ggctgaagga gatcagggta ggccgtccgt 841 gggggcagct gaagggattt tcgcagcggt ccagccgcac gaacaattcc ttcatctcgg 901 acagatccag cttatcgttg gctttgatgg ccgccttgca ggcgttgctc gtcagctctt 961 ctctcttgag ctggatatcc tgcgcgcgga tgctgtcctg ctcgaggatg tggatggcga 1021 aatcctccgc ttcctgcaga tacatgcagg acgggatctc cttaatgacg acgtctccca 1081 tgccgaactc ctcgatgcgg tagccgagat ctgcgagcat cttcagtttt tccgccgctc 1141 cgctgcggga ggcggatccg agctgaagca gcaccggagc caggatgggc tgggatacct 1201 tttccgcgcc attgaagatc ttcagcagct gttcgtacag gatgcgctcg tgggccgcgt 1261 gctggtcgat catgtagaca tgggtctcat ccttcgcaat gatgtacgtg gcgaaggctt 1321 cgccgatgat ctgcaacgag gagaacagga agcggggctt tgcgtcttcc ggttccgcag 1381 gcgatgcgcc gtaaggacgg atctcctcct gcacctgcat gctgcggtcc gattcctccc 1441 gcagctttgc gaaaacattc ttcgcatagg atgcttcttg agtagacggt aaaggattta 1501 tgtctacaat attcagatat tccgacggat ctgacggagt ttctatctct tccaaaccgc 1561 cgaacccctt ggagatctcg ctttcataag gtttcgcata caccgtctcc gcttcccggc 1621 tcacaggtct tgcgatctcg gaggattccg cgatgccctc ctgcttcagc aggctgcggc 1681 ggatggcgcg gatcatgaat tcggatacgc cccgctcgtc gtagaacttg atctccgttt 1741 tatggggatg gatgttcaca tcgacgctgc gggggtcaac gtccaggaac aggaacgccg 1801 ccgggtgcct tccctcgaac agtttatcgg agaacgcctc ctccagcgca tcttccatca 1861 ccttgctctt gacccagcgc ccgttgacga agaagacctg catccgtttg ttgttgcggg 1921 aa // LOCUS sequence251 1903 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence251 VERSION sequence251 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1903 /mol_type="genomic DNA" /organism="" /note="sequence251" CDS 236..763 /product="HD domain-containing protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_010966865.1" /transl_table=11 /codon_start=1 /translation="MEDKLKQLYLAMWKWDEGDAQLIQHFAKVHSFARLIGTCEGLDAG TLYLLETEALLHDIGIIPARKEFGQGSGKFQEKVSDPLVRDMLGKLGFDPAIIDRAAYV VSHHHTYKGIDGPDYQILVEADFLVNLFEEDSPKEAVEAACRNIFKTETGKELLEQMFL KEPPAFVKKVRT" /locus_tag="LOCUS_6660" /note="WP_010966865.1 HD domain-containing protein (Clostridium) [pid:37.0%, q_cov:92.6%, s_cov:99.4%, Eval:1.1e-29]" /note="MGA_1004" ORIGIN 1 aagcgctata tgagcccggt ggcgggccag gcggatatcc tggtggcccc ggacatccag 61 gcgggcaacc tcctggtaaa gagcctgatg tacacggcga aagcggtgct ggcgggcctg 121 gtggtggggg catctgtccc cgtcatcctc acgtcgcgct cctcccccgt cgtggacaaa 181 tccctgtcca tcgccatcgc agcggcgctg gatccgacag ttttgaggta acggtatgga 241 agacaaatta aaacagctgt atctggcgat gtggaagtgg gacgaaggcg acgcacagct 301 catccagcac ttcgcgaaag tgcacagttt tgcgcggctc atcggcacct gcgaaggcct 361 ggatgcgggc accctgtacc tgctcgagac cgaggcgctg ctccacgaca tcggcatcat 421 ccccgcccgc aaggaattcg gccaggggag cggtaagttc caggaaaagg tgagcgatcc 481 cctcgtccgg gacatgctgg gcaagctggg gtttgacccc gccatcatcg accgggctgc 541 ctacgtcgtg agccatcacc acacctacaa agggatcgac ggaccggatt atcagatcct 601 ggtggaagcg gatttcctcg taaatctgtt cgaagaggac tcgccgaaag aggcggtcga 661 ggccgcctgc cggaatatct ttaagaccga aacgggcaaa gaactgctgg agcagatgtt 721 cctgaaggag cctcctgcgt tcgtaaagaa ggtgcgcacc tgatcgttca aaaccgataa 781 accataagtt ttcaatgact gccggaaacg gcagtcattt ttttcatcaa ctgttgaatt 841 gttatattat taccgtgtgt agtaattctt ttaagtatat gataaaataa tttttatctt 901 aactgtgtaa tttcttgaat gcctcatagt gaaggagacg ggatatgaaa acgatcgcag 961 tacccgaact gaaaccgatc agagaggtac ctttatatag cgatttccgg gcgttgatca 1021 acggctgcgc cgaccgcttc ggagacgata tcgcatttca gatcaagacc cgcaaagaga 1081 cgaagacggc gccggcggaa taccgcaccc gctcgtttat cgaagtaaag aaggacgtcg 1141 acgccctggg cgccgcatgg ctgcgccgcg gcatggccgg caagcgcctg gccatcatcg 1201 gcaagaaccg ctacgagtgg atcctgggtt attgggctca cctgtgcggc ctcggcatcg 1261 ccgtgcccct ggataaggat ctgcctcagg aagaactgga gcagtctctg cgcaaggcga 1321 aggcggatgc gctgtatttc gaccttgccc atatgccttt ggtggatgcc ttaaagcaaa 1381 aaccggaatt tgcgcacctg cagtatttct gcatggacga tgtggcgggg ttcgacagca 1441 cggagaagct gctggcggaa ggggcggaag acagcgcggc gcagacggaa taccgcagcc 1501 tgcccgtgga tggcaaagct ctggcggtca tcctgtttac gtccggcacc tccggcctgg 1561 ccaaggcggt gcagctctcc cagttcaaca tgacccataa catctggtcc gtcctttccg 1621 cggaggatct gcgccacggc gacgtcaata tggcgttcct gccctatcac cacacgttcg 1681 gttccaccgg ccagaccatg atgtacgcgg ccggcatgaa gtctgtctac tgcgacggct 1741 taaaatacat ccagaagaac atcgtggaat acaaggtgag cgtgttcatc tgcgtgccgc 1801 tcctgatcga agccatctac aagcgcatca tggcggaggt cgaaaagcag ggcaagatga 1861 agaagctgaa gaccggcctt aagatctcca acgcgctgcg caa // LOCUS sequence252 1897 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence252 VERSION sequence252 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1897 /mol_type="genomic DNA" /organism="" /note="sequence252" CDS 1..372 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MDWLTPNETELSRLTGMPCEEPSEIGEAAAKLQTMGVKNVLVTVG SRGAYLCTAEGAELIPTEKVKAVDTTAAGDCFNGAFAVGLSEGLAPEEAVRFANKAASL SVTREGAQASLPGREEIAG" /locus_tag="LOCUS_6670" /note="WP_004080602.1 ribokinase (Thermotoga) [pid:54.5%, q_cov:98.4%, s_cov:40.9%, Eval:9.3e-28, partial hit]" /note="MGA_1006" CDS complement(369..824) /product="divergent PAP2 family protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003130996.1" /transl_table=11 /codon_start=1 /translation="MSDFAMILQNKILVTALIGWACSQILKPFTFMIVNKRFDVSRFTG DGGMPSSHSTFVTSAAVAAGLNCGWDSPAFAIMTVIAFIVMHDAMNVRYETGKQSQVLN ELIEKFNMISDHDVTLEKKLEEFVGHTPIQVAAGFVLGVVVALIVNL" /locus_tag="LOCUS_6680" /note="WP_003130996.1 divergent PAP2 family protein (Lactococcus) [pid:39.6%, q_cov:88.7%, s_cov:89.1%, Eval:9.6e-25]" /note="MGA_1007" ORIGIN 1 gtggactggc ttacgcccaa cgagacggag ctgtcgcggc ttactggaat gccctgcgaa 61 gaaccgtcgg agatcggaga agccgcagca aagctgcaga ccatgggcgt aaagaatgtg 121 ctggtgaccg tgggcagcag aggggcgtac ctctgtactg cggaaggcgc cgaactcatc 181 cccacggaaa aagtaaaagc cgtggatacc acggctgcgg gagactgttt taacggtgcg 241 tttgcggtcg gcttatccga agggctcgcc ccggaggagg ccgtccgttt tgccaacaag 301 gcagcatctc tttccgttac gcgggaaggt gcgcaggcat ctttacccgg ccgggaagag 361 atcgccggtt aaaggtttac gatcagcgcg accacgacgc ccaggacgaa gcctgcggcg 421 acctggatcg gcgtatggcc cacgaactcc tcgagtttct tctccagggt cacgtcgtga 481 tcggagatca tgttgaactt ctcgatgagt tcgttcaaga cctgggactg tttgccggtc 541 tcgtagcgca cgttcatggc gtcgtgcatc acgataaagg cgatgacggt catgatggcg 601 aaggcggggg agtcccagcc gcagttgagc cctgctgcta cggcagccga cgttacgaag 661 gtggagtggc tgctgggcat gccgccgtcc ccggtaaagc gggaaacgtc gaagcgcttg 721 ttgacgatca taaacgtgaa aggcttgagg atctgggaac aggcccagcc gatgagagcg 781 gtcacgagga tcttattttg taaaatcatt gcaaagtcac tcataacgta tttattgtag 841 caccatttcg cgaaaatggc gctttgcgga aaaagaaaaa agaggggttc ttaccccctc 901 cgtacgttta agcgaccggc ttgctgggcg gcagccgcct aaagtcacaa gatggttgat 961 attatatctt ccgcggatcg ggaaatcaac ccaggatagc cgaaaaatat ctggaaatac 1021 gtaaaaatac ggaaatttgc gtcatgcttt ttcggaggaa gagaacatgc ggtacagaaa 1081 attaggaaac accggactcg aagtgagcga gatcggattc ggcggcgagt ggctggagcg 1141 ccacgagttc gaggaatccg tggaactcat ccggtacgcg caggaaaagg gcatcaacat 1201 catcgattgc tggatgtccg atccgaagtc ccgggacatc atcggcaaag ccctcgaggg 1261 caaccgggaa aagtggtttg tgcagggtca catcggctcc acccatcaga acggccaata 1321 tgtgcgcacc cgggacatgc aattcgtaaa gcttgccttt gaggacctgc tgcagcgcct 1381 cggtacggac tatatcgacc tcggcatgat ccactacgtg gacgcacagg aggactggga 1441 tctgtgcatg aacagcccct acatcgaata cgttaaagaa ctgaaggcgg cgggtaccat 1501 ccgccacatc ggcctttcta cccacaatcc ccgcatcgcg aagacggcca tcgaatccgg 1561 tatcgtggag atgatcctct tctccatcaa tcccgccttc gacatgcatc cggcgacaga 1621 ggtgctggac gagatgttcg aaaactatgc gaacgagatg tccggcatcg atgaggagcg 1681 cgctgcgctg taccggctgt gcgaggagaa gggcgtgggg atcaccgtca tgaagcccta 1741 cttcggcggc cgtctgtttg acccggccag atctcctttc ggctccgtct ttaccccggt 1801 gcagtgcatc cactatgtgc tcacccggcc cggcgtgtcc tccgtgctct gcggctacga 1861 cacgaaggag cagatcgacg ctgccgtcgc gtacgaa // LOCUS sequence253 1891 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence253 VERSION sequence253 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1891 /mol_type="genomic DNA" /organism="" /note="sequence253" CDS complement(209..1138) /product="cysteine synthase A" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_004117534.1" /transl_table=11 /codon_start=1 /translation="MSNIYTSAEQLIGGTPLLELVHTEEKEGLNAKIYGKLEYLNPAGS VKDRIARAIIADYEAAGKLKPGDTIIEPTSGNTGIGLAAVAAAKGYKLILVMPDSMSVE RRKIVAAYGAELVLTEGAKGMKGAIAKADELLKEIPGAVLAGQFVNPSNPKAHYETTGP EIWNDTDGQVDIFVASFGTGGTVSGTGKYLKEQNPAVKVVGVEPAASPFISEGKAGPHK IQGIGAGFAPDTLDLNVLDEVIAISNEDAYAAGAAIGRNEGVLVGISAGAAVAAAIQLA KRPENAGKNIVVILPDTGDRYLSTEGYF" /locus_tag="LOCUS_6690" /gene="cysK" /EC_number="2.5.1.47" /note="WP_004117534.1 cysteine synthase A (Gardnerella vaginalis) [pid:60.7%, q_cov:98.7%, s_cov:98.4%, Eval:5.4e-103]" /note="MGA_1010" ORIGIN 1 agcacgtaca gcagcgcttt cgtcagcgcc tgggcggcca ggtccatctc gatgcgggac 61 ttctcctcca gcccatcccc gctgaaagaa gaaggttctc ctccgaagaa gcggggaaac 121 agggcggaga aaaagcggtc gacagcttcc cggatcctct ccgaaagacc gatgtaattg 181 ggttccatat agttttcctt tatagacgct agaaataccc ttccgtggac aggtagcggt 241 ctccggtatc gggcaggatg acaacgatgt tcttgccggc gttctccgga cgctttgcca 301 gctggatcgc agcggcaact gcagcgccgg cggagatgcc caccaggacg ccctcgtttc 361 tgccgatagc agcgccggcg gcataggcgt cctcgttcga gattgcgatg acctcatcca 421 gcacattcag gtccagcgta tccggtgcga atccggcacc gatgccctgg atcttgtgag 481 gacctgcttt gccttcggag atgaagggag aagcggcagg ttccacacct acgactttta 541 cagccgggtt ctgctccttc agatacttgc ctgtaccgga gactgtgccg ccggtgccga 601 agctggccac gaagatgtct acctggccat ccgtatcgtt ccagatctcc ggacccgtcg 661 tctcgtaatg cgccttcgga ttggaggggt tcacgaactg acctgccagc acggcccccg 721 ggatctcctt cagcagctca tccgctttgg cgatagcgcc tttcataccc ttcgctcctt 781 ccgtcagcac cagttctgcg ccgtaggctg ccacgatctt gcggcgttcc acggacatgg 841 aatccggcat caccaggatg agtttgtagc cctttgcggc agcgaccgca gccaggccga 901 tgccggtgtt gcccgaagtg ggttctatga tggtgtcgcc gggcttcagt ttgccggcgg 961 cttcgtaatc cgcgatgatc gctcgggcga tgcggtcctt tacgctgccc gccggattca 1021 gatactccag ctttccgtag atctttgcgt tcagtccttc cttttcctcc gtgtggacca 1081 gttccagcag cggggtgccg ccgatcagct gttctgccga tgtgtagatg ttagacatgc 1141 ttttttgcct cctttttccg gtaaaataaa aagcgcaggc cattcctgac ccgcgccgca 1201 tgcagagaag aaaaacttgc tcagatgaag caggagccac ggaaaatgcc agcacaaata 1261 cagcacatgc ataccatgcg cgctgcggtt tccatcatgc tcctgtgttc gattctgatc 1321 ttgttcatgg taatatttta ttcctactta cctactatgt caataggtta tataaaaaat 1381 gcacccacgc ctaaatccat ttatggtatg atggtgccat ggcaagaatc gaactgaccg 1441 ccacagctac cttcgggctg gaggctgtcg taaaacgaga gatcgaagga ctcggatacg 1501 ccgttaccgg atcgcaggac ggccgtatct cctatatggc cgacgagcgg ggcatcgtcc 1561 gctctaacct ttggctgcgc agcgcagacc gcgtctatgt aaagctggcg gaattcgagg 1621 cgaagacctt cgaagagctg ttccagaacg tcgccggcat cccctgggag gagtggatcc 1681 cctacgaagg aaaattcacc gttgtcggca cttctgtcaa atcccagctg cattccgtgc 1741 ccggttgcca gtccattacg aagaaagcga tcgtgacccg gctgcagcag acctatggtg 1801 aggtcacctt cccggagaca ggcgccgcct atacagtgcg ttttctgttc cagaaagacg 1861 tgtgcaccat cctgatggat acgtccggtg c // LOCUS sequence254 1887 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence254 VERSION sequence254 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1887 /mol_type="genomic DNA" /organism="" /note="sequence254" CDS complement(1069..1797) /product="aspartate/glutamate racemase family protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011089550.1" /transl_table=11 /codon_start=1 /translation="MDMSKPRIGILRWEGGKVPEGLMQLERMTGNSTNPASYPFPVKMV EVKGATTETVIIHPSREVLSRMIEIVKEMEKEGICAVTTSCGFNAVFQKELAEAVNIPV FTSSILQVPFVQTIIGKNHSVGIITANKGSLTREHMRACNITDESNLYVVGLEDCKEWR KIFDEPDEPFDMEAVSAEILGAIAKGFEEHPDTAFIVLECTDLPPYAKQIRERFHVPVL DVNTMIGYMAYAIGQMKMYD" /locus_tag="LOCUS_6700" /note="WP_011089550.1 aspartate/glutamate racemase family protein (Bradyrhizobium diazoefficiens) [pid:34.5%, q_cov:88.4%, s_cov:89.5%, Eval:6.4e-31]" /note="MGA_1013" ORIGIN 1 cagggtcaga taaccgcccc agcaggaaag gcccgctctc agatactgat cttcttcgat 61 ggccttcttc gggcccttgt cggcgatcgc cagcagcatg ggcagcgtgg cgttggccag 121 ggtcacggaa gcggtctgcg cgaaggctgc ggggatattg tccacgcagt aatgcatgat 181 gccttcctcg aagtagaccg ggtcggtgtg cgtggtgctt tccgtcgtct cgatggcgcc 241 gtggtcgtcg caggccacgt ccacgatcat ggaacccttc ttcatgagcc ggacgtcttc 301 tctgtaaacg atgtggtctg tgcgttcttt cgcccactgc gtaccgttga agagaacatc 361 tgtctctttc agacactttt ccaggttttc ccggttggag aacatgaact tgacgttggg 421 caggtacttc tttgcctcca acatcgcatc gatgttgatg tccagaatac gaacgtccag 481 accccaagcg gaagccagtt ctgcgatggc ggtgccgatg ttgccgcagc cgaggcaggt 541 tacgatcgga gtcggtacgc ctgccacatt gcagagcagt ttgcccgggc cgccgtggat 601 cgtctgcata aagttgagcg ccgcgataaa gcctcccttg cctgcgatct cggacatcgg 661 gcgcagcagc gggaatttgc cattcttgtc agggatgtcc tcataggcga tagcggtgca 721 tttgctgtcc agcagcacgt cggtctctgc cggatgcgca ttggtatgga tataggtgaa 781 cagaatcttg tcctccgcca tccacttgaa ttcttcgggg aaaagttcct taaccttgta 841 atacagctga gccttctccc agactgtatc cttgtccgcg acgatggcgc cggccgcctc 901 gtaatcttcg tcgctgtagc cggagccgac gccggcgccg ctctggacgt atacggtatg 961 gccgtgcgct acgatctcct tgacggtcgc ggggatcgcg gcaactctgt attcattggg 1021 tttgatttcc tttaatacgc cgatgatcat agtgctctcc tttcttaact agtcgtacat 1081 cttcatctga ccgatcgcat acgccatgta gcctatcatg gtgttgacat ccagcacagg 1141 cacgtggaag cgctcgcgga tctgcttcgc gtagggcgga agatcggtgc attccagaac 1201 gatgaaagcg gtgtcgggat gttcttcgaa ccccttggcg atggcgccga ggatctccgc 1261 ggagacggct tccatgtcga agggttcgtc cggttcgtcg aagatcttgc gccactcttt 1321 gcagtcttcg agtccgacga catagaggtt gctctcatct gtgatgttgc aggcgcgcat 1381 gtgctcgcgg gtcagcgagc ccttgttcgc cgtgatgatc ccgacggagt ggttcttgcc 1441 aataatggtc tgcacgaacg gcacctgcag gatcgaagag gtaaagacgg ggatgttcac 1501 cgcttccgcc agttctttct ggaaaacggc gttgaagccg cagctggtcg tgaccgcgca 1561 gatgccctct ttttccatct ccttgacgat ctcgatcatg cgggacagca cttctctgct 1621 ggggtggatg atgacggttt ccgtggtcgc gcctttgacc tccaccatct tgacagggaa 1681 gggataggac gcgggattcg tgctgttgcc ggtcatgcgt tccagttgca tcagtccttc 1741 gggaaccttg ccgccttccc agcgaaggat gccgatcctg ggtttactca tatccattgg 1801 taacacctcc taaaagactt ctctacacct taatgatgaa atgggtcaga ggaaaagtca 1861 agaaataaat acaattttgt atacaaa // LOCUS sequence255 1882 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence255 VERSION sequence255 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1882 /mol_type="genomic DNA" /organism="" /note="sequence255" CDS 1353..1649 /product="STAS domain-containing protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_010939281.1" /transl_table=11 /codon_start=1 /translation="MTITKTIESDALTLALSGRLDTTTSPELEDEINASLAGIHKLTLD FTELSYISSAGLRVLLAAQKKMNVQGEMRVVGVNDTIMEIFEVTGFSEILTIE" /locus_tag="LOCUS_6710" /note="WP_010939281.1 STAS domain-containing protein (Desulfovibrio) [pid:33.3%, q_cov:99.0%, s_cov:90.8%, Eval:2.5e-09]" /note="MGA_1015" ORIGIN 1 gcgaattccg tcagccggga cggaacgccg aatttccggg tcacgatgct ctccgtttcg 61 ccgtaggagg caccggcaga agccgtcagg aacgaggtca tcatggccgg cttgagcgtc 121 ttcagcagcc atttcttttc cacaccgtat ttggtcgccg tgtggttgag catcaggacc 181 aacatcagga acatccccat cacgtagacg aggacgggct tccagatccc gtagagctgg 241 gagatctgac cgttccagat gtaactgatg atggtgagcg agatgaacac cggcgaatac 301 cggccgatgc tctccatcag gtagttgacc agagagttgc cctgggtgac gacacggcgc 361 agcgtgcccg ccgattcgcc catcgccaga agaccgacac ccagcgcaaa gcccatgaag 421 atcagctgga tggagtcgtt gtttgaaaaa ggcgagaccg ggttcgccgg gagtatgctg 481 gcgaccagtt tcagaaattc cgaaagactt tcacccggct ggatgctgcc gcttgtccgg 541 atcgtaaaga acggatagaa gattgcctcg gccaggacag cggccaggaa ggagaaggcg 601 atgaaccggt tcatcacccg tttgccgtag cggctgtacg taacgatatc ccccagattc 661 gatacggcac ttccgaggaa caggaacagc gacagactgg caaaggtgcc gaagacgccg 721 aggaacgcgt tgaaaaacag cgtaagcacg ttctcgtcga tgtagtcgcc tgccgcgtct 781 ggaagctgga agaacaggat gccgaaaaag atgccggcga acacgctgat ggggatcgtc 841 agggtggcaa aacgccgttc ctcgtggatc cgcagcgtaa cgcggttctt gctgccccgc 901 cggctccaga cgggcgcaaa gcccatgtcc accatcaggc ggcggctgaa ctcgtcttcg 961 ccggtgtcga gcgtcgtcgg gttaaaccgg tctccttcgt actcgatggt gatatagtcc 1021 cggcgcatcc gggaatccat atataccgtg cacgatatct tgccgccgaa gtgctcgcag 1081 atgcgcagca gcgtatcctc catcgcgaga cggatgcgga tgcggttgcg gttttccagc 1141 gaaagcgtct gcaggaactc ccagatgtct tccgagatcc tgtccacgcc gcggcggtcc 1201 agcagatata cagtttccac gagtcttctc ttcatgcctt tagtatacta cattttcgga 1261 aagttcagca ttctcccata atttattgtt ttacgaaaaa gcgaattcat gagataataa 1321 attgattatg tagtatgcat aaggaggtcc ctatgacgat cacaaaaacc atcgaatccg 1381 atgctcttac tctcgccctc tccggcagac tggacaccac cacttccccc gaactggagg 1441 atgagatcaa cgcttctctg gcaggcatcc acaagcttac gctggacttt acggaactga 1501 gctacatctc ttccgcaggc ctccgcgtgc tgctggctgc ccagaagaag atgaacgtcc 1561 agggagagat gcgtgtcgtc ggtgtcaacg acacgatcat ggagatcttt gaggtcaccg 1621 gattctccga gatcctgacg atcgaataat gcaggcggac ttatgaaaga agtcagcctt 1681 atcctaaatc aaaccattcc tacgctccgg ctgtctgggc gcatcgattc gacgaacgcc 1741 gcagccgcag agcaggagat ccaaacgctg ctgcaggacg tgcccggcac gcaggtgcag 1801 gtcgacgcgg aggacctgga gtacctttct tccgcaggtc tgcgcgtgct gctgcgtctg 1861 cgcaagagcc gcaccggtct ta // LOCUS sequence256 1870 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence256 VERSION sequence256 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1870 /mol_type="genomic DNA" /organism="" /note="sequence256" misc_feature complement(344..>1870) /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_011057686.1:M23 family metallopeptidase" /note="WP_011057686.1 M23 family metallopeptidase (Thermosynechococcus vestitus) [pid:60.2%, q_cov:19.3%, s_cov:25.5%, Eval:8.5e-28, partial hit]" /note="MGA_1018" /locus_tag="LOCUS_6720" ORIGIN 1 ccggtcgaat tccgcctgct ttttcttcaa gatctggtag ttcggaaatt cctcggcgtt 61 gcggtaaccg tatttcaggc ccagggccat cagactgccg gtgaccgccc cacagcgctc 121 gccgtgctgc gtgccccagc cgaagccgct ggatgccaaa agtgcctgct cctcatcgaa 181 gcccagcatc ttcgcgccat gcacgaatgc gcactgggag cacatcagct cgttcgcgaa 241 ggcgttcgcc ccctcttcca ccagtttggg atctacgctg tccaatattt ccgcatttct 301 tcctgggatc ttgtaatcgt gcactgttgg ggacggttct cttttagttc atttcgtccg 361 gctgctcggt gagttcgctc caggcatcct gcgcgccctt cagcacgaag ctgaaatacg 421 acgcgatctg caggatgtct tcgtccgtca gttcgatctc ctcgccctcc cagggaaccc 481 cggacctgct tacgacgcgg cctcctgcca ggtccaccag gcagctcagg gtcggtccgg 541 taatagcacc ggcggatacg ctgcttttgg taaagttgaa agacagcatc gtatacttcg 601 aaaaactgta gggaccgggt tcccactggg cggagccctc gacggtgacc ccttcaaaat 661 acggatgcgc aaaccgcggg ttcacaaagt acagccatcc gccgccgatc cgatcctcat 721 caggcgtcca ctgcacatac tccgcatcca atccgctcgc gagcaggccc tgcgtgctct 781 tctcgaagtc catcttttcg agtcccggat attcctgaaa tgcggctttg cccgtgtttg 841 ccccgatgcg cccgtctcct tccaggtagt ccatcgggtc taccgactct ccgtccaggc 901 gaacttcgaa atgcagatgg gggccggtgg aatacccggt gaccccgacc agcgctatcg 961 tctgcccctg ctctaccgca tcgccttcct caacaagcag ttcactgcag tgggcatacc 1021 aggtctccag tcctgctccg tgggaaacgg caacccgata accgtaagat ccatcccaac 1081 cggcaaacac gacagttccg gcctgcgcag catgaatctc ttctccttta tccgacttta 1141 agtccaagcc ggtatgcaat gcgggcatct cttctgtaga ataccagaac ggtccgaatt 1201 ccgcggatat cgtaatcgca tccagcggcc acacaaaacc gggagcatcg gcagcaagat 1261 cggcatctga agacggatct tccgatcctc ctttgtcctc ataagcccct tcgccggcaa 1321 agcttttctg gttttccagc acgtccagga cgcgttcctg caattctgcc agttccgtgt 1381 agtcgtaggc gccccagttg ccttccgccg cattttgcaa aagatgggtg atgactttag 1441 ccgcctgctc cgtatcttcc tgatatcctt gcggcagcac gagtcccatg tattccaatg 1501 cgctgcaata cccccgctca tccaattcca gcaaagcctt tgcaacagcc gagatcttct 1561 cccagtcccg ctgctgcgga tccaggaaga ccggcgcatt gccggatccg gccgggcaaa 1621 cggcagagac tgttacggtc ttaaaggtct tcccgccgat attgccgccg gcggaaagct 1681 cgtaggtttc tcccggggtc acgcgggcgg tgccctccat cagcagatag ccttcgccgt 1741 ccgcctccca ggacttgatg agcgtctccc cgcagcgcag ttctaaaacg gccttcagag 1801 gatcgccgga agcggacagg ctgaagcggc actgagcggt cctgccgtcg aaggacagta 1861 ccggcttggc // LOCUS sequence257 1866 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence257 VERSION sequence257 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1866 /mol_type="genomic DNA" /organism="" /note="sequence257" misc_feature <1..1465 /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_011987043.1:pyruvate:ferredoxin (flavodoxin) oxidoreductase" /note="WP_011987043.1 pyruvate:ferredoxin (flavodoxin) oxidoreductase (Clostridium botulinum) [pid:59.5%, q_cov:99.6%, s_cov:42.9%, Eval:2.8e-174, partial hit]" /note="MGA_1019" /locus_tag="LOCUS_6730" ORIGIN 1 cgacgttccc gaatgggata tgaccaagtg catccagtgc aacatctgct ccctcgtctg 61 cccgcacgcg gcgattcgtc cggctctgct cgacgaagaa gaagttgcaa acgcacccga 121 aggatttgag accaagaccg cgaacggcaa ggatctcagc aagtaccagt tccgtatgca 181 ggtcagcccc tacgactgca cgggctgcgg cagctgcgtg aacgtctgcc ccgccaagga 241 gaaagcgctg gctatgaagc cgctggcttc ccagctcgat caggcggaca actgggaata 301 cgctgttgag gaagtctccg tcaagaagga cgctgccaac aacaagagca tcaagaactc 361 ccagttctac aagccctact tcgaattctc cggtgcctgc gcgggctgcg gcgagacgcc 421 gtacatcaag ctcgtcaccc agctgttcgg tgagcgcatg tacgtcacca acgcgtccgg 481 ctgctcctcc gcttacggcg gctccacccc gagctccccg tactgcacgg acaaggacgg 541 caacggtccc tgctgggcaa tgtccctctt cgaggacaac gcagaatatg cttacggcta 601 cctgctcggt cagggcgctg tcaagcgcga actcgtcgac aaagtcaacg cacttaaaga 661 cgccggcgta gctgtcgatg catgccaggc atacctcgac aacgcgatgg atccggaagt 721 ttcccgcaag gtctccgatg atctgctcgc agcgatcgaa gcaaatgaca gcgaagaagc 781 tgccttcatc cgtcagaaca aagaattcct gaccaagaag agcgtctggg cattcggcgg 841 tgacggctgg gcatacgaca tcggttacgg cggtctggac cacgtcctgg cttccggcga 901 tgacatcaac gtcctcgttc tcgataccga agtctactcc aacaccggtg gtcagtcctc 961 caaggcgacc aactccgcgg cgatcgcgaa gttcgctgcc ggtggtaagt acacccgcaa 1021 gaaggacctt ggcatgatgg ctatgagcta tggctacgtc tatgtcgctc aggtcgcgat 1081 gggtgcggat cccgcacaga ccctcaaggc catccgcgaa gcggaagctt atccgggtcc 1141 gtccatcgtc atctgctact gcccctgcat cgagcacggc atgaaggcca gcatgggcct 1201 gtcccagctc gaagagaaga aggctgtcga gtgcggttac tggcatctgt acagatacaa 1261 cccgcagctc aaggaagaag gcatgaatcc gttcatcctc gacagcaagg agcccacagg 1321 cgacttccag gccttcctca tgggcgagaa ccgctacgca tccctggctc tctccttccc 1381 gcacaaggcg gaagagctct acgccaaggc tgctgctgac gcgaaagacc gtctcgaagg 1441 ctacaagaca ctggccggca gataaacatc aagcaatcac aaactgcaga aggtactacg 1501 gtgccttctg cagtcatgtc taccataagg aggattttca ctatggcact tatgactgca 1561 gaacaataca tcgaatccct gcgtaagctc ggcaccagag tctacatgtt cggcgaaaag 1621 atcgacaact gggtcgacca tccgatcatc cgcccctcca tcaactgcct ggcgatgacc 1681 tatgaactcg cacagcagga tgagtacaaa gacctgatga ccgctacgtc caacctgacc 1741 ggtcataccg tcaaccgttt cacgcatctg caccagggtc cggacgacct gatcaagaag 1801 gtcaagatgc agagactgct cggccagaag accgccagct gcttccagcg ctgcgtcggt 1861 atggac // LOCUS sequence258 1855 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence258 VERSION sequence258 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1855 /mol_type="genomic DNA" /organism="" /note="sequence258" CDS complement(596..1810) /product="S-methyl-5-thioribose kinase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_000033250.1" /transl_table=11 /codon_start=1 /translation="MYTPQIAIEYIQKNLPGFFGSDARLKAAELSDGNINFVFRVEDEN TGRSLIIKHAEDTLRVNPSRHIGFDRSKIECEVLKLQRRYCPALIPEVYLYDEDEHNIV MEDMRGYENLRYELCSHKIFPNLAKDVAEFCGKALIGSTDMVVGAEQKKELVKRYTNPK LCEITERHVLTEPYYEDLDDNGVTEENDEFMRTWIYGSEELHAKVGMLKALFETKAQAL LHGDLHTGSIFVTPDKTCILDPEFAFYGPIGYDTGNFIANMIFAYANGLYTMEDGPEKT AYLEWILDTIEEFCGRFVENAKQLIREKSADRQMRSEAFFDLYLEDIFKDQAGFAGTEL IRRVVGTSKVKDIRSIEDEVQRAKAERLCMIAGMKFVMDPEFLKNGKSYTDYLRTFSDV VDFEG" /locus_tag="LOCUS_6740" /gene="mtnK" /EC_number="2.7.1.100" /note="WP_000033250.1 S-methyl-5-thioribose kinase (Bacillus) [pid:41.9%, q_cov:95.8%, s_cov:94.4%, Eval:6.2e-84]" /note="MGA_1022" ORIGIN 1 cgatcaagga ggcagatcct aacgctgtgg tcgtattcat cggaccctgc atggccaaga 61 aatacgaacg caagaaggat tgctccaagg attacatcga ccacgtgctg acgttcttcg 121 aactgcaggc gctgttcgat tccaaggata tcgttctgtc tgagcttgag cccacggatc 181 tgcaggacgg cagcagcttc ggcagagctt actgcaggag cggcggcgtt gcagcgtctg 241 tcgcgcaggc cgtgaaggag atgggaagag aagacctcgt cgtaaagccc gtcatctgca 301 acggcatcga ggaatgcaaa gcggcgctga tgaaggcgaa ggccggcaag ctggacggca 361 acatcatcga aggcatgtgc tgcccggacg gctgcatgcg cggcatgggc acgctggtga 421 acaagcagaa ctccatgaag ttcgtcgcag attatgcggc ctcggcggag aagaagacga 481 tcttagacta aagaatagat aatatgaaaa accgcggacg gtattgcgat ctctcgcttc 541 tgcataccgg ctcgcggttt tttattattt actctgtgct tttccgttcg atgctttatc 601 cttcgaaatc tacgacatcg gagaacgtcc gcagataatc ggtgtaggat ttgccgttct 661 tcaggaactc gggatccatc acgaatttca tgccggcgat catgcacagg cgttcggcct 721 tggcgcgctg cacttcgtct tcgatggatc ttatgtcttt tactttggaa gttccgacca 781 cacggcgtat gagctcagtc ccggcaaagc cggcctggtc cttgaagata tcttccagat 841 acagatcgaa gaaggcctcg gagcgcatct gccggtctgc agatttttcc cgtatcagct 901 gcttcgcatt ctcgacgaat ctcccgcaga actcctcgat cgtatccagg atccattcca 961 gataagcggt cttttccgga ccgtcctcca tcgtgtaaag gccgttcgca taggcgaaga 1021 tcatgttggc gataaagttg cccgtatcgt agccgatggg gccgtagaag gcgaattccg 1081 gatccaggat gcaggtcttg tccggcgtca cgaagatgga acccgtgtgc aggtctccgt 1141 ggagcagtgc ctgggccttg gtctcaaaca gggccttcag catgccgacc ttcgcgtgca 1201 gctcttcgct gccgtagatc caggtgcgca tgaattcgtc gttttcttcg gtgaccccgt 1261 tatcgtccag atcttcataa tagggttcag tgagcacgtg ccgttccgtg atctcgcaca 1321 gcttggggtt ggtgtagcgc ttcaccagct cttttttctg ttccgcgccg acgaccatgt 1381 cggtggatcc gatgagggct ttgccgcaga actctgcaac gtctttggcc agattgggga 1441 agatcttgtg gctgcagagt tcgtagcgca ggttctcgta gcccctcatg tcttccatca 1501 cgatattgtg ttcgtcctcg tcgtacagat agacttcggg aatgagggca gggcagtagc 1561 ggcgctgcag cttcagcact tcgcattcga tcttgctgcg gtcgaatccg atatggcggc 1621 tggggttgac ccgcagcgta tcctccgcgt gcttgatgat gagcgatctg ccggtgtttt 1681 cgtcctccac ccggaacacg aagttgatgt tgccgtcaga gagctcggca gctttcagcc 1741 tggcatcgct gccgaaaaag cccggcaggt tcttttggat atattcgatg gcgatttgcg 1801 gtgtgtacat aggatcctcc ttactggggt tgccgcttcg gcaagctaac gttca // LOCUS sequence259 1853 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence259 VERSION sequence259 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1853 /mol_type="genomic DNA" /organism="" /note="sequence259" CDS 268..768 /product="GNAT family N-acetyltransferase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011036326.1" /transl_table=11 /codon_start=1 /translation="MEKKFVLRDAEEKDYDFILRVNEENVEVLSPMPLERLKLFKEHAD MLQVAEVDGELAAFIICMKEGDDWYDSENYLWFCKTYPQFLYIDRIVLDKPFRHQGLGR FMYEAVFAKAKANGAPVVTCEVDTVPYNGPSLLFHEAMGFKEVGAQYVRGGSVKVSLQA AEV" /locus_tag="LOCUS_6750" /EC_number="2.3.1.-" /note="WP_011036326.1 GNAT family N-acetyltransferase (Xanthomonas campestris) [pid:35.3%, q_cov:94.0%, s_cov:77.8%, Eval:7.6e-19]" /note="MGA_1024" misc_feature complement(840..>1853) /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_005812214.1:DUF401 family protein" /note="WP_005812214.1 DUF401 family protein (Desulfitobacterium hafniense) [pid:21.5%, q_cov:92.9%, s_cov:82.1%, Eval:1.6e-15]" /note="MGA_1025" /locus_tag="LOCUS_6760" ORIGIN 1 actacctcgt aacggagtac ggccgcgtga acctcgtagg caagaccacc tgggagcggg 61 cggaggatat catctcgctg gctcacccgg atttccggga ggcgctgatc gccgaggcgg 121 aagagttggg catctggcgc agatcgaaca aaagatgatg acgcagacag tgcgtatgct 181 ataatcatag atgcaagcgg gtgcgcttcg acaccttcgg cgtccggcga caggtgccgg 241 acgacaaaag atctaaagga gacaacgatg gaaaagaaat ttgttttaag agacgcagaa 301 gagaaggatt acgattttat tctgcgggtc aacgaagaaa acgtggaagt gctctctccc 361 atgccgctgg agaggttaaa actgtttaaa gagcatgcgg acatgctgca ggtcgcggaa 421 gtggatggcg agttggcagc gttcatcatc tgcatgaaag aaggggacga ctggtacgac 481 agcgagaact atctgtggtt ctgcaagacc tacccgcagt tcctgtacat cgaccgcatc 541 gtgctggata agccgttccg tcatcaggga ctgggcagat tcatgtacga agccgttttc 601 gcaaaggcga aggcgaacgg ggctccggtg gtcacctgcg aagtcgacac cgtgccctac 661 aacggaccgt ccctgctgtt ccacgaagcc atgggcttta aagaagtggg cgcccagtat 721 gtacgcggag gctctgtaaa ggtgagcctg caggccgcag aagtgtaaaa cgtaagaaga 781 ataaaagaac cgctccggaa aggggcggtt ttttcgtggg gcgtgttgga ctgaaattcc 841 tacagcacaa ccgtcagcag caggtagtac gcagcagcgg cggggagcag aatggccgcc 901 acgggcagca tgtagcgcgt gatcctccca aacggcacgt ggaaataatc cgctgtcatg 961 tggatgcaga tgtgcgtggg ggagaactgc atggcggtgt acatggtggt ctgcagcagc 1021 acggccagag gcgctccggc gccggggacc gcggagaagg ccatcacggt gaacatcgca 1081 gaagtcgcgt cgcagcccac cacgaagggc gccaggaaga agaggatcat aaagatcacg 1141 aaggccggca gcggaatgct cagcagcgct ttcggcagtt cttccgctgc gccgctggcc 1201 ttcaggatct ccttgaagac catgatgagg taggtgctgc acagcacgtt tccacggaag 1261 gctttcttca ggactgcagg tagctctgcc ggctggaagc ggtgcacggc cagcagcaga 1321 aggcaggcga tgcaggccga aaacagcacg ctgcggccga acgccagcac taacacaatg 1381 atcagaagaa gagaccacag gtgagaaagt gcacccaggg cctcttttgt cttgctttca 1441 cagggcggaa ggcccgtttc ctttggaatg cggcgcgcat aaagcagata gccaagaaga 1501 aagcacagcg ccgtcatggg gatctgcagc agcacaaagg aagcaagcga cgtgccgctc 1561 aggctgcaca tcagaatgat ggaaacgtag gtgggcagga tgctctccgg aatgtggcgg 1621 aaaaatgtcg taagaaaagc ctgcagctcg acggggatgt cgtcccggca ggtatcgcgc 1681 acgatctcgc cggcgatggt gaccgcagca gcggagggca aaagcccgat aaacaccggt 1741 gcgatcgctg tgttcagcct ccggttgttg aataaagcgc tcaggttttc ctgggccttt 1801 ttcagttcgc cgcgggcttc cagcaatccc tggatcacaa agatcgcgta gac // LOCUS sequence260 1852 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence260 VERSION sequence260 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1852 /mol_type="genomic DNA" /organism="" /note="sequence260" ORIGIN 1 cctcgttgac ggcggggctg taatcgatcc agaccgccac ggcgttcgta acgggcgcgg 61 gcggggtctc cggttccggt tcgatgacgg gttcaggcgc ttccggctct ttggatacca 121 ccaggtcgat ggtgtcgcct tccgcgatgg ccatgcccgg cgccgggctc tgggtgatga 181 ccgtatcttc cttgcggttg atatcttcca cataggagat ctcgcccagt ttaaggtcca 241 gttcttcgat ctgcttcttt gcttcgtcca ggctcttgcc ctccacgttg aactgggagc 301 gcgcgacatc cttctcggag cccagcgata cgacgagggt gatctccgag ccatcgggat 361 acgtcgtacc ggcgacgggg ctctggctga tgaccgtgcc cttgggaacg gtctcgctca 421 cctcttccga aacgacgccg accttgaatt tataggtttc cagcatggtg cgggcgttag 481 ccagggactt tccgaccacg tcgggtacgg agccgtccac cttgcccttg ctgacgttga 541 cctcgatgct ctgaccggac ttgatggaag cgccggcatc cggcgtctgg ctgaggatga 601 ccccttccgc cacgtcgttg ctgggcagtt ccatgcctac cttgacatcc agtccgaatt 661 ctttgaggat ctcctccgct tcgtccagcg tatggcccac gatctcgggc gcctgcacga 721 tgtcgccggg gcggatctca tccgggtcgc tgccgctcat catgctgcgc acaaacgcgc 781 tggcagggat cgccagcatc agcgccgcaa ggatgaggac gacatacgcc cagttgaatc 841 ttctgccgcc gctctcttcg ttttcctcgc tctccgcgtc gtcgcccttc tttctgccgc 901 cggtggtcac ctcttccgag cccttggcac ctttggccag cgccggtgta aggccgccgc 961 tgtttctggc cgtcttggag aacttgacga agttcagagc cgttatcatc tcgtccgcac 1021 tgcggtaccg gccggtctgc agtttgttcg tggctttcat gacgatctct tcgagatcct 1081 gcggaatgtc ggggttgagc tcgctgggcg gggtcatctc ctcgttcatg tgcttgaccg 1141 ccacagccac cgccgtatcg ccgtcgaagg gcactttgcc cgtcagcatc tcgtacagca 1201 cgatgcccag ggaatagatg tcggactttt cgtccacgta ggcgcctctg gcctgctccg 1261 gggagaaata gtgcacggag cccatgacgg cttcctgctg ctcgcccacc agcgtgccgc 1321 cggtgacggc cttcgcgatg ccgaagtccg tgatcttggc cgtgccgtcc tgggtgatca 1381 tgatgttatg gggctttacg tcccggtgga tcagttggtg cttatgcgcc atggaaagcg 1441 cggaagccac ctgtttggcg atatccgccg cacggtaagg atccagcgga ccttcctcct 1501 tgatgatgtc ggagagcggt ctgccttcga tgagttccat gacgatgtag tagatgttgc 1561 cctctttgcc tacgtcgtac acgttgacga tattgggatg cacgagaccc gccgcgatct 1621 gggattccct gcggaagctc tcgatgaaca tggcatcttt cgtatattcc ggccggagga 1681 tcttgatggc aacaaagcgg gagagcagac ggtctcttgc cttgaagacg acggccatgc 1741 cgccttcgcc gatcttgtcc tgcagctcgt atcttcctgc taaaattctg ctgcccatac 1801 gctatccccc tatccggatg cagacgacgg agatgttgtc cttgccgccc gc // LOCUS sequence261 1852 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence261 VERSION sequence261 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1852 /mol_type="genomic DNA" /organism="" /note="sequence261" CDS 536..1024 /product="5-(carboxyamino)imidazole ribonucleotide mutase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_008763604.1" /transl_table=11 /codon_start=1 /translation="MKKVAIIMGSDSDLPVVKKGTDLLKTLEIPFEVHVYSAHRTPDQV RDFVASAKANGFGVIIAAAGMAAHLAGVIAAGTTLPVIGIPCKSSVLDGMDALLSTVMM PPGIPVATVAIDGGANAALLAAEILALGDEELAARLQAKRKADADKVLDKDAAIMERL" /locus_tag="LOCUS_6770" /gene="purE" /EC_number="4.1.1.21; 5.4.99.18" /note="WP_008763604.1 5-(carboxyamino)imidazole ribonucleotide mutase (Bacteroides) [pid:55.2%, q_cov:82.7%, s_cov:79.3%, Eval:5.5e-35]" /note="MGA_1028" ORIGIN 1 gcagcctgct ccggcggcgt tatgggcgac cactgctccc ccatttccga taccaccatc 61 atggcttccg caggcgcgca ctgctaccac ctgaaccacg tgttcacgca gctgccctac 121 gctctcacgg tcgccgctgt tgcgttcgta tccttcatcc tggctggact catccagcag 181 gtatggatct gcctcatcat cgccatcgct ctgatgatcg caactctgct ggtcatcgac 241 aagatcgaga gaagcaagaa ccacgatatg tacaaggcta tcgacgaagc ttatgccgct 301 cacatggccg gcaagtaatc gaaacctgtc ttatccaaac cgggtccttc ggggcccggt 361 tttatttttc gaacgaaaag atcgtttttg ttaaccatca tccgtgtaaa tccgaacgtt 421 cgactttttg ccatcaaaat cgtttcaaat tcacaccgat ttcgttgtaa ttccaacccc 481 cgaagtgtag agttagactg tacgaaaatg aacgctgctc tattaaggag gcattatgaa 541 aaaagtcgcc atcatcatgg ggtccgacag cgatctgccg gtggtcaaaa aaggcaccga 601 tctgctgaag accctggaga tccccttcga agtccacgtc tattccgccc accgcacgcc 661 cgatcaggtc cgcgattttg tcgcgtccgc gaaggcgaac ggtttcggcg ttatcatcgc 721 cgctgccggc atggcagccc acctggccgg ggtcatcgcc gcaggcacca cgctccccgt 781 catcggcatc ccctgcaagt cttccgttct ggacggcatg gacgccctgc tttccaccgt 841 catgatgccc ccgggcatcc ccgtggcgac cgttgccatc gacggcggcg ccaacgcggc 901 tttgctggcg gctgagatcc tcgcgctcgg agacgaggaa ctggccgcga gactgcaggc 961 gaagcgcaaa gccgatgcgg ataaagtcct ggacaaggac gccgccatca tggaaagact 1021 gtaacaggag gcagctatgg gaggtttctt cggcatcaca tccggaaaag acgtcgtact 1081 ggacgtattc ttcggcacgg actatcattc tcaccttggg acgaagcgcg gcggcatggc 1141 cgcctgggac gagcagatcg gcctgcagcg cgagatccac aacatcgaaa attccccgtt 1201 ccgcacgaaa ttcgaccacg tgctggacga gatgaagggg accgcagcca tcggctgcat 1261 ctccgatacc tatccgcagc ctctgctcat ccgctccaac ctgggcgtgt acgccatcac 1321 aacgatcggc gtcatcaaca acgcgccgga cctcatcgac agctacctgt ccttctccgg 1381 cggccacttc ggcgtcatga ccggcggaca ggtgaacggc accgagctga tcgcagcgct 1441 catcaaccag aagagcacct tcgcggaagg catcagcttt gcgcagaaga gcatagaagg 1501 cacggccaac atcctcatct taaaggacga cggcagcctg atcgcggcga gagaccgcgt 1561 gggcagactg cctgtcaaga tcggcaaaga cgaagacggc ttcgccgttt ccttcgaaga 1621 cttcgcctac cagaagctgg gctacgaaga ttataaggaa ctgggcccgg gggagatcgt 1681 ggagatcacc ccgaagggca tcaaacagct gaaggccccc ggcaagaaaa agcgcatctg 1741 cgcgttcctg tggagctact tcggctatcc gacagccacc tatgaagggg tcaccgtgga 1801 atccatgcgc taccgcaacg gcgccatcct cgcggaaaac gacctggcca ga // LOCUS sequence262 1851 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence262 VERSION sequence262 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1851 /mol_type="genomic DNA" /organism="" /note="sequence262" CDS complement(114..782) /product="16S rRNA (guanine(527)-N(7))-methyltransferase RsmG" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011462328.1" /transl_table=11 /codon_start=1 /translation="MDRTQQLEKLRDVILEWNEKINVTAIRDPKEFDRKNVQDSLAILP LPEYEGAKEVLDMGTGGGFPGLPLAVCSPEKSFVLADAIGKKLKVVQAAAQELGLVNVE TVHARAEDMAKTKVHRERYDLVVSRAVANMATLSEYCLPFVKLGGFFIAYKTEDAAEEI EAAKGAIARLGGQIRRIEKTSPNNDALLNGHVFVVVEKIAKTPKEYPRKAGTPGKDPLK " /locus_tag="LOCUS_6780" /gene="rsmG" /EC_number="2.1.1.170" /note="WP_011462328.1 16S rRNA (guanine(527)-N(7))-methyltransferase RsmG (Desulfitobacterium) [pid:42.3%, q_cov:99.1%, s_cov:90.0%, Eval:1.5e-44]" /note="MGA_1031" misc_feature complement(787..>1851) /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_009898858.1:tRNA uridine-5-carboxymethylaminomethyl(34) synthesis enzyme MnmG" /note="WP_009898858.1 tRNA uridine-5-carboxymethylaminomethyl(34) synthesis enzyme MnmG (Clostridioides difficile) [pid:60.5%, q_cov:98.3%, s_cov:55.3%, Eval:1.4e-116, partial hit]" /note="MGA_1032" /locus_tag="LOCUS_6790" ORIGIN 1 gtcccagagc tccttttccc ggccggcaaa ttccaggatg cagccccagc cgcccacgtt 61 ctcctcgttc tgattgccgg agcaggcgcc gtccgtgtac atgttgacga tcttcatttc 121 aggggatcct ttcccggcgt gcccgctttt ctcggatatt cctttggcgt tttcgcgatc 181 ttttccacca cgacgaaaac gtgaccattc aaaagcgcat cgttattagg cgatgttttt 241 tcaatgcgcc gaatctgacc gcccagcctg gcgatggccc cttttgcggc ctcgatctcc 301 tccgccgcgt cctccgtttt ataggcgatg aagaagcctc ccagctttac gaacggcagg 361 cagtattccg acagcgtcgc catgttggcc acggcccggg acaccaccag atcgtagcgc 421 tcgcggtgga ccttcgtctt cgccatgtcc tccgcccggg cgtgcaccgt ctccacattg 481 accagaccca gctcctgggc cgccgcctgc actaccttca gcttcttgcc gatggcgtcc 541 gccagcacga aggatttctc cgggctgcag actgccaggg gcaggccggg aaaaccgccg 601 ccggtgccca tgtccagcac ctccttcgcc ccttcgtact cgggaagggg caggatagcg 661 agactgtcct gcacgttctt acggtcgaac tccttgggat cgcggatcgc tgttacgttt 721 attttctcgt tccactccag gatgacgtcc cggagcttct ccagctgctg tgttctgtcc 781 atcgctctat tcctgcgctt tctgcgacgt gcggcgcatc ttctccaggg tcaccagcag 841 cacgccgatg tccgccggcg atacgccgga gatccgggac gcctgaccca cgctcagcgg 901 gcgctgcgcg tccagtttct gacgggcttc gatgcggaga ccgtccatgt tgagataatc 961 cagatccgcc ggaagcgctt tgtcttccag cttcttaaag cgttcgatct gcgccagctg 1021 cttctcgata tagccggcgt atttgagttc cacttctacc ttggatcttt cgtgggcgct 1081 taatgcgggc cggtccggat cgatagctgc caggttctcg taggtgacct ccggccgctt 1141 taaaagatcc gccaggctct gccggttgtc cgtcggcgca gagcccaggc tctccagata 1201 gggattcgcc tctgccggtg agaccgtcgc cgttttcagg cgggcgagct ccgcatccac 1261 tgcggtctgg gatttctgga accgctccca gcggtcatcc gagacgaggc cgatcttgcg 1321 ccccagcggt gtaagccggg tgtccgcatt gtcctggcgc agcaccaggc ggtattccgc 1381 ccgggacgtc atgatgcggt aaggctcgtt cgttcccttc gttacgaggt cgtcgatgag 1441 cacgccgatg taggcctggg accggtccaa gatgaagggg tctttgccgt ccagccaaag 1501 tgctgcgttg accccggcca tcagcccctg ggccgccgcc tcttcgtagc cggagctgcc 1561 gttgaactga cccgcacaga acacgccggg gaagtcccgg tgctccaggt taagctggat 1621 gtccagcggg tcgatgcagt cgtattcgat ggcgtaggcg gagcgcacga cctccagatt 1681 ttccaggccg ggcatggtct tatagaaccc gatctgcacg tcctccggca tgctggaaga 1741 catgccctgc aggtacatct cctcggtgga caggccctcc ggctccacga agcactgatg 1801 gcgctccttg tccgcgaagc ggttcacctt gtcctcgatg gagggacagt a // LOCUS sequence263 1849 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence263 VERSION sequence263 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1849 /mol_type="genomic DNA" /organism="" /note="sequence263" ORIGIN 1 ccgcatggca cggcgcagac catatcatgg tcatccgcca catgggtcag tcccacatcg 61 acggcctgat ggagggtact ccccagggta tcggcggcat ccccgtaacg agaaagcagg 121 ttagagccca gagaaaggcc ctggatctga tcgaggatga agtcggcaga cccatcaact 181 atcactccta catctccggc gttgcaggcc ccgacatcgc ggtcatgttc gctgaagaag 241 gcatcaacgg cgctcaccag gatcctcagt acaacgttct gtacagagac gtcaacatgg 301 taagatcctt cgtagacgcc tgcgaatcca agaagatcat gacctgggca gacatgctcc 361 agatcgacgg cgctcacaac gccaacgcca ccgcaagaga agcctggaag gtaatgccgg 421 agctgatcgt tcagcacgcc atcaactccc tgttctccga aaaggtcggc gaaaagcccg 481 aaaacatctc tctgtccacc gtacctccca cggctacgcc ggctccgtgc atgtatatgg 541 acctacccta cgctgtcgcc ctgagagaga tctgcaacag atataagatg agagcccaga 601 tgaacaccaa gtacatcgac tcctccgcaa gagaagcgac cgttactcac gttatgaaca 661 tgttcatctc caagctcacc cgcgcggaca tccagtccac cattacgccg gacgaaggca 721 gaaacgtacc ctggcacatc tacaacatcg aagctaccga caccgcgaag cagacgctga 781 ttggtctcga cggcctgatg gagatggtcc agctgaacaa cgaccccaac ggcccgctgc 841 gcaagaaggt ccgcgagctg aaggaaagag ccacgctgtt catggaagag atcgtagagg 901 tcggcggcta cttcaaggct gtccaggaag gcttcttcgt agactccgcc atgtaccccg 961 agagaaacgg cgacggtatc gcccgtaaga tcgagggcgg cgtaggcgta ggcaagatct 1021 tcgaaagaga tccggactac atggctcctg ttacggctca ctacggctac aacaacgtcg 1081 agcagtacgg cggcgacccg aaggatccct ccgctctcat cggcggctgc accttcgaag 1141 accgttccaa gatcgtctac atcgacgaac tggacgagac cgactgcgta gacagacgtc 1201 tggaaaagac cgcgaagtac agagacggcc acaccattaa gcccgaaatg gaatggtgcg 1261 gcgacggaac cgtcatgatg accatgtgca tcccgaccaa caagcgcgtt gcggaagcag 1321 tcgctgtcga gatcggtaag aagcttggtc tcgtggatcc ggaagtcatc tcccgcgaag 1381 ttctgcagga agcggaaggc accagaatcg agatgaaggg caaggtcgac ttcgatatcg 1441 acatcaacac catcgacatt ccggaagaac cgcactacat gtccgatgca gagctgtacc 1501 acgaatttga ggaagtcaag cacatgaagg ccatctgcgg caccgtgggc gaagacgaac 1561 actccgtcgg tatgcgcgag atcatgaaca tcaagcacgg cggcatcgag aagtggggca 1621 tcgaatgcat ctacctcggc acctccgtac ctctcgaaaa gatggtcgac gcagccatcg 1681 aagagaacgc ggaagccatc ctggcctcca ccatcatctc tcacgacaat atccactaca 1741 agaacatgaa gagactccat gagctctgcg tggaaaaggg tatccgtgac aaggtgatcc 1801 tctgcgccgg cggcacccag gtcattcctg aggaagccgt taagaccgg // LOCUS sequence264 1848 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence264 VERSION sequence264 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1848 /mol_type="genomic DNA" /organism="" /note="sequence264" CDS complement(625..1281) /product="tRNA (guanosine(46)-N7)-methyltransferase TrmB" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003565908.1" /transl_table=11 /codon_start=1 /translation="MRQRSVKNRDAIAADCSAWIEDDPKAKRGSWRSAFADPSLPLHLE IGSGKGRFICEMARLHPDINFIAVEGGKKINVRILQKAKDYNLSNLLVIMDYIVDARDF FAEGELDRIYLNFSDPWPKARNAKRRLTYREKLKAYEACAAPGAVLQFKTDNDGLFDYS LEEIRSRGLLLRWVTRDLHHSPYAEWNVETEYEQKFSARGKSINCLQAVLKKCNE" /locus_tag="LOCUS_6800" /gene="trmB" /EC_number="2.1.1.33" /note="WP_003565908.1 tRNA (guanosine(46)-N7)-methyltransferase TrmB (Lacticaseibacillus) [pid:50.3%, q_cov:87.6%, s_cov:88.8%, Eval:5.8e-46]" /note="MGA_1035" misc_feature complement(1282..>1848) /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_011860635.1:energy-coupling factor transporter transmembrane component T" /note="WP_011860635.1 energy-coupling factor transporter transmembrane component T (Clostridioides difficile) [pid:67.2%, q_cov:95.7%, s_cov:67.4%, Eval:6.0e-64, partial hit]" /note="MGA_1036" /locus_tag="LOCUS_6810" ORIGIN 1 acttggcgtc gacgaccttc tgcttggcag ttgcggcgtg gatggtggac atcagaccgc 61 cgtcgatgcc gtattcagtc tgcaggacct tgcacagcgg agcgagacag ttcgtggtgc 121 agctggctgc agaaacgata tccattgaac tttcgtactt ctcctggttg acgccgtaga 181 cgaatgtcgg ggtcacctta tccttagccg gagcggacat gatgactttc ttcgcgccgc 241 cgacaaagtg ggccttcgca tcctcggact ttacgtaagc gccggtggcg tcgatgatgt 301 attcggcacc gagttccttc caggggatct tggaagcgtc gccttcgctg tagacgagga 361 tcttcttgcc gtcgatgatg atgccgtcgt ccgccttctc cagcttgccg gggaagcgtc 421 cgtagacggt gtcatatttg atcatataga gcatgtagtc gatgtccgct tcgcgctttg 481 cgatcgcgac gacgtcgaat acttccggct gctgcagagc gatgcgcaga gcgatgctgc 541 cgatgcggcc gaagccgttg attcctaact taatagccat tttctcctcc tcattggccg 601 cacagggcgg tcccaacctc tcagctattc gttacatttt ttcaaaactg cctgcaggca 661 gttgatggac ttgcctctcg cggagaactt ctgctcgtac tccgtctcca cgttccattc 721 cgcgtagggg ctgtggtgga ggtcccgggt gacccagcgc agcagcaggc cgcggctgcg 781 gatctcctcc agggaatagt cgaacaatcc gtcgttatcc gtcttgaact gcagtacggc 841 accgggcgcc gcacaggctt cgtatgcctt cagtttttcc cggtacgtaa gtctgcgctt 901 ggcgttgcgg gccttcggcc agggatcgct gaagttcagg tagatgcggt ccagttcccc 961 ttcggcgaag aagtcccgcg catccactat ataatccatt ataacaagaa gattggaaag 1021 attatagtct tttgcctttt gcaggatgcg gacgttgatc ttttttccgc cttccactgc 1081 gatgaaattg atgtccggat gcagccgtgc catctcgcag ataaaccggc ctttgccgga 1141 accgatctcc agatgcagcg gcaggctggg gtccgcaaag gcgctgcgcc agcttcccct 1201 ctttgctttc gggtcatcct cgatccaggc gctgcagtcc gccgcgatcg catctctgtt 1261 ttttacacta cgctgtctca tttagaacac cggcagcttt ccgatagcga tgaccgccgc 1321 aaaatacaat accaggatga ccgccgcgat gcggtcgcaa ttgtggaagg ccatgccgtt 1381 catgcgggtg cggccgtcgc cgccccggta gcagcgggct tccatggcca tggccaggtc 1441 cgccgcgatg cggaaggcgc tcacgaacaa gggcaccagc agtggaatga gccctttagc 1501 gcgctgcagc agattgccgc tctcaaaatc cgcgcccctc gctgtctggg ccttcatgat 1561 cttgtcggtc tcgtccagca gcgtggggat aaagcgcaga gcgatggtca tcatcatggc 1621 cagctcgtgg gaaggcaggc cgatcttgct taaaggcgag agcagccgct ccatgccgtc 1681 cgtcaaggcc acgggcttgg tggtgagggt caaaagggat gacccgaaga tgagcatgac 1741 gagccggatc gccataaagc aggcgcggta gatgccctcc cgggcgatct tcaggatgcc 1801 gaagcgccag atggggtcgc cgggggtcat gaacaggttg atgatggc // LOCUS sequence265 1844 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence265 VERSION sequence265 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1844 /mol_type="genomic DNA" /organism="" /note="sequence265" misc_feature <1..837 /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_011948404.1:UvrD-helicase domain-containing protein" /note="WP_011948404.1 UvrD-helicase domain-containing protein (Clostridium botulinum) [pid:44.2%, q_cov:98.6%, s_cov:30.9%, Eval:1.6e-63, partial hit]" /note="MGA_1037" /locus_tag="LOCUS_6820" ORIGIN 1 agtctgtaca cctgcctgca gaaccacctg gacgacgaga tcttcaaggg cacgaaagcc 61 gcgaagttta tcgatctgat cgagactttc gccaaacttg ccgagtctat gcccatctcc 121 gaactgtttt cgaaactggt ggaccaaagc ggctacgagg ccatgctgcg cacggaaggc 181 agccaggagc ggctcgacaa tctggcagag ctcaagcagt ccatctacga atacgagacg 241 agctgcgggg aggagacctc gctgcagcac tatctggagc atgtggcgct gttctccaat 301 gcggaacagc ccatcgcgga aggcaaggta aagctcatga cgatccacgc cgccaagggc 361 ctggaattcc cctacgtctt tctgtgctcc ttaaacgaag acgtcttccc ctccaagaaa 421 gtgagcacgc tgcaggccat ggaagaggag cggcgtctgg ccttcgtggc ccttacgaga 481 gcggagaagg cgctgttcct gtccgatgcg gaaggacgca cacacgaagg aacccagcgc 541 tatccgtccc ggtttctgtt cgacatcggg gaagaactgc tggatgtgga gaacaagccg 601 cctgaggatc tggtgcgcga cgcgaaggag atgatcgcgg tcaagacaaa gcgcatgccg 661 gaaaacctgg aaaaaactgc gctggcgccc ggcacccggg tgcgccacga catcttcggc 721 gaaggctgcg tggtggatac cgacgtcaac gcgggcgtct atatcatcca attcgatatg 781 ctcgataccc cgcgcagact gaatatgcgt ctaaaactgg aagtattggg ttcttaacag 841 atgcagaaga ccctcagagt atgttaaaat aaataaatta gcgcattatc gtagcagttt 901 tgagggcact atgggcatcc tgttttccag catgatcggt acgctggcgg tcatcttcgt 961 catcgcgttc tttatcggag gcagcgatct tctgccgatg ttcctcggca tgaagagaaa 1021 ctggaaattc atacttaccg ccggcgtcgt cggcggtgcg ttcggcatct acggcaatct 1081 gacgggcacg tctctgaacg gggccgtcat ttccgtgcgg gatatcggcc ccatgatggc 1141 cggctttttc ggcgggcctc tgggcggact gctgggtggg ctcatcgcag gcgcccaccg 1201 gctcaccatg ggcggcatta cggcaaaagc ctgcatcgtc gccacttgca tcatcggtgt 1261 cctctgcggc ctcttgtccc ggcgttccca cgatcagctc atccgtcccc ggttcgcgtt 1321 cagcgtcggc atcgtgatgg aagcgctcca tctgggcatc gttctgctga tggtcaaacc 1381 cttcgagacg gcgctggaca tcgtccggca gatcgccatt ccctttatcc tggtaaacgc 1441 gctgggcttt acgctgctca tcagtctgat gacttacgtg gaaaagcagc gcaatctgat 1501 cctggaacag aaccgcctcc agtcggagct gaacacggcc aacgtcatcc agcggtcgct 1561 gctgccgccg atcacggaca gctatccggg acggtccgag ttttccatcc gagcttccat 1621 gaccccggca aaagtggtgg gcggagattt ctacgacgtg ttcttcgtgg atcaggaccg 1681 catcgcgttc ctgatcgcgg acgtctccgg caagggcatt cccgctgcgc tgttcatggc 1741 aagcgcgaag atcacgctgc agaactgcat ccgggacttt tcggatctgg cggaagcggt 1801 ggaaaaagcc aacgacagcc tctgcgccaa caacgaggcg gaga // LOCUS sequence266 1822 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence266 VERSION sequence266 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1822 /mol_type="genomic DNA" /organism="" /note="sequence266" CDS complement(316..1056) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MSDRVLEVNNLSVVYQDSTVFGKKSNFQALTDVTFHIDHGEIVGL VGESGCGKSTLSKAILGMLDDAKITGEIKHYTKRPQMVFQDPHGSLNPAKTVGWILEEP LRIFGKYDAPERKRRVLNMMTRVGLDHELITHKPNELSGGQKQRVSIATALIQRPRFVV ADEPVSALDVSIQGQILQLLLDLRDELDLSYLFITHDLNLCYSICDRVLVMYKGQLVEQ GPVDDVYEHPQHEYTKALLDAVLK" /locus_tag="LOCUS_6830" /note="WP_013384738.1 ATP-binding cassette domain-containing protein (Ketogulonicigenium vulgare) [pid:41.9%, q_cov:99.2%, s_cov:71.7%, Eval:5.2e-52, partial hit]" /note="MGA_1040" misc_feature complement(1049..>1822) /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_004081442.1:ABC transporter ATP-binding protein" /note="WP_004081442.1 ABC transporter ATP-binding protein (Thermotoga) [pid:47.6%, q_cov:98.1%, s_cov:76.0%, Eval:2.8e-64]" /note="MGA_1041" /locus_tag="LOCUS_6840" ORIGIN 1 atcccgctgg acttctccga cgcgacggac gcctatatcg tttgctgcaa ggggctgcct 61 gtgggggtca ccgtggggga ggaacaggac ggcgtcctga atctcgttct ggactacacc 121 atccccgaat accgggactt ctccgtcggg cgcttcctcg ctgcggaatt aaaaaaacag 181 ggcgtccgca aactgtgtta cggaggccct gtggaatttc atctgccgta tctgcagaag 241 ctcggctacg tcaagaacgg ggagctctac gaaaaggaac tgtagtgcac agtgtacctg 301 tccccatggg acattttatt tcaggacggc gtcgagcagc gcttttgtgt attcgtgctg 361 cggatgctcg tagacgtcgt ctacgggtcc ctgctccacg agctggcctt tgtacatgac 421 gagcacgcgg tcgcagatgg aatagcagag attcaggtcg tgggtgatga acaggtagct 481 cagatccagt tcgtcgcgca ggtcgagcag cagctgcagg atctgcccct ggatggagac 541 gtccagagcc gagaccggct cgtccgccac gacgaagcgc ggtctctgga tgagggctgt 601 cgcgatggac actctctgtt tctgaccgcc ggacaattcg ttcggcttgt gggtgatcag 661 ctcgtgatcc agcccgactc tcgtcatcat attcagcacc cggcgcttgc gttcgggtgc 721 gtcgtatttt ccgaagatgc gcagaggttc ttccaggatc catcccaccg tcttggcagg 781 gttcaggctg ccgtggggat cctggaacac catctggggc cgcttcgtgt aatgcttgat 841 ctctcccgtg atcttcgcgt cgtccagcat gcccaggatc gccttggaca gggtggattt 901 gccgcagccg gattccccga ccaggccgac gatctcgccg tggtcgatgt ggaacgtcac 961 gtccgtaagc gcctggaaat tgcttttctt tccaaacacc gtagagtcct ggtacacgac 1021 ggacaggtta ttcacttcga gaacgcggtc actcatggcg tctcctcttg gggatggcag 1081 ccatcagctg ccgggtgtat tcgtctttcg gcgcgttgaa aatgtccagg gtcttgccct 1141 gttccacgat gtttccttta tacatgacgg cgacgttctc gcacagctgc ttcacgacca 1201 gcaggtcgtg gctgatcagc agaatgccga ccttgtattc gtcgctgagt tccttcagca 1261 gcttcaggat cttcgcctgc acgctgacgt cgagcgccgt ggtgggttcg tcgcagatga 1321 gcagcttcgg gtggatcacc atcgcggccg cgatcatggc gcgctgccgc tgacccccgg 1381 aaagctggtg cgggtatttg ctgtagatct cgtccggatt gggcagacct acgcggtcga 1441 gggcgtcgat cgcgagtttt ctgcgctctt cgggcgtttt tttcgtgtgg atgcgcagcg 1501 tctcttccac ctggtagccc accttgatga ggggattgag cgagttcatc ggctcctgga 1561 acacgacgcc catgcccggt ccctggatgg aacggagctg gctgcggctg cagcggtgca 1621 gatccatgcc ctcgaacacc acgtccccgg tcacggtcac gcggctgcgt tcgatcagtc 1681 cggtgatggc catggccgta acggtcttgc cggaaccgga ctcgcccacg aggcccagcc 1741 gttcgccttc ctgcatggag aaactgatgc cgtggagcgc ttccttgttg ttgtcgagga 1801 acgtgacccg caggtctttt ac // LOCUS sequence267 1821 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence267 VERSION sequence267 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1821 /mol_type="genomic DNA" /organism="" /note="sequence267" misc_feature complement(365..>1821) /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_010880620.1:AMP-binding protein" /note="WP_010880620.1 AMP-binding protein (Aquifex aeolicus) [pid:34.9%, q_cov:98.1%, s_cov:52.7%, Eval:1.1e-66, partial hit]" /note="MGA_1043" /locus_tag="LOCUS_6850" ORIGIN 1 atgacgttat gcactttatc cagcttttcg cagacgcggt tgagagcctt catgacctcc 61 agatcgctct ccagcgaata atccgccagt tccgcgactt cgtccagttc gcacatctgc 121 ggaacgcgca gcagcaggta ttcggtctcg aggcccgctt ctttcagttt gcggatctgc 181 gacagccggc tggtacccag ctgctttgca ccggcatcca gataggtctt cgccgcgatg 241 ggatcggacc agtaggcctt caccacgccg catacgtcga tgccgcagcg tctgcagcgg 301 tcaacgacct gcttcgcgtt ataccgcagc tttgccagat cgatctctaa ctggggatac 361 atgtttacca cctcttgatt ttctgtgtcg ttgttttttc gaattccgtg tcgcgcaggg 421 agaagcgctt gacccgcttg tacagcggca tcatgtcgtt gcagcggtcg atctccttct 481 tgatgagcgc ctggagggcg tcaccggaag gactgccggc ctccgccagc gcctctttgt 541 ccgggaagat ctccgccgta acagccatat cctgcttgtc gtcttcgccc cgcaccacga 601 cttccttgat gtaggggctc ttgagcagat aatactccac ttcctcgggg aagatgttct 661 tgccgttctt cgttacgatg acgttcttct tgcggcccgt gatgtacacg tagccgtccc 721 ggtcgatgta gccgtagtcg ccggtgtgca gccagccgtc ttcgctgagg actttcttcg 781 tttcatcttc gtccttgtag tagcccagca tgacggcggg actcttgcag acgatctcgc 841 cgatgccgtc ggagtcgggc tggtcgatga agaccttcgt cccgggaagc ggcagtccta 901 cggacgcggg cttgcaggcg taatccgggt tgagagcgat gatcggcgag cattccgtca 961 tgccgtaacc ctgcaccatg ttgatgccca tggccatgta gttgcggatg acgttcgggt 1021 cggatgccgc gccgcccacg atgaacagtt ttacatttcc gcccatggcg ttgtgcacat 1081 ctttaaacag ccgcgcggtg cgcttctgca ccttcttatc gatgtgggag agcgccttta 1141 ccatcttgat ggccttgcgc atcttatccg ccttgccggc cttttccgcc tgcttccaga 1201 tcttgttgtg catgttctcg aagatgaggg gtacggcgat caggtacgtc accttggcct 1261 gctccatgtt cttcgtgatg tatttcaggc cttcgcagaa cgccaccgtg ccgccctggt 1321 gcatcgagcc aagcaccgtc gccgtaaact cgaacgtgtg gtgcatgggg agcagcgaca 1381 ggcagacctt gcggtcctta aagcggtcca gttcgacgta ttcgtacaaa gcgctcacat 1441 cgtaggccag gttgcggtgg cagagcatga cgcccttcgc cagtcccgtc gtacccgacg 1501 taaagatgag cgtgcagaaa tcgtccggtt ccacgggcag ctgtgcatag ttgtccgaac 1561 ctacggaacg gagcgcaccg cccttgttgc gcagtttgcg ccaggacagc acctcttctt 1621 cgtcttccgc cagatccatg cagatgagct ggatgttgtc catcccctgc agcgcctctc 1681 tcactttcgc gccgaccttc gcagaataga cgatggcgga gatgtccgcg cgtccggcca 1741 gggccgatac ttcctgcacc ggaagttcct tgtcgagggg cacgatgacc cccagaccgc 1801 aggccacggc gaaataggtt a // LOCUS sequence268 1818 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence268 VERSION sequence268 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1818 /mol_type="genomic DNA" /organism="" /note="sequence268" misc_feature <1..1030 /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_003440033.1:glycosyltransferase" /note="WP_003440033.1 glycosyltransferase (Clostridioides difficile) [pid:47.8%, q_cov:90.4%, s_cov:79.0%, Eval:7.9e-82]" /note="MGA_1044" /locus_tag="LOCUS_6860" CDS complement(1203..1796) /product="thymidine kinase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011073032.1" /transl_table=11 /codon_start=1 /translation="MAQLYYRYSTMNAGKSIELLKVAYNYEERGKHVLVLTPSFDDRYG VGKINSRIGISRDAIAISGDEDLLELYKKYEAQQHIDCMLIDECQFLKKHQVLELAHVV DDYNCPVLTYGLKNDFRNELFEGSHYLLLYADKIEEIKTICHCGRKATMVARVDENGNM LKEGAQLVVGGNDMYVSLCRKHYMAGDLGPDFKK" /locus_tag="LOCUS_6870" /EC_number="2.7.1.21" /note="WP_011073032.1 thymidine kinase (Shewanella oneidensis) [pid:56.5%, q_cov:94.4%, s_cov:96.9%, Eval:1.2e-60]" /note="MGA_1045" ORIGIN 1 cgacggctac gatttcgaga tggaagacaa ggagaacggc gcgcgggtcg gcaaggataa 61 ggcttttgct acagaactgc tcgtgagcgc cacgctggcg ctggatgaga tggctgcaga 121 acagatcgcc cgcattcagc ccgatctggt ggtttctgat tccgtagcgt tctggggcaa 181 actgaccgct atgaagtacg ggctaccgta cgtctgctcc accacgacat tcgcgttcaa 241 ccgctactct gccgcctata tgaaagaggg ccccttcgac atcgcgaaga tgctgctttc 301 cattccgaag atcaataaac agataaagcg gctgcgggag aagggctatc cggtgaaagg 361 gcttttggat atcgtgcaga acgacaatga cacgaacacc atcgtctaca cgtcgaagga 421 attccagccc cgcagcgaga cgttttcgga ccggtatcat tttatcgggc cgtccatccg 481 ccctgtgcag acgccggtgg aaaagacggc ggaaaagacc atctacatct ccatgggaac 541 ggtggataaa gacgaaggat tttaccaccg ctgcatcgaa gccttccggg atacggacgt 601 tcaggtgatc ctgtccatgg gtcagaatac ggagcagttt acggatctgc cgggcaacat 661 ccatgcgtat ccaactgtcg accagatggc cgtgctgtcc atcgccgact gcttcgtgac 721 ccactgcggc atgaattccg catcggaagg cctgtatttc gaagtacccc tcgtgctgtt 781 cccgcagacg cccgaacagg acgctgtggc aaaacgcacg gaggagctgg gcgccggtct 841 gcgcttgacc gatacgtctg ccgaaggcat ccgcagggcc gtcgagaccg tcctgaacga 901 tccatcctat cagcaagctg ctcaggagat ctccgcggga tttaaaagat gcgggggtta 961 tcaggaggca agggccttta tcgagtcttt gcagcgtgcc ggggagggtg gctttcaccg 1021 caaattatga tttgaccacc gcaatatgcc atctttttaa gggttttgtg tggttcttct 1081 ttcgaacaat aaaaaagaca ccattttcga gacgttttca cttcaaaaat ggtgtctttt 1141 tcgatgttct agaaatgtgc tccgctctca gggtcacgca aaagagcgca tggcacggac 1201 cgctatttct taaaatccgg ccccaggtcg cctgccatgt agtgcttgcg gcacagggac 1261 acatacatgt cgttgccgcc cacgaccagc tgggcgcctt ccttcagcat gttgccgttc 1321 tcgtcgactc tggccaccat ggtcgccttg cggccgcagt ggcagatcgt cttgatctcc 1381 tcgatcttgt ccgcatacag cagcagatag tggctgcctt cgaacagctc gttgcggaag 1441 tcgttcttca gcccgtaggt gagcaccggg cagttgtagt cgtccacgac gtgggccagc 1501 tccagcacct ggtgcttctt gaggaactgg cattcatcga tcagcatgca atcgatgtgc 1561 tgctgcgctt cgtatttctt ataaagctcc agcaggtctt cgtcgccgga gatggcgatc 1621 gcatcccggg agatgccgat gcggctgttg atcttcccca cgccgtagcg gtcatcgaag 1681 gatggcgtga gcaccagcac gtgcttgccc ctctcttcgt agttatatgc gactttcagt 1741 aattctatgg attttcccgc gttcatcgtg ctgtagcggt agtatagctg agccatgaca 1801 atatctcctt gtttttaa // LOCUS sequence269 1811 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence269 VERSION sequence269 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1811 /mol_type="genomic DNA" /organism="" /note="sequence269" CDS complement(124..885) /product="SDR family NAD(P)-dependent oxidoreductase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003436810.1" /transl_table=11 /codon_start=1 /translation="MNIAVITGASSGMGREFVYAVDREYELDELWVVARRKERLEELQE KCRAKVRPLAWDLADPASFERFRSLLEAEKPHIRVLVNAAGYGLFGTFEEMGLEEQLGI VDVNDKALTAMCLLSLPYMEKGDGIVNLGSNSSHQPVPFLNVYAASKAYVLSFSRGLGR ELKPRGVHVMCVCPGWIKTEFMDTAVRDDTIKYYDRWYTPQQVIEQGMKDLKMKKKVSI LGAPVRRQVRLVKFLPVDVVMDTWCRQQGKE" /locus_tag="LOCUS_6880" /note="WP_003436810.1 SDR family NAD(P)-dependent oxidoreductase (Clostridioides difficile) [pid:34.0%, q_cov:98.0%, s_cov:96.5%, Eval:5.4e-44]" /note="MGA_1046" CDS complement(928..1512) /product="helix-turn-helix domain-containing protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_015943659.1" /transl_table=11 /codon_start=1 /translation="MDNYVTGAVIRQLREEKQMTQEELAGKVCVSSKAVSKWETGRGLP DISLLQPLAQALGISVIELFSGGIIQNRNRSSNMGKTVFYVCPVCGNVVRTVGEAVVSC CGIVLPPLEAESPDPDHMLNLEIVEDEYYVSVAHPMDKAHYIAFLAAIADQSVQFVKLY PEGNADARFPIRRVKYLYAYCNRHGLFRVKV" /locus_tag="LOCUS_6890" /note="WP_015943659.1 helix-turn-helix domain-containing protein (Desulfitobacterium hafniense) [pid:38.9%, q_cov:97.4%, s_cov:96.0%, Eval:1.6e-38]" /note="MGA_1047" ORIGIN 1 cagatgaaag taagtatttc tcaaacagaa ctgcaaagtg ccgatgatat cttatgcaat 61 ccaggttggt gaccgttctc tactacagac cggtacgcaa gcggttgatc cacgcagcct 121 gccctactcc tttccctgct gacggcacca ggtgtccatc accacatcta cgggcaggaa 181 cttcacgagc cgcacctgcc ggcgcacggg cgcgcccagg atcgagacct tctttttcat 241 cttcaggtcc ttcataccct gttcgatcac ctgctgaggc gtgtaccagc ggtcatagta 301 cttaatcgta tcgtcccgca cggcggtatc catgaattcc gtcttgatcc atcccgggca 361 gacgcacatc acgtgcacgc cgcggggttt cagctctctg cccaaacctc tggaaaagct 421 taaaacgtaa gccttgctgg ccgcgtagac gtttaagaac ggcacgggct gatggctgga 481 attggagccc aggttgacga tgccatcgcc cttctccatg tagggcagcg acagcagaca 541 catggcagtc agggctttat cgttgacatc cacgatgccc agttgctcct ctagtcccat 601 ttcttcgaat gtaccgaaca ggccgtagcc ggcggcgttc acgagcaccc ggatgtgcgg 661 tttctccgcc tccagcagcg agcggaagcg ttcgaaactg gcagggtcag ccagatccca 721 ggccagcggg cgcaccttgg cccggcattt ttcctgcagt tcctccagcc gctcttttct 781 gcgggcgacg acccacagtt cgtccaattc atattctctg tctaccgcgt agacgaattc 841 tcttcccatg ccggaggatg ctccggtgat gactgcgatg ttcatggcat atctccttgc 901 tccgtttgga gatattatac catattctca gaccttcacc cggaacagcc cgtggcggtt 961 gcagtatgcg tacaggtatt ttacgcggcg gatgggaaag cgggcatctg catttccttc 1021 cggatacagt tttacaaact gcacgctctg gtcggctatg gctgccagga aagcgatgta 1081 gtgggccttg tccatcggat gcgccacgga gacataatac tcgtcttcaa cgatctccaa 1141 gttcagcata tggtccggat ccggcgattc ggcctccagc ggcggcagca cgataccgca 1201 gcagctgacg accgcctccc cgaccgtgcg gacgacgttg ccgcagaccg ggcagacata 1261 gaacaccgtc ttacccatat ttgaggaacg gtttcggttc tgaatgatcc cgccggaaaa 1321 gagctcgatc acggagatcc ccagtgcctg tgccagcggc tggagcagac tgatatccgg 1381 cagacctctg cccgtctccc atttgctcac cgccttgctg cttacgcaga ccttcccggc 1441 cagttcttcc tgggtcatct gcttttcttc gcgtaattgt cggatcacgg cacctgtcac 1501 gtaattgtcc atctcagtct cctccttaca gactcagtgt aaggcacagc cgaagaaaac 1561 gccacctacg cggcgtagag tcccgttttt catccgtcga aaaaaggagg cctgccccct 1621 gcagacctcc ttgtagttgt tatctgtaat cccttttgaa cgttttactt ctgcactgcc 1681 tcgaccgccc ggtggagatc atcggtaaag ttcatctgca gcagcgcatt cagcacattt 1741 acataattct catttgcgtt aacatcgagt acaaggtgct taaaggtcgg atttcccgca 1801 tcgtcgtagt c // LOCUS sequence270 1810 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence270 VERSION sequence270 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1810 /mol_type="genomic DNA" /organism="" /note="sequence270" CDS complement(366..1586) /product="methionine gamma-lyase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003400106.1" /transl_table=11 /codon_start=1 /translation="MHDIDFSKVGFSTMAIHAGAYDDAAYGAEATPIYQTSTYTFKDLN EAEAVFRGELPKYGYGRHGNPTTATLERKIAALECAEAAAVTSSGMGAVSSVLLGELSC GDHMICADTVYGCTDKVVREYLPTFGIETTMLDTSDLEALEAAFKPNTKMVYFEAVANP TLRVTDIAAVAEIAHKHGAIVVVDNTFTPPPVCRPLTLGADIVLHSMTKYLNGHGDVIA GVIAGKKETISAIVSKCVGKLTGSELAPIASYMVIRGLKTLDVRMKVHSASAKAMAEYL EKQPYIKAVYHPTLPSNGKNYETAKKQFREGYCTGMITFETAKYKGMSEYEVARKLLDN LQIPGLGVSLGGADSLIQLPTAMTHAKVPAEGKKAAGITDGMVRFSVGLENIEDLIADF EQAAAKL" /locus_tag="LOCUS_6900" /gene="megL" /EC_number="4.4.1.11" /note="WP_003400106.1 methionine gamma-lyase (Clostridium) [pid:45.2%, q_cov:98.0%, s_cov:98.0%, Eval:4.3e-93]" /note="MGA_1050" ORIGIN 1 agacatcctg gaacgcagca ggttctgccg tgctggcagc cggcgcttcc atgggggtct 61 ccgggttgga gatgtagatc gtgcgggtat tgccgtccca gcgcaccgct ttgcccacga 121 attcgcagac cttggccaga ggcaggtagg tcgtgccctt atacaggatg ctgtagggca 181 cgtcgcccgt cgtgcgtacg aagctttctc cttccaccgc cgtctgaacg ccgtttacct 241 cgatattgat cttgttgaag ctcgcgtcca ccacagatgc aaaggcgctg gcagtcgaga 301 ccgccagtgc caatgcgagg gtcaacgcaa tccggagagt gcgtttcata ttcgatcctt 361 ttgctttaca gcttagcagc agcctgttcg aagtctgcga tgaggtcttc gatgttttcc 421 aggccgacag agaaacgaac catgccgtcg gtgatgccgg cagccttctt gccttctgcg 481 gggacctttg cgtgggtcat cgcggtgggc agctggatga gggagtctgc gccgcccagg 541 gatacgccca ggccggggat ctgcaggttg tccagcagct ttctggcaac ttcgtattcg 601 ctcataccct tgtatttagc ggtctcgaag gtgatcatgc cggtgcagta accttcgcgg 661 aactgcttct tggcggtctc gtagttcttg ccgttggagg gcagagtggg atgataaacg 721 gccttgatgt agggctgctt ctccagatat tccgccatag ccttggcgct ggcggagtgg 781 accttcatgc ggacatccag ggtcttgagg ccgcggatga ccatatagga ggcgatggga 841 gccagctcgg aaccggtgag cttaccgacg cacttggaga cgatcgcgga gatggtctcc 901 ttcttgcctg cgatcacacc cgcgatcacg tcgccgtggc cgttcaggta cttggtcatg 961 gagtgcagaa cgatgtcggc gcccagggtg agcggacggc atactggagg cggcgtaaag 1021 gtgttgtcta cgacaacgat ggcgccgtgc ttatgcgcga tctcggcgac cgctgcgata 1081 tcggtgaccc gcagagtggg gttggcgact gcttcgaagt aaaccatctt ggtgttgggc 1141 ttgaaagcag cttccagcgc ttccaggtcg gaagtgtcga gcatggtggt ctcgatgccg 1201 aaggtgggca gatattcacg gacgacctta tcggtgcagc cgtaaacggt atctgcgcag 1261 atcatatgat caccgcagct cagttcgccc agcaggacgg agctgacagc gcccatgccg 1321 gaagaggtaa cagcagcagc ttctgcgcat tccagagctg cgatctttct ctccagcgtc 1381 gcggtggtgg ggttgccgtg tctgccgtaa ccgtacttgg gaagctcgcc gcggaaaaca 1441 gcttctgctt cattcaggtc tttgaaagtg taagtggacg tctgatagat cggggtcgct 1501 tccgcgccat acgctgcgtc gtcataggcg ccggcatgga tcgccatggt ggagaaaccg 1561 accttagaga aatcgatatc gtgcataatt tcctccttac tcaatatcgt cggcggctgg 1621 tgccgcagtt ttaactatag tatagtttat ccccttttga cggtgtttgc aattcccaag 1681 aaccgcctgt tttatcctaa aatcttacac ttccaccgcc aattcttcga tggaggcgtt 1741 gatccccagg atgccttccg caatatttgt ggcgtggtcg gagatacgct ccaggtcgct 1801 caccatgtcg // LOCUS sequence271 1808 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence271 VERSION sequence271 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1808 /mol_type="genomic DNA" /organism="" /note="sequence271" misc_feature <1..1008 /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_002680089.1:methylaspartate ammonia-lyase" /note="WP_002680089.1 methylaspartate ammonia-lyase (Treponema denticola) [pid:64.7%, q_cov:98.2%, s_cov:79.4%, Eval:1.7e-118]" /note="MGA_1052" /locus_tag="LOCUS_6910" CDS 1095..1376 /product="citrate lyase acyl carrier protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003566181.1" /transl_table=11 /codon_start=1 /translation="MSTLKKASCGTMESSDAYMELEPIAAGVQIDLQSVVEHQFGDSIR ALAADMLQQEGIDNVSLRIVDRGALECTLRARLETLIARAREAGGANA" /locus_tag="LOCUS_6920" /gene="citD" /EC_number="4.1.3.6" /note="WP_003566181.1 citrate lyase acyl carrier protein (Lacticaseibacillus) [pid:45.7%, q_cov:87.1%, s_cov:80.2%, Eval:5.0e-13]" /note="MGA_1053" ORIGIN 1 gcgaaggact tcatccccgt catcgacaag tacatcaagc ccatgctcgt aggcaaggaa 61 gccgataact tccgccagct ggcagccgag atggaagcca tccaggtcga aggcaagaga 121 ctgcacaccg ccatccgcta cggcgtatcc caggccatcc tggacgctgt cgccaaggcc 181 aagcacatga tgatgtgcga agtcgtcgcg gaagaatacg gctgcgaagt ttccgacaag 241 cccatcgaca tcttcaccca gtccggcgac gaccgctatg acaactccga caagatgatc 301 atcaagcagg cgcaggttct gccccacgct ctgatcaaca acgtcgagac caagctcggt 361 ccccagggcg aactgctcga aaagtacgtc gcatggctga gagacagaat cctgaacaac 421 agagcggacg agaactataa ccccatcttc cacatcgacg tatacggcac catcggcgcc 481 gcgttcggca acacgaactt caaggctatg gccgactatc tcgaaaagct ggcggagacc 541 gcgaagccgt tccacctgcg catcgaaggc cccatggact gcgacgttga cagagagacc 601 cagatgctcg ctctgaaggg cctgaccgaa gagatcgacc gcagaggcat cgacgtcgaa 661 ctggtcgccg acgagtggtg caacaccctc gaagacgtca agtacttcac cgacaaccac 721 gccggtcaca tggtccagat caagactccg gacctgggcg gcgtcaacaa caccatcgaa 781 gcggtcctgt actgcaagca gcacggcatg ggcgcctatc agggcggtac ctgcaacgag 841 accgaccgca gcgctcaggt ctgcacccag tgcgcgatgg cgacgcagcc cgctcagatc 901 ctggccaagc cgggcatggg cgtagacgaa ggctacatga tcgtttacaa cgaaatgcag 961 agagtcctgg cgctgagagc tgccaagaag gcctgcggct gcaaataagc gaaagcctgc 1021 ctgaaagggc gtactgaaaa gcccgaagcg tcgaaacttc gggctttttt caacaaggaa 1081 aggaacatcc tgatatgagt acactgaaaa aggcttcctg cggcaccatg gaatccagcg 1141 acgcttacat ggagctggaa cccatcgcgg cgggcgtgca gatcgacctg cagtccgtgg 1201 tggaacacca gttcggcgat tccatccgcg cgctggcagc ggacatgctg cagcaggaag 1261 gcatcgataa cgtatccctg cgcatcgtcg acaggggcgc gctggagtgc acgctccggg 1321 cccgtctgga gacgctgatc gcaagggcga gagaggcagg tggagccaat gcgtagatcc 1381 atgctgtttt taccgggcaa cacgccgaac atgatcctca gcggcgactg cctcggcgcg 1441 gacgccatca tcctggacct ggaagacgcg gtcgctcccg accagaagga cgcggccaga 1501 gtgctggtcc gcaacgcgat caagtatctg cagttccccg gcgtggagaa gatcatccgc 1561 atcaactccc tggatacgcc atactggcag aaggacctgg acgagatggt ccccctgaag 1621 ccggagctca tcatgacccc gaagacctcc tgcgcagcgg acgtgctgga attcgacgcc 1681 tacatgtccg aactggagga taagctggga ttcgaaagaa ataccgttaa gctgctgcct 1741 ctcatcgaga cggcgctggg cgtggagaac gcatttgcca tcgcctctgc cagcaagaga 1801 gtcgcagc // LOCUS sequence272 1803 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence272 VERSION sequence272 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1803 /mol_type="genomic DNA" /organism="" /note="sequence272" CDS 388..888 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MSDRTLLIIIFLLELLAVYNLYDTVWVMLLHLSRRGVSASGTIAE LKKAMRRDRARLFVPTNGKLDSRDINCDYLVDIDYEREGGETVHLKNYVIPSIMKLTAG SASPIYKEGQTLPLKVSRSIRKMAVVDLPEVRARQVSWLWLILWVVTVLVLGFVIVSLI SAL" /locus_tag="LOCUS_6930" /note="MGA_1056" CDS 912..1205 /product="GIY-YIG nuclease family protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_002379749.1" /transl_table=11 /codon_start=1 /translation="MSDPSRTALKKRVYSQRYVYLLRCKDGSLYCGISTDPEARLKQHN YGVGAKYTRSHGPCTLVYTEGPYEYGHALSREAAIKKMTKEQKERLLDTTNR" /locus_tag="LOCUS_6940" /note="WP_002379749.1 GIY-YIG nuclease family protein (Enterococcus) [pid:48.1%, q_cov:79.4%, s_cov:89.8%, Eval:5.9e-14]" /note="MGA_1057" ORIGIN 1 agatccaggg cccgttgttc ttcggcagcg tggagaaact gtcccagatc acggccaagg 61 agaagacgaa ggcgctggtg ctgcgcatgc ggagcgtaac ggcgctggat gccacggctc 121 tggcctctct ggagaagctg tatgaccgct gcatcgccca ggggacgaag gtcgtgttct 181 cccacgtcaa tccccagccc atgaaggtaa tggagcacag ccggtttacg gaaaaggtgg 241 gcagagaata cttttgcagc cacatcgacg aagccatcga gatggccgaa gcgatcgcca 301 tggaataaaa gcacagaaag cgaaacgata gcacagggaa accctccctg tgctataata 361 ttatattatg acaaaggagg atcgttcatg agcgacagaa cgctgctcat catcatattt 421 ctgctggaac tgctggcggt ctataacctg tacgacacgg tgtgggtgat gctgctgcat 481 ctgagccgcc gcggcgtgag cgccagcggt acgatcgcgg aactgaagaa agccatgcgc 541 cgggacagag ccagattgtt cgtccccacg aacggcaagc tggattcccg cgacatcaac 601 tgcgattatc tcgtggatat cgattacgag agggaaggcg gggagaccgt ccacctgaag 661 aactacgtta tcccgtccat catgaaactg acggccggtt ccgccagccc gatctataag 721 gaagggcaga cgctgcccct gaaggtgagc cgcagcatcc ggaagatggc cgtcgtggat 781 ctgcccgagg tgcgcgcccg ccaggtgagc tggctttggc tcatcctctg ggtggtcacc 841 gtcctcgttc tcggctttgt tatcgtttct ctcatctctg cgctgtaggc gcagaagaaa 901 ggaaaagggt tatgagtgac ccatccagga ccgcactgaa aaagcgggtc tacagccagc 961 gctacgtcta cctgctgcga tgcaaagacg gcagtctgta ctgcggcatc tcgacggatc 1021 ccgaagcgcg gctgaagcag cacaactacg gcgtcggcgc gaaatatacc cgcagccacg 1081 gcccctgcac gctggtctac accgagggcc cctatgagta cgggcatgcc ctcagccgag 1141 aagcggccat caagaagatg acgaaggagc agaaggagcg tttacttgac accacaaata 1201 ggtagtgtta ctatttgtgg taattcaaca aagcgtgttg aacttttttt atactctatc 1261 cccctggagg atccatgcat acccagaaac tcaaaggctc acagatcatt attgagaccc 1321 tcatcgagca gggtgttacc catattttcg gatatcccgg cggccaggtg ctgcagatct 1381 acgatcagct gtataaaaat caggagcgca tcactcacgt gctgacggcc cacgaacagg 1441 gcgcggcgca cgcggcggac ggctatgccc gcgcaacggg caaggtaggc gtcgtcctgg 1501 cgacttccgg tcccggtgcc acgaacctga cgacgggtct tgcggccgcc atgatggatt 1561 ccgttccggt ggtcgcgatc accggcaatg tgccgaccta tttcatcggc aaggactctt 1621 tccaggagat caacactatc ggcatcacca tgccgatcac caagcacaat ttctacgtca 1681 ccgacgttac aaagcttgcg gagaccatcc gcgaggcctt ccgcatcgcg aaatccgggc 1741 gtcccggccc cgtcctcgtg gatgtcccca gcgacgtgca ggcggcggaa acggatttta 1801 caa // LOCUS sequence273 1802 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence273 VERSION sequence273 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1802 /mol_type="genomic DNA" /organism="" /note="sequence273" CDS complement(604..1380) /product="arginine ABC transporter substrate-binding protein ArtP" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_004398706.1" /transl_table=11 /codon_start=1 /translation="MAKKLTALLLALCMIFTLAACSGGSSSDETWESELGTAGKLRVGM AADYPPYESYDAQGNVVGLDADIAAMIAEELGVELEIVPMEFDTIISAVTAGTVDMGIS CFSYTEERAKSVLFTETYMTSAQCCFASTEYGINTLEDLNGGLVGAGNGTTGMEVAEAM APEYGFSTQAGEIAVMSESLKSGAMQAIITEQCVADSYIAANPGKFQMIAEDLTVEEIK AITNMNNDKLQAKVDEIIKAFVDSEAYSELVVKWFD" /locus_tag="LOCUS_6950" /gene="artP" /note="WP_004398706.1 arginine ABC transporter substrate-binding protein ArtP (Bacillus) [pid:32.1%, q_cov:96.9%, s_cov:96.1%, Eval:5.4e-31]" /note="MGA_1060" ORIGIN 1 acgaagaatc cttcagcagg acgatgaatt cgttgatgta gggcggcaga atgcgcttaa 61 aggcctgggg caggatgatc tcctgcaggg tctgccggtg cgagaggcct atggtctgcg 121 ccgcctccca ctgccctttg tccacggact ggatggcgga gcggaacagt tccgtcgtgt 181 aggcgccgga gttgatgccc acggcgatgg tgcccaccag gatggggttg ggcgtataca 241 cgtaatggaa cagggccttg gtgaccacgg gaccgcccag gtagagcagc aagatctgca 301 gcatcatggg ggtgccgcgg atgacctcca catagatgtt ggcgatcagc ttgggcagct 361 tgtgtttgcc catcttcgcc atggcggaga gcaggcccag cacggaaccg ccggccaggg 421 cgcatacggc caccagcacg gaatagcccg cgcctttgat cataaactgg agattttcgg 481 gggtgaggat tctttcgatc gcgttcataa acgggtacct cttagacgac aatcatggca 541 ggaagggtct ccctgccatg atgcatgcgg tttcggttgt tccgggatct gcgttccgtt 601 gtcctagtcg aaccacttga cgaccagttc gctgtaagct tcgctgtcga cgaaggcctt 661 gatgatctcg tcgaccttag cctgcagttt gtcgttgttc atgttcgtga tggccttgat 721 ctcttctacg gtgagatctt cggcgatcat ctggaactta ccggggtttg ctgcgatata 781 ggaatcggct acgcactgct cggtgatgat ggcctgcatg gcgccgctct tgagggattc 841 gctcatgacg gcgatctcgc cggcctgggt ggagaagccg tattccgggg ccatcgcttc 901 ggcgacttcc atgccggtgg tgccgttgcc ggcgccaacc agaccgccgt tcaggtcttc 961 cagggtgttg atgccgtact cggtggaagc gaagcagcac tgggcggagg tcatgtacgt 1021 ttcggtgaac agaacggatt tggcacgttc ttccgtgtag gagaagcagg agatgcccat 1081 atcgacggtg cctgcggtga ccgcgctgat gatcgtatcg aattccatgg gaacgatctc 1141 cagttctacg cccagctctt ctgcgatcat ggccgcgata tcggcgtcga gaccgaccac 1201 gttgccctgt gcgtcgtagg attcataggg cggatagtct gccgccatgc cgactctcag 1261 cttgccggcc gtgcccagtt cgctttccca ggtctcgtcg gacgaggagc cgccggagca 1321 ggcagccagt gtaaagatca tacagagcgc cagaagcagt gcagtcagtt tctttgccat 1381 tttgttttcc ttctttcttg tcttatccta attgcaattt tatacgtgag gagtgattac 1441 gctaggattt tattctttgt tatgcgggtt gtcaaggggt attattcact atttaatcat 1501 ttttagaaag tttttatgca tttgtgtgca taaatcgtct gaacaacaaa aaaggaggcc 1561 gaggcctccc tgttctatgt gacccgtaca gggccgctcc gcttcgccgc agctcaggga 1621 tctggtgttt cgacggtttc tttcgcgtgc cgtttcggga ccgcgagacg acctcggccg 1681 gtttcgtctt tgcgaaacgc ggcctcaagc aacgtctcgc cgggtcaagc ccgcccgaaa 1741 cggattccgc tcagaaaccg gaaacacaga cgatcccttc acatccggct cataggagcg 1801 gc // LOCUS sequence274 1793 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence274 VERSION sequence274 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1793 /mol_type="genomic DNA" /organism="" /note="sequence274" CDS complement(79..651) /product="indolepyruvate oxidoreductase subunit beta" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011393759.1" /transl_table=11 /codon_start=1 /translation="METKNIMIVGVGGQGSLLASKLLGKMLLEEGYDVKVSEVHGMSQR GGSVVTYVRYGDKVYSPIIDKGEADFIVSFELLEAARWMEYLKPGGQIVTSTQQIDPMP VVTGAAAYPEDLVAKMKAAGAKVDALDCLALAKEAGSSKAVNLVLMGRLSHYFGMADEV WQKAIETSVPAKFLELNKKAFELGKNA" /locus_tag="LOCUS_6960" /note="WP_011393759.1 indolepyruvate oxidoreductase subunit beta (Moorella thermoacetica) [pid:50.3%, q_cov:96.3%, s_cov:95.3%, Eval:1.2e-48]" /note="MGA_1061" misc_feature complement(655..>1793) /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_010965301.1:indolepyruvate ferredoxin oxidoreductase subunit alpha" /note="WP_010965301.1 indolepyruvate ferredoxin oxidoreductase subunit alpha (Clostridium) [pid:51.5%, q_cov:99.2%, s_cov:64.2%, Eval:4.2e-111, partial hit]" /note="MGA_1062" /locus_tag="LOCUS_6970" ORIGIN 1 atttccggtt gatagtaccg ctccatacaa atgtcctttc ttaaaatgtc tgctgtatcg 61 gtcgattttt atcgcaaact aggcattctt gcccagttca aacgctttct tgttgagttc 121 caggaacttg gccggcacgg aggtctcgat ggccttctgc cagacttcat ccgccatacc 181 gaagtagtgg gagagtcttc ccatcaacac caggttgacg gctttgctgc tgcccgcttc 241 cttggccagc gccagacagt ccagggcgtc gactttggcg cccgccgcct tcatcttagc 301 gaccaggtct tcagggtagg ctgctgcgcc tgtgaccacc ggcatcggat cgatctgctg 361 ggtggatgtt acgatctgtc cgccgggctt cagatattcc atccagcggg ccgcttccag 421 cagttcgaag gatacgataa agtccgcttc gcccttgtcg atgatggggg agtagacttt 481 gtcgccatag cgcacgtacg taacgacgct gccgcctctc tggctcatgc catggacctc 541 ggatacctta acgtcgtatc cttcttccag cagcatcttg cctagcagtt tgctggcgag 601 gaggcttccc tgtccgccta cgcctacgat catgatgttc ttggtttcca tgggctacgc 661 ctcctttccc gtgctctcga acgcatccat cgggcacagc tgcgtgcaga tgccgcagcc 721 cacgcacagc gtgtcgtcca catgggcctt gccttccttg atggatatgg ccgggcagcc 781 gatcttcatg caggacttgc agccgacgca cttgtccgtg ttcaccttca gcggtgcatt 841 gtgcttcacg tacttcagca gcgcgcaggg ccgtctggag atgatgacgg aaggttcttc 901 cgccgccagt tcttccttga ctgccgcatc gcaggctgcc aggtcgtagg gatccacgac 961 tcttacgcgg cggatgccca tggccttgca cagggattcc agatcgatct tgccggccgg 1021 gtctcccttg atgttgtagc ccgtggtggg gttctgctgg tgaccggtca tgccggtgat 1081 ggagttgtcc acgatgataa cggtggaatt gctctggtta taagcgatgt tggcgaggcc 1141 ggtcatgccg gaatgcataa acgtggagtc gccgatgacc gccacagtct tgcctttgct 1201 ctccttgccc agggctttgt taaagccgtg ggtggcggag acggacgcgc ccatgcacag 1261 ggtcatctcg atggaagaga ggggtggtgc cgcacccagc gtgtagcagc cgatatcgcc 1321 caaaaccgtg cacttgttct tcgccagggt gtagaacagg cctctgtggg ggcagccggg 1381 gcacatcacg ggaggacggc cgggcagcgc ttcgtccaga gcctttccgg tgtggacagg 1441 ctgctccagt ttctccgcga tgaggttctg ggagaattca cccagcaggg ggaatgcctc 1501 cttgccgcag caatccagac ccagctctct gacgtaggtc tcaatgaagc cgtccagctc 1561 ttcgacgatg acgagttttt ccacgctctt ggcaaattca cggatcttct gctcgggaag 1621 gggccagatc atgcccagtt ttaagaccgg gaactgcccc ttgcacactt cctgcacgta 1681 ctgataggac gtggaagagg tgatgatgcc gatgctctta ttcgcgccgt cttcgatgcg 1741 gttgagatcc gtcgtttcgg cgaactcggc cagtttcttc gtgcgctcct cca // LOCUS sequence275 1792 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence275 VERSION sequence275 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1792 /mol_type="genomic DNA" /organism="" /note="sequence275" CDS 89..838 /product="type I methionyl aminopeptidase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003421130.1" /transl_table=11 /codon_start=1 /translation="MIVLKSHEEIELMAKAASVTAAMLEEIPNILMPGMTTLELDHWCE DYILRHGMKPAFKGYGGFPGTACISVNEEVVHGIPTKRRVLNEGDIVSVDLGTIYKGFY SDAARTYPVGKVSAEAQKLMDVAEGSFFEGLKFCKKGHRLGDVSHAIQMYVEANGFSVI RDYVGHGVGRELHEDPQIPNYGKANHGPQLVPGMVIAVEPMIAAGEYDVEVLSNGWTAV TLDRSWAAHYENTIVITEDEPRLLTKL" /locus_tag="LOCUS_6980" /gene="map" /EC_number="3.4.11.18" /note="WP_003421130.1 type I methionyl aminopeptidase (Clostridioides) [pid:56.2%, q_cov:100.0%, s_cov:100.0%, Eval:7.7e-80]" /note="MGA_1064" CDS 861..1079 /product="translation initiation factor IF-1" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003421127.1" /transl_table=11 /codon_start=1 /translation="MAKKDSIEVFGTVLEALPNAMFKVKLENDFIVMAHISGKMRMNFI RILPGDRVRMELSPYDLSKGRITWRDK" /locus_tag="LOCUS_6990" /gene="infA" /note="WP_003421127.1 translation initiation factor IF-1 (Clostridioides) [pid:75.0%, q_cov:100.0%, s_cov:100.0%, Eval:5.8e-25]" /note="MGA_1065" CDS 1316..1684 /product="30S ribosomal protein S13" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_005810116.1" /transl_table=11 /codon_start=1 /translation="MARIAGVDLPREKRVEIGLTYIYGIGLPTSRLILEKAGINPDTRV KDLTEEEVGSIRKIIDSEYVVEGDLRREVSMNIKRLMEIGCYRGIRHRRNLPVRGQNTK NNSRTRKGPKKTVGRKKK" /locus_tag="LOCUS_7000" /gene="rpsM" /note="WP_005810116.1 30S ribosomal protein S13 (Desulfitobacterium) [pid:75.7%, q_cov:87.7%, s_cov:87.0%, Eval:1.2e-43]" /note="MGA_1066" ORIGIN 1 gaagagcgga acgcttgccg agatcgatgg cagcaagacg cccgacgaag tgttcgaaga 61 catctgcgcc atcctcggag agtaagtcat gatcgtactg aaatcccacg aagagataga 121 gctgatggcc aaggccgctt cggtaacggc cgccatgctg gaagagatcc caaacatctt 181 aatgcccggc atgacgacgc tggagctgga ccattggtgt gaggactaca tcctgcgcca 241 cggcatgaag cctgccttta aagggtacgg cggattcccc ggcaccgcct gcatctccgt 301 caacgaggaa gtcgtccacg gtattccgac caagagacgc gtcctcaacg aaggagacat 361 cgtaagcgta gacctgggaa ccatctacaa aggcttttac tccgacgctg cccggaccta 421 ccccgtaggg aaggtcagcg cggaagccca aaagctgatg gacgttgccg aaggcagctt 481 cttcgaaggt ctgaagttct gcaaaaaggg acatcgcctc ggcgacgtat ctcacgcgat 541 ccagatgtac gtggaggcca acggcttctc cgtcatccgc gattacgtag gacacggtgt 601 cggacgggaa ctgcacgaag atccgcagat ccccaattat ggcaaggcaa atcacggccc 661 gcagctggtc cccggcatgg tgatcgctgt ggaaccgatg atcgcagccg gtgagtacga 721 tgtggaagtt ctgagcaacg gctggaccgc ggtcacactg gaccgctcct gggcggctca 781 ctacgaaaac acgatcgtca tcaccgagga tgaaccgaga ttgctcacaa agctttagac 841 acgcaaagga ggagcccgct atggcgaaaa aagacagcat cgaagtattc ggcacagtgc 901 tggaagctct gcccaacgcg atgttcaagg taaagcttga gaacgatttc atcgtaatgg 961 cgcatatttc cggcaagatg aggatgaact ttatccgtat cctccccggc gaccgggtcc 1021 gcatggagct cagcccctac gacctgtcca agggacggat cacctggaga gataaataat 1081 cctaccaaca ggaggaatca aacaatgaaa gttagagcat cagtcaagcc catctgcgaa 1141 aagtgcaagg tgatcaagcg caatggcaaa gtcatggtca tctgcgaaaa ccccaagcat 1201 aagcaggtcc agggttaata accgaaacgg ttactgtgtt ccggcgggcg gcgaaccgcc 1261 ttatacggaa cgtaaattat aaacaatagt tgcagtacaa taggaggtaa catttatggc 1321 tcgtatagcc ggtgtcgatc tgcccagaga aaagagagtg gagatcggcc ttacctacat 1381 ctatggtatt ggtcttccca cttccagact catcctggaa aaggcgggca tcaaccccga 1441 caccagagtg aaggacctta ccgaagaaga agtaggttct atccgtaaga tcatcgattc 1501 cgaatacgtc gtggaaggcg atctcagaag agaagtttcc atgaacatca agcgcctgat 1561 ggagatcggc tgctatagag gaatcagaca cagaagaaac ctgcccgttc gcggacagaa 1621 caccaagaac aacagccgta cccgcaaggg cccgaagaag actgttggcc gcaagaagaa 1681 gtagggagaa ggaggtaagc tacaatggca acagtaaaga agactgtacg caaaaagaga 1741 agagagcgta agaacattga aagcggtcag gctcatatcc aggcttcctt ca // LOCUS sequence276 1787 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence276 VERSION sequence276 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1787 /mol_type="genomic DNA" /organism="" /note="sequence276" CDS 566..1621 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MELKAPDFRKREDKLSGWLDGEVRTFLFDSFSDDYCTRTGMEFLR GVDIPIKPGDLAAFHGEGGLPVTDLADNMACVMGANTQFKYRDAYIAYLALYFNEKLVD VLVQKGATELREQHYRKSCIYFRAALLLDDQNRDAMFGYACCCREWYLSMEGEDQQELI GILKKEATEYFEHVTRVYPDYAAAYYFLGYAYVNAGQYKKAELAWKKFLKLNEEKTAVA TEPVEGANESDEVKEIRERVASLEDPVKIEEGINALAAGHLEDGLRILERYVGTQYDNW WPLHYYLASAYRELGFFDEAIEGFKRVLALQPSHEESCECLADLYAADGDAENSEKYRR KAEIIRKNRME" /locus_tag="LOCUS_7010" /note="MGA_1069" ORIGIN 1 aggaactgat cgcaggcgtg cgccgggcgg aagacgccgg catcgcggca tccgtgtcct 61 ttatctcggg gctcggcggc cgggaactgt ggaaagagca tgcggtggat tcggcgacga 121 tgatctccga gatgcatccg tcgtatgcgt cctggcttac gctgatgctg gatccgtcgg 181 ctcctgttac gcaggacatc gcggaagggc ggttcgaact gctgaagcct gcggaggtcc 241 tggaggagat ggacgtgatg ctctcgcata tcgacatgcc ggagggctcg acctgcgtat 301 tccgcagcaa ccacgcatcg aactacctgt ctctgaaggg cgatctgccg aaggatacag 361 agaagatgct ggcggtggtg cggcaggcga aggagaatcg cgatatgctg cggccggagt 421 tctggcgggc gctgtaaggc ctgtcccggc atgcgggcgg aaacgcccgg tatactgttg 481 atctggagat gccgcagaag gcccctaatc ggcgctctgc ggcgttttta taggattttc 541 gggtacttac ccgtttggag gaaacatgga gctgaaagcc ccggatttta gaaaacgaga 601 ggataagctg agcggctggc tggacggcga ggtccgcacc ttcctgttcg acagcttttc 661 cgacgattac tgcacccgca ccggcatgga atttctgcgg ggcgtggaca ttcccatcaa 721 gcccggcgac ctggcggcct tccacggcga agggggtctg ccggtgacgg acctggctga 781 caacatggcc tgcgtcatgg gcgcgaacac ccagtttaag taccgggatg cctatatcgc 841 ctatctggct ctgtatttca acgaaaaact ggtggacgtc ctggtgcaga aaggcgcgac 901 tgagctgcgg gagcagcatt accgcaagag ctgcatctat ttccgggcgg cgctgctgct 961 ggacgatcag aaccgcgatg ccatgttcgg ctacgcctgc tgctgccggg aatggtacct 1021 gagcatggaa ggggaggatc agcaggagct gatcggcatc ctgaagaaag aagcgacgga 1081 gtatttcgag catgtcaccc gggtgtatcc ggactatgct gcggcttact acttcctggg 1141 ctatgcctac gtaaacgccg ggcagtacaa gaaagccgag ctggcgtgga agaagttcct 1201 gaaactgaat gaggagaaga ctgctgtagc cactgagcct gtcgaagggg caaacgaaag 1261 cgacgaagtc aaggagatcc gcgaacgggt cgcttccctg gaagatcccg tgaagatcga 1321 ggaaggcatc aatgcgcttg cggcgggtca cctggaggac ggcctgcgca ttctggaacg 1381 ctatgtgggg acccagtacg acaactggtg gccgctgcac tattatctgg cgtctgcgta 1441 ccgggagctg ggctttttcg acgaggcgat cgagggcttt aaacgcgtgc tggcgctgca 1501 gccgtcccac gaggaaagct gcgagtgcct ggcggacctt tacgccgccg acggcgacgc 1561 cgagaattcc gagaagtacc gccgcaaagc ggagatcatc cgcaagaacc ggatggaata 1621 gaaaaatctt caattcccat taaaaacgaa ggagaaatag catgaaactt ggtattatcc 1681 gctgtatgca aaccgaagat ttctgccccg gcacccggga tttccacacg atacgccaca 1741 agtccggcgt gttcgaaggt ttggacgagg atattacgct ggtaggc // LOCUS sequence277 1767 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence277 VERSION sequence277 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1767 /mol_type="genomic DNA" /organism="" /note="sequence277" CDS complement(451..1251) /product="mechanosensitive ion channel" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_009902661.1" /transl_table=11 /codon_start=1 /translation="MDYKALIESATQVCIKVVIALIVLWIAFTIINKISKSLEKLLGKS GKLDKTITSTLAYVARIALKVLVVLGLVGYLGINTAGIATIIASLGVGVGMAINGAVAN FAGGLLILITRPFKVGDFIDVGGTVGTVEEIRLVHTKIATLDNKVVYVPNGTASGATVV NYSEKETRRVDQVFHISYESDANKALELLLQLADRNPAVLKDPAPFAKISGAGDSSIEL TTRLWCKGADYWDVYFYMLENAKPAFDAAGISIPYPQIDVHMKN" /locus_tag="LOCUS_7020" /note="WP_009902661.1 mechanosensitive ion channel (Clostridioides difficile) [pid:38.5%, q_cov:98.5%, s_cov:88.8%, Eval:1.5e-52]" /note="MGA_1072" ORIGIN 1 atctaaccag cggtattccg tggagacctt cgtcgtgacg gtgcccacga ccgccagacc 61 gcactcgttg gtgcagcagg cgtagtaggg gccgtccgtc gagaagcagg aatcctgcag 121 ataggtgtat ttgtaggtct tgtccggcag aggcacggcg aagccgtgct ggtacatgcc 181 ggtgtccacc atctcccgac cggactgaga agaagcgggc tgcacgaaga acatcttgtt 241 gcagacgccg ctgccctggt cctcggaccg tccgatgagg gtcgtgcctt ccgcgctcac 301 ctccttgccc acgtagacgc cggtgcaggc gtagacaggc gctgcggcaa acagcagaat 361 cgccaggaat aaagtcagag ttcgtttcat ggaaaaacac ctcgaatgaa agaagacggc 421 ccgcaagggc cgtctgtgtg tcctttcgga ctagttcttc atatgaacgt cgatctgcgg 481 atacgggatg gagatgccgg ctgcgtcgaa ggcaggcttt gcattttcca gcatgtagaa 541 gtagacgtcc cagtaatccg cgcccttgca ccagagtctc gtggtgagct cgatgctgga 601 atcgcctgcg ccgctgatct tcgcgaacgg agctgggtct ttcaggactg ccgggtttct 661 gtccgccagc tgcagcagga gttcgagggc cttgttcgcg tcggactcat aggagatgtg 721 gaagacctga tcgactcttc tggtctcctt ctcggagtag tttacgacgg tagcgccgga 781 ggcggtgccg ttgggaacgt agaccacttt gttgtccagg gtagcgatct tcgtgtggac 841 gagacggatc tcttcgacgg tgccgacagt gccgcccacg tctatgaaat cgccgacctt 901 aaacggccgg gtgatgagga tgagcaaacc gcccgcgaag ttggcgacag cgccgttgat 961 cgccatgccg acgcctacgc cgagggatgc gatgattgtc gcgatgccgg cggtgttgat 1021 gcccagatag ccgacgagcc ccagaacgac caggaccttt aaagcgatgc gggcgacgta 1081 agcaagcgtg ctcgtgatgg tcttgtccag tttgccgctc tttcccagca gtttttccag 1141 actcttgctg atcttgttga tgatcgtgaa agcgatccac aggacgatga gtgcgatcac 1201 gactttgatg cacacctggg tagcgctttc gatcagtgct ttgtagtcca tagcgtttgt 1261 ctccttctta ttaattcgtg aaaataaata tacatcagtt caactaatta tagcataaat 1321 aatatatcgg tctgaatatt ggtgataaaa tattagcata aatatatccg tctcaatttg 1381 agtctatcat ccgaggggtg acaggacccc gaggacgatg aggtgaaaac tatgcaacat 1441 accattacgg aactggaaac cgcgctccaa aagcgcatcg aagagatgaa actgcccggc 1501 gtctcggtct gtatccgcgg cccggaaggc gtcatttatg aaaagggctt cggcaagcgg 1561 agcatcgagc aggatctgga tgtgaccccg gacacggtct tcggcatcgc gtccatgagc 1621 aaatccttca ccgcgctgtc ctgctgcatc ctggcggcgg aaggcaagat gagtctggaa 1681 gaccccatta cgaagtattt cccgaacctg catctgaagg gcgtgcctga tgaactggtc 1741 accatccggc agatcggtct gcaccgg // LOCUS sequence278 1749 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence278 VERSION sequence278 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1749 /mol_type="genomic DNA" /organism="" /note="sequence278" CDS 561..1433 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MLSYEEFKNAVRTDLKKYMPRSYADHKLVETKIYRINRCVDSFHL QPPGPVREAVPMPSLNFQDLYQSIVGGAKLEKVLRLIAQTMQYTLPASVERDCAWFDED KKPDPSRLHVALINRQRNEEYLKSIPHHDFLDLSAIAVLEEGDRSGYLCVVNHGILKEL DMDEDTLLKIACANTFEQYPAVLEQSHLGLNAWCEGSTFGAVCLLDEDMLKEAADVLDS DLYILPDSLHLLFIIAVKSIPRKIVLESFSRAMLLEPDAFDFLSDNVYYYDRKKGTLRI LSARTKKIS" /locus_tag="LOCUS_7030" /note="MGA_1075" ORIGIN 1 gcgccaaagc ttcgcagcag gctttcgcgt aggacttggg gatcatctcc gcaaagatga 61 acacgacaaa agccgttacg aacgtacaag cggtaacggc tctgtttccc caaagtttgg 121 atgctaaaag cgttgccgca gaggaacatg caatatgcat gacgttgttc ccgatgagca 181 gcgtcgtgag agccttgtcg aagtggtcca gcacgtacag ggccttcttc gccttagggt 241 ctccatcgtc cgcatcggaa atcatgcgta tcttgctgac cgacgcaaaa gcagtctcgg 301 ccgcggcaaa gtacgcgcct cccaaaagca gcaacgctat gaaaactaaa tatcgcggaa 361 taacggaaat acttccggcg tccataagga cgaatcacct cctggtctca aactgaggat 421 attatagcac actctgttcg acggcacaat agcattggca ttttattact atttttgtta 481 aatttatact ttacaatttc tggcatatcc agtactatga ttttacagta tatgccattt 541 tgttcaaaag gaggttattc atgctttctt acgaagagtt caaaaacgcc gtacgcaccg 601 acctgaagaa gtatatgccc cggtcctatg cggatcacaa actggtggaa acgaagatct 661 acaggatcaa ccgctgcgtg gattcgttcc acctgcagcc gcctggtccc gtccgggaag 721 ccgtaccgat gcccagcctc aactttcagg atctgtatca gagcatcgtg ggcggcgcca 781 aactggaaaa ggtgctgcgc ctgatcgcac agacgatgca gtacaccctg cccgcctctg 841 tcgaacggga ttgcgcctgg ttcgacgagg acaaaaagcc cgatccgtcc cggctgcacg 901 tcgctctcat caaccgtcag agaaacgaag agtacctgaa gagcataccc caccacgatt 961 ttctggatct gtccgccatc gctgtcctcg aggagggcga ccgcagcggc tacctgtgcg 1021 tggtcaacca cggcatcctg aaagaactgg acatggacga agataccctg ctgaagatcg 1081 cctgtgccaa tacgttcgag caatatccgg cggttttgga gcaatcccat ctgggattga 1141 acgcctggtg cgaaggcagc acgttcggcg ctgtctgcct gctggacgaa gacatgctga 1201 aagaagctgc ggacgtgctg gattccgacc tgtacattct gccagacagc ctgcatctgc 1261 tgttcatcat cgccgttaag agcataccga ggaagatcgt tttggagagc ttctcccgcg 1321 ccatgctcct cgagccggac gccttcgatt ttctgtccga caacgtctat tactacgaca 1381 ggaagaaagg cacgctgcgc atcctgtccg cgcggacgaa aaagatctct taggagagat 1441 ccggacaaca ggaaaggccc tgccgaagca gggcccgttt cgctatttta ttcagaccgg 1501 aaaccgttct attcttccgt ctccagcaga ccgtaagatc cgtcggctct cttgtagacc 1561 acgtttacac cgccgctctc gccgtccttg tagacgaaga aattgtgctc gagcagttcc 1621 atctgcagga tcgcttcttc ggaagtcatg gggttgaggc ggaaccgctt ggtgcggacg 1681 atgccttttt ccacttcttc tgcaggcgct gcatcgggga tctcttcgaa gacgatatcc 1741 ttctgctcc // LOCUS sequence279 1733 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence279 VERSION sequence279 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1733 /mol_type="genomic DNA" /organism="" /note="sequence279" CDS complement(240..1532) /product="GTPase HflX" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_009895824.1" /transl_table=11 /codon_start=1 /translation="MIRIKDDGTVVEREEYKAILVGVSLGEDISYSLEELEGLAEAAGI ETLGVMTQNAEKINAATYIGKGKLDELAELVHNMEADLVVFNDELSGMQLRNIEDACGC RVIDRTILILDIFADRATSMEGKLQVELAQLQYRMPRLLGFGKSLSRLGGGIGTRGPGE KKLETDRRHIQRRMDEIKKEIAEVKANRSVQRSKRQKSGLPVAALVGYTNAGKSSIMNR LLAASDKADKQVFEKDMLFATLDTAQRLITLDDRCTFLLIDTVGFVSKLPHALVDAFKA TLEEVTEADLLLHVVDASFEGSDFQQNVTREVLKSLGADGKPSLTVYNKIDLVDTEELT EKQLSSGKGSCFVSTKTGKGYDELIARIRSGLFADLQKVQLLVPYDKGSVVSAILAKTM PYETKYEENGTLLTVDLNEEDRGRYREFILA" /locus_tag="LOCUS_7040" /gene="hflX" /note="WP_009895824.1 GTPase HflX (Clostridioides difficile) [pid:48.9%, q_cov:96.0%, s_cov:98.1%, Eval:3.4e-104]" /note="MGA_1078" ORIGIN 1 catgggagga ccggacgtac cctggggctc cccgtcgtcg gatgtccact tcagttcgct 61 cttttcgccc acgataaaag ccggaacgtt gtgggtggcg tccttgtatt tcgcccggat 121 cgcagcgatg aaggcgtcgg cctcctcctt ggaatagacg ggcgcgatat gggcgataaa 181 gcgggaccgg tcgatggtct gctccgcttc cgcttccttt gcgacggtgg tgtagcgtat 241 catgccagaa taaactcccg gtagcgtccc cggtcctctt cgtttaagtc gaccgtcagg 301 agcgtaccgt tttcttcgta tttcgtctcg tagggcatcg tcttcgcaag gatcgccgat 361 acgacgctgc ctttgtcgta gggaacgagg agctgcacct tctgcagatc tgcgaacagg 421 ccgctgcgga tgcgggcgat cagttcgtcg taccctttcc cggtcttcgt ggatacgaaa 481 caactgccct ttcccgagga aagctgtttt tccgtcagtt cttccgtgtc caccagatcg 541 atcttgttgt agaccgtcag ggacggcttg ccgtccgcgc caaggctttt gaggacttcc 601 cgggtcacgt tctgctgaaa atcgctgccc tcgaaggacg cgtccaccac gtgcagcagc 661 agatccgcct ccgtcacctc ctccagcgtc gccttgaagg cgtccaccag ggcatggggc 721 agcttgctga cgaacccgac ggtatcgatc agcagaaaag tgcagcggtc gtccagcgta 781 atgagccgct gggccgtatc cagggtcgcg aacagcatgt ccttttcgaa cacctgctta 841 tccgccttgt ccgaagccgc cagcaggcgg ttcatgatgg aagacttgcc ggcgttggta 901 taacccacga gcgccgctac gggaaggccg gacttttgcc gtttactgcg ctgcacgctg 961 cggttggcct tgacttccgc gatctccttc ttgatctcgt ccatgcgccg ctgaatgtgg 1021 cgccggtcgg tctccagttt tttttcgccg gggcctctcg tgccgatgcc gccgcccagg 1081 cgcgataaag acttgccgaa gcccagaagg cgcggcatgc gatactgaag ctgagccagc 1141 tccacctgga gtttgccctc catggaggtg gcccggtcgg cgaaaatgtc caggatgagg 1201 atcgtccggt cgatgacccg gcagccgcag gcatcctcga tgttgcgcag ctgcatgccg 1261 gacagttcgt cgttgaacac gacaagatcg gcctccatgt tgtgcaccag ctccgccagc 1321 tcgtccagct tgcctttgcc gatgtaggtg gccgcgttga tcttctccgc gttctgggtc 1381 atgacgccca gggtctcgat gccggccgcc tccgccaggc cctccagttc ctccagggaa 1441 taggagatgt cttcgcccag ggagacgccc accaggatcg ctttatattc ttctctttcg 1501 acgacagtgc cgtcgtcctt gatccgtatc atttacagga taaaccggtc gatatcgtcc 1561 tcgtggatct gttcttcgaa cttctcgcgg acgtattcgg gggtgatgga aatgttcttc 1621 gtgttttcgt caggcaggtt gaaggagatg tcctccagca gcttttccat gatggtgtgc 1681 agtcttctgg caccgatgtt ctcggtctgc tcgttcacca taaacgccat gga // LOCUS sequence280 1728 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence280 VERSION sequence280 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1728 /mol_type="genomic DNA" /organism="" /note="sequence280" misc_feature complement(1172..>1728) /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_178371730.1:NAD(P)/FAD-dependent oxidoreductase" /note="WP_178371730.1 NAD(P)/FAD-dependent oxidoreductase (Desulfitobacterium chlororespirans) [pid:32.1%, q_cov:94.0%, s_cov:45.7%, Eval:1.7e-18, partial hit]" /note="MGA_1081" /locus_tag="LOCUS_7050" ORIGIN 1 agcagtccgg aattcgcatt ctcgccgtcc cgtgcccgca ggctcatgcc gttcgtgcag 61 agaccgccct cttccgatgc ggacgccacg acctgcccgc cgggacacat gcagaacgta 121 tacacgcccc gccccgcctc cgtgcgcacc gacagtttat attccgccgc gcctatgccc 181 agttcttcgt gcagcgccgc gtactgcgcc ttatcgatat ccgcctggcg gtgttcgatc 241 cgtacgccca tggaaaaggg cttctgttcc atccaaaggc ccagtccgtg cagcatggca 301 aaactgtccc gtgcgctgtg acccagacca aggatgaggg cgtctgtcac gatccgctcc 361 gttgttcctt ccggaccggc ggcttcgacc gccgtcagtt tgccctcttc gatcgtaagg 421 cctgtcaact gcgtgcgaaa gcgcacttcg ccgcccaggg cttcgatctg ctttctgaga 481 ttcaccacga cgccccgcag cacgtccgtg ccgacgtggg ggtgttgccg gtacagaatg 541 tccggatcgg caccggcatc cacaaaacac tgcaggataa ggcggtgcac cggatccttt 601 gtccctgtcg tcagtttccc gtcagaaaag ctgcccgcgc cgccttcgcc gaactgcacg 661 ttcgtgcggg ggtcaagcac gccttcgctc cagaaacgct ccacggctgc cacgcgctct 721 tccatgcatg cgccccgctc cagcacgatg ggccgaaggc ccgccttcgc cagcgtgagc 781 gccgcgaaga tgccgcaggg gccaaaccct gccaccacag ggcgtttcgc gtctttgggc 841 agcacgcgtt tttctgggaa agaaacagcg gtctcctcta aaacggcagc cttgcaatgc 901 gagcgcctgg cctccgccag cagttcctca ggggcgaatt cgctgtccgt cacgtccagg 961 ctgaacaccc ggtagacgtc cggtttttcc ctggcgtcca gggattcctt cgcgatgcgg 1021 atctgccgta tgctgccgcc gggcagccgc aagcgccgct ccagtttctt cagcaaaagg 1081 gcctccagcg cctcctgctg cagtcccttg ccttcttccg ctcttatctt tatttcgtgt 1141 atcctgacga tctgcatcga tcctttttct cctatatgct ctctgctgcc gcaaggcctg 1201 ccgtccggcc gctgccgaac gcccaggtaa gactgtagcc tccgcagggc gcgtccacat 1261 ccaggatctc cccggcgaaa tacaagcccg gaacgagatg cgactgcagc gctaccggat 1321 cgacctccgc cagcgctacg cctccggacg tcgtgtgggc ctccttccag cctttgctgg 1381 caacaggcgt aaatgtcagg tttttcagca ggtgcgcagc cgcttcggga gcttgaccct 1441 ccccagccag ttccaggacc gcctccgcca gtttagcggg aagcagcgcg tcgaggaaca 1501 ggtcgccgag cgatgctttt cgctcctcca gtttcatcat cagatccatc tcgtgccact 1561 ccggcatcag atccagctgc agcacaaagg tcatgccttc ccggtgccgg taaaaaccgg 1621 agacgttcat gacgcagatg ccggacacgg aatccttatt aaactggatc tctccggtat 1681 cctgcgacaa acagatgccg ttttccgtgc ggccgccctc cgggaccg // LOCUS sequence281 1728 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence281 VERSION sequence281 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1728 /mol_type="genomic DNA" /organism="" /note="sequence281" CDS complement(62..1096) /product="A/G-specific adenine glycosylase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_000171406.1" /transl_table=11 /codon_start=1 /translation="MEFIDLKTTAVSIADWYAKHKRDLPWRQGKDPYRIWISEIMLQQT RIEAVIPYYGRFLSELPDVAALAAVPEDRLLKLWEGLGYYSRARNLKKAAQTVMQEFGG QMPQTAAKLRKLPGIGEYTAGAIASIAFGEPEPAVDGNVMRVLARLSASKEDVMDAKVR KAAASRLREIYPAGEEAALLTEGLMELGERICIPNGTPLCGDCPCAGRCRGHALGIEAQ LPVRAEKKARKIEEKTVLVLRCGDRYALEKRPDTGLLAGLWGFPILDGSLTEDEIKARF DAASVRPLGKAKHIFTHIEWHMEGYLVECKELSNCHWVTKEDIEADYSIPTAFKTYKKA LQYL" /locus_tag="LOCUS_7060" /gene="mutY" /note="WP_000171406.1 A/G-specific adenine glycosylase (Bacillus) [pid:44.6%, q_cov:90.1%, s_cov:88.5%, Eval:2.0e-69]" /note="MGA_1082" ORIGIN 1 cgaaagagtg ggcctgccca ctctttagaa ataacgtata ccttaactat aatatcatgg 61 tttacagata ttgcaaggcc tttttataag ttttaaatgc cgtagggatc gaataatccg 121 cttcaatgtc ctctttcgtg acccaatggc aattgctcag ctctttacac tccaccaggt 181 acccctccat atgccactcg atatgggtaa agatatgctt ggctttgcct aaaggacgga 241 cggaagcggc atcgaatctt gctttgatct catcttctgt taatgatcca tccaggatgg 301 gaaaacccca tagaccagcg agcagtccgg tgtcgggacg cttttccagt gcatatctat 361 cgccgcagcg caataccagt acggtctttt cttcgatctt tcgcgctttc ttttccgcgc 421 gtacgggcag ctgcgcttcg atccccagag cgtgacccct acagcgccct gcgcagggac 481 aatccccgca aagcggcgtt ccgttgggga tgcagatccg ttcgccgagt tccatcaggc 541 cttctgtgag cagcgcggcc tcttcccctg ccggatagat ctcccgcagt ctgcttgccg 601 ccgcctttcg caccttggcg tccatcacgt cttccttgct cgcggacagt ctagccagta 661 cccgcatcac gttgccatcc accgcgggtt ccggctcgcc gaacgcgatg gatgcaatgg 721 cgccggccgt atactccccg atcccgggaa gtttgcgaag ttttgccgcc gtctgcggca 781 tttgcccgcc gaattcctgc ataacagtct gcgcagcctt cttcagattg cgggcgcggc 841 tgtaataccc caggccttcc caaagtttta acagcctgtc ttcgggaacg gcagccagcg 901 cagcgacatc cggcagttcg gataaaaacc tgccgtaata cggaatgacc gcctcgatgc 961 gggtctgctg cagcatgatc tccgagatcc agatgcggta agggtctttc ccctgccgcc 1021 agggcagatc tcgcttatgc tttgcgtacc agtccgcgat cgaaacggcc gtcgttttta 1081 aatcgataaa ttccatgtcc gttattggaa actgttgatg gtctggatga gcgcgaacag 1141 aaggcccagg atcgtcagga tcgtcaccat gcggttcgtc gtggtgctgt acagcagatc 1201 caggtcggat tccaccagct ccaggaagct gcggatgctc tcgatcttct gggaagcgtc 1261 cagattcttc agcacgaggt cgtccagggc gcccagctcc gtaatgttta cctgatccag 1321 tttgttgagt gtgcggatca tctcagcgcg gatgtgcttg ttgcgcttga tgtcgtcggt 1381 cacgaagaaa ccgtgggagg cggcgacttt cggagaaccg ctcatcagcc gctccgtgct 1441 ggtgcggatg atctgcccca tctccacgga gaagaacagg ccgtggttga cccccgcagt 1501 gggcgcatcc atcgtaaaat actcgttgag agagccgaaa taatgatcct gatagggttt 1561 ctggtaatcg atatagtcgg cgtaggtctc gccccggtta aagttgagca ggacgtaatt 1621 gctgctgaat gcgatcacct tgacgaaatc ccggctggtc caggtctccg ccatgcgctc 1681 ttcgatgagc gccttgggga catgcagata cccttcgtcc cctgtcag // LOCUS sequence282 1728 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence282 VERSION sequence282 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1728 /mol_type="genomic DNA" /organism="" /note="sequence282" CDS complement(297..1460) /product="pyridoxal phosphate-dependent aminotransferase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011016536.1" /transl_table=11 /codon_start=1 /translation="MLKYVDRRGTNCSKWDALESMYGDKDLLSMWVADMDFEIAEPIRA AVRNYVDNVPWGYYNPGPGYKEAFIEWEKKYHGYEVKPEWICFSSGIVSAFYYVTCMAA KPGEAVILLAPIYYPMKDGVNFNGRKLVLCDMIHEGNTYRVDYEKFEKDIVDNDVKLFI MSSPHNPVGKVWTAEELKTLMEICRKHNVLVVSDEIHQDFEWNGHKHVPTATLGDYDDM LITMCAVSKTFNLASCQNSFIIIPNEKLREQYETFSRNVHGNGGNGFGYVAVEAACREG RPWFEEVKKQIWENYCYVRDTFAKELPDVTVADLQGTYLLWLDFSKYFKTQKETEEFMQ GKCKLAFDYGNWFGHGGDDYCGFVRMNLATSLENVKEACDRMIKNLK" /locus_tag="LOCUS_7070" /note="WP_011016536.1 pyridoxal phosphate-dependent aminotransferase (Fusobacterium nucleatum) [pid:43.4%, q_cov:99.0%, s_cov:95.7%, Eval:8.7e-96]" /note="MGA_1085" ORIGIN 1 caggaagcca tcaaaaacct ggtggaacac ggcttcgggg tttccttcat ctcggaactg 61 gctgcagcag accgggtaaa ggaaggccgc ctgctggcgt tcgacaccgg ccttgcggaa 121 gcgaagagga ccttttatct ggtccgccgc aagaacatcg cacttacgga aagcgcagaa 181 ctctttgtga agtgctgcct caaagaatag cgaatagggg cagatcccct gtgttttggc 241 aaaaagagat cctccgggag atttcccgga ggatcttaaa ttatttcggt accgaactat 301 ttcaggttct tgatcatacg atcgcaggct tccttgacgt tctccaggga agttgccagg 361 ttcatgcgga cgaaaccgca gtagtcgtcg ccgccatgac cgaaccagtt gccgtagtcg 421 aaggccagct tgcacttgcc ctgcatgaat tcctcggtct ccttctgggt cttgaagtac 481 ttggagaaat ccagccacag caggtaggtg ccctgcaggt ctgcgaccgt tacgtcgggc 541 agttccttgg cgaaggtgtc gcggacatag cagtagttct cccagatctg cttctttact 601 tcctcaaacc agggacggcc ttctctgcag gctgcttcca ccgccacgta tccgaaacca 661 ttgccgccgt tgccgtggac gtttctggag aatgtctcgt actgctctct cagcttctcg 721 ttggggatga tgatgaagga gttctggcag gaggccaggt tgaaggtttt ggagacggcg 781 cacatggtga tgagcatgtc gtcgtagtcg cccagggtag cggtaggaac gtgcttgtga 841 ccattccatt cgaagtcctg atggatctcg tcggagacca cgaggacgtt gtgcttgcgg 901 cagatctcca tgagggtctt cagctcttct gctgtccaga ctttgccgac cgggttgtgg 961 ggggaggaca tgatgaacag cttaacgtcg ttgtctacga tgtccttttc gaacttctcg 1021 taatccacgc ggtaggtgtt cccttcgtgg atcatgtcgc agagcaccag cttgcggccg 1081 ttgaagttaa cgccgtcttt catggggtag tagatgggtg ccagcaggat gacggcttcg 1141 ccgggctttg ccgccatgca ggtaacgtaa tagaacgcgg agacgatgcc gctggagaag 1201 cagatccatt cgggctttac ttcatagccg tggtacttct tctcccactc gataaaggct 1261 tctttatagc cagggccggg attgtagtat ccccagggta cgttgtcgac ataattgcgg 1321 acggctgcgc ggatcggttc tgcgatctcg aagtccatat ctgcgaccca catggaaagc 1381 aggtccttat cgccgtacat ggattccagg gcgtcccact tggaacagtt cgtgcctctt 1441 ctgtctacgt atttcagcat tcttgctacc tcctgatatg gcaaattcaa gcatttgacg 1501 gtggatagtt cttctctaaa aatataacac tttttccttg caattcaaag agccggctta 1561 tataatatat aggcattcgt ctgcccgggt cctggtccgg gagggacgaa gctctctgcc 1621 gcgggggagc accgcggccg caaacagacc atagggaggt gaaagaatga ataagtacga 1681 actgatgttc atcgtagaac ccagtctgga cgacgccaag aaggacga // LOCUS sequence283 1723 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence283 VERSION sequence283 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1723 /mol_type="genomic DNA" /organism="" /note="sequence283" misc_feature complement(160..>1723) /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_011987043.1:pyruvate:ferredoxin (flavodoxin) oxidoreductase" /note="WP_011987043.1 pyruvate:ferredoxin (flavodoxin) oxidoreductase (Clostridium botulinum) [pid:55.2%, q_cov:98.8%, s_cov:44.6%, Eval:1.3e-164, partial hit]" /note="MGA_1088" /locus_tag="LOCUS_7080" ORIGIN 1 gccaacctcg tgacccgcgc agaagcggct gtcttcatca gcaacatcat cgacgcgatc 61 ggaaaataaa aatctttgag acaagcgaag accgcagccc ctcggggctg cggtcttctt 121 ttgtgttttc tatcgattca gttttgagga gaatttgctt tagccttctg ccagcttctt 181 gtagctgtcc agtctttcct tcgcgtcctt ttctgccttt tcgaacagtt ccttcgcgat 241 ctcggggaac gtgagttcca gacccgcata gcggttctcg ccgcgcagga aggtcttcag 301 gtcgcccgtc ggctccttgc tgtcgagctg gaacgggttg aggccctgtt ctttccgtct 361 cgggtcgaaa cggtagcagt gccagtagcc tgcttcgacc gcggccttct cttcgagctg 421 ggacttgccc atgccgcact tcgggccgtg ctcgatgcac gggcagtagc agatgatcag 481 ggacggtccg tcgtactctt ccgcttcgcg gatggccttc agggtctgct cggggtcata 541 gcccatcgcg acctgtgcca cgtagacgta gccatagctc atggccatca tgccgaggtc 601 cttcttcttg gtcttcttgc cgtcggctgc gaacttggcg accgcgccgg ctgcggtgga 661 cttggaggac tgaccgccgg tgttggagta gacttcggta tcgaggacga ggcagttgat 721 gttcttgccg gaagccagga cgtggtccag accgccgtag ccgatatcat aagcccagcc 781 gtcgccgccg aaggcccagt agcttctctt gcgcaggtaa tccgtgttgg ccaggatgaa 841 ttccttggct tccttctgga tgtcgctctt gggctcaaac gccgcaacag catctgcaaa 901 ggccttggag acttccttgc tcttggcgtc atcctcgcgg tctgccaggt aggcatccag 961 agcgggttcg acctcggtgc cgcggaagtt ctccgcatag cccttgatgg tctcgtttac 1021 cttggtggag ccgagcagca taccgaagga gtattcggca gcatcttcga acagggacat 1081 ggcccatgcg ggaccttcgc ctgccttgtt cttggagtag ggaactcccg ggggcgatcc 1141 gccgtaagcg gtggagcatc cggaggcgtt tcctacggtc atgtgatcac cgaacagctg 1201 cgtgaccagc ttgatgtacg gggtctcgcc gcagcctgcg caggcgccgg agaactcgaa 1261 caggggctga gcgaactggc tgaacttggt gttcttgttg gagacagcgt ccttcttgat 1321 ggtgacttcc tctacgccga actcccagtt ctcggcctgg gcagcctggc tgtcgaaggg 1381 catcatcttg agcggagtcg gatccatctt ggaagccggg catacgttga cgcagctgcc 1441 gcagccggtg cagtcgtaca gggatacctg cattctatac tggtacttct cgagctcctt 1501 gcccttggcg ggtacggtct cgaaggcagc gggcttcttg gccatttctt cgtcgttaag 1561 cagtatggga cggatggcag catgcgggca gaccagtgcg cagcggttgc actgcaggca 1621 cttggtggca tcccattcgg gcagggtgac cgccacaccg cgcttctcgt acttggtgag 1681 ggcgctgggg aaggtaccgt ccggcatgtt gaacttgtcg tac // LOCUS sequence284 1721 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence284 VERSION sequence284 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1721 /mol_type="genomic DNA" /organism="" /note="sequence284" CDS complement(488..1300) /product="electron transfer flavoprotein subunit beta" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011986693.1" /transl_table=11 /codon_start=1 /translation="MRIIVCAKQVPDTSEVKIDPKTNRIIRDGVPSILNPDDANALEEA LLIKDSQPDTEVIVVSMGPPQAKDMLIECLAMGADKCYLLSDRAVGGSDTWATSNAVTS LIEKVVEECGPFDMIFAGRQAIDGDTAQVGPQIAEKMHLPQVTYVQKFEISEDKKVVTV QRQLEDGYEVIEVPTPCMLTCIKELNNPRYMTVSGIVKACKADAPIYVKSAKDCGCDLS KVGLEASPTVVFRSFTPAPKAPGQIIQGEDERTQSQNLLAKLKEKHAI" /locus_tag="LOCUS_7090" /gene="etfB" /note="WP_011986693.1 electron transfer flavoprotein subunit beta (Clostridium botulinum) [pid:61.5%, q_cov:100.0%, s_cov:100.0%, Eval:3.2e-85]" /note="MGA_1090" ORIGIN 1 tcctggatcg catcgcagat gaccttggtg taaccgtcgg tgttgaagtg ctcgagcagc 61 gggctctcga tgaggatgga gccgtcagcg ccccattcga tcgcttcctg accaagagca 121 tccaggttgt tgcctaccag cagcgcatag cacttggtgt cggcggagat gtctctggaa 181 agtctgcggc cgcaggcgat gagttccttg gctacgccca tgagctcgcc gtctctctgt 241 tctgcgaata cccagatatg cttataagcg gacagatcga ctgcatcggt ctcgtccttg 301 gagatggcct tgaacgggca cttggaaatg cagacggagc aagccgtgca cttctcgtta 361 atggttgctt ttctggcgac atcatcgaaa tcgatggcct ggaacgggca tgcctttacg 421 cagatctggc aacctttgca taattcatga ttaacaacta ctgccatttt agtttcctcc 481 ttctacatta aatagcgtgc ttttccttca gcttggccag caggttctgg gactgggttc 541 tttcgtcctc gccctggatg atctggccgg gagccttcgg agccggtgtg aaggaacgga 601 atactacggt cggagaagct tccagaccta ccttggacag gtcgcatccg caatcctttg 661 cgctctttac gtagatggga gcgtcggcct tgcaggcctt tacgataccg gaaacggtca 721 tgtatctggg gttgttcagt tccttgatgc aggtgagcat gcagggagtg ggaacttcga 781 tgacttcgta gccgtcttcc agctgtctct gaacggtaac gaccttcttg tcttcggaga 841 tctcgaactt ctgaacgtaa gtgacctggg gcaggtgcat cttttctgcg atctggggac 901 cgacctgagc ggtgtcgccg tcgatggcct ggcggcctgc aaagatcatg tcgaagggac 961 cgcattcttc aacgaccttt tcgatcagag aagtaacagc gttggaggtt gcccacgtat 1021 cggagccgcc tacggctctg tcggacagca gatagcactt atctgcgccc atcgcgaggc 1081 attcgatcag catatccttg gcctggggag gtcccatgga aacgacgata acttcagtat 1141 ccggctggct gtccttgatc agcagcgctt cttccagagc gtttgcatcg tcggggttga 1201 ggatgctggg tacgccgtca cggatgattc tgttggtctt cggatcgatc ttaacttcgc 1261 ttgtatccgg tacttgcttt gcgcaaacaa taattctcat aatacttatc ctccctctag 1321 cctacttaaa cacagcgccg gagataacca tcttctgtac ttcggtggtt ccttcgtaga 1381 tctcggtgat ctttgcgtct ctcatcatgc gttctacggg gtagtcggtg gtgtaaccgt 1441 agccgccgtg cagctgaaca gccttggtgg tgacgtacat agcggtctct gcagcgtagt 1501 acttagccat agcagcgtct acagagtacg gcatgtgctg atccttcttg aacgcagcgc 1561 tgtaaaccag aagtcttgcc gcttcgatgc gggtcttcat ttcagcaact tcgaaagcca 1621 gagcctggaa cttgttcagg gacttgccga actgctttct ggacttcatg tagtcgacgg 1681 tgacgtccag agcgccctgc gcgataccca gagcctggga a // LOCUS sequence285 1721 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence285 VERSION sequence285 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1721 /mol_type="genomic DNA" /organism="" /note="sequence285" misc_feature <1..536 /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_001830810.1:trigger factor" /note="WP_001830810.1 trigger factor (Staphylococcus) [pid:39.1%, q_cov:75.1%, s_cov:30.3%, Eval:1.6e-23, partial hit]" /note="MGA_1092" /locus_tag="LOCUS_7100" CDS 540..1193 /product="ATP-dependent Clp endopeptidase proteolytic subunit ClpP" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003417102.1" /transl_table=11 /codon_start=1 /translation="MSAGGTQKFRLNHPQDKLERMEHMSNLIPYVVEQTSRGERSYDIY SRLLKDRIIFLDGEVNDAAASLIVAQLLFLESEDPDKDINLYINSPGGVITAGLAIYDT MQYVKPDVSTICVGMAASMGAFLLAAGAKGKRYALPNAEIMIHQPLGGAQGQASDIKIQ AEHILHLREKLNAILAEKTGQSLETIAADTERDNYMTAAEAAAYGLIDQVVEKR" /locus_tag="LOCUS_7110" /gene="clpP" /EC_number="3.4.21.92" /note="WP_003417102.1 ATP-dependent Clp endopeptidase proteolytic subunit ClpP (Clostridioides difficile) [pid:76.4%, q_cov:88.0%, s_cov:98.5%, Eval:1.1e-78]" /note="MGA_1093" ORIGIN 1 aggacaaggt gctgcagcag gtctacgaag ccaaccccct cgaactgccg caggccatga 61 tcgacagcga agccgccaac atgctgaacg aattcggtta ccagctgcag tcccagggac 121 tgaacctgga tcagtactgc aagtatctga acaagaccca gcagcagatg atcgacgaat 181 tcaagcccga cgcggagaag agagtcaaga gcagactcat cgtcgaagcc gtcgccaagc 241 aggaaggcgt cgaagttacc caggaggata tcgacaagga actggccgcg atggccgcgc 301 agtacggcat ggcgcagtcc cagatcaagt ccatcttcgg cgaagagaac atggattatc 361 tgaagaagga tatcatgagc cgcaaggcca tcgatctgat gtacgaggca gcggagatca 421 ccgaggtcga agaaaagaag gaagaagaaa agaagcctgc caagaaggct gcgaaaaaga 481 aaacttccaa gaaggccgag gaagaacctg ctgaagaagc aaaggacgaa gaataaacga 541 tgagcgcagg cggaacccaa aagttccgcc tgaatcatcc gcaagataaa ttggaaagga 601 tggagcacat gagcaatctc atcccctatg tcgtagagca gacgtcccgc ggggaacgtt 661 cctacgatat ctattcccgc ttactcaaag accgcatcat cttcctggac ggcgaggtga 721 acgacgcggc cgcgagcctg atcgtggcgc agctgctgtt cctggaatcc gaagacccgg 781 acaaggacat caacctgtat atcaacagcc ccggcggcgt catcaccgca ggcctcgcga 841 tctatgacac catgcagtac gtcaaacccg acgtgtccac catctgcgtc ggcatggcgg 901 cctccatggg cgcttttctg ctggcggcag gcgcgaaggg caagcgctac gcgctgccca 961 acgccgagat catgatccac cagcctttag gcggcgcgca gggtcaggcc agcgatatca 1021 agatccaggc ggagcatatc ctccacctgc gggagaaact gaacgcgatc ctggcggaga 1081 agacgggcca gagcctggag accatcgccg ccgatacgga gcgggacaat tacatgaccg 1141 cggccgaagc ggccgcctac ggcctgatcg accaggtcgt ggaaaaaaga tagataatac 1201 ggagaaagta tggcaaaatt cgatagttca aaagaattga cctgcagttt ctgcggaaaa 1261 ccccagagcc aggtgcgccg gctgatcgcg ggtccggacg tctacatctg cgacgagtgc 1321 gtcaaactgt gcgaagacat tctggcggag gaattccccg agatcaagga ggaagcctcc 1381 ctgcagttcg gcggagagct gcccaagccc agagagatcg acgccaccct ggcggattac 1441 gtgatcgacc aggaccgcgc gaagaagatg ctggccgtgg cagtctacaa tcattataag 1501 aggatcaaca acctcccgtc ggctccggcg aagaagggca ttaaggccgc gcaggcggac 1561 gacggcgtcg agatccagaa gagcaatatc gtcatgatcg ggccgaccgg ttccggcaag 1621 acgctgctgg cccagacgct ggcgaagatc ctggacgtgc cgttcgccat cgcggacgcg 1681 acgaccctga cggaagccgg ctacgtcggc gaagacgtgg a // LOCUS sequence286 1705 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence286 VERSION sequence286 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1705 /mol_type="genomic DNA" /organism="" /note="sequence286" CDS complement(38..823) /product="tRNA (adenosine(37)-N6)-threonylcarbamoyltransferase complex dimerization subunit type 1 TsaB" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011393646.1" /transl_table=11 /codon_start=1 /translation="MPHRPVILAIETTGPLASVALSGVRGPVEGSAATEDGFLELVNQT HYSHLEEIAPMVKEILQTAGMQPEELDAIAVSRGPGSFTGIRIGMATAKAFAQVWNKPI VCVPTLASFAYMDVDPQAIEGFPEGVDPLICPLFDARRSQVYAGVYLPGCKDALLADGA YDVPDYLEKLGALLTPDKTAVFFGDGCDAYRETLENSGLPHVFAPQNVKFQLAHADLNL ALELYEEGQLTDCYNAQPEYLRLAEAERKLKAGALRKMP" /locus_tag="LOCUS_7120" /gene="tsaB" /EC_number="2.3.1.234" /note="WP_011393646.1 tRNA (adenosine(37)-N6)-threonylcarbamoyltransferase complex dimerization subunit type 1 TsaB (Moorella thermoacetica) [pid:34.3%, q_cov:86.6%, s_cov:95.2%, Eval:2.7e-22]" /note="MGA_1095" CDS complement(805..1227) /product="tRNA (adenosine(37)-N6)-threonylcarbamoyltransferase complex ATPase subunit type 1 TsaE" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003434423.1" /transl_table=11 /codon_start=1 /translation="MEKTISLKNELDTRNLGASLAKQMQPNQVYALIGDLGAGKTTLAK AIARGLGVTETLTSPTFTIVQEYETGRLPLYHFDVYRVSDEDELFEIGLEDYFHKGGVC LVEWADLIEDLLPADVITITLSYGEEEGERICRIDR" /locus_tag="LOCUS_7130" /gene="tsaE" /note="WP_003434423.1 tRNA (adenosine(37)-N6)-threonylcarbamoyltransferase complex ATPase subunit type 1 TsaE (Clostridioides difficile) [pid:49.6%, q_cov:93.6%, s_cov:86.7%, Eval:3.7e-35]" /note="MGA_1096" CDS complement(1199..1558) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MLDYYALLGVPRFTASQDDIRKAYRTQIAFFHPDKGYVNENIALE RTQQLNEAYDTLKNPSRKAVYDDAREGKSSRDDGHHVLQQPQFRHFPGEDHRFIADLPH LWYDIWHGKDHFFKK" /locus_tag="LOCUS_7140" /note="WP_010943043.1 DnaJ C-terminal domain-containing protein (Geobacter sulfurreducens) [pid:38.2%, q_cov:84.0%, s_cov:32.6%, Eval:8.9e-10, partial hit]" /note="MGA_1097" ORIGIN 1 atccggtcga tatcgttttt atccgcgcgg cgcagcatca tggcatcttc ctcagcgcgc 61 cggccttcag cttgcgctcc gcttccgcca ggcgcagata ttcgggctgc gcgttgtagc 121 aatccgtcaa ctgcccttct tcgtacagct ctaacgccag attcagatcc gcatgagcca 181 gctggaactt gacgttctgc ggcgcgaaaa cgtgcggcag cccgctgttt tccaacgttt 241 cccggtatgc gtcgcatccg tcgccgaaga aaacggccgt tttgtccggg gtcagcagcg 301 cacccagctt ctccaggtag tccggcacgt cgtaggcgcc gtccgccagc aatgcgtcct 361 tgcagcccgg caggtacacg ccggcgtaca cctgactgcg gcgggcgtcg aacagcgggc 421 agatgagggg gtcaacgccc tctgggaacc cctcgatcgc ctgcggatcc acatccatat 481 acgcaaagga cgccagcgtg ggcacgcaga cgatgggctt attccagacc tgcgcgaaag 541 ccttggccgt cgccatgccg atgcggatgc cggtaaacga tccgggccct ctggatacgg 601 cgatcgcatc cagttcttcc ggctgcatgc cggcggtctg caggatctcc ttcaccatgg 661 gtgcgatctc ctcgaggtgg gagtaatgag tctggttcac cagctccaga aaaccgtcct 721 ctgtggcagc ggagccttcc acaggccccc gaacgccgga gagcgcaacg gaagccagcg 781 gtcccgtggt ctcgatggcc agtatcaccg gtctatgcgg catatccgtt ctccctcctc 841 ttctccgtaa cttaaggtta tcgtaatgac gtctgccggc agcagatcct cgatgaggtc 901 tgcccactcc accaggcaga cgccgccttt gtggaaataa tcctccaggc cgatctcgaa 961 cagttcgtcc tcgtcgctca cccggtaaac gtcgaaatgg tacagcggca gacggccggt 1021 ctcgtactcc tgcacgatgg taaacgtggg gctggtaagg gtctctgtga cccccagacc 1081 cctcgcgatg gccttcgcca gcgtggtctt gccggcgcca aggtctccga tgagggcgta 1141 gacctggttc ggctgcatct gctttgccag cgaagcgccg agattcctgg tatctaattc 1201 attttttaaa gaaatggtct tttccatgcc aaatatcata ccataaatgg ggaaggtctg 1261 ctataaaacg atgatcctca cccggaaagt gtcgaaattg cggttgttgg agaacgtgat 1321 gaccgtcgtc ccgggatgat ttgccttcac gtgcatcgtc gtagaccgct ttgcgggacg 1381 gattcttcag cgtatcgtaa gcctcgttca gctgctgtgt ccgttccagc gcgatgtttt 1441 cgtttacgta gcccttatcc ggatgaaaaa acgcgatctg cgtccggtaa gccttcctta 1501 tgtcgtcctg ggacgccgta aagcgcggca cgcccagcag cgcgtagtaa tccagcatgc 1561 ggccgtcttc gggtagctgt gcgtgcggct acgcttccgt ggggatctcg tccatctgcg 1621 cttcgagcgc ctcggacaca tcctctgtct gcggcagcgc tctctcagcg gtcacagtgc 1681 agtctttggc ttcgcgccat gcggc // LOCUS sequence287 1695 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence287 VERSION sequence287 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1695 /mol_type="genomic DNA" /organism="" /note="sequence287" CDS complement(813..1694) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MEAYVICVDDEETVILESESVAKELLSETQNEYAAASTGAVIDEV SYDQKVEIRPSYCLLGDIWNRSDAKKVLQGNKEGTDEPLITIRSTETATYTEAVAYDVQ YIDNASLYEGETEIKSQGSEGTDLIVATVERVNGQEVARTVVSTTRITEPVAEVQYRGT KPIPATQGTGAFQYPLASYTISSYFGMRWGTLHTGVDLAAPMGSKIYASDGGTVTFAGW KGSYGYLVIISHGGLFETYYAHCSKILVSVGENVYQGQNIALVGSTGYSTGPHCHFEVR YNGTPNNPLNYL" /locus_tag="LOCUS_7150" /note="WP_005811628.1 M23 family metallopeptidase (Desulfitobacterium hafniense) [pid:31.9%, q_cov:99.7%, s_cov:71.8%, Eval:4.1e-41, partial hit]" /note="MGA_1100" ORIGIN 1 ggctggcagt ctctggggaa cagcttgatg gtgtcctccg tcgccttatt ggagccgtag 61 aggccgtagt tttcgttgta gccggagccg tttacgggag cggtcatgat gtcgctcagg 121 ttgagggcga tctccgcacc cgcttccttc agcagtctct tgcttctctc tctgctgtgg 181 atgtcgcagg ccagcacgtt cttcgtatat ttcaggatgg cacgcacgtc gttggcgaag 241 aagatctcgc actcagcgcc ggcgtcttcc accagctgtt tatagtattc cacgtaatcc 301 acgccggtaa atctgtgttt cttgtagccg aacagctcgc ggtacttcgc ttcgctcagc 361 acgtcggaat aggggttgac ccccgcagca tccagatcat ccagagagat gaggtggttg 421 cccacttcgt cgctgggata agacagctgc agccagatct tcttcgcgcc cttcgcgatg 481 ccgcgcaggc agatcgcgaa gcggttgcgg gacaggatgg ggaatacgac gccgaactca 541 ccggaaggga acttagcccg tacatccgca gcgatatcct ctacgcccac atagttgccc 601 tgggctctcg cgaccactgc ttcggtcaca gcgacaacgt ccttgtcgcg cagatcctta 661 ccgccgttgc ttgcggccag gatgctgtcg gtcacgatct tgacgatgtc gtcgccctcg 721 cggatgatgg gcgcacggac gcctctggat acggttccga tcattctttc cataaaacac 781 atgcctcctt tggtctttgc tgtgtggttt gactacagat aattcagcgg gttgttcggc 841 gtgccgttgt agcgcacctc gaagtggcag tgggggccgg tggaataacc ggtgcttccg 901 accaatgcga tattctgacc ctgatatacg ttttcgccca cgctgactaa gatcttgctg 961 cagtgagcgt aatatgtctc gaacaggccg ccgtggctga tgatgaccag atagccgtaa 1021 ctgcccttcc agccggcgaa tgtaacggtg ccgccgtcgc tggcgtagat cttcgaaccc 1081 atgggagccg ccaggtcgac gcctgtgtgc agcgtgcccc agcgcatgcc gaagtaggac 1141 gagatcgtgt aggatgccag cggatactgg aatgcgccgg tgccctgggt ggccgggatg 1201 ggcttcgtgc cccggtactg gacctccgcc acaggctccg tgatgcgggt ggtggacacc 1261 acggtgcggg ccacttcctg gccgttgacc ctttcaaccg tcgcaacgat gaggtcggtg 1321 ccttcggagc cctggctctt gatctcagtc tcgccttcgt acagcgacgc gttgtcgatg 1381 tactgcacgt cgtaggcgac ggcttcggta taggtcgcgg tctccgtgct gcggatcgtg 1441 atgaggggtt catccgtccc ctccttgttg ccctgcagca ccttcttggc gtcggaccgg 1501 ttccagatgt cgcccagcag acagtagctg ggacggatct ccaccttctg gtcgtaggac 1561 acctcgtcga tgacggcgcc ggtggacgcc gctgcgtatt cgttctgggt ctccgagagc 1621 agttccttgg ctacgctttc gctctccagg atgaccgtct cctcgtcgtc gacacagatg 1681 acgtaggcct ccacc // LOCUS sequence288 1691 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence288 VERSION sequence288 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1691 /mol_type="genomic DNA" /organism="" /note="sequence288" CDS complement(719..1486) /product="ABC transporter ATP-binding protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_002680085.1" /transl_table=11 /codon_start=1 /translation="MRMLEVKNLSVRYGTLDIVKNVSFSVEEGEWLMIAGPNGAGKSTV VSAVAQSVASTGDVLFCGKNVRNYKPQELARHIGVLEQNHAVNYAFSVREVVGLGRYAY SSGIFAGKSDADDDAVERALALTGLDALADKSVLKLSGGELQRVFLAQIFAQDPDLLIL DEPTNHLDLVYQKQVFSLIEEWRKEPGRAVISVVHDLSLALAYGSTAVLMDRGEAVAFG PVQEVLNADHLDAAYGMDVKAWMQSLLKQWEHI" /locus_tag="LOCUS_7160" /note="WP_002680085.1 ABC transporter ATP-binding protein (Treponema denticola) [pid:38.2%, q_cov:98.0%, s_cov:96.9%, Eval:1.2e-46]" /note="MGA_1102" ORIGIN 1 accatgatga tgccctggat aaagtcgttg atcgctgtcg ccatgtagcc gccggcgatg 61 acgtaaacgc ccgtaaggat cgccatgacg atgacgcaca cggaataatc gatgttgaag 121 gccataccga acagacggga caggccgttg tagaggcttg cggtatacgg aatgaggaag 181 atgaagatga tgaccgaaga gcagaccttg agcgccgggc tgtcgaaccg ggcggagaag 241 aactgcggca tcgtggcact gttgaggtgc tgggtcatga tgcgggtgcg ccggcccagg 301 atggcccagg ccataaagga gccgatgagg gcgttgccga tccccaccca ggtggacgca 361 atgccgtatt tccagccgaa ctggccggca tagccgacga agataacggc agaaaaatac 421 gaagtgccgt acgcgaaggc cgtaagccag gggccgacgg aacgtccgcc cagcacgaag 481 ccgtcgacat tggtcgcgtt gcggcggcag tacatgccga tgcctaccat gatgccgaaa 541 aacactacga gcattactac tttgatgaac attgcattgc gtcctttctg aaatgggtat 601 ttgctttaac gcattaaatc gtaacgcata aaagcgtaaa agtcaagcgc tgtttgcaag 661 aaaaaaaggg tctgaaaaag accctcagaa tggacagtca ggaaccgtca ccaactgttc 721 aaatatgctc ccactgtttc agcaggctct gcatccacgc tttcacgtcc atgccgtagg 781 cggcatccag atggtccgca ttcaggactt cctgcaccgg gccgaaggca acggcttcgc 841 cccggtccat cagcacggcg gtactgccgt aagccagcgc caggctcaga tcgtggacca 901 cggagatgac ggcccgtccc ggctctttgc gccattcctc gatcagggag aacacctgtt 961 tctgatagac caggtccagg tggttcgtcg gttcatccag gatgagcaga tccggatcct 1021 gggcgaagat ctgcgcgaga aatacccgct gcagctcgcc gccggagagc tttaagaccg 1081 atttgtccgc cagcgcatcc agccccgtaa gcgccagcgc acgctccacc gcatcgtcgt 1141 ccgcatcgct ctttcctgcg aagatcccgg aggaataggc atagcggccc agacccacga 1201 cttcccgcac ggaaaacgca taattcaccg catggttctg ttccagcaca ccgatatgcc 1261 gggccagttc ctgcggcttg taattccgca cgtttttgcc gcagaacagc acgtctccgg 1321 tgctggcgac gctctgcgcg accgcgctca cgaccgtgga tttgcccgcg ccgttggggc 1381 cggcgatcat cagccactcc ccttcttcca cggaaaaact cacgtttttc acgatatcca 1441 gcgtgccgta gcgcacgctt aaattcttta cttccagcat gcgcattacg agatcctcct 1501 cgaacggtag aagatgacga taaacagaac ggcaccgata agggacgtca cgacgccgat 1561 gggcagctgc agaggattgg cgatcatgcg ggctgccagg tcgcagagca tcagaaaact 1621 cgcgccgccg aacaggcagg cgggcatcag cttcgcatgg ttgggtcccg tgatcatacg 1681 aactatgtgg g // LOCUS sequence289 1689 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence289 VERSION sequence289 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1689 /mol_type="genomic DNA" /organism="" /note="sequence289" CDS complement(347..1165) /product="transketolase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_177224003.1" /transl_table=11 /codon_start=1 /translation="MEHTQLQQIAKTVRQDIIREVYSAGSGHPGGSLSAADLLTALYFS EMRIDPAQPAMEDRDRFVLSKGHAAPALYACLAERGYFPKEDLVTLRKIGSRLQGHPSM KMLPGVEMSTGSLGQGISAAVGMALAGRLDGGSGRVYTLLGDGELQEGIVWEAAMAAGH YKLDNLCAIVDHNGLQIDGRNEDVMNVMPIAEKFAVFGWNVLEIDGHDFEQILDALEMA RKCKGMPTVIVAETVKGKGVSFMEGQAGWHGKAPNEEQAKQAMAELGGEL" /locus_tag="LOCUS_7170" /note="WP_177224003.1 transketolase (Moorella thermoacetica) [pid:69.5%, q_cov:95.2%, s_cov:98.5%, Eval:9.8e-103]" /note="MGA_1105" misc_feature complement(1167..>1689) /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_011393842.1:WecB/TagA/CpsF family glycosyltransferase" /note="WP_011393842.1 WecB/TagA/CpsF family glycosyltransferase (Moorella thermoacetica) [pid:44.6%, q_cov:96.0%, s_cov:68.3%, Eval:1.9e-34, partial hit]" /note="MGA_1106" /locus_tag="LOCUS_7180" ORIGIN 1 ccgtcttcgc ccacggtgac ccctgcatgg gtcgcgcaga tcttgacgtt ggcgcctgta 61 taggcgatgg aattgcggat gatctcatac gctctgccgg aagcaaacat ggcgaagctg 121 ctggcgaaca cggtcttgcc ggaaacggcg aggcctgcgg ccatgcccat catgttggct 181 tctgcgatgc ctgcgttgaa gaagcggtcc ggatagacgt cggcaaactt cttcgtctgt 241 gtggatccgg acaggtctgc gtccagaacg acgatatcgg ggttttcggc gcccagttcc 301 accagagcct tgccgtaact ggctctcgtt gcgatctttt ctgccattac agctcacctc 361 ccagttctgc cattgcctgc ttcgcctgtt cctcgttcgg cgccttgccg tgccagccgg 421 cctggccttc catgaaagaa acgcccttgc ccttgacggt ctctgccacg atgacagtgg 481 gcataccctt gcactttctc gccatttcca gagcgtccag gatctgttcg aaatcgtgtc 541 cgtcgatctc cagcacgttc cagccgaaca ccgcgaattt ttccgcgatg ggcatgacgt 601 tcatgacgtc ttcgttgcgt ccgtcgatct gcagaccgtt gtggtctacg atggcgcaca 661 ggttatccag cttgtaatgc cctgccgcca tggcagcttc ccagacgatg ccttcctgca 721 gttcgccgtc tccgagcagc gtgtagacgc gcccgctgcc tccgtccagt ctgccggcca 781 gcgccatgcc gactgccgcg gagatcccct ggcctaaaga gccggtggac atctccacgc 841 cgggcagcat cttcatgctg ggatgacctt gcaggcggct gccgatcttg cgaagggtca 901 caagatcctc cttggggaaa tagccccgct ccgccaggca cgcgtacagc gccggcgccg 961 catgaccttt ggagagcacg aatctgtccc ggtcttccat ggccggctgc gccgggtcga 1021 tgcgcatctc gctgaagtac agcgcggtga gcagatccgc cgccgaaagg ctgccgccgg 1081 gatgtccgct ccctgcggaa tagacttctc tgatgatatc ctgccttact gtttttgcga 1141 tctgttgcag ctgcgtgtgt tccatgttac ctccgtattg ccgctttgat caaaaagacg 1201 ggaagagccg ggagccgttt taaacgcttg ggctcctgga tcatccggta cagccattcc 1261 aggccgtgat cgatatagaa cttgggggcg cggttgagct gaccggacca gatgtccaga 1321 ctgccgccca ggcctgccgc cgcctttact tttaaagcat cgcgatgctt tatcacaaaa 1381 tattcctgct tcggagaacc gagcgccacg cacaggaaat ccgcaccgct ggcgttgatc 1441 tccgccacga cggatggttc ctcgtcctcc cggaagtagc cgtcccggaa gcctgcgatc 1501 ttcaggcccg ggatctcctt ctccaggttt gctgccgccg cttccgcgac gccgggcttg 1561 ctgcccagca gatagacgct gcggcccagc tttgcgcaca gttcgatggc gctatgggca 1621 aaatcgatgc cggcgacctt ctcctggatg gggtcaccct tgagtttcga cgcgtagatg 1681 aggcctacg // LOCUS sequence290 1680 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence290 VERSION sequence290 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1680 /mol_type="genomic DNA" /organism="" /note="sequence290" CDS complement(465..1505) /product="ABC transporter substrate-binding protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011948969.1" /transl_table=11 /codon_start=1 /translation="MKNVNAKKWMVLLLSIAMVLSVLAGCTSGGSGSGKAEVPESMTAP LNIGTLMGPTGMGMAGLISEENAPMMNVTVYDAPDQAMAGLLNGDLDVAAIPSNVAAVL YNKTEGGVQLLGVNTGGVLYLLSNNAESVSSLADLKGKTVYASGMGGVPEYAFKALMQN AGLAEDDIELVWMNSHADVVSTLLSQGGYALVPEPQVTVAGSKADTVSVDLDINAMWKE AFGYDLPMGVVACRKEVAETRPGDLLYFLNEYNKVLESYNADKDAAAETIAAAGILPAA GIAKQAMPRCNIMLETGFDAAKGILTPLYETLFSYNPQAVGGKIPEDDFYFAKDHESNF SIKLEF" /locus_tag="LOCUS_7190" /note="WP_011948969.1 ABC transporter substrate-binding protein (Clostridium botulinum) [pid:35.7%, q_cov:94.2%, s_cov:98.5%, Eval:7.8e-53]" /note="MGA_1108" ORIGIN 1 agctcccggt attcggcagg cacgctgtcg aagccctgca ggatattggt atacatcacc 61 ggaaagcaca tcagaaaaca cacgaacgtg ggcacgatgc tgctggcaag gcaaaggagc 121 gcgatgagga tgacggacat gacgggcacc gacttgatga ccgccgccgg caccgaaagg 181 atggccctca tccagctgct cttcgttgcc gcccaggcgc cgaggaaccc cagcagggat 241 gccagcgcga gccccgcagc cacccgcagc atcgttacgc cgcaggagcg ccagaacagg 301 ggctggacca gaagatccag cagcgcttta caggtaaaga ccggcgaagg cagcacaaag 361 gatctgccga aggtcatggc gcccagctgc cagagggcaa gccagagcag gaccgcgacg 421 gtcttctttc ctatgcgctt ttcgccggtc tttggtttca ttcgttaaaa ttccagttta 481 atgctgaagt tcgactcgtg atccttggcg aaatagaaat cgtcctcggg gatcttgccg 541 cccacagcct ggggattgta ggagaacagc gtctcgtaca gcggggtaag gatgcccttc 601 gctgcgtcaa acccggtctc caacatgatg ttgcagcggg gcatggcctg ctttgcgatg 661 cctgcagcgg gcaggatgcc tgccgctgcg atggtctccg ccgctgcgtc cttatctgcg 721 ttgtagcttt ccaggacctt gttgtattcg ttcaggaaat agagcaggtc tcccggccgg 781 gtctccgcga cttccttgcg gcaggcgacg acgcccatgg gcagatcgta gccgaaggcc 841 tctttccaca tcgcgttgat gtccagatcc acggaaacgg tatccgcctt ggagccggcc 901 accgtcacct ggggttcggg caccagcgca tagccgccct gggagagcag ggtggagacg 961 acgtccgcgt gggagttcat ccacaccagt tcgatgtcgt cctccgcaag gcctgcgttc 1021 tgcatcaggg ccttgaaggc gtattcgggc acgccgccca tgccggacgc gtacacggtc 1081 ttgcccttca gatccgccag gctgcttacg ctttccgcgt tgttggagag cagatacagc 1141 acgccgccgg tgttgacccc cagcagctgc acgccgcctt cggtcttgtt atacagcacc 1201 gccgctacgt tggacgggat ggctgccacg tccagatcgc cgttcagcag gcctgccatg 1261 gcctggtccg gcgcgtcata gacggtcaca ttcatcatag gtgcgttttc ttcagagatg 1321 agcccggcca tgcccatgcc ggtgggaccc atcagggtgc cgatgttcaa aggcgccgtc 1381 atggattcgg gcacttcggc tttgccgctg ccggaaccgc cggaggtgca gcctgccaga 1441 acagacagca ccatcgcgat gctcaagagg agcaccatcc attttttcgc gttaacgttc 1501 ttcatattcg atctcttcct cctcggattc cttgtaggag atgcctatgt catttcccag 1561 ggcgcctccg tgcattatag aatatttgcc gaatttatcc cgtatggaat ccatcgcggc 1621 atcgatggct tcgttctgtt tgcgtttttc ctcgagcacc ggctcgaaca ggctgatctg // LOCUS sequence291 1671 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence291 VERSION sequence291 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1671 /mol_type="genomic DNA" /organism="" /note="sequence291" CDS complement(276..731) /product="DIP1984 family protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_027479829.1" /transl_table=11 /codon_start=1 /translation="MKLAESLQERADLNRKIEQLRMRIQNNVLVQEGEKPAEDPDKLMK ELEESLARLEYLIRQINLTNCAYKVDGQTLTELIAKKDVLRVKQSAYRDILYAASQSTQ RARNTEIKIVPVLKAAQLQKKADELAKAIRLLDNKIQQANWTADLME" /locus_tag="LOCUS_7200" /note="WP_027479829.1 DIP1984 family protein (Deinococcus radiodurans) [pid:44.0%, q_cov:98.7%, s_cov:96.8%, Eval:3.0e-26]" /note="MGA_1110" CDS complement(745..1374) /product="M15 family metallopeptidase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_000237711.1" /transl_table=11 /codon_start=1 /translation="MDPSGFVVLGEYVPGIVQEIRYYSTYNFIGDRIDGYEEPVALCTI EAARALKAVANEMNVYGYRLKIFDAYRPAPAVRHFVLWGIEDTDVRMKPYFYPDLQKTE LFEKGYVASKSSHSRGSTIDLTLLDMKTGKEVDMGGPFDFFGELSHPDFKGVTKEQYAN RMLLQSTMVRCGFVPIDCEWWHFTLKDEPYPDTYFEFPVNSEYLRK" /locus_tag="LOCUS_7210" /note="WP_000237711.1 M15 family metallopeptidase (Salmonella) [pid:43.9%, q_cov:95.7%, s_cov:87.1%, Eval:8.9e-49]" /note="MGA_1111" ORIGIN 1 agcacgcggc gtccctgttt atcgatcttt tctaccggtt caaaacgcat aataaaaaat 61 cccctttccc gccctcgttc tgcaggcaaa tatctggtcg tgcgcgatac gcaatgccgg 121 atgcgtggat acgcgatcgg agcatgcggt attctcgggg attcgaaccc cgggcgggct 181 ctgccgccct cttccaactg atggtcttgc gaccggtgca gctgtccgcc gctgccgcgt 241 gatattcacc cctgtagaac taccgtctgc aaaacttatt ccatcaggtc ggccgtccag 301 ttcgcctgct ggatcttgtt gtccagcagc cggatcgcct tggccagttc gtccgctttc 361 ttctgcagct gcgccgcctt cagtacggga acgatcttga tctccgtgtt gcgggcccgc 421 tgcgtggact gggaggcggc gtacagaatg tcgcggtaag cgctctgctt gacccgcaga 481 acgtccttct tcgcgatcag ctccgtcagc gtctgcccgt ccactttata ggcgcagttc 541 gtcagattga tctgacggat gaggtattcc agccgcgcga ggctctcctc cagttccttc 601 atcagtttgt ccggatcctc cgccggcttt tcgccttcct gcaccagcac gttgttctgg 661 atgcgcatgc gaagctgctc gatcttgcgg ttgagatccg ctctttcctg taagctttct 721 gctaatttca tcgtcttttg ctccttattt tcttaaatat tccgaattca ccggaaactc 781 gaaatatgta tccggatacg gttcgtcttt cagcgtaaaa tgccaccatt cgcagtcgat 841 gggcacgaaa ccgcagcgca ccatggtgct ctgcagcagc atgcggttgg catattgttc 901 cttcgtgacc cctttgaaat ccggatgcga cagttctccg aagaaatcga agggcccgcc 961 catatccact tccttaccgg tcttcatgtc cagcagtgta aggtcgatgg tgctgccacg 1021 gctgtggctc gacttgctcg ctacgtagcc cttttcgaac agctctgtct tctgcagatc 1081 cgggtagaaa tacggtttca tccgcacatc ggtatcctcg atgccccaca gcacaaaatg 1141 ccgcacggca ggagccggac ggtaggcgtc gaagatcttc agccggtagc catagacgtt 1201 catttcattc gcgacggcct tcagcgctct tgccgcttcg atggtgcaca gcgccaccgg 1261 ctcttcgtag ccgtcgatgc ggtcaccgat aaaattatag gtggagtaat accgtatctc 1321 ctgcacgatg ccgggcacgt attcccccag gacgacgaat ccggaaggat ccatcgtcac 1381 cttcttctca aaatcagtca taatctattc cgtttgtttt atgagccacg caaagccctt 1441 cgccatgcgc agatccggtt ctttaaagtg attgcccgga ttccactcca ggacggtccg 1501 catgccgttc tccgaaagat aggcatgggc ctcccgcaca cagtcgccca cggtgcgcat 1561 cacagggttg cgggtcttct cttccttatc gccgaggctg agatagacgg cctctgtctg 1621 cagggggtga cccttcataa agtccagaaa tcccggaaac cacagcgatc c // LOCUS sequence292 1668 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence292 VERSION sequence292 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1668 /mol_type="genomic DNA" /organism="" /note="sequence292" CDS 57..1247 /product="membrane protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011948736.1" /transl_table=11 /codon_start=1 /translation="MNPESKYTVKKTFSAETVVFPVIFLAFFAYLAHVMGMANMINTIM KTAFDLLINTVLYIVAVCVIMGAVSELLTEFGFVALMDRVLRPLMRPVFGLPGAASLGI VTTFLSDNPAILALTANPRYKYYFKAYQFPALTNIGTSFGMGLIVCTYMLSLASITGES YGKAVVIGLAGATVGAVVSTRIMLHFTKKVYGTDLPAHDAFPSAQDTEIGELEPGLRPV RKGNLGNRVLGALLDGGASGLTLGAGIVPGVLIICTLVMILMNGPSDSGLYTGAAYEGV GLIPAVAAKLNFILEPLFGFSNTQAIGVPVTALGAAGAAISLASGLASRGLLAAGDVAV FTAMCMCWSGYLSTHTSMMDSLHCKELTGKALISHTIGGIAAGFAAHWIFILVNLL" /locus_tag="LOCUS_7220" /note="WP_011948736.1 membrane protein (Clostridium) [pid:48.5%, q_cov:99.0%, s_cov:95.8%, Eval:1.4e-104]" /note="MGA_1113" ORIGIN 1 caggcttctg cttttattgt atcatatgct ataatgtgcg cagaggtgtg tattcaatga 61 atccggaaag taaatatacg gtcaagaaga ccttcagtgc ggagactgtg gtattccctg 121 ttatttttct cgcctttttt gcctatctgg cccacgtgat gggcatggcc aacatgatca 181 atacgatcat gaagacggcg ttcgatcttc tgatcaacac cgtcctgtat atcgtggcgg 241 tctgcgtcat catgggcgca gtatccgaac ttcttacgga gttcggtttc gttgcgctga 301 tggaccgggt actgcggccg ctgatgcggc ctgtcttcgg gctgccgggc gctgcctccc 361 tgggcatcgt caccacgttc ctctcggaca atccggctat cctggcgctc accgcaaatc 421 cccgctataa atattatttc aaagcctacc agttcccggc gctcacgaac atcggcacgt 481 cctttggcat gggacttatc gtgtgcacct acatgctgtc gctggcgtcc atcaccgggg 541 aatcctacgg caaagccgtc gtcatcgggc tggccggcgc gacggtcggc gctgtcgtga 601 gcacccgcat catgctgcat ttcacgaaga aggtctacgg gacggatctg cccgcgcacg 661 atgccttccc ttccgcgcag gacaccgaga tcggggagct ggaaccgggt cttcgcccgg 721 tgaggaaagg aaatctgggc aaccgggtgc tgggagctct gctggacggc ggcgccagcg 781 gtctcaccct tggggcaggt atcgtgcccg gtgtgctcat catctgtacg ctggtgatga 841 tcctgatgaa cgggccttcg gacagcggtc tttacacggg agccgcctac gaaggcgtcg 901 gactgatccc ggcagtcgct gccaaactca attttatcct ggaacccctg ttcgggttca 961 gcaacaccca ggccatcggc gttcccgtaa cggcgctggg cgctgccggc gctgccatca 1021 gcctggcctc ggggctcgct tcccggggac ttttggccgc gggcgacgtg gccgtcttta 1081 ccgccatgtg catgtgctgg agcggctatc tcagcacgca cacgtccatg atggacagcc 1141 tgcactgcaa ggagctgaca ggcaaagcgc ttatctcaca cacgatcggc ggcatcgcag 1201 caggatttgc cgcgcattgg atcttcatac tcgtcaacct tctgtaacaa aaatgcagaa 1261 cggggacagt tctttgtctc acccttcgac agagaaccat ccccgtttat ttccatgttt 1321 tcttactgtg cgtttgcgtg ctccttgttg tagcggtacc acttccagta gccgtagcag 1381 gtattcacca tcatggcggc gacggtcacc agcatgatgt aggcgcctcc gcggatgtac 1441 agcgtggcat ccatgatgag agtgatgatc caggcgtacc actgctcccg gtagcgggcc 1501 agaagcagca cgccgttggc gatgccgaag cccgaagaca gcgcatccac gtaggaatcc 1561 gcagcgccgg ggctcatccg gatgagcgat cccgcgataa aggcaaaggc gaagatagct 1621 gcgatcgcca ggatatcctg cttcggcgta agggtcttca ccaccgtc // LOCUS sequence293 1660 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence293 VERSION sequence293 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1660 /mol_type="genomic DNA" /organism="" /note="sequence293" misc_feature complement(1005..>1660) /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_011860948.1:tRNA 4-thiouridine(8) synthase ThiI" /note="WP_011860948.1 tRNA 4-thiouridine(8) synthase ThiI (Clostridioides difficile) [pid:62.5%, q_cov:95.9%, s_cov:53.2%, Eval:5.7e-70, partial hit]" /note="MGA_1116" /locus_tag="LOCUS_7230" ORIGIN 1 aacttcgaaa gccagagcct ggaacttgtt cagggacttg ccgaactgct ttctggactt 61 catgtagtcg acggtgacgt ccagagcgcc ctgcgcgata cccagagcct gggaagcgat 121 accgatacgg ccgccgtcca gagtcgccat agcgatcttg aagccctggc cgacttcgcc 181 cagcaggttt tccttgggaa cgatgcagtc ttcgaaaatg agctcggtgg tggaagaagc 241 gtggataccc agcttatctt cggtcttacc gatggagaag cccttgaagc ccttctctac 301 gatgaaagcg gtaatgccat gattaccctt gctcttgtcg gtcattgcga aaacgacgaa 361 ggtgtctgcg tagccgccgt tggtgatgaa caccttagcg ccgttgagca gccagtggtc 421 gcccatgtcg acagccttag tctgctgtcc ggatgcgtcg gtacccgcgt tgggctcggt 481 cagaccgaaa gcgccaagct tacggccgga gagcaggtcg ggcaggtact tctgcttctg 541 ttcttctgta ccgaagttga agatcggcca gcagcacaga gaagtgtgag cagagacgat 601 aacgccggtg gatgcgcaaa ctctggagag ttcttccaca gcgatcgcat aagagatgtg 661 gtcggaacct gctccgccgt attcagcggg gaagggaatg cccatcatac cgagcttagc 721 catcttttcg acattttcct tggggaatct gtgttcctta tcgatgtcgg cagcgatggg 781 ttcgacttcg gcaagggcaa acttccttac cagttctctt actttctctt gctctttcga 841 aagttgaaag ttcattcttt tgcctcctta tattttctac aggtccatat taactatgtc 901 ctaaaaataa cagtgcttaa gacaacgcac ccagagcccc gggcgcgttg ccgccaacta 961 ctattaaaca atattttaac aaactttgca aggggaaaca ggcattaaat gccctctctt 1021 tgagaaataa ttatcaattc cgcagattcc acggcttgcg agacaagagc cttgacgtcc 1081 agcctgcttt cggacgcctc gatccgctcc agctttggct gggtcaccgg gtgcttgggc 1141 aggaatacgg tgcagcagtc ctcgtagggc tggatggatg tttcgaacgt gccgatatcc 1201 cgggcgatgt ccatgatctg ggtcttgtcc atggcgatga gcggccgcat gacgggcagc 1261 gacaccgcag cgtcggtgac cacgagagaa gccgccgtct ggctggcgac ctgaccgagg 1321 ctttcgcccg tgatgagcat caggtcccct tcccgcttcg cgatcgcctc ggcgatgcgc 1381 atcatgaagc gccgcaccag gatggtggtc tcctcctccg gacagttctg cacgatctgc 1441 tcctggatgg gcagcaggtt gatggagaac atgcggatgc gcccgcagta atccgtcagg 1501 atgcctgcca gttccttcac cttttcgaac gcgcgctcgg aggtgtacgg ataggaatgg 1561 aaatggacag cgtccatgta catgccgcgg tgagccatca taaacgtcgc caccggagaa 1621 tcgattccgc cggacagcag caccatgccc cggccgttgg // LOCUS sequence294 1657 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence294 VERSION sequence294 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1657 /mol_type="genomic DNA" /organism="" /note="sequence294" CDS complement(1370..1657) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MWICRKGMEKMPTYRADLKEAGGTQFVFDLTDLKSAGTAALLVTV TREDGPVESSLALAEQDLTSGKTQVQYKVASDRYQLSGTLPLDAPVFQWK" /locus_tag="LOCUS_7240" /note="MGA_1118" ORIGIN 1 gtgccacggt tatgaggagc ttctgcttgc ggttctcctt ctgcacgccg cccagatcct 61 ccaggatcgc cggcgttttc aggatcttta tgctttgtgt gtcggtatcc ttcaggccgt 121 tggaagccgt tgccgtcagc ttcacctgat aggtgccggg tttcgtgaac accgcgatcg 181 caccggtctt gccggacttg cggatgctgc cgacgccttt ctgcacgatg gtaaagctgc 241 tcttgcccag ccccagctcc gcagcccggg cggcattcat gctcttgccg tcgacttcgt 301 accaggagca gtcccgcgcc tccacatcgt gacccgcata agcgaccgcc ggcagttcca 361 ggatcgcatc cagaccggta atgtcgtcgc cgtccgcagg cagcgccggg tcggtgggat 421 cgccgggatc gaccggatcg tccgggtcac cgccgggatc gcccccggga cctgtgcccg 481 gaccgtcgcc tcccgtcccg ggaccgtccg gaccctctcc cggatccgga tcttccggca 541 cgggcgtgcg cagatccgta aataccaggc tgacgggaaa ctcgaagtgc aggccgcagg 601 cacccgccgc cgcgaacgtg ccgctgccga tggaatagcc ggcggaatcc acgacgttta 661 cgcccagggt aatggggtga cccccttcca gcgcaccgct cttccccgtg atgaaggacg 721 gatggatggc gttgctgccg gtgtcggaag gatcgtcttc gttatagtag ccgaggccct 781 gcacggcgga ctgtccgttg ccgaagatgg aatagatgtt atagccgtat tttttgtcca 841 ccagcggcac cgtgacagac atgccgggca cgtaatcccg caggctggcg ttgctgtcgc 901 tgaagtgaaa caccggcgtt gcggagaatt cgacctggct gccgctcttg agggtcacct 961 ccgcggggga actttccgcg aacagcatcg agcagtcgcg cccccggtag tccgtaaagg 1021 ccacctgcca gtccgtgccg cgcgtgcctt ccgaaagcag tgccgcaact tctgccggca 1081 cgctgaccgc aaaaacggcc ttctgattcg cctgcagata ctggtccagc gcgcggatct 1141 gcgaatcctc gatgcggatc tgctcgctgc ccttgttgcc gactttccag taaccgccgg 1201 agtaatgcca cagatccagc gtccaggtgc cggacacctt ggccatctga gaagagctcg 1261 tctccgccgg agacagagcc gaagcaggag cgctgccgaa gaggagtgtt cccgaaagaa 1321 gcagggagat gcccctgcga agcaggtttc gcagtttcat ggccgtcacc tacttccact 1381 ggaataccgg ggcgtccagg ggcagcgtgc cggacagctg atagcgatcc gatgccactt 1441 tgtactgcac ttgcgttttg cccgacgtca gatcctgttc cgccagggcc aggctgctct 1501 cgacggggcc gtcctcccga gtgaccgtca ccagcagcgc tgcagtcccg gcgctcttca 1561 gatccgtcag atcgaagacg aactgtgtgc cgccggcttc cttcaaatcc gccctgtagg 1621 tcggcatctt ttccatgcct ttgcggcaga tccacac // LOCUS sequence295 1649 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence295 VERSION sequence295 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1649 /mol_type="genomic DNA" /organism="" /note="sequence295" misc_feature complement(425..>1649) /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_011948757.1:MBL fold metallo-hydrolase" /note="WP_011948757.1 MBL fold metallo-hydrolase (Clostridium botulinum) [pid:51.6%, q_cov:67.1%, s_cov:53.2%, Eval:1.8e-78, partial hit]" /note="MGA_1120" /locus_tag="LOCUS_7250" ORIGIN 1 caggatgcgt acgtccgcat ccgtatccac gaacagttta atgtcgaaca ggttgcgcag 61 gctttcgtcg gcaaagatca ggatgccttc gatgatgatg acccgcgcag gctttacctc 121 cacgacttcc ttcgcccggt tgtggtcgga aaaatcatag accggccggt ggatcgtaat 181 gccctgcttt aacagctgca ggtgttccac cagcatatcc gtatcgtagg cgttgggatg 241 gtcgtagttg agcaggcagc gctgttcgta gggcatgtcg tcatgcgcct tgtagtaata 301 gtcgtggctg agtaggcata cggaatcctg gaattccgct gcgatctcct gcacgagcgt 361 ggatttgccg gagcctgtac cgccggcaat gccgatgagg atgggttctt tcatgggggt 421 gctcctactt tttcttggac ttctttcctt ccttctccgg aatctccttc gggggcagtt 481 cgccctccag cggcagttct tcgtccgccg gccggtcttc cttcgtaatg gtggagccca 541 gattgatgac gtccttctcc aaggaggcca ccaggttctt gatctccgcc agtttctcgg 601 cgcttacggt ggtttccacc gtctcattgg tattgtagag cacgttgtcc agcgtcttgt 661 gcatctcctg cagacgggcc ttcaggtcgt cgatctgctc gggagaagtg aattccttca 721 gagccgcatc ttccgcaggc gcagccttcg atgcatgccg ttcctcgtgg gcggagagtc 781 tcgtctcgtc cgtcagttca tattcggaga taccgtctac gacgacgcag tcccagccct 841 tatgttcctt tacgtacgct gcgaaatccc gcttggcgtc catttcaccg tggaccagga 901 agatgtcgtg gggctgctgc gtaaagctgg agatccagtg gtacagggcg tctctgtccg 961 catggccaga gaacccttcc aggttgtgga tctgcgcctt gacggcaatg tcttcgccga 1021 acagttttac ctcctggatg ccctcgatca gggagcgtcc cagagtgcct tcggcctggt 1081 agccaacgaa cacgatgctg ttggccggat tgtacagatt atgctttaag tggtggcgga 1141 tacggcccgc gtcgcacata ccgctggcgg agatgatgat cttgggtttc gtatccacgt 1201 tgatcatccg gctctcatcg ctggtgcggg tgaagtgcag gttggggaaa tccaggggat 1261 ggtcgccccg cagaatgaat tcccgcatct cgtcgtcgta agtctgggcg ttattcttga 1321 agatctccgt cgcctgggca gccatagggc tgtcgacata gacatggaca tccttcagcg 1381 cctgcttgta ttcactgttg ccgtcgtaga tccggttgag ctcgaagatg agctcctggg 1441 tacggcctac cgcgaagctg gggatgacga cattgccgcc ccgcttggtc gtttcgacaa 1501 tgatgtccag cagtttttta atgctggttg cgttcttttc gtgcagtcgg ttgccgtagg 1561 tggtctccat cacgacgtag tcggctttgt ggatggtgac ggggtcacgc aggatcggac 1621 ggttcgtcat gcccaggtcg ccggagaag // LOCUS sequence296 1642 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence296 VERSION sequence296 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1642 /mol_type="genomic DNA" /organism="" /note="sequence296" ORIGIN 1 cgttgcctcc tttacctatc atgggatccg ggaaacgctg agctacgtgc ctgtagaagg 61 tacggactgg atgcttacct acctgatccg cgagagcgtt atcagcgagg agatcggcag 121 catctccgac gggatcatca accgcagcat gctgcagtcc gcgctcatga tattcgcgct 181 tctcgccatc ttcgcataca tcatccagca gaaccgcagc aacgcaaagc tgaccctgga 241 gaaggagacg gcagatgcgg agaaccgggt gcgccagcag gaactggagc accgtctggc 301 gctgcaggaa gaactgctgg agcaggaggc gcagagaaag cagcaggacg aactgatcac 361 ggcgctgtcc gccgactact ggagcgtcta ttacctcgaa ctggatacgg acgacggcat 421 ctgctaccag gctcactccg acgtggacgg ctttaaggta ggagagcgct ttaagtatct 481 gaagtccgtt acggattatg ccaaacgcta catcaccgat aaataccggg aggtatttct 541 gcagttcgtt cagcccgacg ccatccggga gggcttaaag catcagcagg tcatctccta 601 cacctatacc gtgttccgcc acgatcatga atcctacgag accgtccgct ttgccagggt 661 ccaccgcccg ggcgaacaga aagacgatca catcaacagc gtgggagcct gtttcgccaa 721 caccgatgcg gagacccgca agaacatggt gcagcagcag gcgctcagcg atgcgctggc 781 gtcggcggag gaggcgagca gggccaagac ggcgttcctg tccaacatga gccacgagat 841 ccgcacgccc atgaacgcca tcatcggtct ggacaacatc gccttaaacg atccggatac 901 gccggaaaag acgaagggct atctggagaa gatcggagat tccgcggatc acctgctgga 961 actcatcaac gacattctgg acatgtcccg catcgaatcc ggccggatga ccctcaagaa 1021 cgaggaattc tccttcccga aactgctgga atccatcaat acgatgttca gcgggcagtg 1081 cgacgacaga ggattgaaat accattgcca tatcaacacg ccagtcgacg attattacat 1141 cggcgaccag atgaagcggc ggcaggtgct catcaacatc ctgggcaacg cagtgaagtt 1201 tacgccggaa ggcggcaaag tggaactgac cgtggaacgc accgcgcaga tggacaacca 1261 ctccacgctg cagtttaaga tctccgatac cggcatcggt atgagcgaag acttcctgcc 1321 ccacattttt gacaccttcg ccccggagga ttcctccacg acgaaccggt acggcagttc 1381 cggactgggt ctcgccatta ccaagcgcat cgtcgagatg atgaacggct ccatcgaagt 1441 ggcaagcgaa aagggcaagg gctccgtctt taccgtgacc gtgccgttga tggattccgt 1501 gcgcaagggt gcggaaggtg acccggacga gatccatccg caggacatga gcgtgttgat 1561 cgtcgatgac gaccccgtcg cctgccagca cggcaaactg gtgctggaga aggtgggcat 1621 cgcctccgag atcgcatcct cc // LOCUS sequence297 1642 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence297 VERSION sequence297 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1642 /mol_type="genomic DNA" /organism="" /note="sequence297" misc_feature <1..1134 /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_011101393.1:L,D-transpeptidase family protein" /note="WP_011101393.1 L,D-transpeptidase family protein (Lactiplantibacillus) [pid:31.6%, q_cov:40.8%, s_cov:73.4%, Eval:4.6e-09, partial hit]" /note="MGA_1122" /locus_tag="LOCUS_7260" ORIGIN 1 gaagcgaccg gaaagaatct gctgggcaaa ccgctctacg aggtgacgca gatccgcggt 61 gccgcgcaga ccgaagtgat cggcgcaaag cagtcggtgt tcttcgtgga cgacagggac 121 gccgaagtca cgatcacgga aaacgacgaa tctctgttcg ggtcacgcgc cgtatcgaac 181 accgtcgagg ggatctttac cgacctgcag atcgagcccg gggatggcta tacgctggta 241 aaggcccagg aagagtgcct gtacctgacc gtccccgcgg tggaggacga ggtggaaaac 301 atccgggaag cgctctcgga agcccttacg aacgaactgt tcccggatgg tgaggaagta 361 aaatctctgg agctcaccga tccgctgttc ctggaggagg attccgccgt cgtcttcggc 421 cgctatatcc acggaacgcc ggaggaagaa ggcgtgcaga gcagcgatgc tttcctgctg 481 aggcagaaca gccggggcta ttggaccatc cgggccgagg cggaagacga agagtcgatc 541 ctcccctaca cggaagagta cgtcttcgac atgccaagct atctggaacc gccgaaatct 601 gcgccccgca gccatccgta ttacatcatg gtcaaccggc agatgaacac ggtaacgatc 661 tacgaaaagg gcaaggacgg cagctacagt gaacccatca aagccatgat ctgctcctgc 721 ggcagagaag ggcacgagac gcccacaggc gacttcaaga tcctcagctt taaggcggcc 781 tggtgctaca tgatcgacgg cagctacggc cagtatgcta ctggattcct ggacggcggc 841 tatctgttcc actccgtctg ctatacggct caggacaggg cgaccctgat gcgggacgaa 901 tacaacgcgc tcggcgattt tgcctccgcg ggatgcgtgc gcctgcaggt ggcagatgcc 961 cagtggatct tcgataactg cgaggagggc accggcgtta cgatctatga cggtcccaac 1021 cccgggcctc tgggtaagcc tgaaaaagcg gtggaggaga tcacggaaga aaacgacaac 1081 ggctgggagc cgacagaccc cgatcccttc aacccctgga acgatctcaa ttagggtcaa 1141 aaaccgcaat tgtaattgaa attgcaagct ttttcgggat ataataattt attgagcaat 1201 cacgaaagga cagttgatat atgacgacag acaagcggtt cgcggtcctc atcgacgcgg 1261 acaatatttc ggaccggtac atcaagacca tcctggacga gatggccggc gaaggcgagg 1321 tgacgtacaa gcgcatctac ggcgactgga cgaaaccggc gctggcgccc tggaaaaagg 1381 tgcttctgga gtattcggtg accccgatcc agcagtacag ctacaccacg ggcaagaacg 1441 ccacggactc cgccatgatc atcgatgcca tggacatcct gtattccggc aacgtggaag 1501 gcttctgcct ggtcaccagc gacagcgact ttacccgttt ggccagccgc ctgcgggaat 1561 ccggcatgct ggtcgtaggc atgggcgaaa agaagacgcc gaaggccttc accaccgcct 1621 gcaataagtt taagtatctg ga // LOCUS sequence298 1634 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence298 VERSION sequence298 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1634 /mol_type="genomic DNA" /organism="" /note="sequence298" CDS 343..1353 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MKLLYTDFADKATLRDLSKRYQIPGFNYCLIKEGVAQPVHAYGVQ NAETGEPMLPSTIFEAASLTKTLFACLVLRLVDRGVLTLDEPIAKLAPNVQVSQDERIQ TITARQVLSHGTGLPNWDKKPYLKFLFDPGTSYSYSGEGYYYLQKIVNEITGKDFTDHY WDEFLKPLGMTHSFPVWEPAVSEIESRKHDAKGALLPDRRHLDLEGDAPEPNAAWSLYS GAEDYTKYMLEILNAHGHLSDAMFREMTTPQNKATDGVFWGLGWGIPAKDPNVIWHWGD NGGYRSFTVMDLKTKDGACIFANGFQGNDMEIEFLDYLTDGDFWPDVADFVAHAE" /locus_tag="LOCUS_7270" /note="WP_008671701.1 serine hydrolase (Rhodopirellula europaea) [pid:26.8%, q_cov:71.4%, s_cov:31.9%, Eval:4.6e-18, partial hit]" /note="MGA_1125" ORIGIN 1 acagaacctg gagctggtct gcggccccgg gaaagaccgg gagatcacag aggctctggc 61 cctgatggaa ctgacggatg cggcggacaa aaagccgtcg gagctgtccg gcggcatgca 121 gcgaagagca gcgctggcgc gggccatcgc ctacggaggc gacatcctgg tgctggacga 181 gccgttcacc ggcctggacg aagcgctgaa ggagcgtatc gcgggcaaat tggcggcgca 241 gtggcgggcg gagaagaaga ccgttctttt cgtgacccac gacagcgctg aagcgaaaga 301 atacgcggat aagatcgtaa aactgaacga aggaggtagt ttatgaaact gctttatacg 361 gattttgcgg acaaagcaac gctgcgggat ctgtccaaac ggtaccagat cccgggattc 421 aactattgcc tcatcaagga aggcgtagcc cagccggtcc acgcctacgg cgtgcagaat 481 gcggagacgg gcgagcccat gcttccctct acgatcttcg aagccgcgtc tctgacgaag 541 acgctgttcg cctgcctggt gctgcggctc gtcgaccgcg gcgtgcttac gctggacgag 601 ccgatcgcaa agctggcgcc gaacgtgcag gtctcccagg atgagcgcat ccagaccatc 661 accgcccggc aggtgctgtc ccacggcacg ggacttccca actgggataa gaaaccgtat 721 ctgaagttcc tgttcgatcc cggcacctcc tattcctact cgggagaggg ctattactat 781 ctgcagaaga tcgtcaacga gataacagga aaggatttta cggaccacta ttgggacgaa 841 ttcctcaaac ccctgggcat gacccattcc ttcccggtgt gggagccggc ggtctcggag 901 atcgagagcc gcaagcacga cgcaaagggc gctctgctgc cggaccgcag acacctggat 961 ctggaagggg acgcgccgga gcccaacgcg gcctggtcgc tgtacagcgg ggcggaggat 1021 tacacaaaat atatgctgga gatcctgaac gcccacgggc atctgagcga tgccatgttc 1081 cgggagatga cgacgccgca gaacaaggcg acggacggtg tgttctgggg cctgggctgg 1141 ggcattccgg ccaaggaccc gaatgtcatc tggcactggg gcgacaacgg aggctaccgc 1201 agctttaccg tgatggactt aaagacgaaa gacggcgcct gcatcttcgc caacggattc 1261 cagggcaacg atatggagat cgaattcctg gactatctga cggacggcga tttttggccg 1321 gacgtggcgg attttgtagc gcatgcagaa tagaagaatg aggatcggta tattatgttg 1381 gatctgatca ttaaaaacgc aacgatcgta gatggaaccg gcgcagagcc tttcgagggg 1441 tctatcccca tccgggatgg caagatccgg gcgatctggc acggcggatt tccggcaggt 1501 gtcgaggcaa aagagatcta cgatgccaag gggctggtgg taagcccggg ctttatcgac 1561 atccactgcc acagcgacga gacattctat aaatatccga aggaggaagg caagatcctg 1621 cagggggtca ccac // LOCUS sequence299 1634 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence299 VERSION sequence299 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1634 /mol_type="genomic DNA" /organism="" /note="sequence299" CDS 1..1218 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MDIKRERGFGVLAVEKTEWVMKQMVKDKVPFSMIEHGLDMVVPHA GYLQNFDLRKCRSGLVIRIPEDTHPGGLAPAVDNRNLYKAFQVQRKWAEKLNILTCADL NRAIAAGQINDIIQVSEALQEKKIARIADEIVRSGKRIVLIAGPSSSGKTTFAHRLCTQ LWVNGEKPVYMGTDDYYLDRDLVPVGPDGTQNFENLDSIDVELFNEQLKTLLAGGEVDL PRFDFNQGKKIFGERKLKLGPHQPMVIEGIHGLNEALTPAIPKTDKYKIYISPLTQIRI DDYTRIPLTDMRKLRRIVRDAKKRGWDARQTIEAWPKVRVGEAQNIFPYSDEADAIFNS AFVYELAALKKDALPMLVNIPEDDEYYTEAQRLARLLSHVDVIEDTKYIPNNSILREFI GGSVIV" /locus_tag="LOCUS_7280" /note="WP_003436982.1 nucleoside kinase (Clostridioides difficile) [pid:47.3%, q_cov:91.9%, s_cov:67.0%, Eval:1.5e-90, partial hit]" /note="MGA_1127" ORIGIN 1 atggatatta agcgcgagcg gggcttcggc gtgctcgccg tggagaagac cgaatgggtg 61 atgaagcaga tggtgaagga caaggtgccg ttctccatga tcgaacacgg tctggatatg 121 gtggtgcccc atgccggcta tctgcagaac ttcgatctgc gcaagtgccg cagcggtctc 181 gtcatccgca tccccgaaga tacccatccc ggcggactgg cgcctgccgt ggacaacaga 241 aatctgtaca aggccttcca ggtacagcgc aagtgggcgg agaagctcaa catcctcacc 301 tgcgcggatc tcaaccgcgc catcgcggca gggcagatca acgacatcat ccaggtgtcc 361 gaagcgcttc aggagaagaa gatcgcgcgc atcgccgacg agatcgtaag gagcggcaag 421 cgcatcgtcc tcatcgctgg accgtcctct tccggcaaga ccaccttcgc ccacagactg 481 tgcacgcagc tctgggtcaa cggcgaaaag ccggtctaca tgggaactga cgactattat 541 ctcgaccgcg acctcgtgcc cgtgggcccg gatggcaccc agaatttcga aaatctggac 601 tccatcgacg tggaactctt taacgaacag ctcaagactc tgctggctgg cggcgaagtg 661 gacctgcccc ggttcgattt caaccagggc aagaagatct tcggcgagcg caaactcaag 721 ctgggacccc accagcccat ggtcatcgaa ggcatccacg gcctgaacga agcccttacg 781 ccggccattc ccaagaccga taaatacaag atctacatca gcccgctcac ccagatccgc 841 atcgacgact acacccgcat tccgcttacg gatatgcgca agctccgccg catcgtgcgc 901 gatgccaaga aacggggctg ggacgcccgc cagaccatcg aagcctggcc caaggtaaga 961 gtcggagaag cgcagaacat cttcccctac agcgacgagg cagatgccat tttcaactcc 1021 gccttcgtgt acgagctggc ggcgctcaag aaggacgcgc tgcccatgct ggtgaacatc 1081 cccgaagatg acgagtacta cacggaggcg cagcgcctgg cgcgcctgct gtcccatgtg 1141 gacgtcatcg aagacacgaa atatattccg aacaactcca tcctgcgcga attcatcggc 1201 ggcagcgtca tcgtatagga gcgcagcatg ccggaatatt tatcaaaact caacccgcag 1261 cagctcgagg ccgccacgac gctggagggc ccgctgctga tcttagccgg cgccggttcc 1321 ggaaagaccg gcacgatgac ccaccgcatc gcctacatga tcaaggatca aggggtcagc 1381 ccgtattcca tcctggcggt gaccttcacc aacaaggctg cgacggagat gcgcgaccgc 1441 gtggaggccc tcgtaggccc tgctcccggc atgtggatcc agacatttca ctcggcctgc 1501 cttcgcatcc tgcgcatgga cgcggacaag atcggctacg aacgcaattt cgtcgtctac 1561 gaccccgcgg accagaaggc tctgatgaag agcatcgtta aggagctgca gtacgacgaa 1621 aagcagtatg cgcc // LOCUS sequence300 1633 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence300 VERSION sequence300 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1633 /mol_type="genomic DNA" /organism="" /note="sequence300" ORIGIN 1 accttcgcgt tcaaaatgtc cttggggtcg atggtataaa ggtctctgtc catggtgata 61 aagtccgcta agaagcctgc ctttacctta cccttaatgt tttcttcgcc tgtattccag 121 gcagattccg ccgtataggc gtaaatggcg tcttcaacag acagcgcctg ctcgggcagg 181 tacggtccgt ctccgttctt cgccagtctc gtaacggcgc agtagatacc ctgcaccggt 241 tcgaagcttt ccaccgggca gtcggtgccg aagctcatgt ggatgcccat gtccttgtac 301 cacttccagc agtaggagct ttccgccatc tccttaccca ctctgtcgta gatcacgtgc 361 atgtcgtagt cgatgaagat gggctgcacc attacggaga tgcccagatc cttcatccgc 421 tgcagcatgg cgcggtccgt cacctggctg tgcaccacgg tgtgtctggg atgcacgtgg 481 ggatacttct tctgcgcggc ctccacggcg ttgatcacca tctcgatggc gccgtcgccg 541 atggcgtgga ccgccacggg cacgttctgc cgctgggaga tctccaccat ctcgttcagg 601 ccttcctgat cccacagggc gaggcccgtc gtggacgggt catccgcgta gggctttctc 661 atgagagccg ttctggcgcc cagggaaccg tcggagagca gcttggtgca ggagatcttc 721 atggtgtcgt tgccgaaggt gttgtcgtag ccttcggaga aggcccactt cagcttgtcg 781 gcgttgaagt acagcatctg ggaagccaga cgaagcttga aggtgccctt ttctgcccgc 841 tctctcatga gtttctgcag atcgtggtat ctgcccgccg gcgtgtagtt gccctcgtcg 901 gactgtacgg acgtaagacc cttttcgaac agatcgtact ggtgctcctc catcaggtcc 961 atcagttttt ccagagacgg agcgggaagc gtcgtcttca tgtagtcgaa cagattttcc 1021 ttgatgacgc cgttcagctt gccgtccggg ccgacttccg catattcctt gtactttaag 1081 ccttctccct ggctcatgtc gaatttctcg atccccttgg aattcagcac gcccacgtgg 1141 ccgcaggtgc gctggatcat gatgggccag tcggcagtga tggtgtccag atcctccttg 1201 gtggggaaac gcttttcatc ggtgaaatag tcctggttcc agccttcgcc cacgaaccac 1261 aggccgtcgt tcttgtcgaa ggtcttgtag gcttccttca tgcggtccag cacttccttc 1321 aaggacgtgc agcccaccag atccacgtgg atgcgggtct ttacgtagtg caggaagtgc 1381 atgtgggagt cgttgaaccc gggcagcagc agctgtccgc cgcagtccac ttcctcgcag 1441 gtgccgtcgt tatgggccgc gatgtattcc ttcgcgccct cctcgctgcc tacgtaggcg 1501 aaatacttcc ccgtgaccac agcagcctgc gctctgggct ggtcgctgtc catggtcgcg 1561 atgttggcgt ttctgatgag caatgacatc gtctttcctc cttattcttc cgctgctctg 1621 gatctccaga acg // LOCUS sequence301 1628 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence301 VERSION sequence301 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1628 /mol_type="genomic DNA" /organism="" /note="sequence301" misc_feature complement(785..>1628) /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_021374035.1:murein biosynthesis integral membrane protein MurJ" /note="WP_021374035.1 murein biosynthesis integral membrane protein MurJ (Clostridioides difficile) [pid:35.1%, q_cov:98.6%, s_cov:70.6%, Eval:2.8e-44, partial hit]" /note="MGA_1131" /locus_tag="LOCUS_7290" ORIGIN 1 atgaggtcga tgagcgaagg catgatcttt accttgcact tcgtctggtg gcagatctcc 61 aggatctcgg aaatgacctt cttcggcgcg gaaggaatgg ctacgacgat ctcgtcgatg 121 tcgtactttt ccacggcctt ggggatgtaa tcccggttgc ctacgacctt gatgccgtga 181 gccgtgcggc cgatcttcgc cttgtcgtcg tcgatgaggg cgacgatgcg gcggtcatcg 241 ttctccgcgt tgcggatctc cttgatgacc gtgccggccg cgttgccggc gcccaccagg 301 agcacccggg tgtattcccg gtcggagccc aggccggcca ggcctctgtg cttggagccg 361 ggcagcgtaa aatagccggg atagcggtat tcgcggatgt agcggtagat aaagcggatg 421 ccgccgatga ggacgacgtc caggaaggtg cagatgatgt agaaggaccg gggcatggac 481 tgctgggtca tggccatgta ggtgaggaag cccatgttgc ccacgacgca ggccacaaag 541 accttcagga gctcgtccga gcccgcgtag cgccataggc tgcggtagat accgaacagg 601 atgagggacg cctccttgat gaggagcatc caggcccagt tgtccagaag caccgccagg 661 taggtgatga actggaggtt gtccggatcc agctcgaagc ggatgagcaa cgccaaaatg 721 gacatgatgg cgatgcagat caggtccagg gctgcgagga gtatgatttt taatctatga 781 ttcgtcatcc gcgctttaca agatccttca ggatgttcaa ttcttcgaac tttgcggcct 841 tcagcaggat aaggtacgcg atgcctgccg aggcgacggc gcccgcaaga cttacaagct 901 gcggactatt tattttatca cttaagagcc taaagcacaa ataggagatg ccgacggata 961 cggcggagaa caccgcgatc cgcaccagct tgcgtttgga gctcagaagc ttaatgtcgg 1021 gatatttctt cttaaatgtg taatacagca gcagcgcgtt aatagcctgg gcgatggagg 1081 tggccagggc cagccccgcg tgagccatgg ggcgcaccaa gatcaggttg agcacgatgt 1141 tgcacacgac cgccgccacg gagcagtaca ccgccgtctt cgtatcgtgc agggaataaa 1201 agaccttggt gatgagctgg ttgaccgcca ggaacgttaa tccgatcgca tagcagaaga 1261 acgcggaggc ggtcaccgcc gtatcctccg cggtaaacgc gccgcgctgg tagacgatct 1321 ggatgacggg ctgcgcgtag accatggcac ccagggaaag cggcacggcc agcagcgcca 1381 atacgttgat gccccgttcc gtcatcgtgc cgatggagag ccggtcgcct gcggcgaagg 1441 cctggttgag cttcggatag atgatagtga ccaggatgga gaccgtcagc atgacgatcg 1501 cgttgatgat ctcgttaccg taggttagcg ccgagacgct gcccttgggc agagtggatg 1561 ccagcatgcg gtccacgaag gtgttgatct gctgcacgct gccgccgatg aagatcggca 1621 gcgccagc // LOCUS sequence302 1626 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence302 VERSION sequence302 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1626 /mol_type="genomic DNA" /organism="" /note="sequence302" CDS complement(84..1568) /product="threonine synthase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011986278.1" /transl_table=11 /codon_start=1 /translation="MIFKSTRGQAPEKNLSGAVIQGIAADKGLYVPSEFPKLKKTWAEY AAMDYKTLAQEVLGPYAVEFTPEELKACIDGAYTNKFEAEDVVPLVHAGGADFLELYHG PTAAFKDMALALMPYLMTTALAKEKEDKTVCILVSTSGDTGMAALKGFEDVPGTCIIVF FPDHAVSPVQEQQMRTATGSNTYVTSIFGNFDDAQTTQKAILNDKPFGEEIGALGYRFS AANSMNVGRLLPQVAYYIWAYAQMVKNGRVKAGEPINICVPSGNFGNILSAYYAKQMGV PVNKLICASNKNKVLTDFFHTGVYDARRDFYVTNAPSMDIIISSNLERLLYHLSGCDDT AVRSMMDALAEEKHYEASPAIREGLKDFAAGFATEEEILAAIGEIYREDHYLMDTHTAV AYKVYRDYKAQTGDETPTVIASTASPYKFAAAVSGAIGLPKAEDEFAAIEALNAESGVR VPYGLKDLKSREILHKGAIAREDMKDFVRETIKNRI" /locus_tag="LOCUS_7300" /gene="thrC" /EC_number="4.2.3.1" /note="WP_011986278.1 threonine synthase (Clostridium botulinum) [pid:49.0%, q_cov:98.6%, s_cov:99.0%, Eval:1.6e-135]" /note="MGA_1133" ORIGIN 1 cgatcccgga aaggccgatg ccgccgatac cgacgcaatg tacatgctta taattcttca 61 gatccatata ctttcatctc cgatcagatt ctgtttttta tcgtttcgcg cacgaagtcc 121 ttcatatcct cccgcgcgat cgctcccttg tgcaggatct ccctgctctt caggtccttt 181 aagccgtaag gcactcttac gccgctttcc gcattgagcg cctcgatggc cgcaaattcg 241 tcttccgcct taggcaggcc gatggcgccg ctcaccgcag cagcgaactt gtaggggctg 301 gcagtggagg cgatgacggt gggcgtctcg tcgccggtct gggctttata atcccggtag 361 accttgtagg cgacggccgt gtgggtatcc atcaggtaat ggtcttcccg gtagatctct 421 ccgatggctg ccaggatctc ctcctccgtg gcaaagccag cggcgaaatc cttcaggcct 481 tcccggatgg ccgggctcgc ctcgtaatgc ttctcctccg ccaaagcgtc catcatggac 541 cgcactgccg tgtcgtcgca gccgctcagg tgatagagca ggcgctccag attgctggag 601 atgatgatgt ccatcgaagg cgcgttcgta acgtagaaat ctcttctcgc gtcgtagacg 661 ccggtatgga agaaatccgt cagcaccttg ttcttgttgg acgcgcagat gagcttattg 721 acaggcacac ccatctgttt cgcgtaatag gcgcttaaaa tgttgccgaa attgcccgaa 781 ggcacacaga tattgatggg ctcaccggcc ttcacccggc cgttctttac catctgcgca 841 taggcccata tgtagtaagc gacctggggc agcagccgtc ccacgttcat ggagttggcc 901 gcggagaaac ggtaacccag tgccccgatc tcctcgccga agggtttatc gttgaggatg 961 gccttctgcg tcgtctgcgc gtcgtcgaaa ttgccgaaga tgctcgtaac gtaggtgttg 1021 ctccccgtcg ccgtgcgcat ctgctgctcc tgcacggggc ttacggcgtg atccgggaag 1081 aacacgatga tgcaggtgcc cggcacgtcc tcgaagccct tcagggccgc catgccggtg 1141 tctccggatg tggagaccag gatgcagacc gtcttatctt ccttctcttt ggccagtgct 1201 gtggtcatca ggtagggcat gagcgccagc gccatgtcct taaaggccgc cgtcggaccg 1261 tgatacagct ccaggaagtc cgcgccgccg gcgtgaacca ggggcactac gtcctccgcc 1321 tcgaacttat tcgtgtaggc accgtcgatg caggccttca gttcctccgg ggtgaattcc 1381 accgcgtagg ggccaagcac ttcctgtgcc agcgttttat aatccatggc ggcgtattcc 1441 gcccaggtct ttttcagttt cgggaattcg gacggaacgt acagtccctt atccgctgcg 1501 atgccctgga tgacggctcc cgagagattc ttttccggag cctgccctct cgtactcttg 1561 aaaatcatga tgcctcctct gtttgccctg cgcgtctgcc tactgcagcg ccgcttccgc 1621 tttgtc // LOCUS sequence303 1614 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence303 VERSION sequence303 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1614 /mol_type="genomic DNA" /organism="" /note="sequence303" ORIGIN 1 agctctgcag caggctgaga tccttatcca gatccgtcaa ggccttgtac aggctggtga 61 ggttcccgga gacggtgccc agagaaccgt cgagcgcggc cagatcctcc gcagctgcat 121 ctacggtctt ctgcaggtcc gccgcgtttt ccgatgccgt cgtcaggtct ttctgcagcg 181 tgtcgacgtc gctcaacgcc gtatccgcct gttcgtacag gccctcttta tcgccggaca 241 gaacagcccg tccctcgttg agctcgtcca ggccgtctgc ggtctcccgc aggctggcgg 301 acatgccgga gaaggagttc agcagcgtgt cgatgctgct gtccagctta tgatagttgt 361 cctccagctg atctttctta tcggacagct ccgagatctg gtccagtgcg ccgagattgg 421 cgggcaccat cagcatcgtc agaccgtcga aggcgaaatc ctccgcaccg acttcgatca 481 cgaagtgctc ctcctcgccg ggaagtccca ggaacaggac cgcccgcagg ttgccgatca 541 gctgcacctg ggcgccgggc gccttcaggg acaggatgtc gtcctggttg aacaggccca 601 tcacctccag ggtgtagttg tttctcgcgt attcggatgc cgtctcccgg ggaatggcgt 661 ccacgtcgat ctcgatcatg ccggtcttgc ctgccagatc ttccgccttc gtgggcacgc 721 cgttcagttt ataactgacg gtgatggtcc agggcagttc ctcgaaaggc ttgtccgtct 781 tcccttcaaa atagaagtgg ctgggcgcat cttctccgaa acggaacacg tgggctccgc 841 cttcttcggt aggcgccgtt ccatccgtca aattattgat ggcgtcgtat tcgccgtaat 901 ccgtaacggt atcgacaccg tttaagatgt agctcttgac catgctggca tccttcagat 961 tgccgtaata gtccagattt gcgtagtacg cttcatcata ggtggcgtac acaccgtttc 1021 cgatctctcc ttctgcgaag accgggacga cgctcgtcag ggtcagcgca gcggaaagac 1081 acactgccaa aacttttctc atattccctc catctgtgaa tttaattcac acttgttatt 1141 ttatgcacac ttgttgcttt ttcaaacgat gttaattata atccacatct gttgattagt 1201 caatatcgct tgaatataat aaagatggat gtatgagatc ttctacagaa gcgcagaaga 1261 tcgtggaaaa agttgaagga aagtgatcac catgcacaaa aacaccgatg acagaagagc 1321 aaaacgatcg agaagactgc tgaaggaagg gcttctgtct ctgatgcagg aaaagaaatt 1381 caaggatatc tcggccagag acatcacgga gagcgcggat ctcaaccgcg gtaccttcta 1441 cctgcactac ccggacaccc aggccctgct ggaaagcatc gaagacgatc tcctgggcga 1501 agcgcagcag atcgtggacc agcatctgga ggaattccac gccggcgtct ccctggagcc 1561 gctgctgctc cccatcctgg acttcatcca ggagaagtac aagacgatca ccct // LOCUS sequence304 1609 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence304 VERSION sequence304 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1609 /mol_type="genomic DNA" /organism="" /note="sequence304" ORIGIN 1 agacggtttt cctttacgag cttctgcagc ccttcgatat gggtggagcc gcagcccatg 61 ttgatattcg tgccgtcggg tctgtcgttg atgacaaagg tcttggcacc cagcgcgtcg 121 aatacgctgc gggcgatctg ccacgtgctg ccgttggagc aatccagtcc gatccactta 181 cctttatagg acgtggtggc cagggagatg aggtagccga tgtaacggtt gcggccggcg 241 gaatagtcga tcacctgacc gatgtcgctg ccggtggcaa ggggaacgtc acaggtctcg 301 ccttcaaacc cttcgggctt atagacgccg tccagatagg cttccacatc ggcgatgacg 361 tcgtccggca tcttctcgcc gttctcgttg ataagcttaa tgccgttgtc gtggaacgga 421 ttgtggctgg cggagatcat gatgccgcag tcgaaatctc ccgttctggt aacataagcg 481 acgctgggcg tcgacgttac atgcagcata tagacgtctg cgccggaggc tgcgaggcct 541 gcggacagcg cgtcttcaaa catataactg gaaagtctgg tatccttgcc gagaacgatg 601 ttcgccttgt agccctcggc gtgtttcatc ttcggatcct tcgcgtaata ccatcccagg 661 aaaagtccga tcttgaaggc atggatcgct gtaagatcta cgttggcatt tcctctaaat 721 ccatctgttc caaaatactt tcccatactc tgcttccttt ctgaaatcta ttcgtcctct 781 tccggcgcga gggcttccac gagaacgtgg agctgggccg gttctataac ggtttccagc 841 gattcaccga tcgtcgttcc ggtgtaaata ggcagatcgt attcgcccgc ttcttcgatc 901 gtagaaagat ccacatagta ggcgaacata tccgcagtaa gatccgagat cgtctccacg 961 ggacctttga cggtgacctg catggtgaac ggttcaccgg aggctgccgc tgtaaatcct 1021 tccggcaggt tttccagcac gatctgggaa ctgtccgcct ccatcgtcat gctggcctga 1081 tcggacagcg taaagctggc gatgaggtcg ccgttattcg ctgccagcgc aatgccatcc 1141 gggagcaccg gcaccaccgg cagttccgta ttcgtcgtga tatctgtaat atccagcggc 1201 tgagcgtcga cgtaattcac cttcgccaga tccagcagcg ttcccttgat gcttacggca 1261 gaggggatgc tggagctgag cagttccagg ccgtagccgg gagcgccgtc cacccgcgta 1321 taaaggggca cgctcttgac ggtataaagc gtggaggaca tcgaaacgaa cggactctcc 1381 agttttaccg cctttacgac gtttccttcc gcatccatcg gggttagcgc atattgctgc 1441 tccgtcgctt catccaccga cagtccgccg gcatccacgt gcacggtgag atagtccacc 1501 atatccacca ggctctttgc gccggagaca aggatctgct cctggctgag gtccagcacg 1561 gtgaactccg tgtcggaggg gacattcgcc acatccagca ccacaggct // LOCUS sequence305 1605 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence305 VERSION sequence305 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1605 /mol_type="genomic DNA" /organism="" /note="sequence305" ORIGIN 1 ctccgaggac tttggccatt tcgcgaaact cacgaagggc gccatgttct tctactgcta 61 cggcaaggac aacccggata tgcactccac ggaattcaac ttccacgacg agatcatcga 121 ccgggtgatc gatatctacg acgaactcat caagatgtac taggaggcag ctatgagcaa 181 gacagcattc tacaacgcga aagtctacgt agagaagggc gtatacgccg aagcgatcct 241 gcaggaagac ggctggatca aggctgtcgg cacgaccggc gagatcctca ctctggccgg 301 ctacgacgcg gagaagatcg actgcggcgg caagaccatc gttcctgggt tcaacgactc 361 ccacatgcac atcctgcagg tgggcatggc gatgaaccag ctggacgtga gcggctgcaa 421 gagcgtcgaa gagatcgttg cggcaggcag acagtatctg gcggatcacc ccgactgcca 481 gggcctgttt acgcagacct ggaatgacga catgttcgat ccggacaaga agcgtctgcc 541 cgataagcac gactgcgacg ccatctccac cgagatcccc gtgttcctgg gccgcatctg 601 cggacactcc gcggcggtca acagtctcat cctggagaag atggggctgg ataaggatca 661 ccacaccatt cccggcggcg aagtggtctt gggcgaagac ggcgaaccca acggctacct 721 gttcgaggca gcgcaggcgg aagcccgtct tacgatcccg cagatgaccg tcgaggaagc 781 gaagaaatat tatctgatgg ccatggaata cggcgtatcc cacggcatga ccaccaccca 841 gtccaacgac tacaccaccg ttgcaccgaa ggagattgtc aaggcggctc tggaagggtt 901 gtacggggca ggggaagcgc ccatgcgcta cgttgcccag tgcggctgcg agaacatgaa 961 gcaggcggag gagttcgtcg ccgaagactg gggcagaaaa gtgggcatga tggaatacgg 1021 ccccgccaag atgtttaagg acggttccct gggcgcccgc tccgccatga tgagaaacgg 1081 ctatgcggat gcgccgggcg ttatgggcgt cgaccgcatt ccggacgacg agcagatggc 1141 gatgatccag ttcttccagg ataaaggggt caccatcgcg acccactgca tcggcgacgg 1201 cgccatcgac gtcacccaga agatgtacgc caaggtcgcc ggcaccgaga acaagtaccg 1261 ccacaacatc atccattacc agatcacgga tatggatatg gtgaagttta caagagaaca 1321 caacatcctc gtatcctatc agcccgtctt cctgcagtac gacctccata tcacggagag 1381 ccgctgcgga cacgacctgg ccatgcagtc ctactgcttt aagaccgccc acgacatggg 1441 catccacgcc tcctacggca cggacagccc ggtggaagac tgcaatccgc tggcgaacat 1501 ctacgtcgcc gttacccgca aggacttcaa gggtcagccg ctggaaggct ggaacccggc 1561 ggagcgcgta gatgtggaga ccgctgtgga cgcctacacc tacga // LOCUS sequence306 1605 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence306 VERSION sequence306 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1605 /mol_type="genomic DNA" /organism="" /note="sequence306" ORIGIN 1 aagatcgtct gcgactactt cgaaaagaag aagaacgact taaacgagat catccgcgag 61 cgcggcgtgt tctacgggtt ctccagctac aaacatctgc tggagctggc gaaggaacac 121 cactgcgtgg gcatgggtat gaagatggga gaaggatggc ttctcacgtc cgagatgctt 181 gaactgtgtg agatgggcgt ctccaacatc gtttgctgcc agcctttcgg ctgtctgccg 241 aaccacatcg tgggcaaggg catgatgcgg ccgatcaagg cgtgctatcc ggacgccaac 301 atcgtagcca tcgactttga ccccggtgca tcccgcatca accaggaaaa ccgtttaaag 361 ctcatgatga gcaacgcaag aaagtaggca taccatgaca cccagacagc agcagatcgt 421 aaaaaacgta gacaagtaca gacaggacat cttagacgcg gagcgctgga tctggcagca 481 tccggaagta ggctacaccg agtggcagac gaacgcgtat ctgctggaga aattccgctc 541 ctacgggtat gagcctgtgg aagcggggga tattcccgga ttctatgtag acatcgacac 601 aggaagaccc ggtccctgcc tggccatcat gggcgaactg gatgcgctgg acatcgcgaa 661 tcacccggaa tccgtcaacg ggatgacgca ctgctgcggt cacaactgcc agtgcgcgga 721 gatggtcggc atcgcagcgg ctctcaaaga gcccggcgct ctggacggtc tctgcggcaa 781 gatccgtctt atgctggtcc cggcggaaga gatgatccag ctggagttcc gcaaggggct 841 catcgacgag ggaaagatca aatatctggg cggcaagccg gaattcatgc gccgcggcta 901 tttcgacggc gtggatctgt cgctgatggt ccacacggac aacaacaacg attacgactt 961 tacctgccag gacggcttta acggcatcat cgccaagatc ctcacctata aaggccgcag 1021 cagccatgcc ggcggctctc ctgaggacgg catcaacgcc cagtatgcag cgacgctggg 1081 tctggacggc tgcaacgcgc tgcgggaaac gttccgcgac gaggaccaca tccgtttcca 1141 cccgatcctg aaaggtgtca agagtgccgt caacatcatc ccggatgaga tgcgcatcga 1201 aagctacacc cgcggcaaag gcctggatgc ctacgtgagc gcaaacagaa aactcaaccg 1261 cgcgctggct gcgggcgccg tcgccatggg cgcgcagctg cacatctgcg acatgcccgg 1321 ctacgcgacg gagtaccacg accacatgtt catggatctg tgccagaagt gctgcgaaga 1381 tctgtccggc aaggaaaaag taaagttcga ccacaacgcc tggagcaagg ggtcttcgga 1441 cttcggcgac cttacgatgg tgatgcccgg cgtgcagttc tatgcgaacg gccacacggg 1501 gctgggccac ggcatcgatt tctgcgtggc ggacccggaa agagcctgcg tgaacccggc 1561 aaaagcggaa ctctttatcg ccgacgcgct gctatcggat ggcgc // LOCUS sequence307 1605 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence307 VERSION sequence307 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1605 /mol_type="genomic DNA" /organism="" /note="sequence307" CDS 226..1593 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MENMDQNSIDKSIKGLSIQRLHRFMMAVAVLLAILLLYATYSVMT GYDILQEATDRYIEMERSTQDLMAASDYLTESVQSFVVTADPDYVDDYFEEAKVARRRD NALETMEKTLAGTETYRYLEEALWYSNNLMEIEYYAMRLTIDANGMEVSNFPEELQNIV VRPRHAWLSDESKRSIAIDLVFNDEYQRYKNNIRRDVDLCAGALVTDAQNSQRQSADHF REVIRRLTICIFLLLLSVLFMVILTARLIIDPLNNGIRHIRKKELFPVAGSLEMRYLAQ TYNDLYESSRKEQETLSYEASHDALTGLGNRAMFERVRNDCDPATTAMILIDIDYFKEV NDTYGHEAGDQLLKRAAKVFRASFRSEDCVCRIGGDEFAVLMMHSGTHLKALVQRKIEL AQAQLKDEENGVPGVTISVGVAFPDRDNPTEDIYQDADTALYKVKNAGRNGLAFYE" /locus_tag="LOCUS_7310" /note="WP_002223940.1 diguanylate cyclase (Yersinia pseudotuberculosis complex) [pid:35.4%, q_cov:46.4%, s_cov:53.2%, Eval:9.6e-28, partial hit]" /note="MGA_1143" ORIGIN 1 attcgagatc atgaaatcta cgaccgccat ccagaacatg atccgcgaag acaagctcca 61 ccagctggag tccgccatgc aggcgggagg cgcggagggc atgtgcacca tggacggcag 121 cctgttaaag ctttataagg aaggacgcat cagccgggag acggcgctga tggcctgcgc 181 aaattacgag aacatggtta agagattggg ctagttcccg caaatgtgga aaatatggac 241 cagaacagca tagacaaaag cataaaaggc ctttcgatcc agcggctcca ccggtttatg 301 atggccgttg cggtcctcct tgcgatcctg cttctgtacg ccacgtacag cgtcatgacg 361 ggctacgata tcctgcagga agcgacggac cggtatatcg agatggaacg gagcacccag 421 gatctgatgg cggcttccga ttatctgacg gagagcgtgc agagttttgt cgttacggca 481 gatcctgatt acgtggacga ctattttgag gaggcgaaag tggcccgccg cagggacaat 541 gcgctggaga cgatggagaa gaccctggcc ggcacggaaa cctaccgcta tctggaagag 601 gcgctctggt attccaacaa cctgatggag atcgagtatt acgccatgcg gctcacgatc 661 gacgcaaacg gaatggaagt cagtaacttt ccggaggaac tgcagaacat cgtggtacgc 721 ccccggcatg cgtggctcag cgatgaatcc aagcgaagca tagcgatcga tctggtcttc 781 aacgacgagt atcagcggta taagaataac attcgcaggg acgtggacct gtgcgccggc 841 gccctcgtca cggatgcgca gaacagtcag cggcagagcg cagaccattt ccgggaggtc 901 atccgccggc tcacgatctg cattttcctt ctgctgctct ccgttctctt tatggtgatc 961 ctcacagcga ggctcatcat cgatccgctc aataacggca tccggcatat ccgaaagaag 1021 gaactgtttc ccgtggcagg ctcgctggag atgcggtatc tggcgcagac ctacaacgat 1081 ctatacgaat cctcccgcaa agagcaggag accctgtcct acgaggcatc gcacgatgcg 1141 ctcacgggtc tgggcaaccg ggcgatgttc gaaagggttc gcaacgattg tgaccctgcc 1201 accacagcca tgatcctcat cgacatcgac tatttcaagg aggtcaacga cacctacgga 1261 cacgaggcgg gcgatcagct cctgaagcgc gccgccaagg tcttccgggc cagcttccgt 1321 tccgaagact gcgtctgccg tatcggcggg gacgagtttg cggtgctgat gatgcattcc 1381 ggtacccatc tgaaagccct ggtgcagcgg aagatcgaac tggcgcaggc gcagctgaaa 1441 gacgaggaga acggcgttcc cggggtcacc atcagcgtag gcgtcgcctt cccggaccgg 1501 gacaatccta cggaagatat ttaccaggac gcggataccg ccctttacaa agtcaaaaat 1561 gcaggccgca acgggctcgc gttttatgaa tagaactctt ttttc // LOCUS sequence308 1604 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence308 VERSION sequence308 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1604 /mol_type="genomic DNA" /organism="" /note="sequence308" CDS complement(575..1522) /product="glycyl-radical enzyme activating protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_012870179.1" /transl_table=11 /codon_start=1 /translation="MTTGRLYDIQGFSVQDGPGIRTTAFLKGCPLRCPWCHSPESQAFY KQLSWMSMRCLGLDACRNRCMNACPKGAIEEGPPKTDVQTGEQLRTVHVRRDLCDNCGA CADKCYAEALTLCGRDYTSEELVDRLLQDKNFFDNSGGGVTISGGEPLCQIDFVVEVLQ GLKANGIHTALDTTGFAPWETVERTTPYVDLYLYDLKHMDSAKHKATVGVPNEQIKENA QKLAACGKKLQVRIPVIPRFNEDEENIRATAEFCVGLGEAVQVVQLLPYHNMGVMKYLR ISDGKPLEATPPSDEKMEHLRGIMASYGLNVTIH" /locus_tag="LOCUS_7320" /note="WP_012870179.1 glycyl-radical enzyme activating protein (Thermanaerovibrio acidaminovorans) [pid:42.9%, q_cov:99.7%, s_cov:99.3%, Eval:1.3e-64]" /note="MGA_1145" ORIGIN 1 ctcaggattg cgttgaagac atagaaatag gggttttccg tcgtggacgc gatcagtgtg 61 atggagccgt tttcaatgaa ttccagcagg ctctgctgct gcttcttgtt gaaatactgg 121 atctcgtcga gatagagcag gatgccgccg ggggcgagaa aggtgtccag ctcgtcgatg 181 atcgccttga tgtccgcgat gccggcggtg gtggcgttga gcttgcgcag cgtgcggttg 241 gtctgctgcg caatgatgcg ggctacggtg gtctttccgg taccggaggg gccgtaaaag 301 atcatattgg ggatgctgcc gctttccacg atgcggcgca gcataccatc ctgaccgagg 361 atgtgggtct gtcccacgac ctcgtccagc gtctgcggcc ggatctcgtc cgccagcggt 421 ctgtacatgc ttactcacct gctttccgac atgattaaca ctactatttt atcaattgcg 481 gcgcagaaat acaacacaat tcgcacgcag gcggcgaaaa gcggtcaaaa accggcgggc 541 ccgaagcgcg ggcccgccgg tatgcggggt ttattcagtg aatggtgacg ttgaggccgt 601 aggaggccat gatgccgcgg agatgctcca tcttttcgtc ggagggcggg gtcgcctcaa 661 gaggcttgcc gtcgctgatg cggagatact tcatgacgcc catgttgtgg tatggcagaa 721 gctgtaccac ctgcaccgcc tcccccagac ccacgcagaa ctccgccgtc gcccggatgt 781 tttcctcgtc ctcgttgaag cgcgggatca ccgggatgcg gacctgcagc ttcttgccgc 841 atgcggccag cttctgcgcg ttttccttga tctgctcgtt cggcacaccc accgtcgcct 901 tgtgcttggc gctgtccatg tgcttcagat cgtagaggta cagatccacg tacggcgtcg 961 tccgctctac cgtctcccac ggcgcaaagc ccgtcgtgtc cagcgcggtg tggatgccgt 1021 tcgccttcag accctgcagt acctccacca caaagtcgat ctggcacagc ggctcgccgc 1081 ccgagatcgt caccccgccg ccggagttgt cgaagaagtt cttgtcctgc agcagacggt 1141 ccacgagctc ctcagaggtg tagtccctgc cgcagagcgt cagcgcctcg gcgtagcact 1201 tgtccgcgca tgccccgcag ttgtcgcaga gatcgcgcct gacgtgtacc gtgcgcagct 1261 gttccccggt ctgcacgtcc gtcttcggcg ggccttcctc gatcgccccc ttcgggcagg 1321 cgttcatgca gcggttcctg caggcgtcca gacccagaca gcgcatgctc atccagctca 1381 gctgcttgta gaaggcctga gactccggac tgtggcacca ggggcagcgc agcggacagc 1441 ccttcagaaa ggccgtcgtg cggatgccgg ggccgtcctg tacggaaaag ccctgaatgt 1501 cgtaaaggcg tccagtcgtc atacgctcat ctccgttctg cggatcagat cgtcctgggc 1561 ctccttgtag acctcgacga agtaggcgga gaagccggcg atgc // LOCUS sequence309 1602 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence309 VERSION sequence309 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1602 /mol_type="genomic DNA" /organism="" /note="sequence309" misc_feature complement(763..>1602) /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_010875269.1:transketolase" /note="WP_010875269.1 transketolase (Sinorhizobium fredii) [pid:40.9%, q_cov:75.3%, s_cov:76.0%, Eval:5.7e-37]" /note="MGA_1148" /locus_tag="LOCUS_7330" ORIGIN 1 gatgacgttg tggttctcgt aagtgactgc gccgtacttc accttcttca gggcgtccac 61 gacctgcgga tcggtgaagg gcttgagggt ggaaacggac agcatctgca cggatacgcc 121 gtggttctgc agcaccttga ccgccttcag gccttcttcg gtcgcgatgt tctccgtgaa 181 cagcgccacg tcggagcctt ccgccgcgat cctcgcgtgg ttgaactgga tgggctgatc 241 cgccgggaac agtctgggaa cggacttgcg gagcattctt acgtagaacg ggccgccggc 301 ttcataggcc atgggcagga agccctcgat atccgtcgcg tcggcgatgg agtagatgcg 361 catgttgggt acggagcgca gcgtgccgat gtcgttggtg gactggtggg aaacgccgcc 421 gggcgtggtg aggccgggga cgaagcccac gaggccgacc ggcaggttgc cgtaagccac 481 ggacatctcc acctggtcca gaacgcgtct gtacaggaac acgccgaagg agtgcagata 541 gggcaggaag ccctctctgg ccaggcctgc ggcccagccg atcatgttct gctcggcgat 601 acccagggag aaataacggt ccggataatt cttcttaaat tccatgatct cgcaggaggt 661 gcccaggtcc gcggaaagta cgacggtctc gggatgttcg gcgccccaag ctgtgatgct 721 cttggagtat acgttggttt ccatgatcat agcgcgttcc tcctattcca tgctgtcgta 781 gaaagccttg gcttctgcga tctgttcggg tgtcttgacg tttacgaagt gcagtctctc 841 cgttctgtga tccaggaacg gcatgccgtg ggtcggcttg gtattgcaca gcacgacgag 901 cggctgaccc ggatgggccg ttctgcaagc gtctttgatc gcctggatgt cgtggccgtc 961 gatctcgacg gtcttggcgc cgaacgcggt aaatctgtcg tacaggggct gggtgttcat 1021 gatctccttc gtcggacctt cgatctgctg gccgttgatg tcgcagacga ggacgaagtt 1081 atcgagcttg tagaacgcgg ctgcctggac ggcttcccac agctgtcctt cttccagttc 1141 gccgtcggac atgaagcacc agatcgtgcc ttcctcgccc ttcagctttc tggcgtgcgc 1201 gtgaccgcag gcgacggaga tggtctgcgc cagcgatccg gccgtggtct cgaaaccggg 1261 ggagtgctcc gcgccgatct gttcgaagat ccagccgtct ttgttgaaac gttcgatgcc 1321 tgtctcggag actctaccta cagcgaacag ggtgcagtac agggtgcatg cgtagtgagc 1381 cggagagagg aagaatctgt cgtacggtgc cttcgtgggt ccgttgtaca ggcttcctct 1441 ggggaagtcc atattgtcgg gaccgggaac gccggggaac ggaatgccgt cgggatcgcc 1501 gaggctgtcg cccagattca tcacgtcgag atacagcgtt gccaggatct ccgcggacga 1561 attcgtctgc gtgatgtagc acccgcctct ctcaatggca aa // LOCUS sequence310 1594 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence310 VERSION sequence310 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1594 /mol_type="genomic DNA" /organism="" /note="sequence310" misc_feature <1..768 /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_011391791.1:S41 family peptidase" /note="WP_011391791.1 S41 family peptidase (Moorella thermoacetica) [pid:40.8%, q_cov:59.6%, s_cov:38.5%, Eval:9.7e-25, partial hit]" /note="MGA_1149" /locus_tag="LOCUS_7340" ORIGIN 1 gccaagctca acctgatcgc ggacggcatg gaaaaactga tcgtcgacgt ccgggacaac 61 ggcggcggcg tgatgggcga tgccctgaac atcgccggca tgctcattcc ccagggaaaa 121 ccgctggtgt tctacgaaca acagggagag atcatcgacg aggagtattc cgccggcggc 181 atctacaaag acgtgcctct ggtcgtcctc atcaacgatc atacggccag cgcctccgaa 241 tgcctggcag cagccgtcaa ggacaacggc gcaggcacgc tggtgggggt cacgacctac 301 ggcaagggcg tggcacagga gctggtgacc atggacaacg gcgacagctt taagctgacg 361 ttctgccatt tcctcacccc gaacaagcag cggatcgaca aggtcggcat cgcgccggat 421 attgccattt ccaacggttc tgccctgacg caggagcaga tcgcgaaata tctggagtcc 481 gtgcttccca tggacgaagg caagaagtat ttcaagggcc agcgcggatt gaacgtgctg 541 gcagcccagc agcggctgaa catcctcggt tataaagtac cgcagaatgc ggtgatggag 601 gcggctacga tggacgcgct caagcgcatc caggcgctct acggcgcatc gccctacggc 661 ggactggatt tctgcaccat cgagctggtg gaccgggcgt tctacgaatt cctgtatggc 721 gacggcaccg ataaacagct gcagaaagcg atcgaggtgc tgcaatgagg cttctgagaa 781 aagcggcggc cgttctggct gcggcaggga tcgtgctgac cggcgcagtt cccgtcagcg 841 ccatgacgtt cttctacggc gagacaccca tcgatctgcg catggacgcg ctgcaggaga 901 tcatcgagga agtgcgggaa aactataagg acgaaacgaa gctggacgat atcttcatcg 961 gcatctatca ggggctgttc agcagcctgg gcgatccctg gtccgcctac gttacggtgg 1021 acaagaccga cgacggcacg aatttcgtga ccaacgacgt ggacgaggtc tacgaaggca 1081 tcggcatcgt catccgcaag acgaattccg gcatccgcat ctccagcgtg gtgagcgggt 1141 caccggccca gctggccggc atccgttccg gcgactatat cttaaaagtc ggcgctcagg 1201 acgttacgca gatgacgtcc gaagaggtgt ccctcctcat ccggggcagc tccggcagca 1261 ccgtgtcgct caccgtggac cggcagggcg atacccgggt gttcgaggtg gtgcgccagg 1321 tgatccgcac agacaccgtc tcctccaaga tgctggatga gaccacgggt tacgtgcagg 1381 tgacctcctt cgcggcgggt acggcagacc gtttcgctgc agaatacgac gcgctggcgg 1441 cgcaaggcgc gaaggccatc gtgctcgacc tgagaggcaa cggcggcggc tccgtgggcg 1501 aagccgtggc ggtggcggac catctcatcc acaaggatgg cgtcatctcc atctttaagc 1561 gccagggcga agtgatcgag accgtgcgct cgac // LOCUS sequence311 1583 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence311 VERSION sequence311 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1583 /mol_type="genomic DNA" /organism="" /note="sequence311" CDS 897..1334 /product="GatB/YqeY domain-containing protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_011475872.1" /transl_table=11 /codon_start=1 /translation="MEFKALQAEMIKALKAGQKDRKDSISMLVAAVKKAAIDAGCREDI PEDMVDAAILKEVKTAKEQVDTCPASREDLLAQYKAHLAVVEEFAPKQLSAEEVKALLT EKYAEVIASKNRGLIMKTVMADLKGKADGKVISAVVGELCK" /locus_tag="LOCUS_7350" /note="WP_011475872.1 GatB/YqeY domain-containing protein (Ligilactobacillus salivarius) [pid:37.8%, q_cov:96.6%, s_cov:95.9%, Eval:3.3e-16]" /note="MGA_1152" ORIGIN 1 gtaaaaaccg gagacgttca tgacgcagat gccggacacg gaatccttat taaactggat 61 ctctccggta tcctgcgaca aacagatgcc gttttccgtg cggccgccct ccgggaccgt 121 cagcaggcgc accgtgccgt gcgctcttac gcccgccagc ttcgcaagaa ggtctgtctc 181 ggcgcataga aaaccggtaa gcgcagggat gggccgtacg accgtgtgtc ccaggctctc 241 tgcgatcttc aggcctctgc cgtcgcagcc gtactggatg ccggctttgc cgcccgtcgt 301 caggatcacc ctttccgcga gcaactctct atcatccgct gcggtgaggc ggaatctgcc 361 atccggcacc ttcgtaatat cccgcacctc gaatccgcag atcaactggg cagggttgcc 421 gctgccggct tttccgaaag cgccgcgctc taacgcatgc accacggaag ctgcctgcag 481 gctgcgggga taaagccttc cttccccctc ttccacggca tccagaccga gatgcgcaaa 541 gacctgccgc atcgcttctg ggccgcagtt tttcaggacg gacgcagtaa aacctgccgc 601 atcgcctttc ccgctgcggt agtctttcgc atcagccgtc cggttgagca gattgcaccg 661 tccgttgccg gtggcgtaga gcttcttacc cgctttttca tttttttcga cgaccgcgat 721 gcgcagagac cggttccggg aacttctggc cgcaatggca gccatcaggc ccgccgcgcc 781 gccgcctacg atcgcgatat cgtaacttac ttcgtttctc atacgattat tttaaactat 841 ccgcgggaat cgtgatagaa taatttctat acaaagcgta acggaggtat tgatatatgg 901 aattcaaagc attacaggca gaaatgatca aagctctcaa agcgggtcag aaagacagaa 961 aagactccat ctccatgctg gtggcagcgg tcaagaaggc agccatcgac gccggatgcc 1021 gggaagacat ccccgaagac atggtggacg cagccatcct gaaggaagta aagaccgcca 1081 aggagcaggt agacacctgc cccgccagcc gggaagacct gctggcgcag tataaggctc 1141 acctggcagt cgtggaggag ttcgcgccca agcagctgtc tgcagaagag gtcaaggcgc 1201 tcctcactga aaaatacgcg gaagtcattg catccaagaa ccgcggcctc atcatgaaga 1261 ccgtcatggc cgacctcaag ggcaaggccg acggcaaggt catctccgcc gtcgtgggcg 1321 agctgtgcaa ataagggtgt gacccatgga attcgtgttt ccctgcgagc gggttctgga 1381 ctcctaccgc gaagcctacg cggaagacat tgcggtaaac aaaggtgaac tgcagatgct 1441 gatccatccg gacatcgcca tcgcccgctc agaatcagaa cgcagcggcg aaaatctgcc 1501 cgcaggctac gtgccggcca cgacgctgtg gctcgtggat ggagaccgct ttatcggcag 1561 ggtcaacatc cggcaccggc tca // LOCUS sequence312 1577 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence312 VERSION sequence312 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1577 /mol_type="genomic DNA" /organism="" /note="sequence312" CDS 217..1191 /product="D-2-hydroxyacid dehydrogenase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_010906252.1" /transl_table=11 /codon_start=1 /translation="MYNVLCVLPVNEEEKEMLKAAGGGQCEYCWSTQEGVTREELEWAD VLIGCVDTDKLVDLPKMKFVQLDSAGSDGYAKLKMFHEPQSCLLSNSTGAYGGTIAEYM IGSIIMLIRHFQVYRDHMKEHKWQRVELPTCITEHHALVIGLGDIGVNFAERMKALGCS VSAVRRTVGEKPDCVDEVGTLEDLPRLLPEADFVALCLPNSPATQKVINKETLAMMKPG AILVHVGRGTAVDSDALAEALNSGHLGGAALDVTDPEPLPADHPLWDCRNCLVTPHVAG LFRQLYPFRRIVERSVTNLGHFVKSEPLESVVDLATGYRVSRS" /locus_tag="LOCUS_7360" /note="WP_010906252.1 D-2-hydroxyacid dehydrogenase (Lactococcus) [pid:37.8%, q_cov:90.7%, s_cov:89.8%, Eval:9.3e-53]" /note="MGA_1154" ORIGIN 1 aacagccgcc cagagtacga ggatgaggac ctgccaccaa tatctatgct gatgtcgcaa 61 aggcgattcc tcctcgtgtg cgtgtgcaca gacagttatt atatcataaa gtctgcagaa 121 tatgcaattt taaggggttg atggcagttt acggcctatg atataatcat aatacataat 181 ctagatatac acaaattctg caaaaaggag atcgtcatgt acaacgtatt gtgtgtgctt 241 cctgtcaacg aagaagaaaa agaaatgctc aaggcagccg gcggcggcca gtgcgaatac 301 tgctggtcca cccaggaggg tgtgacccgc gaagaactgg aatgggccga cgtgctgatc 361 ggctgcgtgg ataccgacaa gctggtggat cttccgaaga tgaagttcgt gcagctggat 421 tccgccggtt ccgacggcta tgcgaagctg aaaatgttcc atgaacccca gagctgtctg 481 ctgtccaact ccacgggcgc ttacggcggc accatcgcgg aatacatgat cggttcgatc 541 atcatgctca tccggcactt ccaggtatac cgcgaccaca tgaaggaaca taaatggcag 601 cgggtggaac tgcccacctg catcaccgag caccatgcgc tggtcatcgg cctgggcgat 661 atcggggtca acttcgcaga gcggatgaaa gccctgggct gcagcgtttc cgccgtccgc 721 agaacagttg gcgaaaagcc ggactgcgtg gacgaggtcg gtacgctgga ggacctgccc 781 cggctgctgc ccgaagcgga tttcgtagcc ctgtgcctgc ccaattctcc ggcgacccag 841 aaggtcatca acaaagagac gctggccatg atgaagcccg gcgccatcct cgtacacgtg 901 ggccgcggca ccgctgtgga ctccgatgcc ctggcggaag cgttgaattc cggccatctg 961 ggtggtgcag cgctggacgt taccgatccg gaaccgctgc cggcggatca tcccctgtgg 1021 gattgccgca actgcctggt cacgcctcac gtggcagggc tgttccgtca gctgtatccc 1081 ttccgccgca tcgtggagcg gtccgtcacc aatctgggcc acttcgtaaa gagcgaaccc 1141 ctggagagcg tcgtggacct tgccaccggc taccgggtga gcagatcgta acggcataaa 1201 gagaagatta aaagaagcgc aggcatcgca gcctgcgctt ttctcgtata cgctttttac 1261 agatagatct cgccttccgc caggatggct gccacgccgc ccacgcggat ctttacagat 1321 ccgtcttcca gaatgcttaa acggctggag atcttggagg gtctgtccat ggcctcgccc 1381 tggataaaca ggttgtcggc ttccggcttt acgatgccgc gcttgtagag ataataggtg 1441 agcgcgccgt tggaagtgcc ggtggccgct tcttcgtcga tgtcgtacag cggcgcgaag 1501 ttgcggcagt ggacgccgtc ggactcggac agcgtaaagg catgcacgcc cgttacgtta 1561 taggcggcgg acagatc // LOCUS sequence313 1573 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence313 VERSION sequence313 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1573 /mol_type="genomic DNA" /organism="" /note="sequence313" misc_feature complement(830..>1573) /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_011861408.1:tRNA (adenosine(37)-N6)-dimethylallyltransferase MiaA" /note="WP_011861408.1 tRNA (adenosine(37)-N6)-dimethylallyltransferase MiaA (Clostridioides difficile) [pid:37.1%, q_cov:98.8%, s_cov:77.2%, Eval:3.7e-42]" /note="MGA_1157" /locus_tag="LOCUS_7370" ORIGIN 1 agaagcagcg cgtccttatt ctcctcggac agcgtgtcgt ccggcgccct ctccagggtc 61 acatattcgt tataggcctc ggtgatggtg ttgttgatgg gcatcaccga ttccttgccc 121 cgcttgcggt agatcttgaa ttcgccgcgc tcgaagttga aggaactcag gttgagctgc 181 tgcatctccg aaagacgcag gccgtaggtg accagcagca ggagcatcag cttgtcgcgg 241 tacttcgtcc tctcccagaa cttcttttcc ctgtccgtca ggccctctcc cgagaccacc 301 gcatccagca tgcgcatcac ttcgtcgtcc tgcagcgcct tgatgacccg ttcgccgggc 361 ttgggcagcc ggatgggatc gaagccgtcg gtgatgttct tctctaccag accgtcgcgg 421 tacaggtact tgaagaacac ggagaccgca gattttttat gggccagggc cgcattgccg 481 ttctcgtaga ctgtcacgtt gcccttctca tcctcgactt tgtagcgccg gcagtaatcg 541 ataaagagat tcacgtccat ggacgtgatc ttattgagat cgccgggctg gatcttcttc 601 atttccgtgc acgtctcctg cagttccgtt tccttcagca gatagtgcag gaaaaaccgc 661 agctcccgca ggtacgaaag ccgcgacatg ggaagaacgc cgttgcgcag atacatgaag 721 tagccccgca tccagccagg cagctccctt tcgatcttct cgcattcctc gaatatttcg 781 ttttcccggg ccaccacgtt atcgggcttg tctgacttgt tgtggaccct tatcttccgt 841 tcttcagcca tgttgctatc gtttctttca tgcggctgta cgcctcttcg tcgaaggcgt 901 ctccctgcag cgtgacccag tgcatctgcg gataacgccg cagccagatg agctggcgtc 961 tggcatagtg ccgggtgttt ttgcggatga gttccgcagc ttcttcgatg ggacggcctt 1021 cggaaaggca gtcgatcact tctttatacc cgatgccctt catggcgatg tctttgctcg 1081 taaagccctt cgccatcagg ctgcggacct cgtccttcag ccatgcctcc aggatcttgt 1141 ccaccctgcg gtcgatacgg tcgtacaact cgctgcggtc ccggtctaag ccaattaaga 1201 ggctgtcgta gtccgggtac ggagtctcga tgtcggtgaa cgccgccagt ttcgcttcgc 1261 cgtgctccag gcgttcgatg gcccgcagca tgcgcttgac gttgttggga tggatggctt 1321 cggcggcatc cggatccagg gaacgcaggc gttcgtggac tttctgcggg tcctccccgc 1381 attcctgcca gacccgctgc cggaaaccgt catctccctt aggcgccgaa aagtccatgt 1441 cgtacaacag cgcgttgata tacagccccg tgccgccgct tacgatgggc agtttgccgc 1501 gcgctgcgat ctccgcgata taggagcggg ccagtttctg atagtccgag acgttgaaag 1561 gcgtcttcgg atc // LOCUS sequence314 1564 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence314 VERSION sequence314 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1564 /mol_type="genomic DNA" /organism="" /note="sequence314" CDS complement(259..1206) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MAKEMPVYLFTGFLEAGKTQFIQTTLEDPNFNAGEKTLVIQCEEG IEEFRHERFWEDNVVVEVLDEPEQINNAFLKSLEKKHKPERVMIEYNGMWMLDQLFQEM PENWIIYQEYSFYDANTFLTYNQNMRQLVYDKLKSADCVVFNRYREGMDRMPLHKVVRG VSRRPDIFYELPSGDAIVDDIEDPLPFDKEAPVIEIKDEDFALWYRDLSEDMNGYDGKT VRVKGITGASGVLEGSDFIFGRQVMTCCVEDIQMAGLVCEWHGVKPAKRSWVIVTAKIR IGKSRAYGSKTGPILVVQKVEGAEPPEQEVATFY" /locus_tag="LOCUS_7380" /note="WP_005815046.1 permease (Desulfitobacterium hafniense) [pid:37.4%, q_cov:30.5%, s_cov:18.5%, Eval:5.7e-07, partial hit]" /note="MGA_1159" CDS complement(1208..1480) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MFTSWGETTAARFTVAEIEEKLKELDDTWTYGFVLRAKGIVQDKE EGWIHFDYTPGEINVRKGPAAATGMLCVIGAQMKEDEVKHLFGVA" /locus_tag="LOCUS_7390" /note="MGA_1160" ORIGIN 1 atgatagcct ggatgaagtt gccgtaggtg agctgcgcgc tgcccacggt gaccgccagt 61 tcgctgaagc tgacgccgcc catcagcatg ccgatgatcg gggtgatgat gtcagcgacc 121 agagatccga cgatcgcggt gaacgcgccg ccgatgataa tgcctacggc catgtccatg 181 acgttgccgc gggagatgaa ttccttaaat tccttcatca tagtagtttt cctcctttct 241 tgattgaact tataaaaact aataaaacgt tgctacttcc tgttcgggag gctccgcccc 301 ctcgactttc tgcaccacca ggatgggtcc ggtcttgctg ccgtaagccc tgctcttgcc 361 gatgcggatc ttcgcggtca cgatgaccca ggagcgcttc gcgggcttta ccccgtgcca 421 ttcgcacacg agcccggcca tctggatgtc ctcgacgcag caggtcatca cctgccggcc 481 gaagatgaaa tcgcttccct cgagcacgcc ggacgcgccg gtgatgccct tgacccgcac 541 ggtcttgccg tcgtagccgt tcatatcttc cgacagatcg cggtaccaca gcgcgaagtc 601 ctcgtccttg atctcgatga cgggtgcctc cttatcgaag ggcagcgggt cttcgatatc 661 gtccacgatg gcgtcgccgg agggcagttc gtagaagatg tccggccggc gggacacgcc 721 ccgcacgacc ttgtgcagcg gcatgcggtc catgccttcc cggtagcggt tgaacacgac 781 gcagtccgcg ctcttcagct tgtcgtagac cagctggcgc atgttctgat tgtacgtcag 841 gaacgtgttc gcgtcgtaaa aactgtattc ctggtaaatg atccagttct cgggcatctc 901 ctggaacagc tggtccagca tccacatgcc gttgtactcg atcatgaccc gctctggctt 961 gtgctttttc tcgagggact tcaggaacgc gttgttgatc tgttccggtt cgtccagcac 1021 ttcgaccacg acgttatctt cccagaaacg ctcgtggcgg aactcctcga tcccttcttc 1081 acactgaatg acgagggtct tctcccccgc gttgaaattc gggtcttcca gggtcgtctg 1141 tataaactgt gtcttacctg cttccagaaa accagtaaac aggtagacgg gcatttcctt 1201 ggccatatta cgcaactccg aacaggtgct tgacttcgtc ttccttcatc tgggcgccga 1261 tgacgcacag catgccggta gcggctgcag ggcccttgcg gacgttgatc tcgcccggcg 1321 tgtagtcgaa gtggatccag ccctcttcct tatcctgcac gatacccttg gctctgagta 1381 cgaagccgta ggtccaggtg tcgtccagtt ccttgagttt ttcttcgatc tctgcgacgg 1441 tgaaccgggc agcggtcgtc tcgccccagc tggtgaacac ctcgtccgcg tcgtgctcgc 1501 cgtcgtgatg atgatgatgg tggtgatgat gtccgtgctc atcgtggtcg tgatgatgat 1561 ggtg // LOCUS sequence315 1562 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence315 VERSION sequence315 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1562 /mol_type="genomic DNA" /organism="" /note="sequence315" misc_feature <1..635 /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_011203082.1:SpoIIE family protein phosphatase" /note="WP_011203082.1 SpoIIE family protein phosphatase (Bacteroides fragilis) [pid:38.6%, q_cov:94.3%, s_cov:51.4%, Eval:1.6e-29, partial hit]" /note="MGA_1161" /locus_tag="LOCUS_7400" CDS 619..1476 /product="carbon-nitrogen hydrolase" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_015909400.1" /transl_table=11 /codon_start=1 /translation="MNRKVNVSCVQMQPHAADYEYNLKKMEGFVESVMRSRPETDLIVF PELATTGYVCTNDEFEAMTRTAAEDPSVKRMGALAAKYGVMLIYGFSERDPDDPSILYN AAAILGKDGTLMGTYRKVHPFLNEKKWCTAGSEYPVFDTDFGRIGVMICWDTAFPEVAR TYALKGCDLLVVCTNWEITEAEDWPMDTAADWDLVTRARAFDNTLHLVSANRVGSDRGL GFFGHSNIIDPVGKVLESLDEPVEGDIHAELDLSLTEKRRREYYTILADRRPDTYGTLT EPID" /locus_tag="LOCUS_7410" /note="WP_015909400.1 carbon-nitrogen hydrolase (Chloroflexus aurantiacus) [pid:32.3%, q_cov:97.9%, s_cov:96.6%, Eval:2.2e-31]" /note="MGA_1162" ORIGIN 1 gagatttcta cgacgtgttc ttcgtggatc aggaccgcat cgcatttctg atcgcggacg 61 tctccggcaa aggcattccc gctgcgctgt tcatggcaag cgcgaagatc acgctgcaga 121 actgcatccg ggacttttcg gatctggcgg aagcagtgga aaaagccaac gacagcctct 181 gcgccaacaa cgaggcggag ttgttcgtca ctgcctggat cggcattctg gacattcctt 241 ccggacgggt ggagtacgtc tgtgcgggtc acaatccgcc ggtgctcatc gcgcgggaag 301 gcgcccgttt tatccgggac cgcggcggtt tcgtgctggg cggcatggaa ggtacgccct 361 accggcagca ttcgctgcag ctgcagccgg gcgacagcat ctatctgtac accgacggcg 421 taacggaagc catgaacaca gttcgcgagc tctacggcga gggccgtctg caggaatgcc 481 tcaaatggct gcacaacgta gatccccaga ccgtgctgga ccgggtgcac tacgacgtgg 541 cgcaacatgt aaaaagggcg gaacagttcg acgacatcac gatgctctgc ttaagatggg 601 atggaaagga agtttccggt gaacaggaaa gttaacgtct cctgcgtgca gatgcagccg 661 cacgcagcgg actacgaata caatttgaag aagatggagg gattcgtcga atccgtcatg 721 cgcagccgtc cggagacgga tctcatcgtg tttccggaac tggcgacgac aggctatgtc 781 tgcaccaacg acgaattcga ggcgatgacc cgcacagcgg cggaagatcc gtccgtaaaa 841 cggatgggcg ccctggccgc gaagtatggc gttatgctga tctacggctt ttcggagcgc 901 gacccggacg atccgtctat cctctacaac gctgcagcga tcctgggcaa agacggcacc 961 ctgatgggca cctaccgcaa ggtgcatccc ttcctgaacg agaaaaaatg gtgcaccgcg 1021 ggcagcgaat atcccgtttt cgatacggac ttcggccgca tcggcgtcat gatctgctgg 1081 gatacggcgt ttccggaagt cgcccgcacc tatgcgctca aaggctgcga ccttctcgtc 1141 gtgtgcacga actgggagat cacggaagcg gaggactggc ccatggatac ggcggccgac 1201 tgggatctcg tgacccgcgc cagagccttc gacaacacgc tgcatctggt ctccgccaac 1261 cgggtaggca gcgacagagg gctgggattc ttcggtcaca gcaacatcat cgatcccgtg 1321 ggaaaggtcc tcgaaagcct ggacgagcct gtggaagggg acatccacgc ggaactggat 1381 ctctctctga cggagaagcg ccgccgcgaa tactacacga tcctggcgga ccggcggccg 1441 gatacctacg ggacgctcac ggaacccatc gattaaaatt tttgataatt tccataaaaa 1501 taatcagtcg tttgattgaa aacggctgat tttttatata aactggaagg aggaggagac 1561 ac // LOCUS sequence316 1547 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence316 VERSION sequence316 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1547 /mol_type="genomic DNA" /organism="" /note="sequence316" CDS 114..590 /product="transcription elongation factor GreA" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /inference="similar to AA sequence:RefSeq:WP_003422204.1" /transl_table=11 /codon_start=1 /translation="MSEEILLTKEGYDKIVEEHEYLTSVRRIEVSEHLKEAKSYGDLSE NAEYDAAKNEQAELEDRIQKLETMMRKGKIVSEEELTGDHVNLGLGVRVKDMKSKEEFT YTIVGITEADPFEDKISNESPVGKALLGRKKGETVEIQTENGVLNYKILEIIKG" /locus_tag="LOCUS_7420" /gene="greA" /note="WP_003422204.1 transcription elongation factor GreA (Clostridioides difficile) [pid:58.4%, q_cov:97.5%, s_cov:96.9%, Eval:5.1e-43]" /note="MGA_1164" ORIGIN 1 aaggcgccgc ggcgctgcgc aggcaggcca gcgaagccga gagtctggac gaaatgttta 61 cgatattaga gggtctcaaa aatctggccc tgtaaaatat aaggagaagg aaaatgagtg 121 aagaaatctt acttaccaag gaaggctacg acaagatcgt agaagagcat gaatatctga 181 catccgtaag aaggatcgaa gtctctgaac acctgaagga agccaaatcc tacggcgacc 241 tttccgaaaa cgccgaatac gacgccgcca agaacgagca ggcagagctg gaagaccgga 301 tccagaagct ggagaccatg atgcgcaagg gcaagatcgt ctccgaagag gaacttacgg 361 gcgaccacgt caacctgggg ctgggcgtgc gcgtaaagga tatgaagtcc aaggaagaat 421 tcacatacac catcgtaggc atcaccgagg cggatccctt cgaggacaag atctccaacg 481 aatctcccgt cggcaaggcc ctgctgggcc gcaaaaaggg agagaccgtc gaaattcaga 541 cggaaaacgg agttctgaac tataagatct tggaaattat caagggatag gaagaaaaaa 601 tgagcgaaga aagaatcaac agccagcagg ctccccaggc ggaactcacc gaagagcagg 661 cagcccgcga actcagcgag cagtgcctca tccgcagaga aaagctggcc gcactccagg 721 cagagggcag agatcccttc ctgcagaccc gcttcgaccg caccagcaac gccacccaga 781 tcaaggcgaa cttcgaggag ctggaagggt caacgcagcg gctcgccggc cgcctcatga 841 gcaagcgcgg catgggcaag gcctccttct gcgacctgca ggaccaggac ggccgcatcc 901 agatctatgt ccaggtagac gatctgggaa aggaagaata cgaccggttt aagaagctgg 961 acatcggcga tatcatcggc tgcgagggcg aagtgttccg caccaagcgc ggcgagatct 1021 ccctgcacgt caagagctac gtgctgctgt ccaagtccat ccgtccgctg cccgacaagt 1081 ggagcggcct caaggacatg gatacccgct accgccagcg ctacgtggac ctcatcgtca 1141 atccggaagt ccgggagacc tttaagaaga gagccctcat ttaccgcgcc atccgccggt 1201 acttcgacga cctgggctac atcgaatgcg agacgcctat cctgaatacg gtgcagggcg 1261 gcgctaccgc gcgtcccttc gtgacccatc acaacgccct gaacatcgat ctgtacctgc 1321 gcatcgccac cgagctgcac ttaaagcgat gcatcgtcgg cggattcgac cgggtctacg 1381 acatgggccg catcttccgc aacgaaggca tggatacccg ccacaacccg gaattcacga 1441 ccatcgagtt ctacgaagcc tacacgaaca tcgaaggcat gatggaacgc acggaaggcg 1501 tcatcaagta cgtcaaccag atcgtcaacg gcaaggataa gatcccc // LOCUS sequence317 1546 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence317 VERSION sequence317 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1546 /mol_type="genomic DNA" /organism="" /note="sequence317" CDS 267..731 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MKDIMLKITGKTVTQDEGSEKHENIMEFVTAGQLYRRGTTTFIRY PESELSGLEGCTTSLIITKDKVKMRRTGQALAADTEMEFKKGERFYGMYETPYGPIGME LLTNDVTGLQDVGEGKQALSIDYHISLRGFMEARNKLDIEITHPKEGVAQ" /locus_tag="LOCUS_7430" /note="MGA_1167" ORIGIN 1 cggcgccagc cagctgctca tccccgctcc catcagcgaa gagcaggaag cgcaggtgct 61 ggacatggcc aaaagggcgt ataaggcctg cggctgctgc agttttgcca gggtggattt 121 cctgatggac aagaacaccg gggagatcta catcaacgag atcaatgcca tcccgggctt 181 tacgaagacc agcatgttcc ccatgctgat gcaggcggca ggcataaagt attcggagat 241 catcgaccgg atcgtggagt tgggttatga aagatatcat gctgaaaatc accggtaaga 301 cggtaacaca ggacgaaggc agcgaaaagc acgaaaacat catggaattc gttacggcag 361 gccagctgta ccgccggggt acgacgacgt tcatcaggta cccggagagc gagctgtccg 421 ggctggaagg ctgcaccacg tctctcatca ttacgaagga caaggtcaag atgcgccgca 481 ccgggcaggc tctcgccgcg gacacggaga tggagttcaa aaaaggcgag cgcttctacg 541 gcatgtacga aacgccctac ggccccatcg gcatggaact gctcaccaac gacgtaacgg 601 gtctgcagga cgtgggcgag ggcaagcagg cgctgtccat cgattatcac atcagcctcc 661 gggggtttat ggaggcgaga aataaactgg atatagagat cacacatcca aaggaagggg 721 tagcacagtg aacagaaaac agcagaggaa ccggactgcg gcgcgcatcc tggcgatcat 781 cgtcgccctg tcgatgatcc tgatgtcggg cttttatctc attacggcct ttacggcagg 841 ggggacgtct ttcttcgtct acgcggcgga aagccaggag accatcgaca agaatctcag 901 caagctggac atgctgcgcg acgtggtgaa gtacatcgac gagcactacg cggacgacgt 961 aaacgtggaa gatcttacgg atgctgctta caacggcgtg ttcgaggccc tcgacaagtg 1021 gtccgtgttc tacaagacgc aggaagagaa ggatgcgttc gtaagccagg tgacgggcaa 1081 ctacgccggt atcggggtca ccatgaccct ggacggcagc ggacggtgcg tcatcaccca 1141 ggtgaacacg ctgggtcccg cttacgaagc gggcgttaaa gccggcatga tcatcgtgtc 1201 ggtggacggc aaggcggcgc aggggcttac gctggaggag atctccggcc tggtccgggg 1261 cgaaccgggt acgaaaaccg agcttcagct cgagctcgag ggcgagaccc tcaccaagag 1321 catcgagcgc aggagcatca aggcccagac cgttacctac gagatgctgg acggcaagac 1381 cggctatatc gccatctccc agttctccgg cgagagctgg aaggaattcc gcatcgcaaa 1441 gctcaacctg atctccgaag gcatggagaa gctcatcgta gacctgcgcg acaacggcgg 1501 cggcgtgctg ggcgatgccc tgatcgttgc cggcatgctc gttccc // LOCUS sequence318 1539 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence318 VERSION sequence318 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1539 /mol_type="genomic DNA" /organism="" /note="sequence318" ORIGIN 1 agcgggcagg tgaagccttc cggcagttct tccccttcgt aaacatatcc gcagatcttg 61 cagacccact tggtcttggg cgcttcgggg ctgcagggcg tatcgccgca gccgcagtcc 121 gcttcgctgt agcttgccgc cagctcttct gccagcgcca tcagctgtgc ggtgctggtc 181 tcgttgagcg cggacaggat cgtgacgttg ttctcggtgt aggagatatt cttcaggccc 241 tccagtttgc tcttcatcac cttcatggcc atgggagccc aggagccgtt ttcgataaag 301 ccgatggtgc gcttctgata gcctctctcc accagcatgt tgatgaactc gcgcatgtag 361 gggaagatct ccgcattgta ggtcgtggtg gccagcacca gcttgtcgta gcggaaggcg 421 tcctctacgc attcgtacat gtcgtctctg gccagatccg cgatggccac cttgggcacg 481 ccgcgcttct ccagttcttc cgccagcatc tcggctgcct tcttggtgtg accataaaca 541 gacgtataca tgatggcaac gcccttgttc tccggttcat aggcggacca ggtgttgtac 601 aggtcgagat agaagcccag atcctcgttc agaacggggc cgtgcagcgg cgcgatcacc 661 tggatgtcca gagcagcagc cttcttcagg accgcctgca cctgagcgcc gtacttgccg 721 acgatgccga agtagtagcg gcgggcttcg caggcccagc cttccggatc ttccacgtcg 781 ttggcgccga acttgccgaa gccgtccgcg gagaacagca ccttatcgca ggcgtcgtag 841 gtcatcatga cttccggcca gtgcaccatg ggagcaaaga cgaaggtgag ttcgtgcttg 901 cccagggaaa gcgtatcgcc gttcttgact tccagcttat tggcgatctc caggcccggg 961 aagaactggg agatcatctt gaaggtctta ttgttgccga cgaccgtggt ctcgggatac 1021 ttctgcagga atgcttcgat ggaagcggag tgatccggct ccatgtgctg aacgatcaga 1081 taatctggtg ccttggcggc cttggcttcc acattgccca accattcttc cgtcttgctc 1141 tggtcgatgg tgtccatcac cgcgaccttt tcgtcgttga tgacgtagga attataggcc 1201 atgcccaggg gcacgtcgaa gtgaccctcg aacagatcga tgtcgtggtc attcgcgccg 1261 atgtacagga tgtctttgga aactgctgta ttattcataa atctacctct cttttccggg 1321 tgaaacgata caatctctaa cttatttatc atatcacgaa gaccgctttt ttcccacaga 1381 aaaagagcag ccaaaaggag ctgctcttaa gaattcctgt tcatttacgg ccgcagcacc 1441 cgttcttccg tcacgatgca gggcaccggc acgtcccagg gctccgccgg gaccgcttcg 1501 cagccctggc attcgtaggc caccagcatc acgtccgca // LOCUS sequence319 1518 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence319 VERSION sequence319 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1518 /mol_type="genomic DNA" /organism="" /note="sequence319" misc_feature <1..899 /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_012048077.1:coproporphyrinogen III oxidase" /note="WP_012048077.1 coproporphyrinogen III oxidase (Clostridium botulinum) [pid:41.3%, q_cov:97.0%, s_cov:61.6%, Eval:5.9e-59, partial hit]" /note="MGA_1171" /locus_tag="LOCUS_7440" ORIGIN 1 cgagcaacca gatttccaaa gaagcagcga cggactatct gcaggcgctg tttacggaga 61 tggatgcggt caaagatctg atgacccgaa gaggccagac ggcggaatcc atctacatcg 121 gaggcggaac gcccaccagc ctggatccgg aagacctgaa agctttcctg aataaagtgc 181 acgagctgtt cgtggacgaa aacaccgtgg aattcacggt ggagggcgga agaccggaga 241 ccattacggc ggaacagctg cagatcatca aagacgcagg cgccggacgc atctccatca 301 acccgcagtc catgaagcag cgcacgctgg atctcatcgg acgaaggcac agtccggagc 361 agatccggga agccttcgcc ctggccgagg aggcgcagat ccccgtggtc aacgccgacc 421 tcattacggg gctcccagag gaagaaccgg aggatttccg cagcagtctg gcggaggtca 481 tcggcctggg acccgccaac atcacggtcc ataccctggc tgtgaagaaa gccagccgca 541 tgatcgaaga agatcccggc gtcgcgagac gacaggcgga caacgtgcgg cagatgctgg 601 acgatgcgga ccgcatgctg acggaagcgg ggtacgaacc ctattacatg taccgccaga 661 agcatatggc gggcaacttc gaaaacgtgg gctggtgcct gcccggcacg gaaagccttt 721 acaatatccg catcatggag gaggatcaga cgatcgtcgc catgggcgca ggtgccatct 781 ccaaggtcta tttcccggag gaaaaccgcc tggagagggt gccgaacgta tcgaattatc 841 agatctatat cgaacgcatc gaagaaatga tagcgagaaa ggaagccgga ctcttatgat 901 cataaacata ccaaagggaa cgaaggacat cctgccttcc gaatcctaca aatggcagtg 961 gctggagagc cgcatccgcg aaacggcagc gcgctacgga tttaaggaga tccgcacgcc 1021 gatgttcgag catacggagc tgttcgccag aggcatcggc gatacgacgg acgtggtcca 1081 gaaagagatg tacacgttcg agatcgcgga gagaagcctt accttaaagc ccgagggcac 1141 cgcaggcgtc gtccgttcct atatcgagaa caaactgtac gcagaaccgc agcccggcaa 1201 gtacttctac atcatcccgt gcttccgcta tgagaagatg cagaagggca gacagcgcca 1261 gttccatcag ttcggcatcg agatcttcgg cagcgagaac atgatggcgg atgccgaggt 1321 catcggcctg gcctgggact tcctcaccgg cctgggcatt acggacctca agctgcacat 1381 caacagcatc ggctgcccga actgccgcgg cgaataccgc aaggctctgc aggacttcct 1441 gcggccccac tacgacgagc tgtccgagac cagcaagggc cgcttcgaga agaaccccat 1501 gcgcatcctg gattccaa // LOCUS sequence320 1517 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence320 VERSION sequence320 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1517 /mol_type="genomic DNA" /organism="" /note="sequence320" CDS complement(711..1376) /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MTKGDMLHEIQHLLGGRVAEALVMGDISTGASNDLERATKIAHDM VAKYGMSETIGPLNYSSADEVFLGRDFTSKQNFSEELASKIDKEVHDIMTTAYAETEKI LLEHREELHRVAEALLEMETLDADQFEALYTNTSTVEELENIQKEADAARAEKERLEAE KKAFLEAEEKRRVEEQMREAMEKGKRVAVMDEKGNIIIRDASEVRKAREEAQKKGRDE" /locus_tag="LOCUS_7450" /note="WP_021373798.1 ATP-dependent zinc metalloprotease FtsH (Clostridioides difficile) [pid:41.7%, q_cov:98.6%, s_cov:28.7%, Eval:1.9e-36, partial hit]" /note="internal stop codon at [1389:1391](-)" /note="MGA_1174" ORIGIN 1 cagcagggac atgcgcttgg cgaaggcttt ccactcagtt tcgacgtatt ccttcgtctg 61 ggaggatttg aggatgaggc cggcgatctc gccttccgtt accatcttca gggtgcggat 121 gttgaactcg ttctcgaagg aagcgagttc cttcagaccg ccttccttct tgacgccggg 181 ggtatagaac acgccccaga actcttcctg ggacagatcc agctcctgca tcagggaata 241 ggccaggccg cggttgcctc tgcgcagcgc gcggatgaat tccgctaccg ggtcacgctc 301 cggggcaaaa ttccacatgc ccatcgccag ctcgatgatc tccgctaatt tgaagatatc 361 gtcctggctg tagttatcgt cgttgtccac cagcagcagg tagtatttct cgcctgctac 421 cgtaacgggt ccccagtagg tcgtaagacc ttccagctgc agcttcgtgg attttctctc 481 ctcgatgttg aggcccatct ccgtgctctt gcgcacggct tcctcgatgg tgatgttgtg 541 gcgggtctcc acggagaaca gggcgttgaa gtcggaggag aacagcacga tctggaaggc 601 gttgctgagc gcggcctccc gggctgccat gggaaagctg ctgtactttt cgaagttcag 661 cagatggtag atgctgttgg tgatcagact gttggagaaa gtctcagcca ttattcgtct 721 ctgcctttct tttgggcttc ctcccgcgcc ttacgcactt cggaagcgtc ccggataatg 781 atgtttccct tttcatccat gacagcaacg cgtttgccct tttccatggc ttcgcgcatc 841 tgttcttcca cgcggcgttt ctcttccgcc tctaaaaatg ccttcttttc tgcctccaga 901 cgttcctttt ccgctctcgc agcatccgct tccttctgga tgttctccag ctcttccacg 961 gtgctggtat tggtatacag cgcttcgaac tgatcggcgt ccaaagtctc catctccagc 1021 agagcttccg ctacgcggtg cagctcttct ctgtgctcca gcaggatctt ttcggtctct 1081 gcgtaagccg tcgtcatgat gtcgtgaact tccttgtcga tcttggaagc caattcttcg 1141 gagaagttct gcttggacgt aaagtctctg cccaggaata cttcgtcggc gctgctgtag 1201 ttcagcggtc cgatggtctc gctcatgccg tatttcgcga ccatgtcgtg ggcgatcttc 1261 gtagcccgct ccaggtcgtt gctggcgccg gtggagatgt cgcccatgac gagcgcttcc 1321 gccacgcgtc cgcccagcag gtgctggatc tcgtggagca tgtcgccctt ggtcatgtag 1381 tatttatctt actcgggcag ctgcatcgta aatccgcctg ctctgccgcg gggcatgatg 1441 gtcacctgat ggacagggtc ggcgccgggg gtcgatatca tgacgacggc gtgtccggct 1501 tcgtggaagg cggtgag // LOCUS sequence321 1512 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence321 VERSION sequence321 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1512 /mol_type="genomic DNA" /organism="" /note="sequence321" CDS 2..868 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MDEKLQNSLDERLARSFAQVRGSLDQVYRGLGEMQGLAQDVGDLR KLMTNVKSRGVIGELQLGSILEQILAPGQYETNAQVKPNTQERVEYAVKMPGNGGGSVY LPIDSKFPGDIYGALQDAYDNADSAYAEVQRKRLAQFIKLSAKEIRDKYVEPPYTTDFA VMFLPFEGLYAEVVNLELMEICQRDYKIMIAGPSTLAALLNSLQMGFRTLAIQKRSTEV WGVLGQVKGEFDKFADVLASAQQRINQANAELDKLIGVRTRSIQKTLSGMQKLSDPDEE EQGRWLP" /locus_tag="LOCUS_7460" /note="WP_008765517.1 DNA recombination protein RmuC (Bacteroides) [pid:52.2%, q_cov:100.0%, s_cov:70.4%, Eval:1.5e-80, partial hit]" /note="MGA_1176" ORIGIN 1 cgtggacgaa aaactgcaga attctctgga cgagcggctg gcccgctcct ttgcccaggt 61 gcggggcagc ctggatcagg tgtaccgggg cctcggcgag atgcagggcc tggcgcagga 121 cgtgggcgat ctccgaaaac tcatgaccaa cgtcaagagc cgcggcgtca tcggcgagct 181 gcagctggga tccatcctgg agcagatcct ggcgccgggt cagtacgaga ccaacgccca 241 ggtaaagccg aacacccagg aaagggtgga atatgccgtc aagatgcccg gaaacggcgg 301 cggcagcgtt tatctgccca tcgattccaa attcccaggc gacatctacg gcgcgctgca 361 ggacgcgtac gacaacgcgg acagcgccta tgcggaagta cagagaaaac ggctggcgca 421 gttcatcaaa ctgtccgcga aggagatccg cgacaaatat gtcgagcctc cttacacgac 481 ggattttgcc gtcatgttcc tgccgttcga agggctgtat gcggaagtcg tcaatctgga 541 actgatggag atctgccaac gggattataa gatcatgatc gcagggccct ccacgctggc 601 ggcgctgctc aacagcctgc agatgggttt ccggaccctg gcgatccaga agcgctccac 661 ggaagtctgg ggcgttttag ggcaggtaaa gggcgagttc gataagttcg cggacgtgct 721 ggcttccgcg cagcagcgga tcaaccaggc caacgccgag ctggataagc tgatcggcgt 781 gcgcacccgc agcatccaga agaccctgtc cggcatgcag aaactcagcg atccggacga 841 agaagagcaa ggcaggtggc tgccatgaac gtatgggcca tcggcgacct gcatctgtcg 901 cttgaccccc gcatcgaaaa gcccatggac atcttcggcg gcagctgggt gggtcacgat 961 aagaaactga aggagatctg gctgcgcatg gtggagccgg aagacctggt cgttctcgcg 1021 ggcgacatct cctgggcgct gcgcctggag gaagcgctgg aagatctgaa gtggatcgat 1081 gcgctgcccg gcacgaaact cattttaaag ggcaatcacg atctgtggtg gtccggcatc 1141 tcgaaggtga agaacgcctg caaggacatg ccgacgctgc gctttctgca gcacgacgcc 1201 ttcgtctggg gccgctgcat cgtcttcggt tcccggggct ggacctgtcc cggcgccaag 1261 gattaccacg aggaagaaga cggtgccatc taccgcaggg aggtgctgcg gctggagatg 1321 agcgcaaagg aagccgcgag gctggcggag ggcgtggatg acccttgcat cgtcggcgtc 1381 atgcattatc cgcccatgaa cgagaagttc gagccaaacg gatttacgca gatcctggag 1441 cagagcggtg caaagcaagt cgtttacggc catctccacg gccagaacgc tttcaagaac 1501 ggtccgcagg gc // LOCUS sequence322 1507 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence322 VERSION sequence322 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1507 /mol_type="genomic DNA" /organism="" /note="sequence322" CDS 264..989 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MKELLNEKLKAYRELGPVLPEARKWLEDSNLWMLLYTVLCQRGVR VEKKTLVDILSGRIMEDVNIDLYGFCFRLRDVYKDMISSVEMQATLNTKMLDGWYEDLL EPEGPVHRRDNAVVYDIGFIPCHYSEISERMDHLFRAMDSVSDGALKAAELQMGIINIY AYGQDTITMALLAAAYALLQAGIPLPSYPVSEDEYRRLMSACINDGDEAPFCNMHYRSL VNRLETVIQVYREALENQE" /locus_tag="LOCUS_7470" /note="MGA_1179" ORIGIN 1 caacgacaac aacgagaccg ttatgtacgc tcctgccggc ggcttctaca agaccccggg 61 tgcaggcatc aacgagatgc gtatcgcgta catcctcaac tgcgacgacc tgagaagagc 121 catccagctc ctcggcaagg gtatcgagca gtacaacgcc agaaagtaat ttcggcgcca 181 taacagggaa acaaagagcc ggagcacaac gctccggttc tttttctgtt tttcgtcaac 241 caaaattgtg ttatcataga accatgaagg aacttctgaa cgaaaaactc aaggcttaca 301 gggaattggg acctgtcctt ccggaggcgc gcaagtggct ggaggactcc aatctctgga 361 tgctgctgta caccgtgctg tgccagcggg gcgtgcgggt ggagaagaag actctggtgg 421 acatcctgtc cggccgcatc atggaagacg tgaatatcga cctgtacggc ttctgcttcc 481 gcctgcggga cgtctataag gatatgatca gttccgtgga gatgcaggct acgctcaaca 541 cgaagatgct ggacggctgg tacgaagacc ttctggaacc ggagggaccg gtccacagaa 601 gagacaacgc cgtcgtgtac gacatcggct ttatcccctg tcattacagc gagatctcgg 661 agcggatgga tcacctgttc cgggcgatgg acagcgtttc cgacggcgcc ctgaaggctg 721 cagaacttca gatgggcatc atcaacatct acgcctacgg ccaggatacc atcaccatgg 781 cgctgctggc tgccgcctac gcgctgctgc aggcaggcat tccgcttccg tcgtatcctg 841 tgagcgagga cgaataccgc cggctgatga gcgcctgcat caacgacggc gacgaagctc 901 ccttctgcaa catgcattac cgcagcctgg taaaccgcct ggagacagtc atccaggtgt 961 accgggaggc attggagaat caggaatgaa catacaggag atcaaagaac agctcttttc 1021 ctataccgac gaggaccggg tggccgaata tgagcccatg gacctgcata ccagtttccg 1081 ctgcggaggc gcggcggatc tttttgtcac accgggaagt ctgggggaac tgatgaacgt 1141 gctggacctg gtccgcacgc agaagatccc ctatctcgtg ctgggcaacg gcagtaacgt 1201 gctgtttagg gacggcggct accacggggt ggtcatccgc atcggagagg gtatggaccg 1261 ggtgcgcatc gaggggcaga ccgtgtttgc agagcccggc gtgagcctgg caaaactcgc 1321 gaagatggta gcggaagaag gcctttccgg tctggaattc gcctgcggca tccccgggtc 1381 tctgggcggc gccgtcttca tgaacgccgg tgcgtacgat cacgaactga aggaagtgct 1441 gctgtccgtc tcttccatca accatctggg catgatgaaa gaccgcaagg cggaggactg 1501 cggactc // LOCUS sequence323 1503 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence323 VERSION sequence323 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1503 /mol_type="genomic DNA" /organism="" /note="sequence323" CDS 31..999 /product="hypothetical protein" /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /transl_table=11 /codon_start=1 /translation="MLLLGGAYFAAAETAFASVSKIRMISDADDGDPKAKKALYVLDHF DKALTTLLIGNNIMHIACSSAATLLASKLWGNRAVTACTFVTAFVVFIFAEMIPKSYAK ACCEALAPRIAPSLIFLMKVLTPVSVLFSGVSRLAARLIGAADTEEPTVTEEELFDIIE NIDEEDKIDEDAAELVQSALEFTVKTVRLALTPWEKTVKITRSMTDEEILQIITDGHFS RIPVLDDDGGVEGILHIRKFLKAKIRGRKVLKARSMLDKAFWLPLEMPIDDALDALSSN RAHMAIVHRQDGSIAGIVTVEDILEELVGEIYDEEEGGLPK" /locus_tag="LOCUS_7480" /note="WP_012869172.1 hemolysin family protein (Thermanaerovibrio acidaminovorans) [pid:30.3%, q_cov:98.1%, s_cov:73.7%, Eval:1.1e-37, partial hit]" /note="MGA_1181" ORIGIN 1 gttattccgc gatatttagt tttcatagcg ttgctgcttt tgggaggcgc gtactttgcc 61 gcggccgaga ctgcttttgc gtcggtcagc aagatacgca tgatttccga tgcggacgac 121 ggagacccta aggcgaagaa ggccctgtac gtgctggacc acttcgacaa ggctctcacg 181 acgctgctca tcggaaataa cattatgcac attgcatgct cctctgcggc aacgctttta 241 gcatccaaac tctggggaaa cagggccgtt accgcatgta cgttcgtaac ggcttttgtc 301 gtgttcatct ttgcggagat gatccccaag tcctacgcga aagcctgctg cgaagctttg 361 gcgccccgca tcgcgccgtc cctcatcttc ctgatgaagg tgctgacccc ggtcagcgtg 421 ctgttctccg gggtcagccg gctggcggcc cgcctcatcg gcgctgccga cacggaagag 481 cccaccgtaa cggaggaaga attgttcgac atcatcgaaa acatcgacga agaggacaag 541 atcgacgaag atgcggcgga actggtgcag tccgccctgg aattcaccgt aaagacggta 601 agactggccc ttacaccctg ggaaaagaca gtcaagatca cccgctccat gacagacgag 661 gagatcctgc agatcatcac ggacgggcat ttttcccgca tccccgtgct ggatgacgac 721 ggaggcgtgg aaggcatcct gcacatccgc aaattcctga aggcgaagat ccggggccgc 781 aaggtcttaa aggcccgctc catgctggac aaggcgttct ggctgccgct ggagatgccc 841 atcgacgacg cgctggacgc gctcagcagc aaccgggcgc atatggcgat cgtccacagg 901 caggacggca gcatcgccgg catcgttacc gtggaggaca tcctcgagga actcgtgggc 961 gagatctacg atgaagagga aggagggctg ccgaaatgat aggcaatatc cttctgatcg 1021 tctgcctcat cttcctgtct gcggtgttct cggggtccga gatcgccttc gccagctcca 1081 gcgaggtaaa gctgcgcaag gcggcggaag aggcaaaaag ggcgtcctcg aagaacgcct 1141 ttcatataaa ggaacattac gacgacgcgc tcattacgat cctcatcggc aacaatctgg 1201 tgaacatcgc atcgtctgcc gttgctacgg tcatcgctgt ctctctcatg ggcgacgcag 1261 gcgcgtggat cgcgaccctc atcatgaccg tcatcatcat cacgttcggc gaaattacgc 1321 cgaagatcct ggccagcaag aagccggaag gctttgcccg ccgggtggcg aatccgctgc 1381 aggcgctgtg cgtggtcaca aagcccctcg tcgttgtctt cggcgccatg atggacggcc 1441 tcggccactt atggaagaag agcgtcgtgg acgaagccgt aacggaggat gacctcgaga 1501 cca // LOCUS sequence324 1501 bp DNA linear BCT 20-JUN-2023 DEFINITION . ACCESSION sequence324 VERSION sequence324 KEYWORDS . SOURCE ORGANISM . FEATURES Location/Qualifiers source 1..1501 /mol_type="genomic DNA" /organism="" /note="sequence324" misc_feature <1..1170 /inference="COORDINATES:ab initio prediction:MetaGeneAnnotator" /note="partial CDS similar to WP_000033250.1:S-methyl-5-thioribose kinase" /note="WP_000033250.1 S-methyl-5-thioribose kinase (Bacillus) [pid:43.2%, q_cov:94.9%, s_cov:90.5%, Eval:4.5e-84]" /note="MGA_1183" /locus_tag="LOCUS_7490" ORIGIN 1 ctgcccgact ttttcgggaa agatgcccag ctgaaagcgg ccgaactctc cgacggcaac 61 atcaactacg tgttccgggt ggaggacgaa aacggcaagt ctctcatcat caagcacgcc 121 gaggatacgc tgcgggtcaa cacgaaccgg cacatcggtt tcgaccgcag caagatcgaa 181 tgcgaagtgc tgaagctgca gcgggaatac tgccctgccc tcatccccga agtctatctg 241 tacgacgagg cggagcacaa catcgtcatg gaggatatga agggttacga gaacctgcgc 301 tacgagcttt gtgaccataa gatcttcccg aaccttgcca aagacgtggc agaattctgc 361 ggcaaggccc tcatcgggtc cacggacatg gtcgtgggtg cggaaaagaa aaaagaactg 421 gtgaagcgct acaccaaccc gaaactgtgc gagatcacgg agcggcacgt gctcaccgag 481 ccctattacg aggatctgga cgataacggg gtcacggagg aaaacgacga attcatgcgc 541 acctggatct acggcagcga agagctgcac gccaaggtgg gcatgctgaa ggcgctgttt 601 gagaccaagg cacaggctct gctccacggc gacctgcaca ccggctccat cttcgtgacc 661 ccggacaaga cctgcatctt cgacccggaa tttgccttct acggccccat cggctacgat 721 acgggcaact ttatcgccaa catgatcttc gcctatgcga acggcctcta caccatggaa 781 gatggctccg aaaagacgga gtacctggag tggatcctgg acacgatcga ggagttctgc 841 ggccgtttcg tcgaaaatgc gaagcagctg atgcgggaaa agtccatgga ccggcagatg 901 cagtccgaag ctttcttcga cctgtatctg gaagacatct tcaaggatca ggcgggcttt 961 gccggaacgg agctcatccg ccgcgtcgtc ggaacctcca aggtaaagga catcaagtcc 1021 atcgaggacg aagtgcagcg cgccaaggcc gagcgcctct gcatgaccgc cggcatgaaa 1081 ttcgtgatgg atcccgaatc catgattacc ggcagatcct acaccgacta tctgcgcacc 1141 ttctccgacg tcgtggattt tgaaggataa aactttataa aaatcattaa aaaagccacg 1201 agcgttgaat accggtcgtg gcttttatta tgtcttatat aattaattaa tcgaaaatcg 1261 tcttcttctg cgccgacgcc gcgtaatccg cgacgaactt catggagttc tgcttgttca 1321 ccagggtccc catgccgcgc atgcagccgt ccgggcagca catgccttcg atgatgttgc 1381 cgtccagctt gcctaccttc gccttcatca gcgctgctct gcattcttcg atgccgttgc 1441 agatgacagg cttgacttcg aagtcttccc ttcccatctc cttcacagcc tgggctacgg 1501 a //