# locus_id	locus_tag	location	classification	internal_stop	indel	ref_id	description	query_cov	ref_cov	identity
MGA_1	LOCUS_00010	sequence01:466..609(-)	internal_stop_codon	466..468(-)		WP_002437845.1	YSIRK domain-containing triacylglycerol lipase GehC	85.1	5.8	65.0
MGA_4	LOCUS_00040	sequence01:4163..4444(+)	internal_stop_codon	4442..4444(+)		WP_002294467.1	DUF1801 domain-containing protein	98.9	75.4	43.5
MGA_6	LOCUS_00060	sequence01:5807..6190(+)	frameshift		6151	WP_003244520.1	(S)-ureidoglycine--glyoxylate transaminase	93.7	30.3	52.4
MGA_7	LOCUS_00070	sequence01:6157..7032(+)	frameshift		6151	WP_003244520.1	(S)-ureidoglycine--glyoxylate transaminase	98.6	69.2	49.7
MGA_11	LOCUS_00110	sequence01:10187..11452(-)	frameshift		11468	WP_010706747.1	DUF1116 domain-containing protein	98.1	41.4	68.3
MGA_12	LOCUS_00120	sequence01:11454..13214(-)	frameshift		11468	WP_010706747.1	DUF1116 domain-containing protein	99.1	57.9	50.4
MGA_79	LOCUS_00790	sequence01:69831..70235(-)	partial			WP_011970650.1	SRPBCC family protein	83.6	72.0	31.4
MGA_84	LOCUS_00840	sequence01:74055..75371(-)	partial			WP_010990014.1	autolysin Ami	49.5	24.2	46.9
MGA_108	LOCUS_01080	sequence01:85723..86730(+)	partial			WP_000526910.1	3'-5' exonuclease	45.1	47.3	39.7
MGA_109	LOCUS_01090	sequence01:86887..87225(+)	partial			WP_047210621.1	site-specific integrase	97.3	26.8	85.3
MGA_133	LOCUS_01330	sequence01:110149..110733(-)	partial			WP_012027610.1	phosphatase PAP2 family protein	68.6	67.7	29.5
MGA_134	LOCUS_01340	sequence01:111176..111454(-)	partial			WP_001830097.1	FtsW/RodA/SpoVE family cell cycle protein	92.4	20.9	42.4
MGA_137	LOCUS_01370	sequence01:113076..113744(+)	internal_stop_codon	113742..113744(+)		WP_005170765.1	N-methyl-L-tryptophan oxidase	90.1	53.6	44.5
MGA_154	LOCUS_01540	sequence01:130481..131662(-)	partial			WP_000676339.1	YhgE/Pip domain-containing protein	37.2	23.3	33.1
MGA_195	LOCUS_01950	sequence01:180710..180847(-)	partial			WP_000240855.1	50S ribosomal protein L34	60.0	60.0	100.0
MGA_202	LOCUS_02020	sequence01:191120..191404(+)	frameshift		191456	WP_095092556.1	IS1182 family transposase	63.8	10.3	65.0
MGA_242	LOCUS_02420	sequence01:238655..239359(+)	internal_stop_codon	239357..239359(+)		WP_025455914.1	SIR2 family protein	100.0	46.6	57.0
MGA_243	LOCUS_02430	sequence01:239396..239860(+)	frameshift,internal_stop_codon	239357..239359(+)	239818	WP_025455914.1	SIR2 family protein	94.2	29.0	52.4
MGA_255	LOCUS_02550	sequence01:248803..248976(+)	partial			WP_002455937.1	hypothetical protein	80.7	28.6	89.1
MGA_256	LOCUS_02560	sequence01:248931..249557(-)	partial			WP_002437889.1	MFS transporter	99.0	52.8	60.7
MGA_268	LOCUS_02680	sequence01:260594..260986(-)	partial			WP_000417018.1	2-hydroxyacid dehydrogenase family protein	76.9	31.5	62.0
MGA_280	LOCUS_02800	sequence01:274732..275247(+)	frameshift		275241	WP_011067908.1	amidohydrolase family protein	89.5	37.4	46.3
MGA_281	LOCUS_02810	sequence01:275427..276011(+)	frameshift		275241	WP_011067908.1	amidohydrolase family protein	90.7	40.1	53.4
MGA_287	LOCUS_02870	sequence01:284688..285032(-)	partial			WP_083485680.1	metalloregulator ArsR/SmtB family transcription factor	73.7	79.2	40.5
MGA_311	LOCUS_03110	sequence01:311425..312858(+)	partial			WP_000678077.1	YhgE/Pip family protein	52.6	24.6	32.7
MGA_317	LOCUS_03170	sequence01:315993..316571(+)	frameshift		316547	WP_000497497.1	AEC family transporter	95.3	60.0	35.0
MGA_318	LOCUS_03180	sequence01:316588..316917(+)	frameshift		316547	WP_000497497.1	AEC family transporter	99.1	35.4	47.2
MGA_327	LOCUS_03270	sequence01:325631..328282(+)	partial			WP_011082831.1	MSCRAMM family adhesin SdrF	39.5	20.1	22.4
MGA_332	LOCUS_03320	sequence01:332442..333383(-)	partial			WP_003404247.1	DsbA family protein	59.4	83.8	28.6
MGA_333	LOCUS_03330	sequence01:333523..333876(+)	partial			WP_001789900.1	TetR/AcrR family transcriptional regulator	89.7	56.1	36.8
MGA_336	LOCUS_03360	sequence01:334528..334707(-)	internal_stop_codon	334723..334725(-)		WP_003437484.1	hypothetical protein	96.6	37.0	40.4
MGA_358	LOCUS_03580	sequence01:356464..357636(+)	partial			WP_124797038.1	putative glycoside hydrolase	88.7	72.6	36.9
MGA_414	LOCUS_04140	sequence01:427607..428128(+)	frameshift		428092,428276	WP_002901609.1	PEP phosphonomutase	94.2	54.7	57.1
MGA_415	LOCUS_04150	sequence01:428121..428327(+)	frameshift		428276,428095	WP_011675065.1	haloacid dehalogenase-like hydrolase	80.9	17.8	65.5
MGA_416	LOCUS_04160	sequence01:428293..428505(+)	frameshift		428276,428095	WP_002901609.1	PEP phosphonomutase	100.0	23.5	75.7
MGA_420	LOCUS_04200	sequence01:431587..431712(+)	frameshift		431679	WP_001147974.1	PTS ascorbate transporter subunit IIC	75.6	6.9	90.3
MGA_421	LOCUS_04210	sequence01:431820..432944(+)	frameshift		431679	WP_001147974.1	PTS ascorbate transporter subunit IIC	97.6	81.5	74.8
MGA_436	LOCUS_04360	sequence01:444851..445210(+)	partial			WP_000454151.1	hypothetical protein	47.9	49.2	45.8
MGA_451	LOCUS_04510	sequence01:460599..461261(+)	partial			WP_011101912.1	ABC transporter permease	95.5	50.5	54.8
MGA_482	LOCUS_04820	sequence01:486195..486917(+)	frameshift		486899	WP_000823221.1	nucleoside hydrolase	98.8	76.2	76.8
MGA_483	LOCUS_04830	sequence01:486898..487134(+)	frameshift		486899	WP_000823221.1	nucleoside hydrolase	96.2	24.1	74.7
MGA_501	LOCUS_05010	sequence01:506800..507030(+)	frameshift		507027	WP_000136487.1	sugar O-acetyltransferase	98.7	37.7	48.0
MGA_502	LOCUS_05020	sequence01:507087..507362(+)	frameshift		507027	WP_000136487.1	sugar O-acetyltransferase	100.0	45.7	61.5
MGA_506	LOCUS_05060	sequence01:511837..512274(+)	partial			WP_002456715.1	DUF4064 domain-containing protein	89.0	63.3	25.6
MGA_568	LOCUS_05680	sequence01:586681..586947(+)	partial			WP_135351025.1	transposase	84.1	56.5	75.7
MGA_592	LOCUS_05920	sequence01:615944..616411(+)	internal_stop_codon	616409..616411(+)		WP_003245721.1	MFS transporter	85.8	29.0	58.6
MGA_593	LOCUS_05930	sequence01:616412..617347(+)	internal_stop_codon	616409..616411(+)		WP_003245721.1	MFS transporter	98.1	66.4	37.5
MGA_602	LOCUS_06020	sequence01:625867..626496(-)	frameshift		626507	WP_000592610.1	imidazole glycerol phosphate synthase subunit HisF	97.6	44.2	71.6
MGA_619	LOCUS_06190	sequence01:645191..645964(+)	partial			WP_002468207.1	type II CAAX endopeptidase family protein	72.8	76.2	49.5
MGA_624	LOCUS_06240	sequence01:650984..651454(+)	internal_stop_codon	650918..650920(+)		WP_001291519.1	YdeI family protein	100.0	78.4	65.4
MGA_672	LOCUS_06720	sequence01:694004..695056(+)	frameshift		695038	WP_001118725.1	nitrite reductase large subunit NirB	99.1	43.3	73.8
MGA_673	LOCUS_06730	sequence01:695016..696389(+)	frameshift		695029	WP_002485232.1	nitrite reductase large subunit NirB	98.9	56.4	79.6
MGA_675	LOCUS_06750	sequence01:696698..696967(+)	frameshift		696880	WP_000109877.1	uroporphyrinogen-III C-methyltransferase	87.6	24.0	60.3
MGA_676	LOCUS_06760	sequence01:696922..697638(+)	frameshift		696880	WP_002485238.1	uroporphyrinogen-III C-methyltransferase	94.1	72.0	43.8
MGA_690	LOCUS_06900	sequence01:713298..713522(-)	frameshift		713312	WP_000516798.1	DUF4889 domain-containing protein	74.3	50.0	47.3
MGA_699	LOCUS_06990	sequence01:724847..725302(+)	frameshift		725293	WP_002209403.1	erythritol/L-threitol dehydrogenase	94.7	38.3	72.7
MGA_700	LOCUS_07000	sequence01:725427..725930(+)	frameshift		725293	WP_002209403.1	erythritol/L-threitol dehydrogenase	100.0	45.0	71.3
MGA_712	LOCUS_07120	sequence01:736756..737580(+)	partial			WP_000827010.1	hypothetical protein	40.1	53.9	50.0
MGA_738	LOCUS_07380	sequence01:766961..767962(+)	frameshift		766959	WP_201626527.1	Na+/H+ antiporter NhaC family protein	99.1	75.5	50.0
MGA_741	LOCUS_07410	sequence01:769580..770116(-)	internal_stop_codon	770153..770155(-)		WP_002456635.1	ribulokinase	98.9	32.8	71.6
MGA_742	LOCUS_07420	sequence01:770153..771199(-)	internal_stop_codon	770153..770155(-)		WP_002456635.1	ribulokinase	100.0	64.6	71.8
MGA_882	LOCUS_08820	sequence01:894671..897067(+)	partial			WP_004552628.1	N-6 DNA methylase	47.7	41.8	24.8
MGA_883	LOCUS_08830	sequence01:897094..898533(+)	partial			WP_002680807.1	restriction endonuclease subunit S	31.1	29.3	25.5
MGA_908	LOCUS_09080	sequence02:1..1497(+)	partial			WP_002437845.1	YSIRK domain-containing triacylglycerol lipase GehC	98.6	74.6	62.5
MGA_934	LOCUS_09320	sequence05:1..1006(+)	partial			WP_001582045.1	plasmid recombination protein	15.9	49.1	54.7
MGA_941	LOCUS_09370	sequence06:139..>1239(-)	partial			WP_010903904.1	valine--tRNA ligase	95.9	40.2	55.6
MGA_942	LOCUS_09380	sequence07:46..>1122(-)	partial			WP_010903200.1	anthranilate synthase component I	98.9	67.2	57.1
MGA_1003	LOCUS_09920	sequence12:55761..56435(-)	internal_stop_codon	56604..56606(-)		WP_001060842.1	Nramp family divalent metal transporter	99.6	49.6	75.8
MGA_1004	LOCUS_09930	sequence12:56604..57104(-)	internal_stop_codon	56604..56606(-)		WP_002469506.1	Nramp family divalent metal transporter	98.8	36.6	78.7
MGA_1061	LOCUS_10500	sequence12:114813..115703(+)	partial			WP_002470268.1	FtsQ-type POTRA domain-containing protein	99.7	63.5	56.6
MGA_1131	LOCUS_11200	sequence12:195588..196331(+)	internal_stop_codon	196329..196331(+)		WP_001829468.1	DNA-processing protein DprA	98.4	83.8	44.9
MGA_1176	LOCUS_11650	sequence12:250422..250766(+)	partial			WP_002485463.1	poly-gamma-glutamate hydrolase family protein	78.9	20.2	44.4
MGA_1184	LOCUS_11730	sequence12:257732..258085(+)	partial			WP_001832558.1	poly-gamma-glutamate hydrolase family protein	92.3	52.7	44.4
MGA_1368	LOCUS_13570	sequence12:455467..455652(+)	frameshift		455737	WP_181746991.1	IS1182 family transposase	100.0	12.9	45.9
MGA_1369	LOCUS_13580	sequence12:455772..456017(+)	frameshift		455746	WP_083498292.1	IS1182 family transposase	81.5	14.2	48.5
MGA_1399	LOCUS_13880	sequence12:489288..490196(-)	partial			WP_004524980.1	bifunctional enoyl-CoA hydratase/phosphate acetyltransferase	67.9	43.9	35.1
MGA_1456	LOCUS_14450	sequence12:538719..538895(-)	partial			WP_000048060.1	30S ribosomal protein S21	74.1	74.1	95.3
MGA_1468	LOCUS_14570	sequence12:552061..553968(-)	frameshift		552081	WP_011082702.1	DNA internalization-related competence protein ComEC/Rec2	91.8	77.4	39.4
MGA_1598	LOCUS_15870	sequence12:693183..693356(+)	partial			WP_135351025.1	transposase	66.7	29.0	78.9
MGA_1628	LOCUS_16170	sequence12:729429..730232(+)	frameshift		730205	WP_000285020.1	NAD(P)/FAD-dependent oxidoreductase	98.9	62.3	81.1
MGA_1629	LOCUS_16180	sequence12:730189..730689(+)	frameshift		730208	WP_000285020.1	NAD(P)/FAD-dependent oxidoreductase	97.0	38.2	68.3
MGA_1684	LOCUS_16730	sequence12:786877..787350(+)	frameshift		787281	WP_000894660.1	formate C-acetyltransferase	86.6	18.2	80.1
MGA_1685	LOCUS_16740	sequence12:787344..789125(+)	frameshift		787284	WP_000894660.1	formate C-acetyltransferase	100.0	79.2	90.4
MGA_1710	LOCUS_16900	sequence23:1..3355(+)	partial			WP_001074534.1	glucosaminidase domain-containing protein	77.4	71.7	40.2
MGA_1799	LOCUS_17790	sequence23:103633..103827(+)	partial			WP_002439051.1	NAD(P)-binding domain-containing protein	87.5	14.6	55.4
MGA_1842	LOCUS_18220	sequence23:140777..141001(+)	frameshift,internal_stop_codon	140715..140717(+),140736..140738(+)	140635,140732,140966	WP_002494449.1	IS1182-like element ISSep1 family transposase	89.2	11.8	68.2
MGA_1849	LOCUS_18290	sequence23:144604..145281(+)	frameshift		145245	WP_003227205.1	citrate transporter CitH	85.8	45.3	59.6
MGA_1850	LOCUS_18300	sequence23:145353..145898(+)	frameshift		145248	WP_000880464.1	CitMHS family transporter	98.9	41.2	54.7
MGA_1853	LOCUS_18330	sequence23:147595..147801(-)	partial			WP_001548522.1	TM2 domain-containing protein	94.1	69.6	70.3
MGA_1879	LOCUS_18590	sequence23:165567..166118(+)	partial			WP_002485100.1	Ltp family lipoprotein	70.5	57.9	48.8
MGA_1886	LOCUS_18660	sequence23:169346..169780(-)	frameshift		169381	WP_009894741.1	hypothetical protein	95.8	60.6	38.4
MGA_1900	LOCUS_18800	sequence23:177676..178149(-)	partial			WP_003900701.1	phage terminase small subunit P27 family	63.1	66.7	35.6
MGA_1905	LOCUS_18850	sequence23:181545..183887(-)	partial			WP_010714140.1	DNA primase family protein	57.7	56.0	51.8
MGA_1925	LOCUS_19050	sequence23:200948..201595(-)	partial			WP_000070831.1	DUF4887 domain-containing protein	20.9	21.5	60.0
MGA_1932	LOCUS_19120	sequence23:206257..206547(-)	partial			WP_000664359.1	DUF1722 domain-containing protein	93.8	70.9	45.6
MGA_2036	LOCUS_20160	sequence23:311648..312040(+)	partial			WP_002438866.1	DUF1361 domain-containing protein	97.7	62.0	54.3
MGA_2054	LOCUS_20340	sequence23:328096..328308(-)	partial			WP_000733432.1	hypothetical protein	94.3	50.4	42.4
MGA_2056	LOCUS_20360	sequence23:328916..329413(+)	frameshift		329338	WP_001832056.1	DUF1129 family protein	84.8	62.0	71.1
MGA_2061	LOCUS_20410	sequence23:333815..334543(-)	partial			WP_000865624.1	DUF402 domain-containing protein	71.1	80.4	83.1
MGA_2188	LOCUS_21640	sequence29:81084..81968(-)	frameshift		82075	WP_009891031.1	CDP-glycerol glycerophosphotransferase family protein	74.8	56.3	30.0
MGA_2190	LOCUS_21660	sequence29:83055..84230(-)	partial			WP_000975351.1	poly(ribitol-phosphate) beta-N-acetylglucosaminyltransferase	56.8	37.0	32.9
MGA_2208	LOCUS_21840	sequence29:101756..104272(-)	partial			WP_010905630.1	CDP-glycerol glycerophosphotransferase family protein	73.3	76.2	37.3
MGA_2216	LOCUS_21920	sequence29:109946..110350(-)	internal_stop_codon	110420..110422(-)		WP_000121299.1	kinase	97.8	77.2	43.9
MGA_2321	LOCUS_22970	sequence30:70289..70483(-)	partial			WP_000681968.1	hypothetical protein	73.4	81.0	68.1
MGA_2327	LOCUS_23030	sequence30:76177..78069(-)	partial			WP_049387514.1	MSCRAMM-like protein SdrH	44.1	62.6	35.1
MGA_2332	LOCUS_23080	sequence30:81462..82124(+)	frameshift,internal_stop_codon	82123..82125(+)	81912,81866	WP_010959211.1	GHKL domain-containing protein	99.1	50.8	37.2
MGA_2333	LOCUS_23090	sequence30:82134..82670(+)	internal_stop_codon	82122..82124(+)		WP_010959211.1	GHKL domain-containing protein	100.0	41.0	65.2
MGA_2341	LOCUS_23170	sequence30:91420..92322(+)	frameshift		92319	WP_001832478.1	AAA family ATPase	94.7	52.8	48.6
MGA_2342	LOCUS_23180	sequence30:92331..93011(+)	frameshift		92319	WP_000106332.1	MutS family DNA mismatch repair protein	98.2	41.6	62.8
MGA_2418	LOCUS_23940	sequence31:55806..56348(-)	partial			WP_000701483.1	DNA-directed RNA polymerase subunit delta	71.7	73.3	75.2
MGA_2501	LOCUS_24750	sequence33:7935..8060(-)	partial			WP_001059054.1	DMT family transporter	85.4	11.4	65.7
MGA_2505	LOCUS_24790	sequence33:10173..10418(+)	frameshift		10364,10694	WP_001105984.1	IS6-like element IS257 family transposase	84.0	30.4	94.1
MGA_2506	LOCUS_24800	sequence33:10355..10696(+)	frameshift		10364,10694	WP_001106057.1	IS6-like element IS257 family transposase	99.1	50.0	92.9
MGA_2518	LOCUS_24920	sequence33:20343..20747(-)	partial			WP_011222005.1	protein rep	72.4	29.8	39.2
MGA_2521	LOCUS_24950	sequence33:23239..24237(+)	partial			WP_010989615.1	ABC-F type ribosomal protection protein Vga(G)	93.4	59.1	40.1
MGA_2524	LOCUS_24980	sequence33:25296..25967(-)	frameshift		25367	WP_011117537.1	relaxase/mobilization nuclease domain-containing protein	88.8	68.6	77.8
MGA_2530	LOCUS_25040	sequence33:30809..30961(-)	frameshift,internal_stop_codon	31130..31132(-),30985..30987(-)	30846,31036,31102,30759	WP_000690635.1	recombinase family protein	76.0	19.3	78.9
MGA_2536	LOCUS_25100	sequence33:36638..36898(-)	partial			WP_000412130.1	acyl-CoA thioesterase	98.8	49.4	44.7
MGA_2565	LOCUS_25390	sequence34:21322..21540(-)	partial			WP_003246542.1	glucose starvation-inducible protein GsiB	80.6	43.9	67.2
