# locus_id	locus_tag	location	classification	internal_stop	indel	ref_id	description	query_cov	ref_cov	identity
MGA_46	LOCUS_00460	sequence001:35558..36523(+)	partial			WP_010965544.1	alpha/beta hydrolase	82.9	73.8	34.3
MGA_50	LOCUS_00500	sequence001:40433..41185(+)	internal_stop_codon	41183..41185(+)		WP_012972561.1	IS110 family transposase	98.4	61.8	46.8
MGA_51	LOCUS_00510	sequence001:41204..41656(+)	internal_stop_codon	41183..41185(+)		WP_003549893.1	IS110 family transposase	98.0	35.8	59.9
MGA_52	LOCUS_00520	sequence001:41914..42975(+)	frameshift		43098,42903	WP_115276001.1	ISL3 family transposase	94.1	77.8	34.9
MGA_58	LOCUS_00580	sequence001:49802..51982(+)	partial			WP_003434402.1	ATP-dependent RecD-like DNA helicase	47.0	50.2	24.7
MGA_129	LOCUS_01200	sequence015:909..1166(+)	frameshift		876	WP_011102204.1	6-phospho-beta-glucosidase	96.5	17.0	65.1
MGA_146	LOCUS_01370	sequence015:25363..26754(-)	partial			WP_002287386.1	NlpC/P60 family protein	24.8	22.1	69.0
MGA_149	LOCUS_01400	sequence015:30121..30651(+)	partial			WP_003641616.1	signal peptidase I	81.8	73.8	40.0
MGA_171	LOCUS_01600	sequence017:5403..6791(+)	partial			WP_003546132.1	bifunctional acetaldehyde-CoA/alcohol dehydrogenase	97.0	51.1	65.6
MGA_173	LOCUS_01620	sequence017:8121..8525(-)	partial			WP_002263094.1	amino acid permease	92.5	26.7	31.5
MGA_174	LOCUS_01630	sequence017:8443..8751(-)	partial			WP_011102117.1	amino acid permease	78.4	17.4	59.3
MGA_265	LOCUS_02540	sequence019:83027..83317(-)	partial			WP_219718821.1	hypothetical protein	88.5	16.5	48.2
MGA_271	LOCUS_02600	sequence019:84714..86597(-)	partial			WP_013230933.1	DEAD/DEAH box helicase	72.9	71.2	31.4
MGA_283	LOCUS_02700	sequence020:5558..5845(-)	partial			WP_003098742.1	flagellar biosynthesis anti-sigma factor FlgM	78.9	70.1	33.3
MGA_294	LOCUS_02810	sequence020:14678..15949(-)	partial			WP_011462131.1	methyl-accepting chemotaxis protein	93.1	59.4	29.9
MGA_300	LOCUS_02870	sequence020:21363..22442(-)	internal_stop_codon	22452..22454(-)		WP_011986950.1	fused FliR family export protein/FlhB family type III secretion system protein	95.8	56.5	39.7
MGA_301	LOCUS_02880	sequence020:22452..23210(-)	internal_stop_codon	22452..22454(-)		WP_010965447.1	fused FliR family export protein/FlhB family type III secretion system protein	99.6	41.5	27.8
MGA_306	LOCUS_02930	sequence020:25300..25557(-)	partial			WP_005816224.1	flagellar FlbD family protein	65.9	74.7	48.2
MGA_308	LOCUS_02950	sequence020:26572..26925(-)	partial			WP_011986955.1	TIGR02530 family flagellar biosynthesis protein	82.1	71.2	44.4
MGA_316	LOCUS_03030	sequence020:34013..34327(-)	partial			WP_011986961.1	flagellar hook-basal body complex protein FliE	71.2	71.2	41.9
MGA_341	LOCUS_03270	sequence022:1..654(+)	partial			WP_081581110.1	N-acetylmuramoyl-L-alanine amidase	98.6	20.1	57.4
MGA_388	LOCUS_03740	sequence024:10212..10460(-)	partial			WP_002287688.1	tyrosine-type recombinase/integrase	95.1	20.8	58.2
MGA_389	LOCUS_03750	sequence024:10913..11257(-)	internal_stop_codon	11309..11311(-)		WP_003703269.1	IS200/IS605 family transposase	89.5	71.3	72.5
MGA_396	LOCUS_03820	sequence024:20849..21790(+)	partial			WP_002369211.1	glycerophosphodiester phosphodiesterase	73.5	38.2	40.9
MGA_439	LOCUS_04250	sequence024:70571..70990(+)	partial			WP_011476136.1	cell division protein SepF	75.5	74.7	47.3
MGA_446	LOCUS_04320	sequence024:78395..78562(+)	partial			WP_011475897.1	RNA-guided endonuclease TnpB family protein	78.2	10.1	67.4
MGA_465	LOCUS_04490	sequence027:1408..1767(-)	partial			WP_011476362.1	CrcB family protein	68.1	62.8	53.1
MGA_485	LOCUS_04690	sequence027:23500..24612(+)	partial			WP_081581110.1	N-acetylmuramoyl-L-alanine amidase	55.4	19.4	58.7
MGA_490	LOCUS_04740	sequence027:30811..31656(+)	partial			WP_225355332.1	6-pyruvoyl-tetrahydropterin synthase-related protein	95.4	45.2	24.9
MGA_492	LOCUS_04760	sequence027:32765..35053(-)	frameshift,internal_stop_codon	35174..35176(-)	35167	WP_000200226.1	YfhO family protein	48.6	40.7	24.5
MGA_494	LOCUS_04770	sequence029:268..402(-)	partial			WP_011476585.1	RNA-guided endonuclease TnpB family protein	97.7	10.1	74.4
MGA_548	LOCUS_05310	sequence029:52721..53071(-)	partial			WP_010496068.1	hypothetical protein	75.9	74.6	38.6
MGA_567	LOCUS_05500	sequence029:71230..71415(+)	partial			WP_003694124.1	30S ribosomal protein S21	70.5	70.5	100.0
MGA_591	LOCUS_05730	sequence030:269..643(-)	frameshift		274	WP_003429214.1	cysteine hydrolase family protein	98.4	70.5	63.1
MGA_635	LOCUS_06140	sequence037:14159..14863(-)	frameshift		14985	WP_011101070.1	LCP family protein	91.5	53.1	50.9
MGA_639	LOCUS_06180	sequence037:18104..19132(+)	partial			WP_011083160.1	FIST N-terminal domain-containing protein	74.9	67.0	29.9
MGA_640	LOCUS_06190	sequence037:19152..20129(+)	partial			WP_011948292.1	methyl-accepting chemotaxis protein	84.3	39.2	29.5
MGA_648	LOCUS_06270	sequence037:25804..26007(+)	partial			WP_137628160.1	helix-turn-helix transcriptional regulator	98.5	47.5	40.9
MGA_698	LOCUS_06760	sequence038:17196..18719(-)	partial			WP_002286053.1	SpaH/EbpB family LPXTG-anchored major pilin	67.9	55.4	30.4
MGA_702	LOCUS_06800	sequence038:25877..26791(+)	internal_stop_codon	26789..26791(+)		WP_003642221.1	PTS sugar transporter subunit IIC	97.4	81.3	58.4
MGA_713	LOCUS_06880	sequence041:1790..2518(-)	partial			WP_011017006.1	sugar phosphate nucleotidyltransferase	93.8	41.9	35.2
MGA_715	LOCUS_06900	sequence041:4334..4564(-)	frameshift		4581	WP_011987017.1	TPR domain-containing glycosyltransferase	98.7	15.9	44.0
MGA_720	LOCUS_06940	sequence043:713..1177(+)	partial			WP_003438111.1	gamma-glutamyl-gamma-aminobutyrate hydrolase family protein	84.4	53.9	45.5
MGA_722	LOCUS_06950	sequence044:421..999(+)	frameshift		996	WP_011674398.1	YfhO family protein	92.7	19.2	33.7
MGA_756	LOCUS_07280	sequence045:42308..43060(-)	partial			WP_010905168.1	MATE family efflux transporter	96.4	54.5	23.4
MGA_772	LOCUS_07430	sequence046:382..702(-)	partial			WP_037616840.1	IS200/IS605 family transposase	77.4	50.6	42.7
MGA_778	LOCUS_07480	sequence047:1..873(+)	partial			WP_002287525.1	IS200/IS605 family element RNA-guided endonuclease TnpB	98.6	70.4	38.2
MGA_809	LOCUS_07790	sequence048:2697..3092(+)	partial			WP_000227333.1	polymorphic toxin type 50 domain-containing protein	98.5	31.5	60.5
MGA_826	LOCUS_07960	sequence048:20036..20962(+)	frameshift		20013	WP_011475733.1	competence protein CoiA family protein	77.9	78.6	42.9
MGA_837	LOCUS_08070	sequence049:1596..2519(+)	partial			WP_011861238.1	IS200/IS605 family element RNA-guided endonuclease TnpB	80.5	62.6	24.0
MGA_838	LOCUS_08080	sequence049:2902..3216(+)	frameshift		3189	WP_002286721.1	arginine-ornithine antiporter	91.3	20.5	53.6
MGA_840	LOCUS_08100	sequence049:3823..4194(+)	partial			WP_007054380.1	acylphosphatase	52.8	67.0	49.2
MGA_883	LOCUS_08510	sequence053:5407..6234(-)	partial			WP_011476061.1	DUF805 domain-containing protein	51.6	40.2	29.4
MGA_899	LOCUS_08670	sequence053:18796..19011(-)	partial			WP_011254133.1	RNA-guided endonuclease TnpB family protein	93.0	17.1	66.7
MGA_937	LOCUS_09020	sequence058:10386..10625(-)	partial			WP_003641297.1	hypothetical protein	94.9	70.9	35.5
MGA_968	LOCUS_09330	sequence059:38..460(-)	frameshift		476,581	WP_011987017.1	TPR domain-containing glycosyltransferase	88.6	26.0	31.2
MGA_969	LOCUS_09340	sequence059:531..791(-)	frameshift		584,500	WP_010989544.1	glycosyltransferase family 2 protein	75.6	10.5	49.3
MGA_994	LOCUS_09570	sequence062:12762..15617(-)	partial			WP_081581110.1	N-acetylmuramoyl-L-alanine amidase	67.7	60.4	39.8
MGA_1016	LOCUS_09780	sequence065:20341..21129(-)	partial			WP_011476109.1	hypothetical protein	77.5	68.1	34.5
MGA_1038	LOCUS_09990	sequence068:7376..7831(-)	partial			WP_011475718.1	sigma-70 family RNA polymerase sigma factor	59.6	46.4	47.8
MGA_1060	LOCUS_10210	sequence068:19962..20735(+)	partial			WP_011860997.1	phage recombination protein Bet	61.1	52.0	51.9
MGA_1092	LOCUS_10530	sequence068:38388..39818(+)	partial			WP_010905926.1	phage tail tape measure protein	98.1	27.7	34.7
MGA_1094	LOCUS_10550	sequence068:40332..44201(+)	partial			WP_010905926.1	phage tail tape measure protein	97.6	72.0	29.0
MGA_1100	LOCUS_10610	sequence068:49646..49891(+)	partial			WP_011475670.1	hypothetical protein	77.8	58.3	42.9
MGA_1102	LOCUS_10620	sequence070:1..1197(+)	partial			WP_011254350.1	GH25 family lysozyme	57.8	59.9	36.7
MGA_1103	LOCUS_10630	sequence070:1299..1811(+)	partial			WP_003695998.1	DUF4065 domain-containing protein	72.4	60.9	28.7
MGA_1112	LOCUS_10720	sequence070:10457..10813(+)	frameshift		10407	WP_011460716.1	helix-turn-helix domain-containing protein	59.3	32.2	48.6
MGA_1113	LOCUS_10730	sequence070:11496..11888(+)	internal_stop_codon	11886..11888(+)		WP_041272192.1	transposase	100.0	28.0	35.4
MGA_1145	LOCUS_11040	sequence071:31547..31891(+)	partial			WP_003700554.1	preprotein translocase subunit YajC	75.4	68.3	55.8
MGA_1168	LOCUS_11270	sequence071:52911..53162(+)	partial			WP_002295087.1	cell division protein ZapA	95.2	54.5	48.1
MGA_1192	LOCUS_11500	sequence072:14865..15065(-)	internal_stop_codon	15159..15161(-)		WP_000214765.1	AAA family ATPase	90.9	6.5	46.7
MGA_1199	LOCUS_11570	sequence072:19932..20369(-)	partial			WP_002917164.1	type III-A CRISPR-associated protein Csm2	89.0	68.2	40.5
MGA_1219	LOCUS_11760	sequence072:43447..43803(-)	internal_stop_codon	43927..43929(-)		WP_010922509.1	type I-C CRISPR-associated endonuclease Cas1c	97.5	33.7	59.1
MGA_1220	LOCUS_11770	sequence072:43927..44469(-)	internal_stop_codon	43927..43929(-)		WP_010932802.1	type I-C CRISPR-associated endonuclease Cas1c	98.3	51.6	42.4
MGA_1228	LOCUS_11850	sequence072:52827..53168(-)	frameshift		53136,53161,53402	WP_003813444.1	nitroreductase family protein	78.8	42.4	33.7
MGA_1232	LOCUS_11890	sequence072:54819..54992(-)	partial			WP_011987099.1	methyl-accepting chemotaxis protein	89.5	8.9	58.8
MGA_1253	LOCUS_12100	sequence072:82629..82916(-)	partial			WP_002303793.1	lipopolysaccharide assembly protein LapA domain-containing protein	87.4	56.5	36.1
MGA_1289	LOCUS_12460	sequence072:114294..116435(-)	partial			WP_011101414.1	DNA translocase FtsK	72.1	51.2	63.8
MGA_1314	LOCUS_12710	sequence072:138117..138443(-)	frameshift		138593,138422	WP_011100915.1	peptide ABC transporter substrate-binding protein	94.4	18.4	55.9
MGA_1315	LOCUS_12720	sequence072:138394..138588(-)	frameshift		138426	WP_011254634.1	peptide ABC transporter substrate-binding protein	89.1	10.5	54.4
MGA_1382	LOCUS_13360	sequence074:54531..55478(-)	partial			WP_004398990.1	inositol 2-dehydrogenase	75.2	73.0	24.2
MGA_1397	LOCUS_13510	sequence074:68595..69545(+)	frameshift		68648,68700	WP_011475746.1	competence type IV pilus assembly protein ComGB	94.6	84.0	47.3
MGA_1400	LOCUS_13540	sequence074:70554..70874(+)	partial			WP_011475896.1	IS200/IS605 family transposase	93.4	67.1	36.6
MGA_1401	LOCUS_13550	sequence074:70871..72040(+)	partial			WP_011254604.1	RNA-guided endonuclease TnpB family protein	55.8	74.7	54.5
MGA_1408	LOCUS_13620	sequence074:77962..78336(+)	internal_stop_codon	78334..78336(+)		WP_003703917.1	metallophosphoesterase family protein	98.4	60.7	59.8
MGA_1409	LOCUS_13630	sequence074:78343..78564(+)	internal_stop_codon	78334..78336(+)		WP_003703917.1	metallophosphoesterase family protein	100.0	36.3	53.4
MGA_1423	LOCUS_13760	sequence076:5950..6309(-)	internal_stop_codon	6463..6465(-)		WP_084742643.1	IS607-like element ISSto11 family transposase	74.8	48.9	39.3
MGA_1442	LOCUS_13950	sequence076:25225..25644(+)	partial			WP_002670247.1	AraC family transcriptional regulator	65.5	28.9	34.1
MGA_1490	LOCUS_14420	sequence079:325..1065(-)	partial			WP_003082313.1	peptide cleavage/export ABC transporter	94.3	31.6	37.6
MGA_1492	LOCUS_14440	sequence079:3150..3782(-)	partial			WP_015613327.1	GHKL domain-containing protein	95.2	47.3	33.7
MGA_1495	LOCUS_14470	sequence079:5037..5516(+)	partial			WP_002263742.1	thioredoxin family protein	70.4	32.4	26.5
MGA_1505	LOCUS_14570	sequence079:14213..14662(+)	frameshift		14608	WP_003643171.1	ABC transporter substrate-binding protein	72.5	24.0	61.1
MGA_1506	LOCUS_14580	sequence079:14625..15014(+)	frameshift		14608,14981	WP_003643171.1	ABC transporter substrate-binding protein	91.5	26.2	55.9
MGA_1507	LOCUS_14590	sequence079:15017..15535(+)	frameshift		14981	WP_003643171.1	ABC transporter substrate-binding protein	98.3	37.6	47.9
MGA_1522	LOCUS_14740	sequence080:3112..3402(-)	frameshift		3491	WP_011254472.1	RNA-guided endonuclease TnpB family protein	99.0	24.7	70.5
MGA_1524	LOCUS_14760	sequence080:3851..4261(-)	frameshift		3882,4188,3725	WP_011254472.1	RNA-guided endonuclease TnpB family protein	71.3	27.0	58.7
MGA_1536	LOCUS_14880	sequence080:16789..18147(-)	frameshift		18139	WP_011475728.1	ATP-dependent Clp protease ATP-binding subunit	99.1	61.4	76.4
MGA_1537	LOCUS_14890	sequence080:18134..18943(-)	frameshift		18139	WP_011475728.1	ATP-dependent Clp protease ATP-binding subunit	99.6	37.8	73.6
MGA_1551	LOCUS_15030	sequence081:5679..6725(+)	partial			WP_007056327.1	thiazole biosynthesis adenylyltransferase ThiF	30.2	39.0	40.0
MGA_1553	LOCUS_15050	sequence081:8361..9914(+)	partial			WP_011948347.1	ABC transporter ATP-binding protein	79.3	74.4	25.0
MGA_1601	LOCUS_15530	sequence083:21753..22463(-)	internal_stop_codon	22467..22469(-)		WP_041272513.1	flagellin	96.2	70.4	32.7
MGA_1602	LOCUS_15540	sequence083:22467..22811(-)	internal_stop_codon	22467..22469(-)		WP_011392281.1	flagellin	99.1	29.7	61.9
MGA_1608	LOCUS_15600	sequence083:29174..29647(-)	partial			WP_003700642.1	ComF family protein	100.0	68.4	45.9
MGA_1611	LOCUS_15630	sequence083:32017..32265(-)	frameshift,internal_stop_codon	32053..32055(-)	32061	WP_003703269.1	IS200/IS605 family transposase	82.9	47.6	63.2
MGA_1650	LOCUS_16000	sequence086:1405..2328(-)	partial			WP_011475863.1	DNA internalization-related competence protein ComEC/Rec2	81.1	33.2	58.8
MGA_1679	LOCUS_16280	sequence087:11385..12542(-)	partial			WP_053240438.1	glycosyltransferase family 1 protein	47.5	43.8	27.5
MGA_1696	LOCUS_16440	sequence088:1161..1829(-)	partial			WP_000359383.1	hypothetical protein	51.4	48.0	36.0
MGA_1753	LOCUS_16990	sequence091:14302..15282(+)	partial			WP_010870531.1	phosphoglycerate dehydrogenase	82.2	50.6	33.3
MGA_1762	LOCUS_17080	sequence091:23948..24496(-)	partial			WP_010868022.1	SagB/ThcOx family dehydrogenase	70.9	65.8	38.6
MGA_1764	LOCUS_17100	sequence091:25620..25751(-)	frameshift		25759	WP_011254325.1	transporter substrate-binding domain-containing protein	95.3	14.3	65.9
MGA_1765	LOCUS_17110	sequence091:25745..25933(-)	frameshift		25759	WP_011254325.1	transporter substrate-binding domain-containing protein	93.5	20.3	79.3
MGA_1777	LOCUS_17220	sequence092:6628..7584(-)	partial			WP_002263236.1	sensor histidine kinase	74.2	72.9	36.0
MGA_1779	LOCUS_17240	sequence093:362..1606(-)	partial			WP_010957062.1	TIR domain-containing protein	38.9	42.0	37.1
MGA_1780	LOCUS_17250	sequence093:1747..2124(-)	frameshift,internal_stop_codon	2132..2134(-)	2107	WP_011166415.1	Eco47II family restriction endonuclease	86.4	40.2	42.0
MGA_1826	LOCUS_17680	sequence098:539..808(+)	frameshift		384,540	WP_140224180.1	ClbS/DfsB family four-helix bundle protein	100.0	52.2	54.3
MGA_1830	LOCUS_17720	sequence098:4665..4829(+)	frameshift		4814	WP_010890794.1	GNAT family N-acetyltransferase	88.9	35.0	50.0
MGA_1831	LOCUS_17730	sequence098:4838..5083(+)	frameshift		4814	WP_010890794.1	GNAT family N-acetyltransferase	100.0	59.1	35.8
MGA_1837	LOCUS_17790	sequence098:9088..11082(+)	internal_stop_codon	11080..11082(+)		WP_003244282.1	class I SAM-dependent DNA methyltransferase	100.0	75.8	56.4
MGA_1838	LOCUS_17800	sequence098:11209..11775(+)	internal_stop_codon	11080..11082(+)		WP_003244282.1	class I SAM-dependent DNA methyltransferase	91.0	18.7	55.0
MGA_1852	LOCUS_17940	sequence098:26496..27563(+)	partial			WP_011103073.1	restriction endonuclease subunit S	34.1	34.2	33.3
MGA_1862	LOCUS_18040	sequence098:34613..34882(+)	partial			WP_002262851.1	cardiolipin synthase	95.5	16.6	48.2
MGA_1865	LOCUS_18070	sequence098:39583..40593(+)	partial			WP_000643829.1	GNAT family N-acetyltransferase	43.8	82.5	39.7
MGA_1866	LOCUS_18080	sequence098:40654..40845(+)	partial			WP_012027683.1	methylenetetrahydrofolate reductase [NAD(P)H]	50.8	11.2	65.6
MGA_1870	LOCUS_18120	sequence098:43812..44615(+)	frameshift		43767	WP_003437109.1	MATE family efflux transporter	94.8	56.5	46.3
MGA_1875	LOCUS_18170	sequence098:49834..50097(+)	frameshift		49980,50110	WP_009895475.1	NUDIX hydrolase	44.8	19.1	61.5
MGA_1876	LOCUS_18180	sequence098:50280..51092(+)	partial			WP_051532688.1	DUF3578 domain-containing protein	61.1	45.5	37.3
MGA_1877	LOCUS_18190	sequence098:51319..52479(+)	partial			WP_143185615.1	DUF262 domain-containing protein	62.2	54.1	23.3
MGA_1881	LOCUS_18220	sequence100:121..261(+)	frameshift		240	WP_003642100.1	DUF554 domain-containing protein	82.6	16.9	63.2
MGA_1882	LOCUS_18230	sequence100:252..791(+)	frameshift		240	WP_003242513.1	DUF554 domain-containing protein	97.2	76.0	63.8
MGA_1904	LOCUS_18450	sequence104:737..997(+)	partial			WP_061603534.1	HAD family hydrolase	90.7	27.9	57.7
MGA_1924	LOCUS_18650	sequence105:3551..4108(-)	partial			WP_010931764.1	alanine--glyoxylate aminotransferase family protein	93.0	45.6	33.9
MGA_1927	LOCUS_18680	sequence105:7618..8940(-)	partial			WP_010880882.1	glycerol-3-phosphate cytidylyltransferase	28.0	72.6	52.8
MGA_1929	LOCUS_18700	sequence105:9806..11269(-)	partial			WP_015263274.1	hypothetical protein	82.8	49.5	30.2
MGA_1931	LOCUS_18720	sequence105:12393..13889(-)	partial			WP_015263274.1	hypothetical protein	84.5	50.8	33.3
MGA_1937	LOCUS_18780	sequence105:18469..20643(-)	partial			WP_009898508.1	glycosyltransferase family 2 protein	27.1	50.8	25.7
MGA_1943	LOCUS_18820	sequence107:6380..6853(+)	partial			WP_100190734.1	IS3 family transposase	96.8	30.1	36.9
MGA_1949	LOCUS_18880	sequence107:13842..14276(-)	partial			WP_003722849.1	LytTR family DNA-binding domain-containing protein	73.6	70.2	45.3
MGA_1952	LOCUS_18910	sequence107:16401..16868(-)	internal_stop_codon	16896..16898(-)		WP_011476518.1	DUF308 domain-containing protein	91.6	81.6	51.4
