# locus_id	locus_tag	location	classification	internal_stop	indel	ref_id	description	query_cov	ref_cov	identity
MGA_2	LOCUS_00010	sequence1:501..1307(-)	frameshift		626	WP_011707240.1	retention module-containing protein	78.0	4.1	38.1
MGA_3	LOCUS_00020	sequence1:1291..3693(-)	frameshift		3692	WP_005477759.1	tandem-95 repeat protein	82.2	23.2	31.2
MGA_4	LOCUS_00030	sequence1:3582..5048(-)	frameshift		5062,5047,5065,3692,3695	WP_005477759.1	tandem-95 repeat protein	88.5	14.1	28.8
MGA_5	LOCUS_00040	sequence1:5045..6316(-)	frameshift		6345,5065,6342,5047	WP_005477759.1	tandem-95 repeat protein	92.2	13.3	28.7
MGA_9	LOCUS_00080	sequence1:7213..8736(-)	frameshift		8753,6948,7227,8750	WP_005477759.1	tandem-95 repeat protein	91.7	13.9	29.0
MGA_11	LOCUS_00100	sequence2:60..461(+)	frameshift		45	WP_000375433.1	ABC-ATPase domain-containing protein	100.0	24.4	91.8
MGA_12	LOCUS_00110	sequence2:789..1007(-)	frameshift		1089,668,643,1032,776,972,792,891,1020,731	WP_001284008.1	DNA-J related domain-containing protein	76.4	26.3	63.6
MGA_13	LOCUS_00120	sequence2:1521..1784(+)	frameshift,internal_stop_codon	1426..1428(+)	1668,1608,1449,1419,1773,1713,1497,1695	WP_001131372.1	DUF2238 domain-containing protein	83.9	37.9	61.0
MGA_14	LOCUS_00130	sequence2:1784..1969(+)	frameshift		1666,1606,1495,1771,1693,1711	WP_001131372.1	DUF2238 domain-containing protein	98.4	30.8	88.3
MGA_16	LOCUS_00150	sequence2:2903..3283(-)	frameshift		3330	WP_000140419.1	HAD family hydrolase	84.1	46.9	86.8
MGA_17	LOCUS_00160	sequence2:3304..3609(-)	frameshift		3330	WP_000140419.1	HAD family hydrolase	92.1	41.2	90.3
MGA_112	LOCUS_01110	sequence2:116553..117209(+)	partial			WP_000135747.1	VWA domain-containing protein	92.7	63.5	93.6
MGA_215	LOCUS_02140	sequence2:239719..240951(-)	partial			WP_005769303.1	HPr kinase	71.7	71.3	26.8
MGA_219	LOCUS_02180	sequence2:243933..244664(-)	partial			WP_010964224.1	alanyl-tRNA editing protein	97.9	57.6	28.8
MGA_221	LOCUS_02200	sequence2:245723..246403(-)	partial			WP_005477420.1	LysR substrate-binding domain-containing protein	95.1	69.4	83.7
MGA_222	LOCUS_02210	sequence2:246393..246740(+)	partial			WP_005477481.1	6-phospho-beta-glucosidase	100.0	26.3	91.3
MGA_311	LOCUS_03100	sequence2:344704..344892(-)	partial			WP_000070352.1	type VI secretion system toxin VasX	100.0	5.7	87.1
MGA_358	LOCUS_03570	sequence2:404990..406918(-)	partial			WP_011073324.1	metallophosphoesterase	46.4	77.3	31.7
MGA_380	LOCUS_03790	sequence2:436450..437124(-)	partial			WP_011267286.1	LuxR C-terminal-related transcriptional regulator	25.0	23.3	51.8
MGA_421	LOCUS_04200	sequence2:480870..481790(+)	partial			WP_206819201.1	PAS domain S-box protein	42.2	31.8	62.8
MGA_425	LOCUS_04240	sequence2:483166..486327(+)	partial			WP_011704393.1	response regulator	71.2	82.4	42.4
MGA_469	LOCUS_04680	sequence2:535387..536121(-)	partial			WP_005481536.1	hypothetical protein	94.3	48.3	49.6
MGA_518	LOCUS_05170	sequence2:588157..592917(+)	partial			WP_011268103.1	CHASE domain-containing protein	55.5	65.0	36.2
MGA_527	LOCUS_05260	sequence2:601871..604165(-)	partial			WP_011142717.1	tetratricopeptide repeat protein	43.2	43.1	23.1
MGA_529	LOCUS_05280	sequence2:606288..607379(-)	partial			WP_002210712.1	DUF4297 domain-containing protein	73.6	74.6	33.2
MGA_538	LOCUS_05370	sequence2:612966..613934(+)	partial			WP_000104945.1	helix-turn-helix domain-containing protein	40.4	41.2	39.6
MGA_553	LOCUS_05520	sequence2:630018..630536(+)	partial			WP_011072618.1	N-acetylmuramidase	84.3	69.9	32.9
MGA_567	LOCUS_05660	sequence2:640790..642766(+)	partial			WP_000038927.1	DUF1983 domain-containing protein	59.3	84.1	32.3
MGA_578	LOCUS_05770	sequence2:651324..664034(+)	partial			WP_010774229.1	DEAD/DEAH box helicase family protein	21.6	27.8	30.7
MGA_580	LOCUS_05790	sequence2:664698..664865(+)	partial			WP_000692622.1	L-threonine 3-dehydrogenase	96.4	15.5	98.1
MGA_590	LOCUS_05890	sequence2:674996..676834(-)	partial			WP_011267513.1	PAS domain S-box protein	41.0	35.4	39.5
MGA_609	LOCUS_06080	sequence2:710971..712758(-)	partial			WP_010943149.1	EAL domain-containing protein	69.7	47.8	40.2
MGA_667	LOCUS_06660	sequence2:785854..786243(+)	partial			WP_001894072.1	translation initiation factor IF-3	100.0	70.5	89.9
MGA_700	LOCUS_06990	sequence2:814962..815447(+)	partial			WP_099245403.1	hypothetical protein	44.1	58.7	40.8
MGA_809	LOCUS_08080	sequence2:907137..907460(+)	internal_stop_codon	907029..907031(+)		WP_011705794.1	N-acetyltransferase	95.3	62.8	36.9
MGA_831	LOCUS_08300	sequence2:926359..927012(+)	partial			WP_012582467.1	peptidoglycan DD-metalloendopeptidase family protein	74.2	55.4	30.6
MGA_832	LOCUS_08310	sequence2:927213..927767(+)	partial			WP_005462179.1	hypothetical protein	31.0	21.9	57.9
MGA_843	LOCUS_08420	sequence2:938128..939324(-)	partial			WP_004080646.1	ATP-dependent Clp protease proteolytic subunit	31.7	46.8	32.8
MGA_848	LOCUS_08470	sequence2:942271..942636(+)	partial			WP_014206488.1	FMN-binding negative transcriptional regulator	100.0	57.8	43.4
MGA_856	LOCUS_08550	sequence2:947474..948382(+)	partial			WP_047815565.1	lipase family protein	64.6	56.9	27.1
MGA_921	LOCUS_09200	sequence2:1009483..1009998(+)	internal_stop_codon	1009996..1009998(+)		WP_011391484.1	P-loop NTPase fold protein	100.0	38.1	38.2
MGA_922	LOCUS_09210	sequence2:1010041..1010844(+)	internal_stop_codon	1009996..1009998(+)		WP_011391484.1	P-loop NTPase fold protein	67.0	39.0	30.7
MGA_925	LOCUS_09240	sequence2:1012934..1013176(+)	frameshift		1012889	WP_014164108.1	hypothetical protein	100.0	68.4	100.0
MGA_952	LOCUS_09510	sequence2:1031011..1032654(+)	partial			WP_005694526.1	type I restriction endonuclease subunit R	65.4	39.9	23.0
MGA_977	LOCUS_09760	sequence2:1051657..1053003(+)	partial			WP_188614543.1	SIR2 family protein	46.7	38.4	27.4
MGA_980	LOCUS_09790	sequence2:1054423..1054734(+)	frameshift		1054728	WP_164922377.1	GNAT family N-acetyltransferase	91.3	71.4	42.9
MGA_987	LOCUS_09860	sequence2:1058645..1059010(+)	frameshift		1058911	WP_003097816.1	glutathione S-transferase family protein	66.9	40.5	65.4
MGA_988	LOCUS_09870	sequence2:1058911..1059252(+)	frameshift		1058911	WP_014208018.1	glutathione S-transferase family protein	95.6	69.7	72.2
MGA_998	LOCUS_09970	sequence2:1067147..1067824(+)	partial			WP_010990036.1	helix-turn-helix domain-containing protein	52.4	43.3	29.5
MGA_1060	LOCUS_10590	sequence2:1145463..1145831(+)	frameshift		1145828	WP_003113745.1	MFS transporter	100.0	30.4	59.8
MGA_1061	LOCUS_10600	sequence2:1145896..1146666(+)	frameshift		1145828	WP_003973162.1	MFS transporter	96.1	58.4	42.3
MGA_1075	LOCUS_10740	sequence2:1161795..1162733(+)	partial			WP_005796357.1	AraC family transcriptional regulator	32.1	29.9	41.0
MGA_1079	LOCUS_10780	sequence2:1172557..1184682(+)	partial			WP_011104106.1	type I polyketide synthase	25.2	31.9	47.9
MGA_1106	LOCUS_11050	sequence2:1212172..1213488(+)	partial			WP_011073743.1	insulinase family protein	91.3	46.7	26.4
MGA_1142	LOCUS_11410	sequence2:1253151..1254380(+)	partial			WP_012047848.1	helix-turn-helix transcriptional regulator	16.9	47.9	44.9
MGA_1143	LOCUS_11420	sequence2:1254377..1255285(+)	partial			WP_010965577.1	thioether cross-link-forming SCIFF peptide maturase	93.4	65.2	21.7
MGA_1211	LOCUS_12100	sequence2:1321918..1322139(-)	partial			WP_005481274.1	Flp family type IVb pilin	71.2	61.9	59.6
MGA_1214	LOCUS_12130	sequence2:1324041..1327103(-)	partial			WP_005481331.1	M6 family metalloprotease domain-containing protein	70.8	71.7	48.4
MGA_1263	LOCUS_12620	sequence2:1386907..1387104(-)	partial			WP_005477197.1	hypothetical protein	69.2	63.4	57.8
MGA_1317	LOCUS_13160	sequence2:1446657..1448072(-)	frameshift		1448146	WP_181712488.1	LTA synthase family protein	100.0	72.0	95.1
MGA_1318	LOCUS_13170	sequence2:1448051..1448383(-)	frameshift		1448530,1448425,1448458,1448379,1448524,1448142	WP_181712488.1	LTA synthase family protein	70.9	11.9	88.5
MGA_1319	LOCUS_13180	sequence2:1449154..1449423(-)	frameshift		1449409,1449370,1449178	WP_001233647.1	GlyGly-anchored extracellular serine protease VesA	71.9	19.4	73.4
MGA_1320	LOCUS_13190	sequence2:1449359..1449694(-)	frameshift		1449409,1449370,1449181	WP_001233647.1	GlyGly-anchored extracellular serine protease VesA	85.6	28.8	81.1
MGA_1321	LOCUS_13200	sequence2:1449825..1450421(-)	frameshift		1450528,1449952	WP_001154248.1	DEAD/DEAH box helicase	60.1	18.5	87.4
MGA_1322	LOCUS_13210	sequence2:1450469..1450915(-)	frameshift		1450528,1450929,1450898,1451188	WP_001154248.1	DEAD/DEAH box helicase	87.8	20.2	92.3
MGA_1323	LOCUS_13220	sequence2:1450912..1451166(-)	frameshift		1450896,1451186,1451336,1451405,1450927	WP_001154248.1	DEAD/DEAH box helicase	97.6	12.8	95.1
MGA_1325	LOCUS_13230	sequence3:123..665(+)	frameshift		61	WP_005480862.1	ATPase	98.3	78.0	59.3
MGA_1327	LOCUS_13250	sequence3:1482..1607(-)	frameshift		1626	WP_001884322.1	RNA-binding protein	100.0	27.0	85.4
MGA_1350	LOCUS_13480	sequence3:39743..41686(-)	partial			WP_019439542.1	methyl-accepting chemotaxis protein	54.1	55.9	51.3
MGA_1389	LOCUS_13870	sequence3:83384..83812(+)	frameshift		83297	WP_011706755.1	ion channel	99.3	44.7	49.7
MGA_1484	LOCUS_14810	sequence3:189068..190219(+)	partial			WP_011461034.1	glycosyltransferase	67.1	62.7	24.0
MGA_1492	LOCUS_14890	sequence3:200404..201021(-)	partial			WP_000947937.1	O-antigen ligase	99.0	46.3	83.7
MGA_1632	LOCUS_16290	sequence3:354985..355860(+)	partial			WP_011263006.1	LysR family transcriptional regulator	59.1	55.3	30.7
MGA_1635	LOCUS_16320	sequence3:357248..358150(+)	partial			WP_011461506.1	methyl-accepting chemotaxis protein	85.0	44.7	24.3
MGA_1730	LOCUS_17270	sequence3:458346..458876(-)	partial			WP_000098720.1	23S rRNA pseudouridine(2457) synthase RluE	100.0	73.0	97.2
MGA_1837	LOCUS_18340	sequence3:582370..582993(+)	partial			WP_011262129.1	heme lyase (NrfEFG) for insertion of heme into c552, subunit NrfG	67.1	64.7	52.5
MGA_1844	LOCUS_18410	sequence3:589745..590164(+)	partial			WP_011262122.1	heme lyase NrfEFG subunit NrfF	78.4	73.2	62.4
MGA_1919	LOCUS_19160	sequence3:677477..680617(+)	partial			WP_011704874.1	HD domain-containing protein	38.8	41.1	49.1
MGA_1953	LOCUS_19500	sequence3:721899..722657(+)	partial			WP_001881132.1	ABC transporter substrate-binding protein	99.2	73.7	78.8
MGA_1972	LOCUS_19690	sequence3:749278..749928(+)	frameshift		749913	WP_000870878.1	methyl-accepting chemotaxis protein	93.1	35.7	68.2
MGA_1973	LOCUS_19700	sequence3:749916..750968(+)	frameshift		749913	WP_000870878.1	methyl-accepting chemotaxis protein	100.0	62.2	80.3
MGA_1993	LOCUS_19900	sequence3:769680..770327(+)	partial			WP_013095455.1	4-hydroxyphenylacetate degradation bifunctional isomerase/decarboxylase	89.3	44.5	39.1
MGA_2004	LOCUS_20010	sequence3:781292..783343(+)	partial			WP_000212116.1	type VI secretion system tip protein TssI/VgrG	99.4	58.4	93.4
MGA_2005	LOCUS_20020	sequence3:783340..784128(+)	partial			WP_055064297.1	DUF4123 domain-containing protein	74.8	73.2	64.8
MGA_2012	LOCUS_20090	sequence3:791477..793342(-)	partial			WP_010895594.1	PAS domain-containing protein	72.9	51.3	47.8
MGA_2091	LOCUS_20880	sequence3:885400..885687(+)	partial			WP_000958712.1	NlpC/P60 family protein	100.0	57.2	88.4
MGA_2170	LOCUS_21670	sequence3:966127..973104(-)	partial			WP_011707240.1	retention module-containing protein	98.3	45.7	28.6
MGA_2171	LOCUS_21680	sequence3:973058..979840(-)	frameshift		973081,973102	WP_005477759.1	tandem-95 repeat protein	86.3	57.8	24.3
MGA_2191	LOCUS_21880	sequence3:1004904..1006856(-)	partial			WP_012067720.1	YDG domain-containing protein	76.8	28.8	28.4
MGA_2193	LOCUS_21900	sequence3:1007892..1008968(+)	partial			WP_011073736.1	efflux RND transporter periplasmic adaptor subunit	87.7	72.0	45.9
MGA_2300	LOCUS_22970	sequence3:1137903..1139318(-)	partial			WP_011086955.1	winged helix-turn-helix domain-containing protein	24.0	12.0	32.7
MGA_2317	LOCUS_23140	sequence3:1153825..1156410(+)	partial			WP_011202282.1	glycoside hydrolase family 31 protein	86.9	58.6	33.0
MGA_2329	LOCUS_23260	sequence3:1173376..1176081(+)	partial			WP_009292032.1	GH92 family glycosyl hydrolase	95.9	72.5	30.6
MGA_2360	LOCUS_23570	sequence3:1212231..1212596(+)	partial			WP_001881606.1	YchJ family protein	88.4	70.2	71.0
MGA_2428	LOCUS_24250	sequence3:1297102..1297656(+)	partial			WP_005477075.1	hypothetical protein	51.1	62.7	43.6
MGA_2475	LOCUS_24720	sequence3:1349363..1351903(+)	partial			WP_011261692.1	basic endochitinase	17.8	27.4	44.8
MGA_2570	LOCUS_25670	sequence3:1456928..1457875(+)	partial			WP_015444337.1	AraC family transcriptional regulator	31.1	29.3	34.7
MGA_2721	LOCUS_27180	sequence3:1608138..1608566(+)	partial			WP_001881906.1	flagellar basal body P-ring formation chaperone FlgA	100.0	55.7	92.3
MGA_2865	LOCUS_28620	sequence3:1768884..1769153(-)	partial			WP_000589998.1	DUF3293 domain-containing protein	97.8	68.5	81.6
MGA_3091	LOCUS_30880	sequence3:2023219..2023821(-)	partial			WP_000687664.1	peptidylprolyl isomerase	74.0	73.6	93.2
MGA_3146	LOCUS_31430	sequence3:2082237..2083160(-)	internal_stop_codon	2083176..2083178(-)		WP_000138832.1	group II intron reverse transcriptase/maturase	99.7	54.2	47.6
MGA_3147	LOCUS_31440	sequence3:2083176..2083895(-)	internal_stop_codon	2083176..2083178(-)		WP_235893157.1	group II intron reverse transcriptase/maturase	96.7	39.8	65.8
MGA_3195	LOCUS_31920	sequence3:2136999..2139185(-)	partial			WP_011262166.1	glycosyl hydrolase family 18 protein	25.3	24.3	27.4
MGA_3230	LOCUS_32270	sequence3:2175065..2175247(-)	frameshift		2175317,2175085	WP_000244705.1	hypothetical protein	91.7	51.4	70.9
MGA_3280	LOCUS_32770	sequence3:2241959..2242750(-)	frameshift		2242982	WP_010895430.1	peptide chain release factor 2	100.0	72.1	99.2
MGA_3503	LOCUS_35000	sequence3:2501482..2501946(-)	partial			WP_139685680.1	type II secretion system protein	57.1	56.6	64.3
MGA_3634	LOCUS_36300	sequence3:2670521..2671528(+)	partial			WP_011793001.1	sugar transferase	71.3	53.3	49.8
MGA_3637	LOCUS_36330	sequence3:2673464..2674495(-)	partial			WP_001221227.1	glycosyltransferase family 4 protein	75.5	68.8	27.3
MGA_3638	LOCUS_36340	sequence3:2674492..2675463(-)	partial			WP_011176648.1	polysaccharide pyruvyl transferase family protein	93.5	47.4	32.5
MGA_3662	LOCUS_36580	sequence3:2701598..2702506(-)	partial			WP_011962185.1	class I SAM-dependent methyltransferase	50.7	54.6	29.7
MGA_3810	LOCUS_38060	sequence3:2873939..2874157(+)	partial			WP_000263365.1	hypothetical protein	54.2	70.8	71.7
MGA_3900	LOCUS_38960	sequence3:2977065..2977223(-)	frameshift		2977496,2977081,2977274	WP_000118232.1	sodium:proton antiporter	98.1	11.5	92.2
MGA_3901	LOCUS_38970	sequence3:2977171..2977410(-)	frameshift		2977496,2977081,2977650,2977274	WP_000118232.1	sodium:proton antiporter	78.5	14.0	77.4
MGA_3902	LOCUS_38980	sequence3:2977476..2977631(-)	frameshift		2977496,2977650,2977891,2977274	WP_000118232.1	sodium:proton antiporter	90.2	10.4	100.0
MGA_3903	LOCUS_38990	sequence3:2977639..2977917(-)	frameshift		2977496,2977650,2977894	WP_000118232.1	sodium:proton antiporter	89.1	18.5	96.3
MGA_3905	LOCUS_39010	sequence3:2978530..2978787(+)	frameshift		2979011,2978772,2978893	WP_000514261.1	methionine synthase	95.3	6.6	96.3
MGA_3906	LOCUS_39020	sequence3:2979044..2979454(+)	frameshift		2978896,2979344,2978772,2979014,2979402,2979326	WP_000514261.1	methionine synthase	87.5	9.7	94.1
MGA_3907	LOCUS_39030	sequence3:2979406..2979861(+)	frameshift		2979401,2979827,2979325,2979343	WP_000514261.1	methionine synthase	92.7	11.4	98.6
MGA_3908	LOCUS_39040	sequence3:2979830..2982214(+)	frameshift		2979825	WP_000514261.1	methionine synthase	100.0	64.8	98.0
MGA_3909	LOCUS_39050	sequence3:2982293..2982505(-)	partial			WP_000102995.1	lysine-sensitive aspartokinase 3	100.0	15.5	97.1
