# locus_id	locus_tag	location	classification	internal_stop	indel	ref_id	description	query_cov	ref_cov	identity
MGA_1	LOCUS_00010	sequence1:122..337(+)	frameshift		48,344,331	WP_002359372.1	lysine--tRNA ligase	98.6	14.1	94.3
MGA_2	LOCUS_00020	sequence1:415..942(+)	frameshift		347,331	WP_010989378.1	lysine--tRNA ligase	99.4	34.9	78.2
MGA_7	LOCUS_00040	sequence1:7789..8562(+)	frameshift		8517	WP_002378875.1	ATP-dependent Clp protease ATP-binding subunit	95.3	30.0	65.1
MGA_8	LOCUS_00050	sequence1:8537..9118(+)	frameshift		9173,9082,8517,9318	WP_002378875.1	ATP-dependent Clp protease ATP-binding subunit	100.0	23.2	74.6
MGA_9	LOCUS_00060	sequence1:9166..9363(+)	frameshift		9200,9321,9082,9427	WP_003585669.1	ATP-dependent Clp protease ATP-binding subunit	55.4	4.3	69.4
MGA_10	LOCUS_00070	sequence1:9435..9881(+)	frameshift		9321,9427,10115,9878	WP_002289035.1	ATP-dependent Clp protease ATP-binding subunit	100.0	17.8	87.2
MGA_11	LOCUS_00080	sequence1:9887..10141(+)	frameshift		10115,9878	WP_002289035.1	ATP-dependent Clp protease ATP-binding subunit	97.6	9.9	68.3
MGA_44	LOCUS_00400	sequence2:33210..33956(+)	partial			WP_002355609.1	WxL domain-containing protein	78.2	74.0	36.6
MGA_48	LOCUS_00440	sequence2:36458..37270(+)	partial			WP_077275481.1	WxL domain-containing protein	98.5	34.2	24.0
MGA_52	LOCUS_00480	sequence2:39758..40591(+)	frameshift,internal_stop_codon	39663..39665(+)	39701	WP_010989522.1	DUF916 and DUF3324 domain-containing protein	79.4	60.7	37.7
MGA_54	LOCUS_00500	sequence2:40909..43959(+)	partial			WP_011101989.1	cell surface protein	14.1	28.5	30.8
MGA_59	LOCUS_00550	sequence2:48171..48458(-)	partial			WP_009932617.1	effector binding domain-containing protein	95.8	70.9	51.1
MGA_65	LOCUS_00610	sequence2:53065..53583(+)	partial			WP_000473177.1	PTS glucose transporter subunit IIABC	84.3	21.0	52.4
MGA_67	LOCUS_00630	sequence2:54492..55010(+)	partial			WP_000938900.1	N-acetylglucosamine-specific PTS transporter subunit IIBC	68.0	28.4	37.3
MGA_82	LOCUS_00780	sequence2:67079..68173(+)	partial			WP_011837107.1	ATP-binding protein	59.3	40.0	36.2
MGA_88	LOCUS_00840	sequence2:71532..71663(+)	internal_stop_codon	71661..71663(+)		WP_002287732.1	type I restriction-modification system subunit M	100.0	8.1	88.4
MGA_89	LOCUS_00850	sequence2:71769..73127(+)	internal_stop_codon	71661..71663(+)		WP_000819001.1	type I restriction-modification system subunit M	99.3	84.7	84.0
MGA_97	LOCUS_00930	sequence2:81115..83904(+)	partial			WP_106518812.1	DEAD/DEAH box helicase	52.7	66.0	43.8
MGA_110	LOCUS_01060	sequence2:93108..93671(+)	partial			WP_002322202.1	hypothetical protein	81.8	26.0	32.7
MGA_138	LOCUS_01340	sequence2:128404..129894(+)	partial			WP_002321200.1	helix-turn-helix domain-containing protein	78.4	73.5	21.3
MGA_141	LOCUS_01370	sequence2:131409..132047(+)	partial			WP_003732646.1	WxL domain-containing protein	73.1	70.5	32.7
MGA_156	LOCUS_01520	sequence2:148655..150094(+)	partial			WP_002326835.1	hypothetical protein	41.3	62.3	28.6
MGA_178	LOCUS_01740	sequence2:171623..178336(+)	partial			WP_013389449.1	glycoside hydrolase N-terminal domain-containing protein	25.1	26.5	24.7
MGA_210	LOCUS_02060	sequence2:215091..216572(-)	partial			WP_012972623.1	helix-turn-helix domain-containing protein	32.5	32.0	27.5
MGA_301	LOCUS_02970	sequence2:295883..296773(-)	frameshift		296831	WP_205010568.1	tyrosine-type recombinase/integrase	98.3	71.9	49.8
MGA_306	LOCUS_03020	sequence2:301031..301354(-)	partial			WP_010989667.1	Cd(II)-sensing metalloregulatory transcriptional repressor CadC	72.0	69.4	42.9
MGA_315	LOCUS_03110	sequence2:308043..309461(+)	partial			WP_011860826.1	PTS transporter subunit IIBCA	98.9	74.8	58.2
MGA_317	LOCUS_03130	sequence2:310183..320439(+)	partial			WP_000815762.1	isopeptide-forming domain-containing fimbrial protein	66.0	60.3	23.7
MGA_325	LOCUS_03210	sequence2:327866..328075(-)	partial			WP_010877980.1	copper-translocating P-type ATPase CopA	92.8	8.0	42.2
MGA_360	LOCUS_03560	sequence2:367039..367389(-)	frameshift,internal_stop_codon	367150..367152(-),367144..367146(-)	367080,367167	WP_001273859.1	recombinase family protein	91.4	57.3	44.3
MGA_373	LOCUS_03690	sequence2:380301..383000(+)	partial			WP_162225034.1	SpaA isopeptide-forming pilin-related protein	80.4	51.5	35.8
MGA_453	LOCUS_04490	sequence2:481519..482364(-)	partial			WP_000586891.1	GNAT family N-acetyltransferase	44.5	83.4	27.7
MGA_501	LOCUS_04940	sequence2:529379..530512(+)	partial			WP_003731931.1	YbbR-like domain-containing protein	86.5	71.0	37.3
MGA_526	LOCUS_05190	sequence2:554345..555853(-)	partial			WP_002287463.1	glycoside hydrolase family 73 protein	50.8	64.0	44.8
MGA_577	LOCUS_05700	sequence2:616807..617238(+)	partial			WP_009930948.1	hypothetical protein	89.5	25.5	35.9
MGA_587	LOCUS_05800	sequence2:626256..626759(-)	partial			WP_001548522.1	TM2 domain-containing protein	37.7	68.5	57.1
MGA_609	LOCUS_06020	sequence2:653960..654610(-)	frameshift,internal_stop_codon	654008..654010(-)	654043	WP_002287140.1	helix-turn-helix domain-containing protein	97.2	42.8	36.2
MGA_620	LOCUS_06130	sequence2:664610..665401(-)	partial			WP_011836379.1	membrane protein	95.1	57.6	41.8
MGA_636	LOCUS_06290	sequence2:683563..684186(+)	partial			WP_000687254.1	pentapeptide repeat-containing protein	75.8	74.4	37.6
MGA_642	LOCUS_06350	sequence2:688372..688737(-)	partial			WP_000849163.1	YxeA family protein	76.0	74.6	42.4
MGA_659	LOCUS_06520	sequence2:703562..705814(+)	partial			WP_003147473.1	Ig-like domain-containing protein	25.3	7.7	29.9
MGA_666	LOCUS_06590	sequence2:715108..717177(+)	partial			WP_011102031.1	BspA family leucine-rich repeat surface protein	31.6	23.9	37.7
MGA_675	LOCUS_06680	sequence2:725768..728206(+)	partial			WP_010989368.1	LapB repeat-containing protein	15.5	32.3	31.6
MGA_687	LOCUS_06800	sequence2:738274..738924(+)	partial			WP_010905524.1	MarR family transcriptional regulator	81.9	61.9	34.2
MGA_712	LOCUS_07050	sequence2:760199..760414(+)	partial			WP_011837061.1	hypothetical protein	81.7	43.0	49.2
MGA_726	LOCUS_07190	sequence2:771954..772307(+)	partial			WP_003359348.1	single-stranded DNA-binding protein	86.3	68.9	42.2
MGA_756	LOCUS_07490	sequence2:802630..803262(+)	partial			WP_003228938.1	exo-glucosaminidase LytG	94.3	69.5	48.5
MGA_793	LOCUS_07860	sequence2:842201..842962(-)	partial			WP_002304851.1	response regulator transcription factor	49.4	25.9	38.4
MGA_818	LOCUS_08110	sequence2:867060..867716(+)	partial			WP_002355609.1	WxL domain-containing protein	75.7	73.2	30.9
MGA_827	LOCUS_08200	sequence2:875279..875797(+)	partial			WP_003575983.1	restriction endonuclease	70.3	64.7	47.9
MGA_843	LOCUS_08360	sequence2:891925..892923(+)	partial			WP_011176648.1	polysaccharide pyruvyl transferase family protein	89.2	46.5	28.4
MGA_875	LOCUS_08650	sequence2:933466..934272(+)	partial			WP_000617045.1	GNAT family N-acetyltransferase	43.7	41.8	30.5
MGA_877	LOCUS_08670	sequence2:935007..935279(+)	internal_stop_codon	935277..935279(+)		WP_011948196.1	DUF5692 family protein	83.3	22.3	44.0
MGA_878	LOCUS_08680	sequence2:935394..935924(+)	internal_stop_codon	935277..935279(+)		WP_011948196.1	DUF5692 family protein	96.0	52.7	56.1
MGA_942	LOCUS_09320	sequence2:1003842..1006580(+)	partial			WP_011101414.1	DNA translocase FtsK	54.3	49.2	65.1
MGA_956	LOCUS_09460	sequence2:1021655..1022377(+)	partial			WP_003549457.1	MerR family transcriptional regulator	47.5	46.9	41.7
MGA_969	LOCUS_09590	sequence2:1033577..1034767(+)	internal_stop_codon	1034765..1034767(+)		WP_000899106.1	EndoU domain-containing protein	14.4	60.6	68.4
MGA_973	LOCUS_09630	sequence2:1036584..1036784(+)	partial			WP_011100982.1	pre-toxin TG domain-containing protein	100.0	11.1	65.2
MGA_976	LOCUS_09660	sequence2:1038501..1038734(+)	partial			WP_011100983.1	hypothetical protein	62.3	34.5	75.0
MGA_1006	LOCUS_09960	sequence2:1069855..1070877(+)	partial			WP_010989623.1	MBL fold metallo-hydrolase	75.0	66.0	44.7
MGA_1017	LOCUS_10070	sequence2:1080770..1081048(-)	partial			WP_003546474.1	DUF1827 family protein	75.0	74.2	44.9
MGA_1055	LOCUS_10450	sequence2:1122652..1123929(+)	partial			WP_011109429.1	C39 family peptidase	62.6	37.2	37.0
MGA_1083	LOCUS_10730	sequence2:1147322..1148911(+)	partial			WP_002382239.1	membrane protein	75.8	40.9	24.9
MGA_1088	LOCUS_10780	sequence2:1152569..1153354(+)	partial			WP_011101863.1	SH3 domain-containing protein	60.5	20.0	60.1
MGA_1120	LOCUS_11100	sequence2:1182255..1182659(+)	partial			WP_002369327.1	LapA family protein	76.1	68.4	44.3
MGA_1133	LOCUS_11230	sequence2:1192301..1193272(+)	internal_stop_codon	1192256..1192258(+)		WP_000056102.1	T7SS effector LXG polymorphic toxin	82.4	48.3	28.2
MGA_1143	LOCUS_11330	sequence2:1205304..1206923(-)	partial			WP_010989367.1	lmo0171 family class 1 internalin	52.9	33.4	28.1
MGA_1185	LOCUS_11750	sequence2:1255035..1255421(+)	partial			WP_011861025.1	phage terminase small subunit	57.0	32.6	58.7
MGA_1186	LOCUS_11760	sequence2:1255637..1256647(+)	partial			WP_010905725.1	phage tail spike protein	37.2	14.9	37.0
MGA_1205	LOCUS_11950	sequence2:1277042..1277740(+)	frameshift		1276985	WP_011674913.1	hypothetical protein	97.4	80.2	24.9
MGA_1209	LOCUS_11990	sequence2:1279971..1280813(+)	partial			WP_004080600.1	YgcG family protein	58.2	65.5	40.9
MGA_1224	LOCUS_12140	sequence2:1292814..1293656(+)	partial			WP_000078841.1	sortase SrtA	51.1	59.1	40.4
MGA_1230	LOCUS_12200	sequence2:1298335..1299225(-)	internal_stop_codon	1298335..1298337(-)		WP_010989529.1	serine/threonine-protein kinase	95.9	74.7	38.7
MGA_1261	LOCUS_12510	sequence2:1334298..1336052(+)	partial			WP_010706747.1	DUF1116 domain-containing protein	99.7	57.9	55.0
MGA_1262	LOCUS_12520	sequence2:1336111..1337373(+)	partial			WP_010706747.1	DUF1116 domain-containing protein	99.3	41.9	67.1
MGA_1283	LOCUS_12730	sequence2:1361219..1362148(-)	partial			WP_003722812.1	glycerophosphodiester phosphodiesterase	77.3	41.9	32.0
MGA_1338	LOCUS_13280	sequence2:1417535..1418014(-)	partial			WP_012027226.1	EbsA family protein	76.1	74.1	28.9
MGA_1347	LOCUS_13370	sequence2:1425553..1428150(+)	partial			WP_003565607.1	PBP1A family penicillin-binding protein	74.2	83.9	50.2
MGA_1406	LOCUS_13960	sequence2:1482988..1483191(-)	frameshift		1483011	WP_002378961.1	cysteine hydrolase family protein	94.0	38.0	58.7
MGA_1407	LOCUS_13970	sequence2:1483336..1484433(-)	partial			WP_011674041.1	family 20 glycosylhydrolase	95.9	61.0	52.6
MGA_1441	LOCUS_14310	sequence2:1518315..1518491(-)	frameshift		1518544	WP_029645128.1	TrkH family potassium uptake protein	100.0	12.6	51.7
MGA_1442	LOCUS_14320	sequence2:1518482..1519675(-)	frameshift		1518544	WP_002304549.1	TrkH family potassium uptake protein	95.2	84.0	52.5
MGA_1466	LOCUS_14560	sequence2:1542920..1544251(-)	partial			WP_011674729.1	sortase	55.1	83.7	30.0
MGA_1475	LOCUS_14650	sequence2:1553867..1554223(-)	frameshift		1554337,1554178,1554172	WP_001103118.1	GNAT family N-acetyltransferase	83.9	57.6	59.6
MGA_1597	LOCUS_15870	sequence2:1679637..1680062(-)	partial			WP_011704421.1	GNAT family N-acetyltransferase	73.8	74.6	39.4
MGA_1625	LOCUS_16150	sequence2:1708229..1708606(-)	partial			WP_002262088.1	cell division protein FtsL	72.0	84.1	35.6
MGA_1671	LOCUS_16610	sequence2:1753737..1754102(-)	partial			WP_003700554.1	preprotein translocase subunit YajC	72.7	69.8	40.9
MGA_1673	LOCUS_16630	sequence2:1755381..1755950(-)	partial			WP_003244088.1	TetR/AcrR family transcriptional regulator	31.7	31.7	48.3
MGA_1741	LOCUS_17310	sequence2:1823909..1824619(-)	partial			WP_007335847.1	WecB/TagA/CpsF family glycosyltransferase	80.5	61.7	30.1
MGA_1766	LOCUS_17560	sequence2:1851144..1851512(-)	partial			WP_011674405.1	VanZ family protein	87.7	56.7	46.5
MGA_1797	LOCUS_17870	sequence2:1884872..1885153(-)	partial			WP_002295087.1	cell division protein ZapA	98.9	63.4	39.1
MGA_1816	LOCUS_18060	sequence2:1901722..1902003(+)	partial			WP_002903682.1	DUF4352 domain-containing protein	88.2	38.8	40.9
MGA_1817	LOCUS_18070	sequence2:1901960..1902262(+)	frameshift		1901985	WP_011674335.1	Ltp family lipoprotein	94.0	42.7	66.0
MGA_1856	LOCUS_18460	sequence2:1944335..1944853(-)	partial			WP_000938894.1	N-acetylglucosamine-specific PTS transporter subunit IIBC	68.0	28.4	38.0
MGA_1870	LOCUS_18600	sequence2:1959164..1960267(-)	partial			WP_011476432.1	zinc ribbon domain-containing protein	52.9	40.2	25.0
MGA_1927	LOCUS_19130	sequence2:2014736..2015224(-)	partial			WP_069591551.1	serine O-acetyltransferase	66.7	46.2	46.8
MGA_1939	LOCUS_19250	sequence2:2031012..2031326(+)	frameshift,internal_stop_codon	2031472..2031474(+)	2031067,2031260	WP_002287705.1	site-specific integrase	73.1	20.0	53.9
MGA_1940	LOCUS_19260	sequence2:2031238..2031474(+)	frameshift,internal_stop_codon	2031472..2031474(+)	2031064,2031624,2031254	WP_010707087.1	site-specific integrase	92.3	18.9	59.7
MGA_1941	LOCUS_19270	sequence2:2031588..2031812(+)	frameshift,internal_stop_codon	2031472..2031474(+)	2031603	WP_002287688.1	tyrosine-type recombinase/integrase	89.2	17.6	55.2
MGA_1957	LOCUS_19430	sequence2:2045732..2047858(+)	partial			WP_168488820.1	CDP-glycerol glycerophosphotransferase family protein	79.4	48.0	27.0
MGA_1974	LOCUS_19600	sequence2:2065321..2065713(+)	partial			WP_003564504.1	DUF4828 domain-containing protein	69.2	76.3	31.5
MGA_1979	LOCUS_19650	sequence2:2070064..2071242(-)	partial			WP_003245877.1	serine hydrolase domain-containing protein	75.8	74.9	36.6
MGA_1998	LOCUS_19840	sequence2:2087684..2088001(+)	partial			WP_003732213.1	metalloregulator ArsR/SmtB family transcription factor	67.6	73.2	56.3
MGA_2002	LOCUS_19880	sequence2:2092069..2093493(-)	partial			WP_004399426.1	peptidase G2 autoproteolytic cleavage domain-containing protein	76.8	44.9	41.8
MGA_2014	LOCUS_20000	sequence2:2106990..2107262(-)	frameshift		2107257	WP_000620148.1	GNAT family N-acetyltransferase	84.4	49.3	44.7
MGA_2016	LOCUS_20020	sequence2:2107665..2108525(+)	partial			WP_003722722.1	HlyD family secretion protein	53.8	69.8	29.0
MGA_2019	LOCUS_20050	sequence2:2110541..2111509(-)	partial			WP_002387476.1	family 20 glycosylhydrolase	94.1	36.8	41.3
MGA_2043	LOCUS_20290	sequence2:2138020..2138826(-)	partial			WP_002385163.1	WxL domain-containing protein	57.8	63.9	25.3
MGA_2049	LOCUS_20350	sequence2:2145238..2146764(-)	partial			WP_003566131.1	helix-turn-helix domain-containing protein	43.3	45.2	25.2
MGA_2059	LOCUS_20450	sequence2:2154950..2158798(-)	partial			WP_002296199.1	Ig-like domain-containing protein	51.1	66.3	29.7
MGA_2062	LOCUS_20480	sequence2:2163778..2164500(+)	frameshift		2164476	WP_011102026.1	DUF916 and DUF3324 domain-containing protein	87.5	60.2	31.1
MGA_2123	LOCUS_21090	sequence2:2219300..2220034(-)	partial			WP_002359986.1	phage tail tip lysozyme	38.9	11.8	32.4
MGA_2124	LOCUS_21100	sequence2:2220095..2220757(-)	partial			WP_010905391.1	peptidoglycan amidohydrolase family protein	66.4	56.8	52.7
MGA_2172	LOCUS_21580	sequence2:2267229..2270960(-)	partial			WP_010989523.1	hypothetical protein	54.8	81.2	39.9
MGA_2188	LOCUS_21740	sequence2:2287551..2288204(-)	partial			WP_001041726.1	class A sortase	71.4	72.9	29.7
MGA_2209	LOCUS_21950	sequence2:2312462..2312797(-)	partial			WP_002304776.1	GIY-YIG nuclease family protein	70.3	83.0	66.7
MGA_2247	LOCUS_22270	sequence2:2353128..2354189(-)	partial			WP_000014237.1	nucleoside triphosphate pyrophosphohydrolase	98.6	71.8	47.0
MGA_2267	LOCUS_22470	sequence2:2378337..2379764(-)	partial			WP_001241086.1	DUF4430 domain-containing protein	71.6	55.4	33.0
MGA_2271	LOCUS_22510	sequence2:2382717..2383730(+)	partial			WP_010989386.1	class 1 internalin InlH	61.7	32.7	28.0
MGA_2293	LOCUS_22730	sequence2:2402084..2402683(+)	partial			WP_003228938.1	exo-glucosaminidase LytG	97.5	70.6	43.0
MGA_2301	LOCUS_22810	sequence2:2410605..2411867(-)	partial			WP_012972628.1	competence system sensor histidine kinase ComD	50.5	50.8	27.0
MGA_2303	LOCUS_22830	sequence2:2413006..2415063(-)	partial			WP_009993840.1	GA module-containing protein	22.6	13.3	29.9
MGA_2304	LOCUS_22840	sequence2:2415095..2417329(-)	partial			WP_011254514.1	DUF1542 domain-containing protein	71.9	22.6	26.7
MGA_2315	LOCUS_22950	sequence2:2430004..2431362(-)	partial			WP_000056102.1	T7SS effector LXG polymorphic toxin	78.5	68.1	29.1
MGA_2320	LOCUS_23000	sequence2:2434342..2434800(+)	partial			WP_003723013.1	thioredoxin family protein	71.7	69.4	30.1
MGA_2329	LOCUS_23090	sequence2:2446850..2447281(-)	partial			WP_003723013.1	thioredoxin family protein	76.9	71.3	31.2
MGA_2331	LOCUS_23110	sequence2:2448530..2448979(+)	partial			WP_003641117.1	hypothetical protein	66.4	74.6	28.6
MGA_2365	LOCUS_23450	sequence2:2484817..2485962(+)	partial			WP_010879949.1	GGDEF domain-containing protein	44.9	38.5	39.9
MGA_2366	LOCUS_23460	sequence2:2486017..2486679(-)	partial			WP_003231267.1	3D domain-containing protein	45.0	30.7	45.5
MGA_2380	LOCUS_23600	sequence2:2499314..2501908(+)	partial			WP_010989363.1	LPXTG cell wall anchor domain-containing protein	70.8	73.9	28.1
MGA_2396	LOCUS_23760	sequence2:2516870..2519011(+)	partial			WP_180947112.1	hypothetical protein	69.6	54.9	22.1
MGA_2399	LOCUS_23790	sequence2:2520620..2520901(-)	partial			WP_010964215.1	shikimate dehydrogenase	88.2	22.3	42.7
MGA_2404	LOCUS_23840	sequence2:2523384..2523941(-)	internal_stop_codon	2523960..2523962(-)		WP_003731898.1	peptide ABC transporter substrate-binding protein	98.4	32.8	43.2
MGA_2405	LOCUS_23850	sequence2:2523960..2525063(-)	internal_stop_codon	2523960..2523962(-)		WP_003731898.1	peptide ABC transporter substrate-binding protein	98.1	64.0	46.7
MGA_2427	LOCUS_24070	sequence2:2548500..2549114(-)	partial			WP_011068637.1	YesL family protein	57.8	57.7	30.1
MGA_2442	LOCUS_24220	sequence2:2565763..2566098(-)	partial			WP_002385633.1	helix-turn-helix transcriptional regulator	58.6	59.1	47.7
MGA_2444	LOCUS_24240	sequence2:2567886..2568620(-)	partial			WP_011674101.1	GH25 family lysozyme	79.5	72.8	35.2
