# locus_id	locus_tag	location	classification	internal_stop	indel	ref_id	description	query_cov	ref_cov	identity
MGA_58	LOCUS_00480	sequence13:5317..5625(+)	internal_stop_codon	5623..5625(+)		WP_013530060.1	NAD(P)-dependent alcohol dehydrogenase	93.1	27.6	47.4
MGA_59	LOCUS_00490	sequence13:5671..6330(+)	internal_stop_codon	5623..5625(+)		WP_013094782.1	NAD(P)-dependent alcohol dehydrogenase	98.2	62.8	50.7
MGA_60	LOCUS_00500	sequence13:6282..6554(-)	partial			WP_167797511.1	transposase	64.4	27.1	94.8
MGA_75	LOCUS_00630	sequence16:8113..8379(+)	partial			WP_002438951.1	hypothetical protein	39.8	54.7	71.4
MGA_84	LOCUS_00720	sequence16:15459..15698(-)	partial			WP_083312988.1	terminase small subunit	96.2	47.2	47.4
MGA_89	LOCUS_00770	sequence16:18215..19009(-)	partial			WP_000148333.1	DnaD domain-containing protein	51.1	47.1	32.9
MGA_95	LOCUS_00830	sequence16:20569..21429(+)	partial			WP_095089160.1	helix-turn-helix transcriptional regulator	32.5	41.5	51.6
MGA_99	LOCUS_00870	sequence16:25266..28151(+)	partial			WP_000645791.1	LPXTG-anchored adenosine synthase AdsA	67.0	82.9	52.1
MGA_103	LOCUS_00910	sequence16:30581..30775(-)	partial			WP_000250823.1	glycine C-acetyltransferase	90.6	14.9	61.0
MGA_144	LOCUS_01320	sequence17:8025..8681(+)	partial			WP_011142031.1	hypothetical protein	81.2	72.1	30.2
MGA_154	LOCUS_01390	sequence21:1116..1856(+)	partial			WP_001831861.1	accessory Sec system glycosylation chaperone GtfB	76.4	42.4	42.3
MGA_192	LOCUS_01770	sequence21:32693..33196(+)	partial			WP_003721792.1	DUF805 domain-containing protein	55.7	74.6	32.1
MGA_249	LOCUS_02340	sequence21:90264..90641(+)	partial			WP_001832142.1	hypothetical protein	72.8	65.0	31.9
MGA_254	LOCUS_02390	sequence21:92988..93464(-)	partial			WP_001832119.1	hypothetical protein	95.6	68.6	64.5
MGA_399	LOCUS_03840	sequence21:230076..230693(-)	frameshift		230806	WP_002439040.1	FAD-dependent oxidoreductase	100.0	57.9	82.4
MGA_400	LOCUS_03850	sequence21:230804..231118(-)	frameshift		230806	WP_000794020.1	NAD(P)/FAD-dependent oxidoreductase	94.2	27.7	80.6
MGA_511	LOCUS_04960	sequence21:331660..332514(+)	partial			WP_011475651.1	Clp protease ClpP	69.7	81.6	34.5
MGA_523	LOCUS_05080	sequence21:344363..349867(+)	partial			WP_000582152.1	phage tail spike protein	35.0	51.3	53.2
MGA_525	LOCUS_05100	sequence21:350044..350343(+)	partial			WP_001262621.1	hypothetical protein	65.7	68.4	44.6
MGA_530	LOCUS_05150	sequence21:352623..353459(+)	partial			WP_001148136.1	SH3 domain-containing protein	92.1	51.4	40.2
MGA_535	LOCUS_05200	sequence21:357697..357909(-)	partial			WP_001788574.1	NINE protein	100.0	72.9	58.6
MGA_622	LOCUS_06070	sequence21:448870..449010(+)	partial			WP_011082549.1	IS1182-like element ISSep1 family transposase	95.7	8.0	72.7
MGA_636	LOCUS_06210	sequence21:463688..464302(-)	partial			WP_096810449.1	site-specific integrase	94.6	53.0	40.9
MGA_657	LOCUS_06420	sequence21:481806..482951(+)	partial			WP_002470268.1	FtsQ-type POTRA domain-containing protein	82.9	68.3	51.3
MGA_687	LOCUS_06720	sequence21:515437..515640(-)	partial			WP_001548522.1	TM2 domain-containing protein	100.0	72.8	68.7
MGA_693	LOCUS_06780	sequence21:520375..521415(+)	frameshift		521391	WP_001833032.1	Stk1 family PASTA domain-containing Ser/Thr kinase	96.0	50.2	65.6
MGA_694	LOCUS_06790	sequence21:521418..522371(+)	frameshift		521409	WP_001833032.1	Stk1 family PASTA domain-containing Ser/Thr kinase	100.0	45.9	49.8
MGA_717	LOCUS_07020	sequence21:543853..544137(-)	frameshift,internal_stop_codon	543679..543681(-)	543783,543855	WP_002494449.1	IS1182-like element ISSep1 family transposase	58.5	9.8	87.3
MGA_800	LOCUS_07850	sequence21:640386..640670(+)	internal_stop_codon	640668..640670(+)		WP_001829500.1	homoserine kinase	100.0	30.7	67.0
MGA_801	LOCUS_07860	sequence21:640857..641303(+)	internal_stop_codon	640668..640670(+)		WP_001829500.1	homoserine kinase	98.6	47.7	74.0
MGA_817	LOCUS_08020	sequence21:656575..656811(+)	internal_stop_codon	657031..657033(+),656809..656811(+)		WP_002494449.1	IS1182-like element ISSep1 family transposase	100.0	14.0	94.9
MGA_818	LOCUS_08030	sequence21:656830..657033(+)	internal_stop_codon	657031..657033(+),656809..656811(+)		WP_007083038.1	IS1182 family transposase	100.0	32.8	92.5
MGA_819	LOCUS_08040	sequence21:657082..657336(+)	internal_stop_codon	657334..657336(+),657031..657033(+),656809..656811(+)		WP_002494449.1	IS1182-like element ISSep1 family transposase	97.6	14.7	78.0
MGA_820	LOCUS_08050	sequence21:657394..657771(+)	frameshift,internal_stop_codon	657334..657336(+),658063..658065(+)	657693	WP_194313290.1	IS1182 family transposase	80.0	18.6	92.0
MGA_821	LOCUS_08060	sequence21:657876..658064(+)	frameshift,internal_stop_codon	658063..658065(+)	657693	WP_194313290.1	IS1182 family transposase	100.0	11.5	91.9
MGA_860	LOCUS_08450	sequence21:704772..705524(+)	frameshift,internal_stop_codon	704751..704753(+)	705512	WP_011082682.1	aspartate kinase	99.6	60.7	85.9
MGA_861	LOCUS_08460	sequence21:705482..705973(+)	frameshift		705518	WP_011082682.1	aspartate kinase	98.2	39.0	86.2
MGA_870	LOCUS_08550	sequence21:713862..714026(-)	frameshift		713903	WP_000269923.1	regulatory protein MsaA	75.9	40.2	68.3
MGA_1014	LOCUS_09990	sequence21:852995..853174(-)	partial			WP_000819532.1	diacylglycerol kinase	71.2	36.8	76.2
MGA_1020	LOCUS_10050	sequence21:857592..857768(-)	partial			WP_000048060.1	30S ribosomal protein S21	74.1	74.1	100.0
MGA_1065	LOCUS_10500	sequence21:900702..900845(-)	partial			WP_001830746.1	SAS049 family protein	74.5	74.5	91.4
MGA_1178	LOCUS_11630	sequence21:1028702..1029733(-)	frameshift		1029873,1029858,1029846,1029882,1029855	WP_001050566.1	LPXTG-anchored repetitive surface protein SasC	76.7	12.2	30.0
MGA_1179	LOCUS_11640	sequence21:1029817..1030845(-)	frameshift,internal_stop_codon	1030852..1030854(-)	1029873,1029825,1029876,1029879,1029882,1029870,1029855	WP_011082715.1	YSIRK signal domain/LPXTG anchor domain surface protein	92.4	8.6	35.1
MGA_1180	LOCUS_11650	sequence21:1030852..1032864(-)	frameshift,internal_stop_codon	1030852..1030854(-),1030851..1030853(-)	1033049,1033058,1033076	WP_001050566.1	LPXTG-anchored repetitive surface protein SasC	97.6	29.9	36.4
MGA_1181	LOCUS_11660	sequence21:1033038..1036208(-)	frameshift		1033088	WP_000468780.1	YSIRK signal domain/LPXTG anchor domain surface protein	88.7	74.5	30.1
MGA_1214	LOCUS_11990	sequence21:1067009..1067545(-)	frameshift		1067766	WP_002469574.1	protoporphyrinogen oxidase	100.0	38.3	76.4
MGA_1215	LOCUS_12000	sequence21:1067716..1068390(-)	frameshift		1067766	WP_002469574.1	protoporphyrinogen oxidase	92.4	44.5	84.1
MGA_1245	LOCUS_12280	sequence22:1..621(+)	partial			WP_000122374.1	MobV family relaxase	100.0	49.9	90.8
MGA_1263	LOCUS_12440	sequence23:15249..16193(-)	partial			WP_010921843.1	ABC transporter permease/substrate binding protein	96.8	50.6	30.6
MGA_1282	LOCUS_12630	sequence23:40042..40383(+)	frameshift		40368	WP_002438866.1	DUF1361 domain-containing protein	72.6	40.0	68.3
MGA_1283	LOCUS_12640	sequence23:40380..40652(+)	frameshift		40368	WP_002438866.1	DUF1361 domain-containing protein	96.7	42.4	62.1
MGA_1315	LOCUS_12950	sequence25:34993..35382(+)	internal_stop_codon	35380..35382(+)		WP_011476046.1	phosphatase PAP2 family protein	100.0	57.3	41.1
MGA_1322	LOCUS_13020	sequence25:42597..43214(+)	partial			WP_001829387.1	hypothetical protein	93.7	63.7	72.9
MGA_1361	LOCUS_13410	sequence25:80156..80293(-)	partial			WP_000240855.1	50S ribosomal protein L34	60.0	60.0	100.0
MGA_1388	LOCUS_13680	sequence25:114865..115002(-)	partial			WP_001836575.1	hypothetical protein	84.4	52.1	76.3
MGA_1397	LOCUS_13770	sequence25:123562..124482(+)	partial			WP_010957062.1	TIR domain-containing protein	76.1	55.5	31.3
MGA_1399	LOCUS_13790	sequence25:125084..125986(+)	partial			WP_074956823.1	hypothetical protein	66.7	44.2	27.8
MGA_1405	LOCUS_13850	sequence25:130095..130262(+)	partial			WP_002437601.1	heavy metal translocating P-type ATPase	100.0	8.0	92.7
MGA_1411	LOCUS_13910	sequence25:135883..136254(+)	frameshift		136185	WP_003227736.1	NAD(P)-dependent oxidoreductase	82.1	47.4	61.8
MGA_1412	LOCUS_13920	sequence25:136227..136523(+)	frameshift		136185	WP_003227736.1	NAD(P)-dependent oxidoreductase	100.0	46.0	59.2
MGA_1415	LOCUS_13950	sequence25:137923..139329(-)	partial			WP_002370472.1	glycosyltransferase family A protein	50.0	48.4	29.7
MGA_1416	LOCUS_13960	sequence25:139747..140301(+)	frameshift		140268	WP_001830488.1	SLC45 family MFS transporter	94.6	38.4	94.3
MGA_1417	LOCUS_13970	sequence25:140247..141101(+)	frameshift		140268	WP_001830488.1	SLC45 family MFS transporter	95.4	59.8	87.8
MGA_1424	LOCUS_14040	sequence25:146019..146138(-)	frameshift		146245	WP_000358995.1	thioredoxin-dependent arsenate reductase	97.4	30.5	65.0
MGA_1425	LOCUS_14050	sequence25:146213..146356(-)	frameshift		146245	WP_001830465.1	arsenate reductase (thioredoxin)	78.7	28.2	86.5
MGA_1431	LOCUS_14110	sequence25:151658..153778(+)	partial			WP_012775094.1	AAA family ATPase	49.4	60.2	54.1
MGA_1435	LOCUS_14150	sequence25:157968..158150(+)	internal_stop_codon	158148..158150(+)		WP_002438333.1	nitroreductase family protein	100.0	28.7	80.0
MGA_1436	LOCUS_14160	sequence25:158199..158588(+)	internal_stop_codon	158148..158150(+)		WP_002287459.1	nitroreductase family protein	100.0	61.7	58.1
MGA_1453	LOCUS_14330	sequence25:175628..175912(+)	partial			WP_186433708.1	arsenite efflux transporter membrane subunit ArsB	88.3	19.3	78.3
MGA_1455	LOCUS_14350	sequence25:177913..178269(+)	internal_stop_codon	178267..178269(+)		WP_002469307.1	(S)-acetoin forming diacetyl reductase	100.0	45.6	76.3
MGA_1456	LOCUS_14360	sequence25:178486..178692(+)	internal_stop_codon	178267..178269(+)		WP_002469307.1	(S)-acetoin forming diacetyl reductase	100.0	26.3	88.2
MGA_1496	LOCUS_14760	sequence25:214711..215433(+)	internal_stop_codon	214669..214671(+)		WP_001345592.1	alpha/beta hydrolase	100.0	78.8	39.8
MGA_1502	LOCUS_14820	sequence25:219374..219799(-)	partial			WP_000162810.1	DsbA family protein	100.0	70.9	46.8
MGA_1527	LOCUS_15070	sequence25:242626..243453(+)	partial			WP_009895228.1	CPBP family intramembrane metalloprotease	78.2	65.0	30.1
MGA_1530	LOCUS_15100	sequence25:245275..245901(-)	partial			WP_011728616.1	ABC transporter ATP-binding protein	87.5	34.6	36.2
MGA_1531	LOCUS_15110	sequence25:245888..246661(-)	partial			WP_015040087.1	ABC transporter ATP-binding protein	90.3	45.8	31.3
MGA_1555	LOCUS_15350	sequence25:270609..270803(-)	partial			WP_011987096.1	excinuclease ABC subunit UvrA	98.4	8.4	49.2
MGA_1571	LOCUS_15510	sequence25:286290..287936(+)	frameshift,internal_stop_codon	287934..287936(+)	288002,287939,288005,287942,288008,287912,287918,287921,287924,287990,288216,287993,287996,287933	WP_000044547.1	serine-rich repeat glycoprotein adhesin SasA	89.6	18.5	25.3
MGA_1603	LOCUS_15820	sequence26:32758..32907(+)	partial			WP_000034497.1	NAD(P)-dependent oxidoreductase	77.6	13.4	65.8
MGA_1659	LOCUS_16380	sequence26:87516..88499(-)	frameshift		87551	WP_001830386.1	radical SAM/CxCxxxxC motif protein YfkAB	94.8	81.6	86.5
MGA_1784	LOCUS_17620	sequence28:23370..23561(-)	internal_stop_codon	23370..23372(-),23304..23306(-),23208..23210(-)		WP_001792547.1	alpha/beta hydrolase	93.7	19.7	55.9
MGA_1862	LOCUS_18400	sequence28:81900..82754(-)	partial			WP_000131842.1	AraC family transcriptional regulator	94.4	40.2	35.1
MGA_1866	LOCUS_18440	sequence28:87492..88442(+)	partial			WP_000737705.1	CHAP domain-containing protein	35.4	68.7	66.7
MGA_1882	LOCUS_18600	sequence28:103265..103453(+)	partial			WP_000205307.1	hypothetical protein	72.6	73.8	51.1
MGA_1930	LOCUS_19080	sequence28:150171..152549(-)	partial			WP_080388512.1	hyperosmolarity resistance protein Ebh	83.2	6.8	26.0
MGA_1937	LOCUS_19140	sequence28:158369..158806(-)	partial			WP_000771368.1	spore coat protein	84.1	69.7	53.3
MGA_1954	LOCUS_19310	sequence28:169686..177884(-)	partial			WP_080388512.1	hyperosmolarity resistance protein Ebh	99.7	26.6	41.2
MGA_1955	LOCUS_19320	sequence28:178293..178547(-)	frameshift		178594	WP_002438356.1	GNAT family N-acetyltransferase	100.0	63.2	70.2
MGA_1960	LOCUS_19370	sequence28:181622..181906(-)	frameshift		181955	WP_001020016.1	YhgE/Pip domain-containing protein	100.0	22.6	55.2
MGA_2108	LOCUS_20850	sequence28:337587..340094(-)	partial			WP_010905630.1	CDP-glycerol glycerophosphotransferase family protein	69.2	71.7	38.9
MGA_2127	LOCUS_21040	sequence28:359669..360436(+)	partial			WP_005785152.1	bifunctional demethylmenaquinone methyltransferase/2-methoxy-6-polyprenyl-1,4-benzoquinol methylase UbiE	31.4	34.7	36.5
MGA_2130	LOCUS_21070	sequence28:360948..361691(+)	frameshift		360939	WP_011673979.1	DMT family transporter	96.8	82.6	46.4
MGA_2145	LOCUS_21220	sequence28:374663..375997(-)	partial			WP_124797038.1	putative glycoside hydrolase	79.5	74.9	39.2
MGA_2160	LOCUS_21370	sequence28:395072..395314(-)	partial			WP_002438015.1	hypothetical protein	75.0	59.4	45.0
MGA_2163	LOCUS_21400	sequence28:397367..398266(-)	frameshift		398229	WP_002438012.1	sulfate adenylyltransferase	96.0	73.2	90.6
MGA_2164	LOCUS_21410	sequence28:398179..398526(-)	frameshift		398229	WP_002438012.1	sulfate adenylyltransferase	80.0	23.5	78.3
MGA_2188	LOCUS_21620	sequence30:8983..10128(+)	partial			WP_012582960.1	glycosyltransferase family 4 protein	38.8	37.7	31.8
