# locus_id	locus_tag	location	classification	internal_stop	indel	ref_id	description	query_cov	ref_cov	identity
MGA_34	LOCUS_00340	sequence1:40491..40751(+)	partial			WP_011391916.1	helix-turn-helix domain-containing protein	93.0	65.0	53.8
MGA_60	LOCUS_00600	sequence1:67299..68243(+)	frameshift		68189	WP_002489776.1	MFS transporter	95.5	66.7	67.7
MGA_61	LOCUS_00610	sequence1:68285..68653(+)	frameshift		68189	WP_002489776.1	MFS transporter	100.0	26.9	76.2
MGA_64	LOCUS_00640	sequence1:70527..70679(-)	partial			WP_003642286.1	SDR family oxidoreductase	92.0	21.7	63.0
MGA_67	LOCUS_00670	sequence1:73014..73244(+)	internal_stop_codon	73242..73244(+)		WP_002288651.1	TMEM175 family protein	100.0	39.1	51.3
MGA_71	LOCUS_00710	sequence1:75418..76389(-)	frameshift		76420	WP_003971922.1	NAD(P)/FAD-dependent oxidoreductase	98.5	85.0	48.1
MGA_72	LOCUS_00720	sequence1:76409..76573(-)	frameshift		76420	WP_003971486.1	NAD(P)/FAD-dependent oxidoreductase	79.6	11.5	62.8
MGA_93	LOCUS_00930	sequence1:95162..95683(+)	internal_stop_codon	95060..95062(+),95681..95683(+)		WP_000598772.1	ABC transporter ATP-binding protein	100.0	69.5	80.9
MGA_98	LOCUS_00980	sequence1:101351..101998(+)	internal_stop_codon	101996..101998(+)		WP_000887022.1	BglG family transcription antiterminator	100.0	34.5	49.3
MGA_99	LOCUS_00990	sequence1:102230..103210(+)	internal_stop_codon	101996..101998(+)		WP_002437911.1	BglG family transcription antiterminator	98.5	52.2	50.2
MGA_104	LOCUS_01040	sequence1:108119..108727(+)	partial			WP_003581575.1	stage II sporulation protein M	71.8	69.6	27.2
MGA_122	LOCUS_01220	sequence1:128896..129516(-)	partial			WP_002906887.1	accessory Sec system protein Asp3	63.1	82.4	33.6
MGA_143	LOCUS_01430	sequence1:146994..147620(+)	partial			WP_011728616.1	ABC transporter ATP-binding protein	91.8	36.3	38.7
MGA_150	LOCUS_01500	sequence1:153307..153804(+)	frameshift		153792	WP_000159014.1	DNA/RNA non-specific endonuclease	98.8	25.9	69.3
MGA_155	LOCUS_01550	sequence1:157836..158048(+)	frameshift		158036	WP_000826312.1	tandem-type lipoprotein	94.3	25.9	63.6
MGA_156	LOCUS_01560	sequence1:158344..158541(+)	partial			WP_000972280.1	tandem-type lipoprotein	92.3	23.3	58.3
MGA_157	LOCUS_01570	sequence1:158609..159082(+)	partial			WP_001044255.1	membrane protein	78.3	32.4	46.2
MGA_160	LOCUS_01600	sequence1:161413..162030(+)	partial			WP_000836421.1	amidohydrolase family protein	100.0	60.4	42.9
MGA_188	LOCUS_01880	sequence1:189107..189433(+)	partial			WP_000731945.1	LPXTG cell wall anchor domain-containing protein	99.1	47.2	42.7
MGA_211	LOCUS_02110	sequence1:210308..211234(-)	partial			WP_010921843.1	ABC transporter permease/substrate binding protein	92.9	48.2	32.8
MGA_271	LOCUS_02710	sequence1:286020..287228(+)	partial			WP_124797038.1	putative glycoside hydrolase	87.8	73.0	40.2
MGA_287	LOCUS_02870	sequence1:304856..305740(+)	partial			WP_001830674.1	zinc ribbon domain-containing protein	94.9	63.2	28.2
MGA_365	LOCUS_03650	sequence1:381535..382413(-)	partial			WP_012256690.1	transcriptional regulator CynR	56.2	54.9	32.3
MGA_388	LOCUS_03880	sequence1:408911..410683(-)	partial			WP_002370472.1	glycosyltransferase family A protein	43.4	52.7	26.8
MGA_397	LOCUS_03970	sequence1:422366..423274(+)	frameshift		423262	WP_011031842.1	FAD-dependent monooxygenase	92.1	69.7	32.4
MGA_398	LOCUS_03980	sequence1:423274..423504(+)	frameshift		423262	WP_013226955.1	NAD(P)/FAD-dependent oxidoreductase	100.0	21.6	43.8
MGA_437	LOCUS_04370	sequence1:463736..464362(-)	internal_stop_codon	464396..464398(-)		WP_001185695.1	sodium:proton antiporter	98.6	24.1	36.6
MGA_438	LOCUS_04380	sequence1:464396..465919(-)	internal_stop_codon	464396..464398(-)		WP_001185695.1	sodium:proton antiporter	96.4	70.8	73.5
MGA_460	LOCUS_04600	sequence1:486081..487085(+)	partial			WP_000727772.1	zinc ABC transporter substrate-binding lipoprotein AdcA	96.4	63.5	64.8
MGA_471	LOCUS_04710	sequence1:496381..498135(+)	internal_stop_codon	498133..498135(+)		WP_000514408.1	nitrate reductase subunit alpha	100.0	47.5	86.1
MGA_473	LOCUS_04730	sequence1:498277..500064(+)	internal_stop_codon	498133..498135(+)		WP_000514408.1	nitrate reductase subunit alpha	99.7	48.3	87.7
MGA_514	LOCUS_05140	sequence1:541038..541781(+)	partial			WP_000827010.1	hypothetical protein	44.1	55.4	58.4
MGA_525	LOCUS_05250	sequence1:554854..555129(+)	internal_stop_codon	555127..555129(+)		WP_000238542.1	MarR family transcriptional regulator	100.0	60.3	74.7
MGA_544	LOCUS_05440	sequence1:571814..573124(-)	frameshift		573141	WP_002456635.1	ribulokinase	98.9	80.0	73.1
MGA_545	LOCUS_05450	sequence1:573121..573438(-)	frameshift		573141	WP_002456635.1	ribulokinase	94.3	18.5	64.6
MGA_569	LOCUS_05690	sequence1:597490..597672(-)	partial			WP_000205307.1	hypothetical protein	58.3	57.4	74.3
MGA_580	LOCUS_05800	sequence1:607650..608063(+)	partial			WP_001830043.1	LCP family protein	93.4	40.5	76.6
MGA_582	LOCUS_05820	sequence1:608863..609399(+)	partial			WP_001830043.1	LCP family protein	100.0	56.3	77.5
MGA_687	LOCUS_06870	sequence1:693200..693436(+)	internal_stop_codon	693434..693436(+)		WP_000047009.1	tagatose-bisphosphate aldolase	100.0	23.9	82.1
MGA_688	LOCUS_06880	sequence1:693758..694171(+)	partial			WP_000047009.1	tagatose-bisphosphate aldolase	100.0	42.0	93.4
MGA_750	LOCUS_07480	sequence1:763562..764038(+)	frameshift		763547	WP_000701483.1	DNA-directed RNA polymerase subunit delta	79.1	71.0	78.4
MGA_779	LOCUS_07770	sequence1:790947..791204(+)	partial			WP_126475239.1	IS1182 family transposase	97.6	15.2	88.0
MGA_824	LOCUS_08210	sequence1:837396..838286(-)	frameshift		838359	WP_001832478.1	AAA family ATPase	99.7	54.5	65.3
MGA_825	LOCUS_08220	sequence1:838357..839019(-)	frameshift		838362	WP_001832478.1	AAA family ATPase	90.9	37.2	54.0
MGA_840	LOCUS_08370	sequence1:852508..854124(+)	partial			WP_049387514.1	MSCRAMM-like protein SdrH	71.4	81.8	38.3
MGA_959	LOCUS_09540	sequence1:983332..983565(-)	partial			WP_001200542.1	fluoride efflux transporter CrcB	63.6	40.5	67.3
MGA_972	LOCUS_09670	sequence1:994295..995146(-)	frameshift		994222,994327	WP_001196362.1	proline dehydrogenase	96.5	82.0	79.5
MGA_981	LOCUS_09760	sequence1:1010032..1015581(+)	partial			WP_001048266.1	LPXTG-anchored DUF1542 repeat protein FmtB	84.3	63.0	35.1
MGA_997	LOCUS_09920	sequence1:1032626..1033261(+)	frameshift		1033216	WP_002484970.1	UDP-N-acetylmuramate--L-alanine ligase	95.3	46.0	89.1
MGA_998	LOCUS_09930	sequence1:1033462..1033938(+)	frameshift		1033219	WP_002484970.1	UDP-N-acetylmuramate--L-alanine ligase	100.0	36.2	86.1
MGA_1027	LOCUS_10220	sequence1:1064762..1065178(+)	frameshift		1065175	WP_001830758.1	tRNA 4-thiouridine(8) synthase ThiI	97.1	32.9	72.4
MGA_1028	LOCUS_10230	sequence1:1065166..1065984(+)	frameshift		1065175	WP_001830758.1	tRNA 4-thiouridine(8) synthase ThiI	98.9	66.1	80.3
MGA_1038	LOCUS_10330	sequence1:1074642..1074779(+)	frameshift		1074773	WP_001830890.1	DRTGG domain-containing protein	100.0	10.4	86.7
MGA_1083	LOCUS_10780	sequence1:1128661..1128810(+)	partial			WP_001830756.1	hypothetical protein	63.3	67.4	90.3
MGA_1103	LOCUS_10980	sequence1:1148756..1150273(+)	frameshift		1150219	WP_001830852.1	aspartate--tRNA ligase	96.6	83.0	90.8
MGA_1104	LOCUS_10990	sequence1:1150231..1150521(+)	frameshift		1150219	WP_000044799.1	aspartate--tRNA ligase	100.0	16.3	95.8
MGA_1108	LOCUS_11030	sequence1:1154012..1154161(+)	partial			WP_001830746.1	SAS049 family protein	65.3	68.1	84.4
MGA_1113	LOCUS_11080	sequence1:1158698..1160563(+)	frameshift		1160497	WP_001283312.1	ATP-dependent RecD-like DNA helicase	96.8	72.5	82.4
MGA_1114	LOCUS_11090	sequence1:1160605..1161168(+)	frameshift		1160494	WP_002484987.1	ATP-dependent RecD-like DNA helicase	100.0	21.9	70.1
MGA_1115	LOCUS_11100	sequence1:1161543..1162760(+)	frameshift		1162742	WP_000734075.1	alanine--tRNA ligase	99.0	45.8	88.8
MGA_1116	LOCUS_11110	sequence1:1162726..1164174(+)	frameshift		1162745	WP_000734075.1	alanine--tRNA ligase	98.8	54.3	80.7
MGA_1151	LOCUS_11460	sequence1:1193478..1194005(+)	frameshift		1193891	WP_012972447.1	molecular chaperone DnaJ	81.1	37.7	54.5
MGA_1152	LOCUS_11470	sequence1:1194479..1194613(+)	partial			WP_001119021.1	molecular chaperone DnaJ	100.0	11.6	79.5
MGA_1156	LOCUS_11510	sequence1:1197793..1197969(+)	partial			WP_000048060.1	30S ribosomal protein S21	74.1	74.1	100.0
MGA_1187	LOCUS_11820	sequence1:1225578..1226048(+)	frameshift		1226039	WP_000697220.1	competence type IV pilus ATPase ComGA	99.4	47.8	76.8
MGA_1188	LOCUS_11830	sequence1:1226045..1226551(+)	frameshift		1226042	WP_001831109.1	competence type IV pilus ATPase ComGA	100.0	51.9	77.4
MGA_1245	LOCUS_12400	sequence1:1276841..1277467(+)	frameshift		1277446	WP_002456188.1	helix-turn-helix domain-containing protein	97.1	63.1	61.4
MGA_1246	LOCUS_12410	sequence1:1277605..1277808(+)	frameshift		1277446	WP_001163801.1	helix-turn-helix domain-containing protein	91.0	19.2	52.5
MGA_1248	LOCUS_12430	sequence1:1279325..1281142(+)	partial			WP_107515759.1	elastin-binding protein EbpS	36.9	50.0	27.3
MGA_1285	LOCUS_12800	sequence1:1320459..1325864(+)	frameshift		1325828	WP_080388512.1	hyperosmolarity resistance protein Ebh	98.3	17.5	45.0
MGA_1286	LOCUS_12810	sequence1:1325861..1335952(+)	frameshift,internal_stop_codon	1335950..1335952(+),1329918..1329920(+),1335951..1335953(+)	1329537,1329874,1330275,1325828,1328456,1329965	WP_080388512.1	hyperosmolarity resistance protein Ebh	78.8	26.1	34.5
MGA_1287	LOCUS_12820	sequence1:1336046..1348969(+)	frameshift,internal_stop_codon	1346603..1346605(+),1335950..1335952(+),1348365..1348367(+)	1348433,1348339,1346590,1346617	WP_080388512.1	hyperosmolarity resistance protein Ebh	99.3	42.2	30.1
MGA_1308	LOCUS_13030	sequence1:1368572..1369411(+)	partial			WP_002984437.1	ABC transporter ATP-binding protein	61.3	76.7	32.0
MGA_1335	LOCUS_13300	sequence1:1395773..1397062(-)	frameshift		1397202	WP_000077571.1	oligoendopeptidase F	99.3	70.5	82.9
MGA_1336	LOCUS_13310	sequence1:1397164..1397583(-)	frameshift		1397193	WP_002439680.1	oligoendopeptidase F	93.5	21.6	56.2
MGA_1371	LOCUS_13660	sequence1:1438658..1439203(-)	frameshift		1439348	WP_002485803.1	SMC family ATPase	100.0	17.9	82.9
MGA_1372	LOCUS_13670	sequence1:1439316..1441688(-)	frameshift		1439348	WP_002485803.1	SMC family ATPase	100.0	78.3	39.1
MGA_1390	LOCUS_13850	sequence1:1456715..1457230(-)	frameshift		1457372,1457228	WP_001255461.1	threonine synthase	100.0	48.4	89.5
MGA_1391	LOCUS_13860	sequence1:1457197..1457355(-)	frameshift		1457372,1457228	WP_001255461.1	threonine synthase	80.8	11.9	85.7
MGA_1392	LOCUS_13870	sequence1:1457361..1457774(-)	frameshift		1457228,1457375	WP_001255461.1	threonine synthase	97.1	37.7	82.7
MGA_1393	LOCUS_13880	sequence1:1457791..1457982(-)	frameshift		1457801,1457987	WP_002439624.1	homoserine dehydrogenase	79.4	11.7	50.0
MGA_1394	LOCUS_13890	sequence1:1457946..1458554(-)	frameshift		1457800,1458586,1457986	WP_002439624.1	homoserine dehydrogenase	94.6	44.8	82.7
MGA_1395	LOCUS_13900	sequence1:1458584..1459057(-)	frameshift		1458586	WP_000735864.1	homoserine dehydrogenase	100.0	36.9	91.1
MGA_1403	LOCUS_13980	sequence1:1464383..1465306(-)	frameshift		1465314	WP_000670307.1	sensor histidine kinase	97.1	81.8	44.8
MGA_1410	LOCUS_14050	sequence1:1470287..1470646(-)	partial			WP_000354307.1	DUF4355 domain-containing protein	98.3	56.9	36.8
MGA_1411	LOCUS_14060	sequence1:1470923..1471903(-)	partial			WP_002485350.1	minor capsid protein	66.0	46.2	58.5
MGA_1446	LOCUS_14410	sequence1:1511485..1511631(-)	frameshift		1511635	WP_000052590.1	ribonuclease J	100.0	8.6	95.8
MGA_1494	LOCUS_14890	sequence1:1568537..1569115(-)	frameshift		1569159	WP_001151509.1	ATP-dependent DNA helicase RecG	100.0	28.0	84.4
MGA_1495	LOCUS_14900	sequence1:1569130..1570584(-)	frameshift		1569159	WP_001830069.1	ATP-dependent DNA helicase RecG	99.4	70.5	86.5
MGA_1555	LOCUS_15500	sequence1:1629938..1630306(-)	partial			WP_002485104.1	amidase	57.4	69.4	48.0
MGA_1556	LOCUS_15510	sequence1:1630697..1631278(-)	partial			WP_010922065.1	hypothetical protein	42.5	39.2	43.4
MGA_1557	LOCUS_15520	sequence1:1631347..1632294(-)	partial			WP_001148136.1	SH3 domain-containing protein	34.3	21.6	60.2
MGA_1590	LOCUS_15850	sequence1:1657278..1657415(-)	partial			WP_001065101.1	DUF1024 family protein	95.6	55.1	60.5
MGA_1619	LOCUS_16140	sequence1:1667507..1668262(-)	partial			WP_002286575.1	phage antirepressor	57.0	57.7	54.5
MGA_1731	LOCUS_17260	sequence1:1780251..1780463(+)	partial			WP_001788574.1	NINE protein	100.0	72.9	68.6
MGA_1824	LOCUS_18190	sequence1:1881642..1881977(-)	internal_stop_codon	1882008..1882010(-)		WP_002468866.1	D-glycerate dehydrogenase	100.0	34.4	65.8
MGA_1825	LOCUS_18200	sequence1:1882008..1882604(-)	internal_stop_codon	1882008..1882010(-)		WP_000239131.1	D-glycerate dehydrogenase	100.0	62.1	71.2
MGA_1873	LOCUS_18680	sequence1:1915182..1916183(+)	partial			WP_000070642.1	DUF4352 domain-containing protein	60.7	61.6	64.2
MGA_1886	LOCUS_18810	sequence1:1923549..1923866(-)	frameshift,internal_stop_codon	1923905..1923907(-),1923521..1923523(-),1923872..1923874(-)	1923865,1923577	WP_103167312.1	terminase small subunit	90.5	59.4	80.0
MGA_1902	LOCUS_18970	sequence1:1939703..1940386(-)	partial			WP_004199405.1	GIY-YIG nuclease family protein	24.7	20.8	48.4
MGA_1992	LOCUS_19870	sequence1:2037758..2038348(-)	partial			WP_014207607.1	MBL fold metallo-hydrolase	61.7	42.1	35.5
MGA_1997	LOCUS_19920	sequence1:2040698..2041168(-)	partial			WP_001832142.1	hypothetical protein	51.3	57.1	37.5
MGA_2100	LOCUS_20950	sequence1:2139618..2140556(-)	frameshift		2139620	WP_013530953.1	UDP-N-acetylmuramoylalanyl-D-glutamyl-2,6-diaminopimelate--D-alanyl-D-alanine ligase	68.3	44.5	32.6
MGA_2110	LOCUS_21050	sequence1:2149775..2152882(-)	partial			WP_000745891.1	MSCRAMM family adhesin clumping factor ClfB	45.6	53.4	38.9
MGA_2119	LOCUS_21140	sequence1:2160252..2162915(+)	partial			WP_000645787.1	LPXTG-anchored adenosine synthase AdsA	66.4	75.1	55.0
MGA_2120	LOCUS_21150	sequence1:2162972..2163637(-)	internal_stop_codon	2163707..2163709(-)		WP_001024371.1	SDR family oxidoreductase	100.0	78.6	84.2
MGA_2122	LOCUS_21170	sequence1:2165771..2165989(+)	internal_stop_codon	2165987..2165989(+)		WP_011476685.1	alcohol dehydrogenase catalytic domain-containing protein	97.2	19.6	58.6
MGA_2123	LOCUS_21180	sequence1:2166179..2166838(+)	internal_stop_codon	2165987..2165989(+)		WP_011476685.1	alcohol dehydrogenase catalytic domain-containing protein	99.5	61.3	45.9
MGA_2222	LOCUS_22120	sequence1:2283249..2283476(+)	frameshift		2283464	WP_001832460.1	glycosyltransferase	97.3	14.6	72.6
MGA_2223	LOCUS_22130	sequence1:2283610..2284746(+)	frameshift		2283464	WP_001832460.1	glycosyltransferase	99.2	75.2	53.8
MGA_2228	LOCUS_22180	sequence1:2288403..2290664(-)	internal_stop_codon	2290746..2290748(-)		WP_003147473.1	Ig-like domain-containing protein	75.2	22.1	38.5
MGA_2229	LOCUS_22190	sequence1:2290746..2294615(-)	frameshift,internal_stop_codon	2290745..2290747(-),2290746..2290748(-)	2293667,2293651	WP_003147473.1	Ig-like domain-containing protein	98.1	49.0	34.5
MGA_2231	LOCUS_22210	sequence1:2296081..2296953(-)	partial			WP_011082831.1	MSCRAMM family adhesin SdrF	65.5	12.5	31.1
MGA_2246	LOCUS_22360	sequence1:2308850..2309095(+)	frameshift,internal_stop_codon	2308792..2308794(+),2308813..2308815(+)	2308848	WP_001789536.1	hypothetical protein	98.8	58.0	60.0
MGA_2329	LOCUS_23190	sequence1:2393239..2396304(+)	partial			WP_000791146.1	M4 family metallopeptidase	33.3	38.9	26.1
MGA_2332	LOCUS_23220	sequence1:2397805..2398443(-)	partial			WP_002485581.1	hypothetical protein	54.2	53.7	60.0
MGA_2346	LOCUS_23360	sequence1:2410260..2410697(-)	frameshift		2410686	WP_002455937.1	hypothetical protein	90.3	81.4	49.6
MGA_2350	LOCUS_23400	sequence1:2415346..2415492(-)	frameshift,internal_stop_codon	2415744..2415746(-)	2415554	WP_001831756.1	ABC transporter ATP-binding protein	100.0	21.1	83.3
MGA_2351	LOCUS_23410	sequence1:2415516..2415695(-)	frameshift,internal_stop_codon	2415744..2415746(-)	2415554	WP_001831756.1	ABC transporter ATP-binding protein	79.7	20.6	80.9
MGA_2352	LOCUS_23420	sequence1:2415744..2416031(-)	frameshift,internal_stop_codon	2415744..2415746(-)	2415554	WP_001831756.1	ABC transporter ATP-binding protein	100.0	41.7	88.4
MGA_2355	LOCUS_23450	sequence1:2417608..2417826(+)	frameshift		2417808	WP_002455925.1	YIP1 family protein	77.8	26.8	64.3
MGA_2366	LOCUS_23560	sequence1:2426708..2426845(-)	partial			WP_000240855.1	50S ribosomal protein L34	60.0	60.0	100.0
