# locus_id	locus_tag	location	classification	internal_stop	indel	ref_id	description	query_cov	ref_cov	identity
MGA_4	LOCUS_00040	sequence1:3036..3443(+)	partial			WP_035213450.1	helix-turn-helix transcriptional regulator	56.3	62.6	45.1
MGA_18	LOCUS_00160	sequence1:31102..31680(+)	partial			WP_002263142.1	rod shape-determining protein MreC	99.0	71.0	30.1
MGA_83	LOCUS_00800	sequence1:95486..95830(+)	frameshift		95459	WP_011837044.1	AraC family transcriptional regulator	92.1	37.9	62.9
MGA_84	LOCUS_00810	sequence1:96002..96523(-)	partial			WP_002983552.1	PepSY domain-containing protein	39.3	45.3	50.0
MGA_107	LOCUS_01040	sequence1:127358..127807(-)	partial			WP_011475904.1	Ltp family lipoprotein	73.2	53.7	49.1
MGA_109	LOCUS_01060	sequence1:128221..128583(-)	partial			WP_010922480.1	XRE family transcriptional regulator	70.0	32.7	45.2
MGA_116	LOCUS_01130	sequence1:130915..131217(+)	partial			WP_011861119.1	DUF6017 domain-containing protein	60.0	18.5	43.3
MGA_132	LOCUS_01290	sequence1:137069..137383(+)	partial			WP_000052302.1	hypothetical protein	77.9	72.7	53.1
MGA_137	LOCUS_01340	sequence1:141560..143182(+)	partial			WP_010922076.1	phage minor capsid protein	74.4	80.7	65.4
MGA_151	LOCUS_01480	sequence1:148715..152092(+)	partial			WP_010922222.1	tape measure protein	34.9	32.5	51.8
MGA_153	LOCUS_01500	sequence1:153531..156311(+)	partial			WP_093649511.1	phage tail spike protein	41.3	34.9	49.9
MGA_160	LOCUS_01570	sequence1:161114..161347(+)	partial			WP_002986552.1	competence type IV pilus major pilin ComGC	98.7	70.4	68.4
MGA_187	LOCUS_01840	sequence1:185018..185449(-)	internal_stop_codon	185450..185452(-)		WP_002987812.1	tRNA dihydrouridine synthase DusB	100.0	44.0	93.0
MGA_188	LOCUS_01850	sequence1:185450..185995(-)	internal_stop_codon	185450..185452(-)		WP_002987812.1	tRNA dihydrouridine synthase DusB	100.0	55.7	97.8
MGA_211	LOCUS_02080	sequence1:211167..212666(+)	partial			WP_011029647.1	CehA/McbA family metallohydrolase	49.7	46.0	26.5
MGA_215	LOCUS_02120	sequence1:216194..216403(+)	frameshift,internal_stop_codon	216188..216190(+)	216349	WP_002262755.1	ABC transporter ATP-binding protein	75.4	21.8	61.5
MGA_218	LOCUS_02150	sequence1:219382..219720(+)	partial			WP_010865177.1	cupin domain-containing protein	53.6	34.1	41.7
MGA_265	LOCUS_02620	sequence1:263381..263575(+)	internal_stop_codon	263621..263623(+),263573..263575(+)		WP_027970603.1	transposase	100.0	66.0	75.0
MGA_288	LOCUS_02850	sequence1:281474..283087(-)	frameshift		283083	WP_011836385.1	bifunctional 2',3'-cyclic-nucleotide 2'-phosphodiesterase/3'-nucleotidase	99.8	66.3	66.4
MGA_289	LOCUS_02860	sequence1:283030..283950(-)	frameshift		283083	WP_011836385.1	bifunctional 2',3'-cyclic-nucleotide 2'-phosphodiesterase/3'-nucleotidase	81.4	31.9	54.8
MGA_295	LOCUS_02920	sequence1:290899..291564(+)	partial			WP_010963358.1	YiiX/YebB-like N1pC/P60 family cysteine hydrolase	55.7	49.8	44.4
MGA_312	LOCUS_03090	sequence1:309920..310822(-)	partial			WP_002198132.1	Ppx/GppA family phosphatase	97.7	56.9	30.1
MGA_321	LOCUS_03180	sequence1:319848..320246(+)	partial			WP_010922668.1	hypothetical protein	97.7	52.5	27.3
MGA_327	LOCUS_03240	sequence1:323680..323973(-)	frameshift		324157	WP_000022160.1	site-specific integrase	48.5	12.2	87.2
MGA_328	LOCUS_03250	sequence1:324125..324979(-)	frameshift		324160	WP_000022160.1	site-specific integrase	96.5	71.4	74.5
MGA_335	LOCUS_03320	sequence1:329197..329625(+)	partial			WP_011203101.1	TaqI-like C-terminal specificity domain-containing protein	69.0	8.0	42.6
MGA_336	LOCUS_03330	sequence1:329615..332371(+)	partial			WP_096040458.1	SIR2 family protein	28.3	51.5	26.8
MGA_349	LOCUS_03460	sequence1:343287..343712(+)	partial			WP_011109583.1	hypothetical protein	95.7	33.2	25.9
MGA_374	LOCUS_03700	sequence1:370880..371257(-)	partial			WP_002982833.1	mechanosensitive ion channel family protein	100.0	44.5	72.0
MGA_379	LOCUS_03750	sequence1:376596..377441(+)	partial			WP_000925394.1	sensor histidine kinase	85.4	41.5	51.7
MGA_403	LOCUS_03980	sequence1:407503..407991(+)	frameshift		407494	WP_010921894.1	sigma-70 family RNA polymerase sigma factor	94.4	83.6	52.3
MGA_412	LOCUS_04070	sequence1:414214..414603(+)	frameshift,internal_stop_codon	413929..413931(+),413981..413983(+)	413937,414118	WP_000859573.1	MerR family transcriptional regulator	99.2	53.8	56.2
MGA_414	LOCUS_04090	sequence1:415070..415456(+)	frameshift		415375	WP_002261950.1	SDR family oxidoreductase	83.6	38.6	50.5
MGA_415	LOCUS_04100	sequence1:415498..415911(+)	frameshift		415375	WP_002261950.1	SDR family oxidoreductase	97.8	48.4	54.5
MGA_422	LOCUS_04170	sequence1:421984..422982(-)	partial			WP_010921901.1	branched-chain amino acid transport system II carrier protein	100.0	72.8	66.9
MGA_458	LOCUS_04530	sequence1:456177..456326(+)	partial			WP_002262564.1	membrane protein insertion efficiency factor YidD	93.9	54.8	82.6
MGA_511	LOCUS_05060	sequence1:501668..502201(+)	partial			WP_002300997.1	bifunctional lysylphosphatidylglycerol flippase/synthetase MprF	68.9	14.4	47.6
MGA_543	LOCUS_05380	sequence1:529887..530840(+)	partial			WP_001017622.1	sensor histidine kinase	97.8	69.5	41.6
MGA_603	LOCUS_05980	sequence1:587345..587491(-)	partial			WP_002985576.1	SPJ_0845 family protein	68.8	68.6	71.4
MGA_648	LOCUS_06430	sequence1:630178..630465(+)	frameshift		630160,630421	WP_002295900.1	cation diffusion facilitator family transporter	86.3	26.4	62.2
MGA_649	LOCUS_06440	sequence1:630514..630717(+)	frameshift		630420	WP_002295900.1	cation diffusion facilitator family transporter	98.5	21.2	48.5
MGA_699	LOCUS_06940	sequence1:687221..687523(+)	frameshift,internal_stop_codon	687056..687058(+)	687657	WP_002262947.1	glycogen/starch/alpha-glucan phosphorylase	99.0	12.4	83.8
MGA_700	LOCUS_06950	sequence1:687520..687669(+)	frameshift		687888,687657	WP_002917496.1	glycogen/starch/alpha-glucan phosphorylase	91.8	5.6	82.2
MGA_701	LOCUS_06960	sequence1:687666..687914(+)	frameshift		687657,687894	WP_002917496.1	glycogen/starch/alpha-glucan phosphorylase	92.7	9.5	81.6
MGA_702	LOCUS_06970	sequence1:687919..688386(+)	frameshift,internal_stop_codon	688385..688387(+)	687657,687894	WP_002262947.1	glycogen/starch/alpha-glucan phosphorylase	100.0	19.4	74.8
MGA_703	LOCUS_06980	sequence1:688390..689259(+)	internal_stop_codon	688384..688386(+)		WP_002262947.1	glycogen/starch/alpha-glucan phosphorylase	98.3	35.6	76.4
MGA_727	LOCUS_07220	sequence1:715606..715782(+)	partial			WP_000048058.1	30S ribosomal protein S21	74.1	74.1	100.0
MGA_743	LOCUS_07380	sequence1:734778..736985(+)	partial			WP_002263335.1	GBS Bsp-like repeat-containing protein	68.3	51.5	40.9
MGA_758	LOCUS_07530	sequence1:748955..749368(-)	partial			WP_010922142.1	membrane protein	66.4	61.6	58.2
MGA_855	LOCUS_08500	sequence1:847291..851739(+)	partial			WP_012775357.1	S8 family serine peptidase	61.7	52.5	31.0
MGA_910	LOCUS_09050	sequence1:904813..907257(+)	partial			WP_010922709.1	pneumococcal-type histidine triad protein	61.7	57.2	47.9
MGA_921	LOCUS_09160	sequence1:919598..920554(+)	partial			WP_002261970.1	hypothetical protein	91.2	57.9	49.1
MGA_927	LOCUS_09220	sequence1:924832..926112(+)	partial			WP_003547453.1	ferric reductase	50.9	79.3	28.3
MGA_937	LOCUS_09320	sequence1:934276..934698(+)	partial			WP_011948039.1	cupin domain-containing protein	97.9	62.6	55.5
MGA_996	LOCUS_09910	sequence1:992035..992712(-)	partial			WP_010922359.1	phosphate ABC transporter permease subunit PstC	100.0	72.3	90.7
MGA_1059	LOCUS_10540	sequence1:1055133..1055675(-)	partial			WP_002294234.1	chorismate mutase	67.8	44.3	33.6
MGA_1062	LOCUS_10570	sequence1:1058014..1058940(-)	partial			WP_011250668.1	glycosyltransferase	67.5	68.4	33.0
MGA_1098	LOCUS_10930	sequence1:1092850..1094022(-)	partial			WP_034350357.1	alpha/beta hydrolase	58.2	68.5	29.8
MGA_1131	LOCUS_11260	sequence1:1128276..1129829(-)	partial			WP_000682783.1	G5 domain-containing protein	24.0	4.2	34.8
MGA_1138	LOCUS_11330	sequence1:1140120..1140434(-)	internal_stop_codon	1140492..1140494(-)		WP_010922238.1	thiamine pyrophosphate-dependent dehydrogenase E1 component subunit alpha	100.0	32.3	86.5
MGA_1139	LOCUS_11340	sequence1:1140492..1141088(-)	internal_stop_codon	1140492..1140494(-)		WP_010922238.1	thiamine pyrophosphate-dependent dehydrogenase E1 component subunit alpha	100.0	61.5	91.9
MGA_1172	LOCUS_11670	sequence1:1173766..1174353(-)	partial			WP_010922189.1	TDT family transporter	96.4	62.6	61.9
MGA_1191	LOCUS_11860	sequence1:1200404..1200562(-)	partial			WP_002984154.1	hypothetical protein	71.2	71.2	94.6
MGA_1194	LOCUS_11890	sequence1:1203886..1204803(+)	partial			WP_002682345.1	CorA family divalent cation transporter	61.6	61.3	37.4
MGA_1239	LOCUS_12340	sequence1:1251537..1251740(-)	partial			WP_164405755.1	DUF3272 family protein	74.6	74.6	64.0
MGA_1262	LOCUS_12570	sequence1:1279058..1279549(-)	frameshift		1279569	WP_011922181.1	pseudouridine synthase	99.4	68.1	64.2
MGA_1263	LOCUS_12580	sequence1:1279558..1279773(-)	frameshift		1279569	WP_038431436.1	pseudouridine synthase	100.0	29.8	45.1
MGA_1266	LOCUS_12610	sequence1:1281792..1282832(-)	partial			WP_011836681.1	serine hydrolase	83.5	74.9	70.2
MGA_1269	LOCUS_12640	sequence1:1284786..1285571(-)	partial			WP_010922436.1	DNA internalization-related competence protein ComEC/Rec2	96.9	33.9	60.1
MGA_1277	LOCUS_12720	sequence1:1294522..1295358(-)	partial			WP_038431655.1	hypothetical protein	48.2	24.2	33.3
MGA_1367	LOCUS_13620	sequence1:1386461..1387123(-)	partial			WP_000511719.1	hypothetical protein	28.6	82.9	41.3
MGA_1368	LOCUS_13630	sequence1:1387132..1388448(-)	partial			WP_000241584.1	hypothetical protein	51.6	76.6	40.3
MGA_1380	LOCUS_13750	sequence1:1400841..1402295(-)	partial			WP_000020814.1	T7SS effector LXG polymorphic toxin	42.1	44.0	29.9
MGA_1396	LOCUS_13910	sequence1:1419326..1420993(-)	partial			WP_000762954.1	DUF262 domain-containing protein	32.6	30.6	39.8
MGA_1409	LOCUS_14040	sequence1:1436027..1438138(-)	partial			WP_010932366.1	AAA family ATPase	77.2	73.1	22.9
MGA_1506	LOCUS_15000	sequence1:1548669..1548797(+)	frameshift,internal_stop_codon	1548925..1548927(+)	1548782	WP_088197863.1	IS3-like element ISSag2 family transposase	90.5	10.3	92.1
MGA_1507	LOCUS_15010	sequence1:1548988..1549317(-)	frameshift,internal_stop_codon	1549330..1549332(-)	1549002	WP_000556335.1	PTS sugar transporter subunit IIC	96.3	26.9	48.6
MGA_1588	LOCUS_15820	sequence1:1623769..1624107(-)	partial			WP_001830526.1	DsrE/DsrF/DrsH-like family protein	81.2	24.7	39.6
MGA_1615	LOCUS_16090	sequence1:1654493..1655218(-)	partial			WP_000704662.1	site-specific integrase	100.0	62.6	63.8
MGA_1665	LOCUS_16590	sequence1:1700957..1702018(-)	partial			WP_050984070.1	AbrB family transcriptional regulator	43.9	42.8	23.1
MGA_1671	LOCUS_16650	sequence1:1708099..1708308(-)	partial			WP_002286804.1	hypothetical protein	87.0	53.6	51.7
MGA_1672	LOCUS_16660	sequence1:1708458..1708706(-)	frameshift		1708490	WP_003243530.1	flavin reductase family protein	82.9	32.4	44.1
MGA_1678	LOCUS_16720	sequence1:1713493..1713786(-)	partial			WP_000503137.1	GNAT family protein	100.0	42.9	80.4
MGA_1679	LOCUS_16730	sequence1:1713798..1714211(-)	partial			WP_000908499.1	MFS transporter	92.7	31.9	52.0
MGA_1685	LOCUS_16790	sequence1:1718763..1719380(+)	partial			WP_006268963.1	hypothetical protein	65.9	66.7	42.2
MGA_1726	LOCUS_17200	sequence1:1758163..1758318(-)	partial			WP_002321387.1	BglG family transcription antiterminator	100.0	7.8	54.9
MGA_1779	LOCUS_17730	sequence1:1810093..1822710(-)	partial			WP_036095565.1	isopeptide-forming domain-containing fimbrial protein	7.2	78.2	25.5
MGA_1780	LOCUS_17740	sequence1:1822751..1825582(-)	partial			WP_011082576.1	accumulation-associated protein Aap	68.8	39.7	23.9
MGA_1854	LOCUS_18480	sequence1:1907891..1908751(+)	partial			WP_010922690.1	streptokinase	86.4	62.0	29.1
MGA_1867	LOCUS_18610	sequence1:1921608..1921988(-)	partial			WP_000402394.1	helix-turn-helix transcriptional regulator	100.0	64.0	44.4
MGA_1869	LOCUS_18630	sequence1:1923245..1925446(-)	partial			WP_012256402.1	PucR family transcriptional regulator	20.7	28.8	32.9
MGA_1878	LOCUS_18720	sequence1:1935818..1936087(-)	partial			WP_011222020.1	metalloregulator ArsR/SmtB family transcription factor	82.0	61.3	47.9
