# locus_id	locus_tag	location	classification	internal_stop	indel	ref_id	description	query_cov	ref_cov	identity
MGA_4	LOCUS_00040	sequence1:2858..3358(-)	partial			WP_001197951.1	YehR family lipoprotein	74.1	69.3	34.7
MGA_16	LOCUS_00160	sequence1:15418..16083(-)	frameshift		16127	WP_001155321.1	IS30-like element ISSpn8 family transposase	99.1	69.1	70.8
MGA_17	LOCUS_00170	sequence1:16047..16370(-)	frameshift		16127	WP_205010637.1	IS30 family transposase	88.8	30.0	60.0
MGA_35	LOCUS_00340	sequence1:42830..43801(+)	frameshift		42821	WP_011269088.1	SEC-C metal-binding domain-containing protein	83.3	74.8	26.0
MGA_95	LOCUS_00940	sequence1:101912..107770(+)	partial			WP_011068088.1	FctA domain-containing protein	53.1	44.7	32.1
MGA_124	LOCUS_01220	sequence1:138674..140071(+)	partial			WP_002358661.1	LPXTG cell wall anchor domain-containing protein	18.5	81.7	40.0
MGA_125	LOCUS_01230	sequence1:140097..145907(+)	partial			WP_011836823.1	GbpC/Spa domain-containing protein	24.8	34.9	35.7
MGA_152	LOCUS_01500	sequence1:174209..174646(-)	frameshift,internal_stop_codon	174208..174210(-),174649..174651(-)	174726	WP_012972561.1	IS110 family transposase	98.6	35.8	81.1
MGA_153	LOCUS_01510	sequence1:174706..174894(-)	frameshift,internal_stop_codon	174967..174969(-),174649..174651(-)	174726	WP_156875129.1	transposase	95.2	26.7	88.1
MGA_154	LOCUS_01520	sequence1:174967..175161(-)	frameshift,internal_stop_codon	174967..174969(-)	174726	WP_162038636.1	IS110 family transposase	100.0	14.9	90.6
MGA_155	LOCUS_01530	sequence1:175493..175756(+)	frameshift		175750	WP_000255098.1	LD-carboxypeptidase	100.0	25.4	71.3
MGA_156	LOCUS_01540	sequence1:175779..176516(+)	frameshift		175750	WP_120770826.1	LD-carboxypeptidase	98.0	69.8	74.6
MGA_185	LOCUS_01830	sequence1:211374..211991(+)	partial			WP_002902226.1	L-ascorbate 6-phosphate lactonase	90.2	51.0	95.1
MGA_194	LOCUS_01920	sequence1:221322..222161(-)	frameshift		222211	WP_115283723.1	IS3 family transposase	99.6	61.8	79.1
MGA_218	LOCUS_02160	sequence1:241260..241484(-)	frameshift,internal_stop_codon	241191..241193(-)	241232,241274	WP_011836381.1	DUF308 domain-containing protein	93.2	40.4	84.1
MGA_234	LOCUS_02320	sequence1:256245..256739(+)	frameshift,internal_stop_codon	256650..256652(+),256125..256127(+)	256610	WP_102777394.1	IS3 family transposase	74.4	32.4	80.3
MGA_302	LOCUS_02990	sequence1:328969..329808(-)	frameshift		329858	WP_115283723.1	IS3 family transposase	99.6	61.8	79.1
MGA_341	LOCUS_03380	sequence1:371444..371758(+)	partial			WP_002983650.1	DNA-directed RNA polymerase subunit omega	62.5	61.9	92.3
MGA_357	LOCUS_03540	sequence1:387759..387911(+)	internal_stop_codon	387909..387911(+)		WP_000355907.1	cytidine deaminase	98.0	34.0	81.6
MGA_358	LOCUS_03550	sequence1:387918..388244(+)	internal_stop_codon	387909..387911(+)		WP_000355907.1	cytidine deaminase	80.6	60.4	74.7
MGA_376	LOCUS_03710	sequence1:411364..411555(+)	frameshift,internal_stop_codon	411844..411846(+)	411184,411804,411549	WP_102777394.1	IS3 family transposase	98.4	30.3	47.4
MGA_407	LOCUS_04020	sequence1:441126..441374(+)	internal_stop_codon	441372..441374(+)		WP_002902601.1	GNAT family N-acetyltransferase	100.0	56.9	59.8
MGA_408	LOCUS_04030	sequence1:441390..441563(+)	internal_stop_codon	441372..441374(+)		WP_002902601.1	GNAT family N-acetyltransferase	96.5	38.2	56.4
MGA_443	LOCUS_04380	sequence1:479550..479783(+)	partial			WP_002262696.1	hypothetical protein	71.4	67.9	67.3
MGA_474	LOCUS_04690	sequence1:505296..505619(+)	frameshift		505281	WP_002287457.1	DUF2798 domain-containing protein	96.3	70.9	40.0
MGA_512	LOCUS_05070	sequence1:554441..555619(+)	partial			WP_002680450.1	TPM domain-containing protein	51.8	76.1	33.5
MGA_524	LOCUS_05190	sequence1:566124..566765(-)	frameshift,internal_stop_codon	566921..566923(-)	566788	WP_011836763.1	metallophosphoesterase	100.0	74.5	69.0
MGA_573	LOCUS_05680	sequence1:628152..628889(-)	partial			WP_003722868.1	YdcF family protein	95.5	70.1	44.7
MGA_587	LOCUS_05820	sequence1:640096..640224(+)	frameshift		640218	WP_001156530.1	UDP-glucose 4-epimerase GalE	97.6	12.1	80.5
MGA_588	LOCUS_05830	sequence1:640269..641114(+)	frameshift		640218	WP_001156530.1	UDP-glucose 4-epimerase GalE	99.6	82.6	83.2
MGA_616	LOCUS_06110	sequence1:673786..674070(+)	internal_stop_codon	674068..674070(+)		WP_001237212.1	YbaN family protein	100.0	79.0	73.4
MGA_626	LOCUS_06210	sequence1:686639..686779(-)	partial			WP_002897213.1	SPJ_0845 family protein	67.4	68.9	90.3
MGA_669	LOCUS_06640	sequence1:725865..726326(+)	partial			WP_011837046.1	hypothetical protein	99.3	71.0	63.2
MGA_675	LOCUS_06700	sequence1:731597..732025(-)	partial			WP_011836891.1	hypothetical protein	70.4	72.5	40.6
MGA_685	LOCUS_06800	sequence1:742454..749437(+)	partial			WP_207215633.1	MucBP domain-containing protein	34.6	72.6	35.1
MGA_691	LOCUS_06860	sequence1:753755..754057(+)	partial			WP_002680353.1	hypothetical protein	99.0	67.3	71.7
MGA_700	LOCUS_06950	sequence1:761290..762120(+)	frameshift		761997	WP_012775274.1	pneumococcal-type histidine triad protein	82.6	27.9	48.3
MGA_701	LOCUS_06960	sequence1:762099..763331(+)	frameshift,internal_stop_codon	763330..763332(+)	761997	WP_012775274.1	pneumococcal-type histidine triad protein	100.0	47.9	60.8
MGA_737	LOCUS_07320	sequence1:800584..801465(+)	partial			WP_003722212.1	LysR family transcriptional regulator	66.2	65.8	30.9
MGA_739	LOCUS_07340	sequence1:802328..802768(+)	internal_stop_codon	802301..802303(+)		WP_011202637.1	carboxymuconolactone decarboxylase family protein	95.2	50.0	58.3
MGA_747	LOCUS_07420	sequence1:808490..808945(+)	partial			WP_010964318.1	ASCH domain-containing protein	75.5	71.3	43.0
MGA_751	LOCUS_07460	sequence1:812178..812534(+)	partial			WP_000566988.1	GNAT family N-acetyltransferase	100.0	71.1	90.7
MGA_756	LOCUS_07500	sequence1:815443..815943(+)	frameshift,internal_stop_codon	815401..815403(+)	815360	WP_002262027.1	flavocytochrome c	100.0	21.0	74.0
MGA_762	LOCUS_07560	sequence1:821754..822146(+)	internal_stop_codon	821751..821753(+)		WP_011461573.1	alpha/beta hydrolase	99.2	48.5	29.8
MGA_776	LOCUS_07700	sequence1:834243..834614(+)	frameshift		834545	WP_011836679.1	DUF805 domain-containing protein	81.3	26.6	48.0
MGA_777	LOCUS_07710	sequence1:834545..834784(+)	frameshift		834545	WP_011836679.1	DUF805 domain-containing protein	67.1	14.6	60.4
MGA_801	LOCUS_07950	sequence1:856609..857289(+)	internal_stop_codon	857287..857289(+)		WP_002897353.1	GNAT family N-acetyltransferase	96.9	75.5	58.4
MGA_809	LOCUS_08030	sequence1:867153..867329(+)	partial			WP_000048054.1	30S ribosomal protein S21	74.1	74.1	100.0
MGA_844	LOCUS_08380	sequence1:902151..902342(-)	partial			WP_002310781.1	DUF3173 domain-containing protein	74.6	77.0	51.1
MGA_859	LOCUS_08530	sequence1:913223..915994(+)	partial			WP_010946812.1	DUF927 domain-containing protein	26.4	46.6	20.7
MGA_866	LOCUS_08600	sequence1:922063..922443(+)	partial			WP_000721684.1	ABC transporter ATP-binding protein	63.5	31.6	52.5
MGA_881	LOCUS_08750	sequence1:939087..939215(-)	frameshift		939306	WP_011836974.1	sugar O-acetyltransferase	92.9	20.9	87.2
MGA_882	LOCUS_08760	sequence1:939244..939633(-)	frameshift		939306	WP_011836974.1	sugar O-acetyltransferase	84.5	58.3	76.1
MGA_883	LOCUS_08770	sequence1:939863..940450(-)	internal_stop_codon	939863..939865(-)		WP_011836975.1	PRD domain-containing protein	100.0	69.6	69.7
MGA_990	LOCUS_09840	sequence1:1048190..1049029(-)	frameshift		1049079	WP_115283723.1	IS3 family transposase	99.6	61.8	79.1
MGA_1024	LOCUS_10180	sequence1:1077401..1077535(-)	partial			WP_011836809.1	GNAT family N-acetyltransferase	81.8	24.5	69.4
MGA_1051	LOCUS_10450	sequence1:1107497..1107667(+)	partial			WP_002895160.1	DUF3042 family protein	71.4	71.4	90.0
MGA_1059	LOCUS_10530	sequence1:1115609..1116028(-)	frameshift		1116002	WP_011105965.1	hypothetical protein	93.5	64.8	54.6
MGA_1060	LOCUS_10540	sequence1:1115964..1116194(-)	frameshift		1116002	WP_011105965.1	hypothetical protein	86.8	33.2	53.0
MGA_1082	LOCUS_10760	sequence1:1143996..1145231(-)	partial			WP_011388495.1	ComF family protein	18.7	32.1	43.0
MGA_1083	LOCUS_10770	sequence1:1145224..1146228(-)	partial			WP_164922340.1	DNA-processing protein DprA	62.9	49.3	35.2
MGA_1084	LOCUS_10780	sequence1:1146331..1147641(-)	partial			WP_000301254.1	recombinase family protein	84.2	69.8	52.3
MGA_1085	LOCUS_10790	sequence1:1147586..1148809(-)	partial			WP_041272556.1	recombinase family protein	81.3	63.3	42.6
MGA_1086	LOCUS_10800	sequence1:1148953..1149900(-)	partial			WP_010774154.1	GH25 family lysozyme	30.5	21.5	64.6
MGA_1090	LOCUS_10840	sequence1:1150865..1154158(-)	partial			WP_001880132.1	phage tail spike protein	50.4	41.8	47.6
MGA_1100	LOCUS_10940	sequence1:1161666..1162349(-)	partial			WP_225426975.1	Clp protease ClpP	76.7	73.1	38.5
MGA_1105	LOCUS_10990	sequence1:1166042..1166257(-)	partial			WP_041272555.1	DUF4314 domain-containing protein	85.9	37.7	49.2
MGA_1116	LOCUS_11100	sequence1:1173886..1176171(-)	partial			WP_010950564.1	phage/plasmid primase, P4 family	45.9	73.2	31.0
MGA_1124	LOCUS_11180	sequence1:1181866..1182816(+)	partial			WP_001303996.1	hypothetical protein	47.5	68.8	33.3
MGA_1151	LOCUS_11450	sequence1:1210942..1213761(-)	partial			WP_002900650.1	GBS Bsp-like repeat-containing protein	81.5	58.7	52.8
MGA_1178	LOCUS_11720	sequence1:1240930..1244739(-)	partial			WP_012775602.1	GbpC/Spa domain-containing protein	91.9	71.3	30.1
MGA_1184	LOCUS_11780	sequence1:1249696..1250631(-)	partial			WP_001132444.1	replication initiator protein A	53.1	51.4	42.4
MGA_1197	LOCUS_11910	sequence1:1263066..1263323(-)	internal_stop_codon	1263066..1263068(-)		WP_002263641.1	GrpB family protein	100.0	42.3	54.1
MGA_1219	LOCUS_12130	sequence1:1286728..1287504(-)	internal_stop_codon	1287595..1287597(-)		WP_002904591.1	zinc-binding alcohol dehydrogenase family protein	100.0	80.6	69.0
MGA_1227	LOCUS_12210	sequence1:1294278..1295999(-)	partial			WP_011963670.1	AAA family ATPase	59.2	49.8	26.3
MGA_1236	LOCUS_12300	sequence1:1306288..1306548(-)	internal_stop_codon	1306768..1306770(-),1306564..1306566(-)		WP_000730279.1	DUF3169 family protein	93.0	32.8	55.0
MGA_1239	LOCUS_12330	sequence1:1306937..1307212(-)	frameshift		1307234	WP_002900787.1	helix-turn-helix transcriptional regulator	75.8	63.9	79.7
MGA_1312	LOCUS_13060	sequence1:1381018..1381944(+)	frameshift		1381977,1381911	WP_002263312.1	aminoacyltransferase	97.1	72.7	57.2
MGA_1313	LOCUS_13070	sequence1:1382065..1382265(+)	frameshift		1381980,1381911	WP_002919288.1	aminoacyltransferase	100.0	16.1	72.7
MGA_1346	LOCUS_13400	sequence1:1410619..1411248(+)	partial			WP_002263013.1	hypothetical protein	24.9	24.6	51.9
MGA_1365	LOCUS_13590	sequence1:1429636..1429899(-)	internal_stop_codon	1429636..1429638(-),1430032..1430034(-)		WP_000276229.1	IS1182-like element ISSmi2 family transposase	75.9	11.8	42.4
MGA_1366	LOCUS_13600	sequence1:1430032..1430907(-)	frameshift,internal_stop_codon	1430031..1430033(-)	1431026	WP_095092556.1	IS1182 family transposase	100.0	52.8	45.1
MGA_1367	LOCUS_13610	sequence1:1430925..1431161(-)	partial			WP_000547417.1	transposase	57.7	55.6	73.3
MGA_1374	LOCUS_13670	sequence1:1443021..1443314(-)	frameshift		1443296,1443407	WP_012048283.1	SulP family inorganic anion transporter	94.8	17.0	57.4
MGA_1465	LOCUS_14580	sequence1:1544533..1544703(+)	frameshift,internal_stop_codon	1544701..1544703(+)	1544528,1544908	WP_100190734.1	IS3 family transposase	96.4	10.5	52.7
MGA_1469	LOCUS_14620	sequence1:1548804..1548953(-)	internal_stop_codon	1548954..1548956(-)		WP_012028519.1	pseudouridine synthase	100.0	20.2	71.4
MGA_1470	LOCUS_14630	sequence1:1548954..1549532(-)	internal_stop_codon	1548954..1548956(-)		WP_012028519.1	pseudouridine synthase	100.0	79.3	74.0
MGA_1480	LOCUS_14730	sequence1:1564254..1564658(-)	internal_stop_codon	1564254..1564256(-)		WP_003702501.1	flavodoxin	97.0	83.3	58.5
MGA_1482	LOCUS_14750	sequence1:1565717..1566025(-)	frameshift		1566108	WP_011101849.1	LacI family DNA-binding transcriptional regulator	99.0	32.7	36.9
MGA_1483	LOCUS_14760	sequence1:1566022..1566588(-)	frameshift,internal_stop_codon	1566634..1566636(-)	1566108	WP_000200830.1	LacI family DNA-binding transcriptional regulator	85.1	51.3	52.2
MGA_1484	LOCUS_14770	sequence1:1566802..1567155(-)	frameshift,internal_stop_codon	1567190..1567192(-)	1567174,1566855	WP_000153219.1	Cof-type HAD-IIB family hydrolase	88.9	38.7	52.9
MGA_1485	LOCUS_14780	sequence1:1567190..1567492(-)	frameshift,internal_stop_codon	1567190..1567192(-)	1567174	WP_000153219.1	Cof-type HAD-IIB family hydrolase	96.0	36.1	59.8
MGA_1500	LOCUS_14930	sequence1:1580119..1580349(+)	partial			WP_002934707.1	hypothetical protein	98.7	47.8	70.7
MGA_1504	LOCUS_14970	sequence1:1582644..1583378(-)	frameshift,internal_stop_codon	1583441..1583443(-)	1583611	WP_011102204.1	6-phospho-beta-glucosidase	97.1	48.3	65.8
MGA_1505	LOCUS_14980	sequence1:1583564..1584085(-)	frameshift,internal_stop_codon	1583440..1583442(-)	1583610,1584084	WP_009931832.1	glycoside hydrolase family 1 protein	92.5	32.5	63.4
MGA_1524	LOCUS_15170	sequence1:1605819..1609418(-)	partial			WP_002900650.1	GBS Bsp-like repeat-containing protein	49.8	44.9	42.0
MGA_1558	LOCUS_15510	sequence1:1646216..1646383(+)	internal_stop_codon	1646381..1646383(+)		WP_115270946.1	IS110 family transposase	96.4	13.2	96.2
MGA_1592	LOCUS_15850	sequence1:1677782..1678402(-)	internal_stop_codon	1678508..1678510(-)		WP_011101571.1	restriction endonuclease	100.0	71.7	39.7
MGA_1597	LOCUS_15900	sequence1:1683546..1684427(-)	frameshift		1684450	WP_002263364.1	zinc-dependent alcohol dehydrogenase family protein	99.7	83.7	76.7
MGA_1598	LOCUS_15910	sequence1:1684424..1684591(-)	frameshift		1684450	WP_002263364.1	zinc-dependent alcohol dehydrogenase family protein	85.5	13.5	59.6
MGA_1610	LOCUS_16030	sequence1:1694670..1695020(+)	partial			WP_002902079.1	hypothetical protein	100.0	71.6	44.8
MGA_1611	LOCUS_16040	sequence1:1695266..1701751(-)	partial			WP_011837563.1	Cna B-type domain-containing protein	52.2	67.0	33.2
MGA_1649	LOCUS_16420	sequence1:1724797..1726320(-)	partial			WP_000777402.1	SpaH/EbpB family LPXTG-anchored major pilin	75.9	72.0	33.0
MGA_1653	LOCUS_16460	sequence1:1734164..1734436(-)	internal_stop_codon	1734485..1734487(-)		WP_011836334.1	uridine kinase	94.4	40.1	58.8
MGA_1654	LOCUS_16470	sequence1:1734485..1734811(-)	internal_stop_codon	1734485..1734487(-)		WP_011836334.1	uridine kinase	95.4	48.6	67.0
MGA_1657	LOCUS_16500	sequence1:1737235..1737666(-)	frameshift		1737710	WP_011836331.1	kinase	98.6	83.5	68.3
MGA_1662	LOCUS_16550	sequence1:1743094..1745190(-)	partial			WP_000671444.1	fibronectin-binding SSURE repeat adhesin PavB	85.5	51.1	53.2
MGA_1663	LOCUS_16560	sequence1:1745342..1745671(+)	internal_stop_codon	1745669..1745671(+)		WP_001066185.1	histidine phosphatase family protein	100.0	59.7	50.5
MGA_1664	LOCUS_16570	sequence1:1745678..1745878(+)	internal_stop_codon	1745669..1745671(+)		WP_001066185.1	histidine phosphatase family protein	86.4	31.5	45.6
MGA_1668	LOCUS_16610	sequence1:1749927..1751351(+)	frameshift		1751336,1751339,1751342	WP_078232918.1	Ltp family lipoprotein	36.1	20.5	38.5
MGA_1669	LOCUS_16620	sequence1:1751369..1751584(+)	frameshift		1751336,1751339,1751342	WP_078232918.1	Ltp family lipoprotein	74.6	7.1	54.4
MGA_1670	LOCUS_16630	sequence1:1751765..1751941(-)	frameshift,internal_stop_codon	1752116..1752118(-),1751765..1751767(-),1751951..1751953(-)	1751701	WP_002263494.1	ISL3-like element ISSmu2 family transposase	94.8	13.2	72.7
MGA_1671	LOCUS_16640	sequence1:1752156..1752395(-)	internal_stop_codon	1752116..1752118(-),1751951..1751953(-)		WP_002263494.1	ISL3-like element ISSmu2 family transposase	50.6	9.6	65.0
MGA_1672	LOCUS_16650	sequence1:1753003..1755297(-)	partial			WP_011948400.1	class I SAM-dependent DNA methyltransferase	51.4	83.5	30.1
MGA_1684	LOCUS_16770	sequence1:1765795..1766472(-)	partial			WP_000231291.1	acyltransferase	70.7	77.3	37.9
MGA_1700	LOCUS_16930	sequence1:1781982..1782419(-)	partial			WP_002917849.1	SP_0198 family lipoprotein	69.7	63.5	47.5
MGA_1719	LOCUS_17120	sequence1:1798430..1798936(-)	partial			WP_167939813.1	virulence RhuM family protein	96.4	45.7	59.3
MGA_1721	LOCUS_17140	sequence1:1800231..1800857(-)	partial			WP_095089160.1	helix-turn-helix transcriptional regulator	80.8	71.2	33.5
MGA_1730	LOCUS_17230	sequence1:1803747..1804538(+)	partial			WP_010905350.1	phage replisome organiser protein	62.7	58.9	49.7
MGA_1733	LOCUS_17260	sequence1:1806621..1806812(+)	partial			WP_011020810.1	type II toxin-antitoxin system HicA family toxin	92.1	74.0	43.1
MGA_1757	LOCUS_17500	sequence1:1832706..1835576(-)	partial			WP_011962196.1	PorP/SprF family type IX secretion system membrane protein	32.3	25.3	27.5
MGA_1772	LOCUS_17650	sequence1:1848912..1849751(+)	frameshift		1848861	WP_115283723.1	IS3 family transposase	99.6	61.8	79.1
MGA_1779	LOCUS_17720	sequence1:1856011..1857006(+)	partial			WP_002262569.1	DUF1700 domain-containing protein	23.0	39.9	58.2
MGA_1781	LOCUS_17740	sequence1:1858008..1858325(-)	partial			WP_011837702.1	polyphosphate polymerase domain-containing protein	91.4	40.5	68.8
MGA_1799	LOCUS_17920	sequence1:1878238..1879077(-)	frameshift		1879127	WP_115283723.1	IS3 family transposase	99.6	61.8	79.1
MGA_1814	LOCUS_18070	sequence1:1892366..1893055(-)	partial			WP_011141042.1	triose-phosphate isomerase	65.9	63.8	30.6
