# locus_id	locus_tag	location	classification	internal_stop	indel	ref_id	description	query_cov	ref_cov	identity
MGA_1	LOCUS_00010	sequence1:303..1145(+)	frameshift,internal_stop_codon	1147..1149(+)	1139	WP_011674284.1	glutamate racemase	96.4	55.2	47.8
MGA_13	LOCUS_00130	sequence1:9990..12332(+)	partial			WP_011101641.1	translation initiation factor IF-2	77.1	69.6	72.0
MGA_41	LOCUS_00410	sequence1:43494..43853(-)	partial			WP_010906384.1	hypothetical protein	91.6	48.9	34.8
MGA_54	LOCUS_00540	sequence1:54457..54774(+)	partial			WP_003640811.1	YlbG family protein	74.3	78.0	39.7
MGA_80	LOCUS_00800	sequence1:77945..78307(+)	frameshift		77912	WP_002295936.1	ASCH domain-containing protein	99.2	78.9	44.2
MGA_82	LOCUS_00820	sequence1:78892..79110(-)	frameshift		79078	WP_003699994.1	GNAT family N-acetyltransferase	76.4	31.3	48.4
MGA_83	LOCUS_00830	sequence1:79073..79465(-)	frameshift		79078	WP_003699994.1	GNAT family N-acetyltransferase	96.9	64.1	44.5
MGA_98	LOCUS_00980	sequence1:95112..95582(+)	frameshift		95465	WP_003642591.1	amidophosphoribosyltransferase	69.9	22.3	68.8
MGA_99	LOCUS_00990	sequence1:95552..96529(+)	frameshift		95465	WP_002382407.1	amidophosphoribosyltransferase	99.7	67.4	64.2
MGA_103	LOCUS_01030	sequence1:99767..99982(+)	frameshift		99961	WP_000866776.1	phosphoribosylamine--glycine ligase	87.3	15.6	55.2
MGA_104	LOCUS_01040	sequence1:99979..101013(+)	frameshift		99958	WP_014570649.1	phosphoribosylamine--glycine ligase	98.0	82.0	49.6
MGA_106	LOCUS_01060	sequence1:102781..103413(+)	partial			WP_000469013.1	bifunctional 3,4-dihydroxy-2-butanone 4-phosphate synthase/GTP cyclohydrolase II	95.2	49.4	51.0
MGA_107	LOCUS_01070	sequence1:103642..104349(-)	partial			WP_003641460.1	helix-turn-helix transcriptional regulator	35.7	26.5	39.3
MGA_128	LOCUS_01280	sequence1:123874..124854(+)	partial			WP_011475804.1	membrane protein insertase YidC	69.9	73.6	45.2
MGA_142	LOCUS_01420	sequence1:139731..140228(+)	partial			WP_003565600.1	cell division regulator GpsB	68.5	81.7	49.1
MGA_165	LOCUS_01650	sequence1:162542..163102(+)	frameshift		162509	WP_010905789.1	GTP cyclohydrolase I FolE	96.2	51.6	58.3
MGA_183	LOCUS_01830	sequence1:183305..186772(-)	partial			WP_002852392.1	HAD-IA family hydrolase	28.6	30.3	31.5
MGA_184	LOCUS_01840	sequence1:186940..188121(-)	partial			WP_003645039.1	CDP-glycerol glycerophosphotransferase family protein	95.4	58.2	53.3
MGA_185	LOCUS_01850	sequence1:188225..191662(-)	partial			WP_002852392.1	HAD-IA family hydrolase	28.9	30.5	32.0
MGA_209	LOCUS_02090	sequence1:213071..214222(-)	partial			WP_011074562.1	serine hydrolase	64.5	69.9	26.0
MGA_211	LOCUS_02110	sequence1:215139..215636(-)	internal_stop_codon	215679..215681(-)		WP_011476037.1	PTS transporter subunit EIIC	97.0	35.6	49.4
MGA_212	LOCUS_02120	sequence1:215679..216410(-)	internal_stop_codon	215679..215681(-)		WP_011101275.1	PTS transporter subunit EIIC	99.6	57.7	23.8
MGA_214	LOCUS_02140	sequence1:217631..218491(-)	partial			WP_013531164.1	alpha/beta hydrolase	73.8	69.2	25.7
MGA_217	LOCUS_02170	sequence1:220193..220951(-)	frameshift,internal_stop_codon	220999..221001(-)	220224,221004	WP_002262583.1	D-alanyl-lipoteichoic acid biosynthesis protein DltB	96.4	57.9	63.8
MGA_218	LOCUS_02180	sequence1:220948..221343(-)	frameshift,internal_stop_codon	220999..221001(-)	221004	WP_009659556.1	D-alanyl-lipoteichoic acid biosynthesis protein DltB	87.8	27.8	50.4
MGA_220	LOCUS_02200	sequence1:223113..224267(-)	partial			WP_003594959.1	serine hydrolase domain-containing protein	72.9	71.8	27.8
MGA_237	LOCUS_02370	sequence1:241687..242967(+)	partial			WP_011101838.1	Ig-like domain-containing protein	80.8	60.5	31.2
MGA_239	LOCUS_02390	sequence1:245763..247034(+)	partial			WP_000582678.1	bifunctional glutamate--cysteine ligase GshA/glutathione synthetase GshB	96.5	52.9	34.0
MGA_280	LOCUS_02800	sequence1:287187..289964(-)	partial			WP_010964394.1	hypothetical protein	32.9	9.4	28.2
MGA_295	LOCUS_02950	sequence1:304944..305165(-)	partial			WP_010905450.1	TIGR00266 family protein	98.6	31.0	55.6
MGA_300	LOCUS_03000	sequence1:308777..309352(-)	partial			WP_010963779.1	TetR/AcrR family transcriptional regulator	35.6	36.4	41.2
MGA_336	LOCUS_03360	sequence1:344784..345149(-)	frameshift		344801	WP_003550049.1	DUF3290 domain-containing protein	97.5	79.2	30.5
MGA_366	LOCUS_03660	sequence1:373178..373501(+)	internal_stop_codon	373499..373501(+)		WP_002296572.1	transcriptional repressor LexA	96.3	50.2	47.2
MGA_367	LOCUS_03670	sequence1:373550..373789(+)	internal_stop_codon	373499..373501(+)		WP_003640747.1	transcriptional repressor LexA	94.9	35.7	49.3
MGA_373	LOCUS_03730	sequence1:378890..379822(-)	partial			WP_003640710.1	molecular chaperone DnaJ	53.9	43.9	58.9
MGA_390	LOCUS_03900	sequence1:395213..395947(-)	partial			WP_003642122.1	LysM domain-containing protein	94.7	72.3	19.0
MGA_394	LOCUS_03940	sequence1:400915..401400(-)	partial			WP_011101709.1	competence/damage-inducible protein A	92.5	36.2	53.3
MGA_401	LOCUS_04010	sequence1:408409..408612(-)	frameshift		408638	WP_010906368.1	gluconokinase	94.0	12.1	57.1
MGA_402	LOCUS_04020	sequence1:408576..409943(-)	frameshift		408638	WP_010906368.1	gluconokinase	95.2	81.9	63.4
MGA_411	LOCUS_04110	sequence1:418211..418801(-)	partial			WP_011837359.1	nucleoside-triphosphate diphosphatase	95.4	56.6	31.1
MGA_415	LOCUS_04150	sequence1:422633..423181(-)	partial			WP_011101268.1	Asp-tRNA(Asn)/Glu-tRNA(Gln) amidotransferase subunit GatA	99.5	37.6	70.5
MGA_418	LOCUS_04170	sequence1:424603..424752(-)	frameshift		424892	WP_011836815.1	RsmF rRNA methyltransferase first C-terminal domain-containing protein	83.7	9.4	46.3
MGA_419	LOCUS_04180	sequence1:424881..425972(-)	frameshift		424895	WP_003640460.1	RsmF rRNA methyltransferase first C-terminal domain-containing protein	98.9	78.9	53.3
MGA_484	LOCUS_04820	sequence1:483896..491050(-)	partial			WP_011254514.1	DUF1542 domain-containing protein	78.8	70.8	22.6
MGA_489	LOCUS_04870	sequence1:496902..497702(-)	frameshift		497746	WP_002289184.1	carboxypeptidase M32	98.5	52.6	54.2
MGA_490	LOCUS_04880	sequence1:497690..498268(-)	frameshift,internal_stop_codon	498278..498280(-)	497746	WP_002289184.1	carboxypeptidase M32	87.0	33.5	40.7
MGA_515	LOCUS_05130	sequence1:516695..517582(-)	partial			WP_003709392.1	DNA/RNA non-specific endonuclease	74.6	79.3	55.6
MGA_554	LOCUS_05500	sequence2:31592..31885(+)	internal_stop_codon	31502..31504(+)		WP_003131406.1	TVP38/TMEM64 family protein	99.0	48.8	46.9
MGA_564	LOCUS_05600	sequence2:42971..43711(-)	partial			WP_011476055.1	PBP1A family penicillin-binding protein	93.9	31.1	39.3
MGA_570	LOCUS_05660	sequence2:48593..50476(-)	partial			WP_000796600.1	heavy metal translocating P-type ATPase	92.3	73.7	55.8
MGA_580	LOCUS_05760	sequence2:58902..59768(+)	partial			WP_003569796.1	YihY/virulence factor BrkB family protein	84.4	73.4	24.2
MGA_586	LOCUS_05820	sequence2:65446..66114(-)	partial			WP_010880879.1	NAD(P)H-hydrate dehydratase	99.5	42.7	39.4
MGA_595	LOCUS_05910	sequence2:73917..74246(+)	partial			WP_002667298.1	PC4/YdbC family ssDNA-binding protein	57.8	82.9	57.1
MGA_602	LOCUS_05980	sequence2:79669..80916(+)	partial			WP_002286064.1	HAMP domain-containing sensor histidine kinase	67.2	63.5	33.2
MGA_611	LOCUS_06070	sequence2:87425..88546(+)	partial			WP_011475582.1	ATP-binding protein	69.7	67.1	50.4
MGA_653	LOCUS_06480	sequence2:131418..132131(+)	partial			WP_003643232.1	MucBP domain-containing protein	95.8	65.4	26.2
MGA_670	LOCUS_06650	sequence2:146740..146964(+)	partial			WP_003639224.1	F0F1 ATP synthase subunit C	71.6	75.7	69.8
MGA_688	LOCUS_06820	sequence2:169776..170609(+)	partial			WP_003660856.1	SAM-dependent methyltransferase	66.1	74.5	33.9
MGA_758	LOCUS_07520	sequence2:222092..223777(+)	partial			WP_002289023.1	NAD(P)/FAD-dependent oxidoreductase	87.7	73.3	45.3
MGA_772	LOCUS_07660	sequence2:236846..237385(-)	partial			WP_011109294.1	GNAT family N-acetyltransferase	86.0	32.5	34.8
MGA_774	LOCUS_07680	sequence2:239268..240062(-)	partial			WP_002359986.1	phage tail tip lysozyme	51.9	15.5	59.1
MGA_793	LOCUS_07860	sequence2:260915..264670(+)	partial			WP_011254514.1	DUF1542 domain-containing protein	39.1	17.6	27.7
MGA_794	LOCUS_07870	sequence2:265099..275235(+)	partial			WP_011836739.1	accessory Sec-dependent serine-rich glycoprotein adhesin	35.6	70.6	25.6
MGA_806	LOCUS_07990	sequence2:287517..288170(+)	partial			WP_002264906.1	CHAP domain-containing protein	80.2	73.9	36.8
MGA_807	LOCUS_08000	sequence2:288246..288788(+)	partial			WP_003549855.1	C40 family peptidase	68.3	40.8	29.3
MGA_831	LOCUS_08230	sequence2:314398..315105(+)	partial			WP_011254484.1	rhomboid family intramembrane serine protease	74.9	77.4	31.6
MGA_841	LOCUS_08330	sequence2:322358..322867(+)	partial			WP_003644309.1	dUTP diphosphatase	51.5	48.6	36.8
MGA_844	LOCUS_08350	sequence2:323794..324327(-)	partial			WP_003140884.1	TM2 domain-containing protein	43.5	71.2	43.8
MGA_849	LOCUS_08400	sequence2:326222..327121(+)	partial			WP_010989346.1	alpha/beta hydrolase	82.9	69.0	34.0
MGA_851	LOCUS_08420	sequence2:329481..331454(-)	partial			WP_103372260.1	CDP-glycerol glycerophosphotransferase family protein	55.6	42.3	31.1
MGA_867	LOCUS_08560	sequence2:342329..343120(+)	frameshift		343099	WP_003733179.1	DUF1254 domain-containing protein	97.3	56.4	39.5
MGA_868	LOCUS_08570	sequence2:343168..343689(+)	frameshift		343099	WP_003733179.1	DUF1254 domain-containing protein	100.0	38.4	50.0
MGA_879	LOCUS_08680	sequence2:353463..353666(+)	internal_stop_codon	353664..353666(+)		WP_010706547.1	PTS glucose transporter subunit IIA	97.0	39.6	51.5
MGA_880	LOCUS_08690	sequence2:353700..353960(+)	internal_stop_codon	353664..353666(+)		WP_013363031.1	PTS glucose transporter subunit IIA	96.5	48.2	44.0
MGA_881	LOCUS_08700	sequence2:353986..355491(+)	frameshift,internal_stop_codon	353958..353960(+)	353996	WP_011674207.1	PTS glucose transporter subunit IIABC	99.2	74.4	52.4
MGA_884	LOCUS_08730	sequence2:358557..359666(-)	partial			WP_011073890.1	diguanylate cyclase	45.5	26.2	35.6
MGA_885	LOCUS_08740	sequence2:359946..360317(+)	internal_stop_codon	360315..360317(+)		WP_001227915.1	bifunctional glycosyltransferase family 2/GtrA family protein	95.9	33.0	40.8
MGA_886	LOCUS_08750	sequence2:360357..361010(+)	internal_stop_codon	360315..360317(+)		WP_011016893.1	bifunctional glycosyltransferase family 2/GtrA family protein	98.6	60.8	40.2
MGA_887	LOCUS_08760	sequence2:361007..363010(+)	partial			WP_011861594.1	glycosyltransferase	82.6	71.4	37.1
MGA_893	LOCUS_08820	sequence2:366556..367167(+)	internal_stop_codon	367165..367167(+)		WP_027479748.1	3-hydroxyacyl-CoA dehydrogenase	100.0	68.6	52.7
MGA_894	LOCUS_08830	sequence2:367177..367443(+)	internal_stop_codon	367165..367167(+)		WP_027479748.1	3-hydroxyacyl-CoA dehydrogenase	100.0	29.4	52.8
MGA_911	LOCUS_09000	sequence2:383458..386268(+)	partial			WP_011860904.1	glycosylating toxin TcdA	52.1	20.8	24.9
MGA_913	LOCUS_09020	sequence2:386735..386887(-)	frameshift		386994	WP_011675075.1	threonine/serine exporter family protein	92.0	18.1	69.6
MGA_914	LOCUS_09030	sequence2:386977..387477(-)	frameshift		386994	WP_011675075.1	threonine/serine exporter family protein	89.8	58.7	49.0
MGA_926	LOCUS_09140	sequence2:397231..399117(-)	partial			WP_011102038.1	SH3 domain-containing protein	34.4	24.1	24.7
MGA_928	LOCUS_09160	sequence2:401052..403208(+)	frameshift		401014	WP_011101706.1	YfhO family protein	56.8	40.5	28.5
MGA_937	LOCUS_09250	sequence2:411826..412329(+)	partial			WP_003643457.1	YdcF family protein	92.8	44.3	36.2
MGA_940	LOCUS_09280	sequence2:413539..414447(+)	frameshift		414276,414669	WP_011674878.1	DUF2075 domain-containing protein	67.5	50.8	44.1
MGA_941	LOCUS_09290	sequence2:414363..414704(+)	frameshift		414276,414669	WP_011674878.1	DUF2075 domain-containing protein	89.4	24.6	48.5
MGA_942	LOCUS_09300	sequence2:414755..415891(+)	partial			WP_001816819.1	isochorismate synthase	70.6	65.5	39.9
MGA_1033	LOCUS_10180	sequence3:23194..23625(+)	partial			WP_003546774.1	DNA repair protein RadC	78.3	54.1	38.4
MGA_1060	LOCUS_10450	sequence3:48752..49807(+)	partial			WP_011101680.1	cell division protein FtsQ/DivIB	64.1	73.9	32.9
MGA_1063	LOCUS_10480	sequence3:52633..53070(+)	partial			WP_002286627.1	cell division protein SepF	73.8	49.2	39.3
MGA_1070	LOCUS_10550	sequence3:59386..62070(+)	partial			WP_011101675.1	ATP-dependent RecD-like DNA helicase	63.3	67.0	47.7
MGA_1104	LOCUS_10890	sequence3:97200..98231(+)	partial			WP_011674723.1	C40 family peptidase	69.1	57.5	26.1
MGA_1111	LOCUS_10960	sequence3:102204..102962(+)	partial			WP_000612272.1	competence protein CoiA family protein	39.3	23.7	41.4
MGA_1113	LOCUS_10980	sequence3:105019..105399(+)	partial			WP_003641537.1	DUF948 domain-containing protein	57.1	52.2	52.8
MGA_1141	LOCUS_11250	sequence3:130425..130610(+)	partial			WP_003638914.1	30S ribosomal protein S21	72.1	71.0	88.6
MGA_1154	LOCUS_11380	sequence3:142302..145067(+)	partial			WP_003700578.1	DNA translocase FtsK	57.8	68.1	53.9
MGA_1171	LOCUS_11540	sequence3:156436..156654(+)	partial			WP_010922480.1	XRE family transcriptional regulator	91.7	26.7	41.8
MGA_1194	LOCUS_11770	sequence3:165746..166204(+)	partial			WP_002356090.1	Asp23/Gls24 family envelope stress response protein	84.9	69.4	50.4
MGA_1206	LOCUS_11890	sequence3:175563..176675(+)	frameshift		176333	WP_011475652.1	phage major capsid protein	68.4	63.6	56.9
MGA_1207	LOCUS_11900	sequence3:176573..176800(+)	partial			WP_011475652.1	phage major capsid protein	85.3	16.1	82.8
MGA_1208	LOCUS_11910	sequence3:176861..177205(+)	partial			WP_010905932.1	head-tail connector protein	72.8	74.8	32.9
MGA_1290	LOCUS_12710	sequence4:58142..58915(-)	partial			WP_003644005.1	biotin--[acetyl-CoA-carboxylase] ligase	95.3	74.8	33.3
MGA_1302	LOCUS_12830	sequence4:74220..74786(-)	partial			WP_011475701.1	DNA-directed RNA polymerase subunit delta	60.6	58.2	67.5
MGA_1322	LOCUS_13030	sequence4:95478..95798(-)	internal_stop_codon	95802..95804(-)		WP_000029196.1	ribose transporter RbsU	91.5	33.4	52.0
MGA_1323	LOCUS_13040	sequence4:95802..96389(-)	internal_stop_codon	95802..95804(-)		WP_003641602.1	GRP family sugar transporter	100.0	63.6	41.0
MGA_1334	LOCUS_13150	sequence4:112113..112769(-)	frameshift		112831	WP_206819539.1	alpha/beta hydrolase	99.1	69.1	51.2
MGA_1335	LOCUS_13160	sequence4:112748..113041(-)	frameshift		112837	WP_008764889.1	alpha/beta hydrolase	68.0	19.5	37.3
MGA_1338	LOCUS_13190	sequence4:115296..117599(-)	frameshift		117655	WP_010714416.1	collagen-binding MSCRAMM adhesin Ace	58.0	64.1	34.9
MGA_1339	LOCUS_13200	sequence4:117602..118177(-)	frameshift		117655	WP_010714416.1	collagen-binding MSCRAMM adhesin Ace	87.4	24.9	39.9
MGA_1352	LOCUS_13330	sequence4:131266..133920(+)	partial			WP_012972584.1	accessory Sec-dependent serine-rich glycoprotein adhesin	39.8	21.3	20.6
MGA_1354	LOCUS_13350	sequence4:135447..136670(+)	partial			WP_011101709.1	competence/damage-inducible protein A	70.0	67.9	49.1
MGA_1359	LOCUS_13400	sequence4:141864..142943(-)	internal_stop_codon	142974..142976(-)		WP_003245322.1	catalase KatA	98.6	73.3	59.6
MGA_1360	LOCUS_13410	sequence4:142974..143327(-)	internal_stop_codon	142974..142976(-)		WP_002379460.1	catalase	97.4	23.8	73.7
MGA_1374	LOCUS_13520	sequence4:156824..157519(-)	partial			WP_000450003.1	gluconokinase	58.4	26.6	30.9
MGA_1416	LOCUS_13930	sequence5:40575..41372(-)	partial			WP_000721136.1	peptidylprolyl isomerase	75.1	74.5	59.8
MGA_1434	LOCUS_14110	sequence5:57874..58941(-)	partial			WP_003245529.1	small-conductance mechanosensitive channel protein MscY	76.6	73.3	30.1
MGA_1475	LOCUS_14470	sequence6:11591..12568(-)	partial			WP_003642085.1	tRNA lysidine(34) synthetase TilS	96.9	69.6	31.9
MGA_1530	LOCUS_15010	sequence7:17833..18663(-)	partial			WP_011475863.1	DNA internalization-related competence protein ComEC/Rec2	94.9	35.5	39.6
