# locus_id	locus_tag	location	classification	internal_stop	indel	ref_id	description	query_cov	ref_cov	identity
MGA_146	LOCUS_01370	sequence011:23457..24026(-)	partial			WP_002456715.1	DUF4064 domain-containing protein	74.1	71.9	31.8
MGA_150	LOCUS_01410	sequence011:26944..>29169(-)	partial			WP_003147473.1	Ig-like domain-containing protein	92.4	27.4	35.4
MGA_170	LOCUS_01550	sequence021:13357..14442(-)	partial			WP_001831714.1	DUF4064 domain-containing protein	71.2	78.3	48.7
MGA_227	LOCUS_02120	sequence021:71355..75773(+)	partial			WP_002485275.1	glucosaminidase domain-containing protein	69.6	74.6	38.7
MGA_238	LOCUS_02230	sequence021:86459..86854(-)	partial			WP_001240655.1	N-acetylmuramoyl-L-alanine amidase	79.4	55.1	44.2
MGA_252	LOCUS_02300	sequence028:803..1183(+)	frameshift		1162,1300	WP_029376395.1	tandem-type lipoprotein	85.7	44.0	46.9
MGA_254	LOCUS_02320	sequence028:1624..2247(+)	frameshift		2193	WP_001802015.1	tandem-type lipoprotein	87.0	72.2	46.6
MGA_258	LOCUS_02360	sequence028:3615..4151(+)	frameshift		3640,3547	WP_029376395.1	tandem-type lipoprotein	93.3	67.7	35.6
MGA_270	LOCUS_02480	sequence028:16091..16321(-)	partial			WP_001794540.1	twin-arginine translocase TatA/TatE family subunit	69.7	71.6	73.6
MGA_281	LOCUS_02590	sequence028:29239..29928(+)	partial			WP_002470184.1	YdcF family protein	96.5	69.8	43.9
MGA_363	LOCUS_03410	sequence029:28538..29320(+)	internal_stop_codon	29318..29320(+)		WP_000433354.1	M42 family metallopeptidase	99.2	75.2	72.1
MGA_370	LOCUS_03480	sequence029:34467..35453(+)	frameshift		35423	WP_001041351.1	tryptophan synthase subunit beta	96.0	78.0	85.1
MGA_371	LOCUS_03490	sequence029:35459..35695(+)	frameshift		35423	WP_001041351.1	tryptophan synthase subunit beta	93.6	18.1	72.6
MGA_445	LOCUS_04210	sequence032:35945..36550(-)	partial			WP_000070642.1	DUF4352 domain-containing protein	82.1	53.2	29.1
MGA_447	LOCUS_04230	sequence032:37446..38552(+)	partial			WP_004399048.1	endonuclease YokF	66.6	80.7	42.5
MGA_448	LOCUS_04240	sequence032:38651..39658(-)	partial			WP_000070642.1	DUF4352 domain-containing protein	43.3	43.8	57.9
MGA_526	LOCUS_05010	sequence033:17424..18692(+)	frameshift		18662	WP_002437845.1	YSIRK domain-containing triacylglycerol lipase GehC	85.5	45.2	22.0
MGA_527	LOCUS_05020	sequence033:18749..19861(+)	frameshift		18662	WP_002437845.1	YSIRK domain-containing triacylglycerol lipase GehC	100.0	53.6	68.6
MGA_579	LOCUS_05540	sequence034:49982..51772(-)	partial			WP_011015494.1	metallophosphoesterase family protein	71.0	63.3	25.7
MGA_601	LOCUS_05760	sequence034:78000..82079(-)	partial			WP_041814900.1	Rib/alpha-like domain-containing protein	58.5	49.2	32.8
MGA_615	LOCUS_05900	sequence034:90370..91740(-)	partial			WP_000736784.1	glycine-glycine endopeptidase LytM	32.7	46.2	39.6
MGA_621	LOCUS_05960	sequence034:95035..95907(-)	frameshift		95951	WP_005619903.1	acetamidase/formamidase family protein	98.6	69.5	63.8
MGA_622	LOCUS_05970	sequence034:95949..96227(-)	frameshift		95951	WP_003896733.1	acetamidase/formamidase family protein	100.0	22.2	59.8
MGA_630	LOCUS_06050	sequence035:6246..8357(-)	partial			WP_001830607.1	assimilatory sulfite reductase (NADPH) flavoprotein subunit	55.0	63.0	54.5
MGA_664	LOCUS_06390	sequence035:42335..42943(-)	partial			WP_000956137.1	hypothetical protein	95.5	58.5	67.9
MGA_719	LOCUS_06940	sequence036:44755..44922(-)	internal_stop_codon	44947..44949(-)		WP_002468316.1	class I mannose-6-phosphate isomerase	100.0	17.6	72.7
MGA_720	LOCUS_06950	sequence036:44947..45690(-)	internal_stop_codon	44947..44949(-)		WP_002468316.1	class I mannose-6-phosphate isomerase	100.0	79.5	54.6
MGA_818	LOCUS_07910	sequence039:11182..12084(+)	partial			WP_002470268.1	FtsQ-type POTRA domain-containing protein	94.7	61.6	51.9
MGA_894	LOCUS_08660	sequence040:39762..40691(-)	partial			WP_010921843.1	ABC transporter permease/substrate binding protein	98.1	51.0	32.5
MGA_904	LOCUS_08760	sequence040:51048..52211(-)	partial			WP_000673890.1	MFS transporter	48.1	45.6	27.9
MGA_909	LOCUS_08810	sequence040:57540..58232(+)	partial			WP_000176178.1	alpha/beta hydrolase-fold protein	75.2	74.8	31.1
MGA_934	LOCUS_09060	sequence042:15831..16166(-)	partial			WP_002440082.1	diacylglycerol kinase family protein	76.6	72.0	57.6
MGA_975	LOCUS_09440	sequence044:33915..35186(-)	partial			WP_107515759.1	elastin-binding protein EbpS	62.2	69.6	23.5
MGA_1091	LOCUS_10590	sequence046:43055..45088(-)	partial			WP_012583944.1	AraC family transcriptional regulator	14.6	34.5	35.4
MGA_1092	LOCUS_10600	sequence046:45553..46980(+)	partial			WP_002485785.1	YSIRK-type signal peptide-containing protein	93.1	62.4	23.3
MGA_1155	LOCUS_11230	sequence048:245..409(+)	partial			WP_011117494.1	RepB family plasmid replication initiator protein	100.0	19.7	85.2
MGA_1178	LOCUS_11450	sequence050:15100..15489(+)	internal_stop_codon	15487..15489(+)		WP_041272586.1	helix-turn-helix transcriptional regulator	93.8	33.2	33.6
MGA_1179	LOCUS_11460	sequence050:15559..16200(+)	partial			WP_000578732.1	helix-turn-helix transcriptional regulator	99.1	58.2	28.0
MGA_1268	LOCUS_12350	sequence051:92..331(-)	partial			WP_001548645.1	YneF family protein	70.9	58.9	64.3
MGA_1356	LOCUS_13230	sequence053:30912..31715(+)	partial			WP_002485467.1	NAD(P)H-binding protein	60.3	32.1	28.6
MGA_1361	LOCUS_13280	sequence053:36781..37377(+)	partial			WP_002468207.1	type II CAAX endopeptidase family protein	92.9	73.8	39.7
MGA_1390	LOCUS_13570	sequence053:69188..69391(-)	frameshift,internal_stop_codon	69394..69396(-)	69576	WP_001012225.1	FemA/FemB family glycyltransferase FmhA	89.6	14.4	80.0
MGA_1391	LOCUS_13580	sequence053:69388..70419(-)	frameshift,internal_stop_codon	69394..69396(-)	69576	WP_001012225.1	FemA/FemB family glycyltransferase FmhA	84.0	69.2	57.3
MGA_1438	LOCUS_14030	sequence055:10272..11240(+)	frameshift		10128	WP_012546117.1	ImmA/IrrE family metallo-endopeptidase	92.5	75.6	36.2
MGA_1440	LOCUS_14050	sequence055:11684..12502(-)	partial			WP_011101255.1	AraC family transcriptional regulator	48.2	39.3	27.6
MGA_1441	LOCUS_14060	sequence055:12864..24071(+)	partial			WP_220738881.1	DUF1542 domain-containing protein	49.2	77.3	20.0
MGA_1449	LOCUS_14140	sequence055:35443..36639(-)	partial			WP_124797038.1	putative glycoside hydrolase	86.4	72.6	34.4
MGA_1485	LOCUS_14500	sequence057:16665..17030(-)	partial			WP_011948529.1	Hsp20/alpha crystallin family protein	71.9	60.3	42.0
MGA_1490	LOCUS_14550	sequence058:35..694(+)	partial			WP_011117511.1	LPXTG cell wall anchor domain-containing protein	61.6	72.1	33.8
MGA_1509	LOCUS_14740	sequence058:25296..25433(+)	partial			WP_000240855.1	50S ribosomal protein L34	60.0	60.0	100.0
MGA_1534	LOCUS_14980	sequence061:2341..4719(+)	partial			WP_049387514.1	MSCRAMM-like protein SdrH	37.6	63.0	36.7
MGA_1538	LOCUS_15020	sequence061:8069..8440(+)	partial			WP_010989411.1	DUF1433 domain-containing protein	78.9	73.2	43.6
MGA_1541	LOCUS_15050	sequence061:9636..10436(+)	internal_stop_codon	9630..9632(+)		WP_011461029.1	Fic family protein	99.2	66.3	31.5
MGA_1592	LOCUS_15560	sequence061:59906..60250(-)	frameshift		60261	WP_000838159.1	carbonic anhydrase	96.5	58.8	59.1
MGA_1593	LOCUS_15570	sequence061:60217..60474(-)	frameshift		60261	WP_003423380.1	carbonic anhydrase	83.5	37.8	59.2
MGA_1675	LOCUS_16390	sequence062:68495..69322(-)	partial			WP_000070831.1	DUF4887 domain-containing protein	21.5	26.8	57.6
MGA_1683	LOCUS_16470	sequence062:75045..75374(-)	partial			WP_010922054.1	helix-turn-helix transcriptional regulator	68.8	29.6	64.0
MGA_1697	LOCUS_16600	sequence063:2373..3623(-)	partial			WP_003420541.1	replicative DNA helicase	76.0	73.3	36.0
MGA_1699	LOCUS_16620	sequence063:3977..4291(-)	partial			WP_000132051.1	helix-turn-helix domain-containing protein	85.6	36.6	62.9
MGA_1700	LOCUS_16630	sequence063:4410..4751(-)	partial			WP_000511415.1	DnaD domain protein	66.4	25.9	36.0
MGA_1703	LOCUS_16660	sequence063:5987..6658(-)	partial			WP_002383799.1	ERF family protein	77.1	72.5	33.3
MGA_1717	LOCUS_16780	sequence067:1089..1268(-)	partial			WP_001096113.1	LLM class flavin-dependent oxidoreductase	94.9	15.9	78.6
MGA_1730	LOCUS_16910	sequence068:3206..3841(-)	partial			WP_002485463.1	poly-gamma-glutamate hydrolase family protein	96.2	45.6	41.4
MGA_1755	LOCUS_17160	sequence070:10922..11437(-)	partial			WP_002456715.1	DUF4064 domain-containing protein	77.8	68.4	38.5
MGA_1762	LOCUS_17230	sequence070:18945..20681(-)	partial			WP_011100946.1	glycosyltransferase	83.2	53.5	24.1
MGA_1763	LOCUS_17240	sequence070:21227..21565(+)	frameshift		21517,21493	WP_000745891.1	MSCRAMM family adhesin clumping factor ClfB	86.6	10.3	38.8
MGA_1764	LOCUS_17250	sequence070:21447..24323(+)	frameshift		21517,21511	WP_000934467.1	MSCRAMM family adhesin SdrD	49.9	34.4	23.5
MGA_1772	LOCUS_17330	sequence070:29992..30417(-)	partial			WP_001198795.1	DUF805 domain-containing protein	72.3	83.3	40.6
MGA_1775	LOCUS_17360	sequence070:33100..34476(-)	frameshift,internal_stop_codon	34515..34517(-)	34502	WP_000181735.1	ATP-dependent helicase	97.6	74.2	31.9
MGA_1776	LOCUS_17370	sequence070:34515..34871(-)	frameshift,internal_stop_codon	34515..34517(-)	34502	WP_000181735.1	ATP-dependent helicase	88.1	17.6	45.7
MGA_1778	LOCUS_17390	sequence070:37594..37809(+)	frameshift,internal_stop_codon	37531..37533(+),37807..37809(+),37411..37413(+)	37370	WP_055164393.1	IS30 family transposase	95.8	22.0	71.0
MGA_1779	LOCUS_17400	sequence070:37849..38130(+)	internal_stop_codon	37807..37809(+),38128..38130(+)		WP_055164393.1	IS30 family transposase	96.8	28.7	61.1
MGA_1780	LOCUS_17410	sequence070:38309..39202(-)	partial			WP_035050627.1	site-specific DNA-methyltransferase	97.6	41.5	51.0
MGA_1781	LOCUS_17420	sequence071:165..341(-)	partial			WP_000048060.1	30S ribosomal protein S21	74.1	74.1	100.0
MGA_1821	LOCUS_17810	sequence073:4760..6040(+)	partial			WP_000676539.1	Glu-specific serine endopeptidase SspA	54.5	69.6	45.0
MGA_1822	LOCUS_17820	sequence073:6438..6725(-)	partial			WP_003246542.1	glucose starvation-inducible protein GsiB	100.0	66.7	55.2
MGA_1855	LOCUS_18130	sequence076:6674..8476(-)	partial			WP_011082576.1	accumulation-associated protein Aap	21.7	8.9	52.6
MGA_1856	LOCUS_18140	sequence076:8979..9605(-)	partial			WP_011082831.1	MSCRAMM family adhesin SdrF	95.2	12.1	30.0
MGA_1860	LOCUS_18180	sequence077:3644..4309(-)	partial			WP_002485581.1	hypothetical protein	71.0	73.8	36.4
MGA_1877	LOCUS_18340	sequence078:11685..12443(-)	internal_stop_codon	11685..11687(-)		WP_001033761.1	hypothetical protein	96.0	33.3	51.7
MGA_1882	LOCUS_18390	sequence079:4341..5357(-)	frameshift,internal_stop_codon	5378..5380(-)	5374	WP_000570687.1	alanine/glycine:cation symporter family protein	96.4	62.3	71.8
MGA_1883	LOCUS_18400	sequence079:5378..5932(-)	frameshift,internal_stop_codon	5378..5380(-)	5374	WP_000570687.1	alanine/glycine:cation symporter family protein	96.7	34.1	79.8
MGA_2005	LOCUS_19610	sequence083:2601..2951(+)	partial			WP_010965201.1	HNH endonuclease signature motif containing protein	66.4	73.8	53.2
MGA_2010	LOCUS_19660	sequence083:6747..7301(+)	partial			WP_137615044.1	phage major capsid protein	82.1	29.1	49.3
MGA_2011	LOCUS_19670	sequence083:7342..8682(+)	partial			WP_010905714.1	phage major capsid protein	66.8	75.8	43.7
MGA_2017	LOCUS_19730	sequence083:10943..11422(+)	partial			WP_001115046.1	Ig domain-containing protein	76.1	39.7	38.5
MGA_2022	LOCUS_19780	sequence083:17548..20079(+)	partial			WP_001795393.1	phage tail tape measure protein	19.9	11.1	36.6
MGA_2024	LOCUS_19800	sequence083:20651..22714(+)	partial			WP_000369014.1	hypothetical protein	17.2	19.7	32.0
MGA_2032	LOCUS_19880	sequence083:28194..28757(+)	partial			WP_011705890.1	ImmA/IrrE family metallo-endopeptidase	65.8	30.8	37.4
MGA_2125	LOCUS_20800	sequence084:102815..107281(+)	partial			WP_015704442.1	putative mucin/carbohydrate-binding domain-containing protein	47.1	69.8	25.9
MGA_2128	LOCUS_20830	sequence084:110467..111021(-)	partial			WP_003229340.1	RDD family protein	74.5	82.3	40.6
MGA_2169	LOCUS_21240	sequence086:604..2127(+)	partial			WP_002469217.1	CDP-glycerol glycerophosphotransferase family protein	95.9	66.0	26.9
MGA_2170	LOCUS_21250	sequence086:2130..2774(+)	partial			WP_009897033.1	YdcF family protein	58.4	52.4	33.6
MGA_2216	LOCUS_21660	sequence091:338..1642(-)	partial			WP_002489707.1	hypothetical protein	49.5	79.1	46.1
MGA_2224	LOCUS_21740	sequence091:8932..9387(+)	partial			WP_010989411.1	DUF1433 domain-containing protein	38.4	44.9	41.4
MGA_2261	LOCUS_22080	sequence096:1621..2400(-)	partial			WP_048065733.1	HNH endonuclease	52.9	57.3	42.7
MGA_2277	LOCUS_22230	sequence097:9647..11356(+)	internal_stop_codon	9638..9640(+)		WP_002470205.1	AraC family transcriptional regulator Rsp	97.9	79.7	21.9
MGA_2289	LOCUS_22320	sequence101:6395..8059(+)	partial			WP_011108297.1	FAD-dependent oxidoreductase	97.1	65.5	37.3
MGA_2292	LOCUS_22350	sequence101:9732..10073(+)	frameshift		9687	WP_000358995.1	thioredoxin-dependent arsenate reductase	97.3	84.0	85.5
MGA_2294	LOCUS_22370	sequence101:10552..11085(+)	frameshift,internal_stop_codon	11339..11341(+)	11067	WP_004554540.1	DUF5655 domain-containing protein	95.5	54.5	56.8
MGA_2298	LOCUS_22400	sequence102:1094..1366(-)	internal_stop_codon	1094..1096(-)		WP_003244896.1	thymidylate synthase	98.9	31.9	57.3
MGA_2301	LOCUS_22430	sequence102:3664..4221(-)	partial			WP_002322009.1	protein rep	76.8	46.4	56.3
MGA_2307	LOCUS_22470	sequence103:2821..3447(-)	partial			WP_004527343.1	DNA-3-methyladenine glycosylase	91.3	60.6	34.7
MGA_2331	LOCUS_22650	sequence112:219..941(+)	frameshift		905	WP_001830636.1	acyltransferase family protein	98.3	39.0	58.5
MGA_2332	LOCUS_22660	sequence112:896..2035(+)	frameshift		905	WP_001830636.1	acyltransferase family protein	98.2	62.1	51.5
MGA_2359	LOCUS_22930	sequence112:26607..26945(+)	partial			WP_001829897.1	SprT family protein	100.0	74.2	60.7
MGA_2361	LOCUS_22950	sequence113:640..>1222(-)	partial			WP_000801979.1	Abi family protein	100.0	59.9	59.1
MGA_2364	LOCUS_22980	sequence114:1509..1991(-)	partial			WP_010963585.1	TspO/MBR family protein	72.5	70.6	35.8
MGA_2374	LOCUS_23080	sequence114:10009..10818(+)	frameshift		10794	WP_002389992.1	IS30-like element IS6770 family transposase	98.1	82.8	58.3
