# locus_id	locus_tag	location	classification	internal_stop	indel	ref_id	description	query_cov	ref_cov	identity
MGA_3	LOCUS_00020	sequence001:1051..1839(-)	partial			WP_012775242.1	TPM domain-containing protein	63.4	64.3	59.6
MGA_88	LOCUS_00850	sequence002:5340..6218(-)	partial			WP_000998260.1	glycosyltransferase	99.7	42.1	38.3
MGA_89	LOCUS_00860	sequence002:6220..7965(-)	partial			WP_001263850.1	SP_1767 family glycosyltransferase	51.5	73.4	54.2
MGA_91	LOCUS_00880	sequence002:8946..9821(-)	partial			WP_000998260.1	glycosyltransferase	99.7	42.1	34.8
MGA_96	LOCUS_00920	sequence002:15229..17112(-)	partial			WP_010774274.1	phage tail tip lysozyme	99.4	68.5	40.2
MGA_102	LOCUS_00980	sequence002:22457..27124(-)	partial			WP_010989916.1	collagen binding domain-containing protein	33.0	31.8	24.4
MGA_128	LOCUS_01240	sequence002:53083..54159(-)	frameshift		54167	WP_012775277.1	FtsX-like permease family protein	95.8	52.0	41.4
MGA_129	LOCUS_01250	sequence002:54147..55094(-)	frameshift		54170	WP_012775277.1	FtsX-like permease family protein	98.1	46.2	53.1
MGA_132	LOCUS_01280	sequence002:57464..58033(-)	frameshift		57472	WP_012027525.1	response regulator transcription factor	97.9	82.8	75.0
MGA_142	LOCUS_01340	sequence005:150..1496(-)	partial			WP_012775522.1	GbpC/Spa domain-containing protein	95.8	27.3	53.0
MGA_158	LOCUS_01410	sequence011:464..988(-)	partial			WP_011837563.1	Cna B-type domain-containing protein	67.8	7.5	51.7
MGA_184	LOCUS_01640	sequence013:22068..22334(-)	partial			WP_008760854.1	bifunctional 3-deoxy-7-phosphoheptulonate synthase/chorismate mutase type II	96.6	24.1	32.9
MGA_202	LOCUS_01820	sequence013:44910..45659(+)	frameshift		45650	WP_002261920.1	GIY-YIG nuclease family protein	99.6	73.2	73.8
MGA_203	LOCUS_01830	sequence013:45667..45924(+)	frameshift		45656	WP_040804636.1	GIY-YIG nuclease family protein	92.9	23.2	75.9
MGA_224	LOCUS_01990	sequence016:5475..9380(-)	partial			WP_011837563.1	Cna B-type domain-containing protein	92.1	74.6	37.4
MGA_226	LOCUS_02010	sequence016:11998..14352(-)	partial			WP_012775593.1	ZmpA/ZmpB/ZmpC family metallo-endopeptidase	43.1	18.4	28.5
MGA_227	LOCUS_02020	sequence016:14518..20346(-)	partial			WP_000682783.1	G5 domain-containing protein	16.6	11.8	37.6
MGA_263	LOCUS_02380	sequence017:8990..9367(-)	partial			WP_074390220.1	IS630 family transposase	97.6	43.3	48.4
MGA_274	LOCUS_02490	sequence017:17330..18310(-)	partial			WP_000705149.1	O antigen biosynthesis rhamnosyltransferase RfbN	71.8	70.7	26.7
MGA_275	LOCUS_02500	sequence017:18303..19535(-)	partial			WP_223217130.1	glycosyltransferase family 1 protein	83.7	74.9	38.6
MGA_374	LOCUS_03480	sequence019:24690..25076(+)	frameshift		25055	WP_148255728.1	IS5 family transposase	97.7	46.8	72.0
MGA_375	LOCUS_03490	sequence019:25181..25495(+)	frameshift		25064	WP_224783972.1	IS5 family transposase	97.1	38.1	78.2
MGA_401	LOCUS_03740	sequence020:16035..16211(-)	partial			WP_000048054.1	30S ribosomal protein S21	74.1	74.1	100.0
MGA_405	LOCUS_03780	sequence020:20635..34047(-)	partial			WP_000515824.1	beta-N-acetylglucosaminidase domain-containing protein	33.7	54.2	55.3
MGA_430	LOCUS_04030	sequence021:13691..14140(+)	partial			WP_012775625.1	DUF6287 domain-containing protein	61.1	33.7	49.5
MGA_431	LOCUS_04040	sequence021:14407..14859(-)	partial			WP_000737133.1	helix-turn-helix transcriptional regulator	46.7	70.7	54.3
MGA_433	LOCUS_04060	sequence021:15899..16489(-)	partial			WP_011101082.1	helix-turn-helix transcriptional regulator	38.8	62.5	45.5
MGA_434	LOCUS_04070	sequence021:16742..17224(+)	partial			WP_001008113.1	hypothetical protein	58.8	62.9	28.1
MGA_448	LOCUS_04210	sequence021:30288..35441(+)	partial			WP_011836870.1	ZmpA/ZmpB/ZmpC family metallo-endopeptidase	50.5	28.3	50.3
MGA_462	LOCUS_04330	sequence022:2279..2854(+)	frameshift		2228	WP_002262670.1	hdrR negative regulator HdrM	79.1	65.8	24.2
MGA_496	LOCUS_04670	sequence022:36701..37342(-)	partial			WP_011837497.1	D-alanyl-D-alanine carboxypeptidase family protein	86.9	70.6	62.2
MGA_502	LOCUS_04730	sequence022:43327..44523(-)	partial			WP_011836924.1	ZmpA/ZmpB/ZmpC family metallo-endopeptidase	58.3	12.3	25.0
MGA_504	LOCUS_04750	sequence023:3499..4371(+)	partial			WP_011461245.1	MBOAT family protein	100.0	61.8	37.8
MGA_505	LOCUS_04760	sequence023:4389..5807(+)	partial			WP_016357000.1	alginate O-acetylation protein AlgJ	50.2	47.7	23.3
MGA_511	LOCUS_04820	sequence023:12520..13065(+)	partial			WP_002294234.1	chorismate mutase	61.3	40.0	42.0
MGA_512	LOCUS_04830	sequence023:13056..14009(+)	partial			WP_011922118.1	glycosyltransferase family 2 protein	71.9	65.3	36.1
MGA_515	LOCUS_04860	sequence023:16301..17092(+)	partial			WP_001058925.1	glycosyltransferase family 52 protein	85.6	71.7	40.7
MGA_533	LOCUS_05040	sequence023:35982..36620(-)	partial			WP_003596039.1	helix-turn-helix domain-containing protein	30.7	31.1	50.8
MGA_536	LOCUS_05070	sequence023:40911..42986(+)	partial			WP_011837563.1	Cna B-type domain-containing protein	95.7	41.3	36.6
MGA_545	LOCUS_05150	sequence024:9557..10612(-)	frameshift		10641	WP_005797442.1	glycosyltransferase family 8 protein	30.5	23.6	37.4
MGA_556	LOCUS_05260	sequence024:18899..22669(-)	partial			WP_011836823.1	GbpC/Spa domain-containing protein	45.5	39.5	28.6
MGA_576	LOCUS_05460	sequence024:49939..50124(-)	partial			WP_000704762.1	DNA topology modulation protein	93.4	31.6	54.4
MGA_577	LOCUS_05470	sequence024:50301..50546(-)	partial			WP_002897695.1	DNA topology modulation protein	91.4	43.4	57.3
MGA_612	LOCUS_05820	sequence024:88516..88917(+)	internal_stop_codon	88245..88247(+)		WP_140834349.1	DNA alkylation repair protein	98.5	60.1	61.8
MGA_653	LOCUS_06230	sequence025:41074..41313(-)	partial			WP_011254116.1	site-specific integrase	84.8	19.1	71.6
MGA_664	LOCUS_06330	sequence026:12888..13379(-)	frameshift,internal_stop_codon	13434..13436(-)	13488	WP_002262444.1	RpiB/LacA/LacB family sugar-phosphate isomerase	98.8	76.7	61.5
MGA_672	LOCUS_06410	sequence026:20636..21874(-)	partial			WP_010922066.1	AAA family ATPase	91.0	49.7	25.3
MGA_677	LOCUS_06460	sequence026:23428..24087(-)	partial			WP_000424672.1	Rha family transcriptional regulator	65.8	69.2	53.5
MGA_679	LOCUS_06480	sequence026:24530..25183(+)	partial			WP_012027034.1	XRE family transcriptional regulator	38.2	31.2	50.6
MGA_702	LOCUS_06700	sequence027:9671..10243(-)	frameshift		10364	WP_011836406.1	glycosyltransferase family 2 protein	93.7	61.6	29.4
MGA_703	LOCUS_06710	sequence027:10356..10568(-)	frameshift		10388	WP_002383750.1	glycosyltransferase	81.4	17.6	54.4
MGA_735	LOCUS_07020	sequence028:12577..13236(+)	partial			WP_012775187.1	CPBP family intramembrane metalloprotease	42.5	40.6	38.7
MGA_737	LOCUS_07040	sequence028:14044..15627(-)	partial			WP_011837107.1	ATP-binding protein	43.5	42.2	49.8
MGA_811	LOCUS_07760	sequence030:27372..27704(-)	partial			WP_000331954.1	hypothetical protein	73.6	82.2	50.6
MGA_833	LOCUS_07970	sequence031:13537..13890(-)	partial			WP_012775462.1	helix-turn-helix transcriptional regulator	64.1	63.0	58.7
MGA_851	LOCUS_08150	sequence032:1821..6356(+)	frameshift		1818	WP_013390242.1	Ig-like domain-containing protein	92.9	77.3	45.7
MGA_890	LOCUS_08530	sequence033:15345..16565(+)	partial			WP_000038635.1	helicase	12.3	38.2	56.0
MGA_916	LOCUS_08780	sequence034:15598..16473(-)	partial			WP_003895789.1	excalibur calcium-binding domain-containing protein	15.5	71.4	75.6
MGA_931	LOCUS_08920	sequence035:2433..2570(+)	partial			WP_000831905.1	50S ribosomal protein L34	57.8	59.1	92.3
MGA_935	LOCUS_08960	sequence035:5616..6323(+)	partial			WP_003547408.1	DNA/RNA non-specific endonuclease	47.7	36.7	35.4
MGA_960	LOCUS_09210	sequence035:37462..38142(-)	partial			WP_002359765.1	hypothetical protein	66.8	53.4	29.5
MGA_982	LOCUS_09430	sequence035:49905..50072(+)	partial			WP_000220553.1	hypothetical protein	98.2	41.8	64.3
MGA_986	LOCUS_09470	sequence035:50904..51308(+)	partial			WP_002399989.1	YopX family protein	58.2	53.8	41.0
MGA_989	LOCUS_09500	sequence035:51831..52058(+)	partial			WP_011109521.1	class I SAM-dependent methyltransferase	92.0	43.1	59.4
MGA_1011	LOCUS_09720	sequence035:64450..67521(+)	partial			WP_001795393.1	phage tail tape measure protein	84.2	60.3	18.4
MGA_1013	LOCUS_09740	sequence035:67883..70834(+)	partial			WP_010922449.1	gp58-like family protein	41.1	64.5	30.5
MGA_1020	LOCUS_09810	sequence035:73636..74361(+)	partial			WP_010922095.1	glucosaminidase domain-containing protein	99.6	60.8	70.4
MGA_1034	LOCUS_09940	sequence036:4810..15363(-)	partial			WP_000489923.1	alpha-like surface protein	37.2	78.5	31.5
MGA_1042	LOCUS_10020	sequence036:25622..26029(-)	frameshift		26111	WP_012775056.1	LD-carboxypeptidase LdcB/DacB	98.5	52.6	73.7
MGA_1043	LOCUS_10030	sequence036:26088..26483(-)	frameshift		26105	WP_012775056.1	LD-carboxypeptidase LdcB/DacB	63.4	33.5	41.7
MGA_1073	LOCUS_10320	sequence037:27022..27231(-)	partial			WP_100190734.1	IS3 family transposase	100.0	13.2	88.4
MGA_1110	LOCUS_10670	sequence039:13683..13949(-)	partial			WP_002938604.1	DUF6290 family protein	71.6	84.0	79.4
MGA_1127	LOCUS_10830	sequence040:5165..6409(+)	partial			WP_012061841.1	family 16 glycosylhydrolase	39.9	33.1	26.6
MGA_1132	LOCUS_10880	sequence040:12570..13340(+)	partial			WP_052846403.1	ABC transporter permease	75.8	69.8	23.5
MGA_1143	LOCUS_10990	sequence040:24899..25180(+)	frameshift		25114	WP_000749954.1	hypothetical protein	78.5	53.3	50.7
MGA_1190	LOCUS_11430	sequence043:10772..11077(+)	partial			WP_010964944.1	DUF4176 domain-containing protein	79.2	59.4	51.2
MGA_1233	LOCUS_11850	sequence045:15434..15724(+)	partial			WP_012775696.1	preprotein translocase subunit YajC	81.2	72.0	79.5
MGA_1315	LOCUS_12650	sequence047:3291..3563(-)	partial			WP_001254394.1	YiaA/YiaB family inner membrane protein	73.3	84.6	53.0
MGA_1371	LOCUS_13180	sequence049:17871..18446(+)	partial			WP_002903684.1	DUF4352 domain-containing protein	76.4	74.9	61.0
MGA_1372	LOCUS_13190	sequence049:18807..19166(-)	partial			WP_011921671.1	HAD-IA family hydrolase	99.2	55.9	58.5
MGA_1384	LOCUS_13310	sequence050:14513..14980(+)	internal_stop_codon	14978..14980(+)		WP_011100919.1	ABC-F family ATP-binding cassette domain-containing protein	100.0	30.6	45.8
MGA_1404	LOCUS_13490	sequence052:1..1590(+)	partial			WP_013399748.1	Rib/alpha-like domain-containing protein	93.6	16.1	28.8
MGA_1420	LOCUS_13640	sequence053:1786..2772(-)	partial			WP_012775182.1	MFS transporter	96.0	74.5	51.1
MGA_1423	LOCUS_13670	sequence053:3405..3617(-)	frameshift,internal_stop_codon	3405..3407(-)	3248,3238	WP_001105159.1	IS5 family transposase	92.9	24.3	52.3
MGA_1424	LOCUS_13680	sequence053:3640..3918(-)	partial			WP_012775182.1	MFS transporter	95.7	20.8	72.7
MGA_1432	LOCUS_13760	sequence053:14043..15086(-)	partial			WP_003549759.1	LPXTG cell wall anchor domain-containing protein	91.6	69.9	29.2
MGA_1443	LOCUS_13860	sequence054:4032..4460(-)	partial			WP_100190734.1	IS3 family transposase	97.2	26.4	67.4
MGA_1472	LOCUS_14140	sequence056:189..938(-)	partial			WP_011142015.1	ABC transporter permease	69.1	46.9	28.5
MGA_1476	LOCUS_14180	sequence056:3755..4282(-)	partial			WP_010947583.1	endopeptidase La	64.6	14.7	33.1
MGA_1486	LOCUS_14280	sequence056:12496..13014(-)	frameshift		13030	WP_000452107.1	Cof-type HAD-IIB family hydrolase	100.0	37.6	65.5
MGA_1487	LOCUS_14290	sequence056:13001..13867(-)	frameshift		13030	WP_002901047.1	Cof-type HAD-IIB family hydrolase	96.2	59.3	54.2
MGA_1533	LOCUS_14740	sequence057:49042..50334(-)	partial			WP_004083337.1	radical SAM protein	74.4	72.2	27.5
MGA_1550	LOCUS_14910	sequence057:66464..68524(-)	partial			WP_011964235.1	N-6 DNA methylase	66.6	59.8	26.1
MGA_1555	LOCUS_14960	sequence058:873..1310(+)	partial			WP_010879839.1	hypothetical protein	53.1	76.2	46.8
MGA_1559	LOCUS_15000	sequence058:3291..4709(+)	frameshift		4664	WP_002399687.1	DNA polymerase	97.2	71.5	50.2
MGA_1560	LOCUS_15010	sequence058:4682..5227(+)	frameshift		4667	WP_002399687.1	DNA polymerase	100.0	27.7	47.3
MGA_1561	LOCUS_15020	sequence058:5238..6623(+)	partial			WP_010714181.1	VapE family protein	98.7	57.8	44.3
MGA_1562	LOCUS_15030	sequence058:6606..7112(-)	frameshift		7212	WP_115265112.1	IS630 family transposase	100.0	48.0	79.8
MGA_1563	LOCUS_15040	sequence058:7144..7650(-)	frameshift		7158	WP_148255720.1	IS630 family transposase	98.8	47.6	49.4
MGA_1575	LOCUS_15150	sequence059:6822..13574(-)	partial			WP_025189858.1	glycoside hydrolase family 31 protein	57.2	69.5	45.5
MGA_1595	LOCUS_15320	sequence062:706..1437(+)	partial			WP_010922334.1	PASTA domain-containing protein	52.3	79.4	40.2
MGA_1618	LOCUS_15530	sequence063:8930..9367(-)	partial			WP_011837153.1	GNAT family N-acetyltransferase	62.1	64.1	47.3
MGA_1625	LOCUS_15590	sequence064:582..992(+)	frameshift		570	WP_011254576.1	peptide cleavage/export ABC transporter	98.5	18.9	32.8
MGA_1641	LOCUS_15740	sequence065:5593..10752(-)	partial			WP_199567761.1	glycoside hydrolase family 2 TIM barrel-domain containing protein	34.7	25.1	51.5
MGA_1642	LOCUS_15750	sequence066:1..678(+)	partial			WP_013061396.1	tyrosine-type recombinase/integrase	85.8	61.3	40.9
MGA_1668	LOCUS_16000	sequence068:13312..13986(+)	partial			WP_011921718.1	competence type IV pilus ATPase ComGA	54.9	38.9	73.2
MGA_1672	LOCUS_16040	sequence068:15713..15904(+)	partial			WP_011921722.1	competence type IV pilus minor pilin ComGE	81.0	52.6	51.0
MGA_1674	LOCUS_16060	sequence068:16297..16731(+)	partial			WP_000265622.1	competence type IV pilus minor pilin ComGG	41.7	43.8	48.3
MGA_1703	LOCUS_16350	sequence068:38558..41641(+)	partial			WP_010922451.1	phage tail spike protein	42.0	69.5	41.3
MGA_1709	LOCUS_16410	sequence068:43211..43942(+)	partial			WP_010922095.1	glucosaminidase domain-containing protein	99.6	60.8	59.2
MGA_1713	LOCUS_16450	sequence068:46941..47267(+)	partial			WP_010922083.1	minor capsid protein	94.4	73.7	31.4
MGA_1749	LOCUS_16780	sequence071:1071..1769(-)	partial			WP_010989918.1	class B sortase	78.4	72.4	32.1
MGA_1754	LOCUS_16830	sequence071:6846..7298(-)	partial			WP_011101497.1	alcohol dehydrogenase catalytic domain-containing protein	97.3	42.1	84.9
MGA_1755	LOCUS_16840	sequence071:7210..7755(-)	partial			WP_011101497.1	alcohol dehydrogenase catalytic domain-containing protein	84.0	43.8	75.0
MGA_1766	LOCUS_16930	sequence074:6553..>7917(-)	partial			WP_000527121.1	YSIRK signal domain/LPXTG anchor domain surface protein	93.4	18.2	33.0
MGA_1784	LOCUS_17080	sequence077:208..1449(-)	partial			WP_168549381.1	SAG1250 family conjugative relaxase	96.9	63.9	55.1
MGA_1786	LOCUS_17100	sequence077:1804..3291(-)	partial			WP_002484399.1	type IA DNA topoisomerase	65.7	47.9	33.9
MGA_1889	LOCUS_18030	sequence087:241..3483(+)	partial			WP_000795191.1	bacterial Ig-like domain-containing protein	90.5	59.3	45.3
MGA_1909	LOCUS_18190	sequence090:3371..3952(+)	partial			WP_010933538.1	restriction endonuclease subunit S	98.4	40.1	47.9
MGA_1915	LOCUS_18250	sequence090:13288..13926(+)	partial			WP_003577315.1	phospholipase A2 family protein	75.0	74.4	28.7
MGA_1950	LOCUS_18600	sequence090:52209..52898(+)	partial			WP_000511719.1	hypothetical protein	25.3	76.3	46.6
MGA_1961	LOCUS_18710	sequence090:61293..61427(-)	partial			WP_012774985.1	cysteine synthase A	90.9	13.0	92.5
MGA_1971	LOCUS_18780	sequence092:1409..2089(+)	partial			WP_011222005.1	protein rep	100.0	74.3	45.6
MGA_1995	LOCUS_18970	sequence098:1547..1747(+)	partial			WP_002225616.1	hemagglutinin repeat-containing protein	75.8	1.8	62.0
MGA_2067	LOCUS_19650	sequence102:387..2636(-)	partial			WP_002903447.1	hypothetical protein	26.0	43.2	40.1
MGA_2080	LOCUS_19750	sequence106:1052..2035(+)	partial			WP_000792779.1	bacterial Ig-like domain-containing protein	93.0	17.6	47.1
