# locus_id	locus_tag	location	classification	internal_stop	indel	ref_id	description	query_cov	ref_cov	identity
MGA_16	LOCUS_00160	sequence01:15345..15590(-)	partial			WP_002658367.1	rhodanese-like domain-containing protein	100.0	65.9	98.8
MGA_21	LOCUS_00210	sequence01:20051..20482(-)	frameshift		20477	WP_010957235.1	tRNA preQ1(34) S-adenosylmethionine ribosyltransferase-isomerase QueA	96.5	39.2	55.8
MGA_22	LOCUS_00220	sequence01:20445..21083(-)	frameshift		20477	WP_010957235.1	tRNA preQ1(34) S-adenosylmethionine ribosyltransferase-isomerase QueA	97.6	62.2	38.4
MGA_198	LOCUS_01980	sequence01:203345..204088(+)	partial			WP_002656686.1	hemolysin family protein	100.0	60.0	100.0
MGA_219	LOCUS_02190	sequence01:228542..228895(-)	partial			WP_010890332.1	SIMPL domain-containing protein	99.1	50.2	56.0
MGA_263	LOCUS_02630	sequence01:281314..281577(-)	partial			WP_010889722.1	RNA chaperone Hfq	100.0	54.7	100.0
MGA_298	LOCUS_02980	sequence01:310559..311185(-)	partial			WP_014023546.1	putative lipid II flippase FtsW	100.0	57.1	88.9
MGA_365	LOCUS_03650	sequence01:383395..383925(-)	partial			WP_010889737.1	hypothetical protein	100.0	69.0	100.0
MGA_400	LOCUS_04000	sequence01:422471..423058(+)	partial			WP_011964510.1	DNA/RNA non-specific endonuclease	89.7	64.3	39.4
MGA_495	LOCUS_04930	sequence01:516090..516473(+)	frameshift,internal_stop_codon	516004..516006(+),516007..516009(+),516034..516036(+)	515929,515978,516042,516097	WP_002675739.1	HAD family hydrolase	86.6	49.8	31.4
MGA_505	LOCUS_05030	sequence01:532851..533606(+)	partial			WP_011392090.1	NAD+ synthase	98.0	42.6	47.2
MGA_511	LOCUS_05090	sequence01:539367..540020(-)	frameshift		540025	WP_012870308.1	TIGR02757 family protein	91.2	77.5	34.0
MGA_657	LOCUS_06550	sequence01:712204..712926(-)	partial			WP_002657405.1	hypothetical protein	90.4	62.4	91.7
MGA_728	LOCUS_07260	sequence01:790807..791283(-)	partial			WP_010889814.1	ABC transporter permease	100.0	48.5	93.7
MGA_825	LOCUS_08230	sequence01:909915..910058(-)	frameshift		910144,910117,909913,910075,910174	WP_010883928.1	hypothetical protein	97.9	41.5	65.3
MGA_845	LOCUS_08430	sequence04:2387..2542(+)	frameshift,internal_stop_codon	2339..2341(+)	2527	WP_010883949.1	plasmid maintenance protein	100.0	41.8	70.6
MGA_846	LOCUS_08440	sequence04:3141..3605(+)	frameshift		3105	WP_010883946.1	plasmid maintenance protein	99.4	42.4	83.3
MGA_847	LOCUS_08450	sequence04:3598..3819(+)	partial			WP_010890331.1	lipoprotein P35	93.2	25.9	57.4
MGA_863	LOCUS_08610	sequence05:15349..15813(+)	partial			WP_010883946.1	plasmid maintenance protein	98.7	41.3	76.3
MGA_866	LOCUS_08640	sequence05:16603..16800(+)	partial			WP_010883946.1	plasmid maintenance protein	95.4	16.8	100.0
MGA_871	LOCUS_08690	sequence06:5377..5529(+)	frameshift,internal_stop_codon	5574..5576(+),5586..5588(+)	5377,5524	WP_010890335.1	S2/P23 family protein	98.0	17.4	57.1
MGA_872	LOCUS_08700	sequence06:6182..6355(-)	partial			WP_002657094.1	5'-methylthioadenosine/adenosylhomocysteine nucleosidase	86.0	18.5	71.4
MGA_882	LOCUS_08800	sequence06:16915..17097(+)	frameshift,internal_stop_codon	16831..16833(+),16885..16887(+),17095..17097(+),16861..16863(+),16891..16893(+)	17130,16772	WP_010890263.1	chromosome replication/partitioning protein	100.0	31.1	90.0
MGA_883	LOCUS_08810	sequence06:19935..20150(+)	frameshift,internal_stop_codon	20172..20174(+),19830..19832(+),19661..19663(+)	20129,19762,20237	WP_010883927.1	DNA methyltransferase	91.5	6.1	66.7
MGA_885	LOCUS_08830	sequence06:23508..23723(-)	frameshift		23519	WP_010883945.1	hypothetical protein	94.4	57.3	64.2
MGA_920	LOCUS_09160	sequence08:4027..4182(+)	frameshift		4000	WP_010890349.1	hypothetical protein	100.0	70.8	96.1
MGA_922	LOCUS_09180	sequence08:5953..6375(-)	internal_stop_codon	6421..6423(-),5953..5955(-)		WP_010890312.1	chromosome replication/partitioning protein	97.9	67.0	53.6
MGA_928	LOCUS_09240	sequence08:10033..10179(-)	frameshift,internal_stop_codon	10357..10359(-),10415..10417(-),10348..10350(-)	10344,10217,10279	WP_014023152.1	RNA-guided endonuclease TnpB family protein	100.0	12.7	79.2
MGA_937	LOCUS_09330	sequence08:17551..17805(-)	frameshift		17512	WP_183221031.1	DUF226 domain-containing protein	71.4	34.6	68.8
MGA_938	LOCUS_09340	sequence08:18427..18822(-)	frameshift		18872	WP_075552700.1	variable large family protein	93.9	41.5	40.4
MGA_939	LOCUS_09350	sequence08:18870..19979(-)	frameshift		18872,20029	WP_075552700.1	variable large family protein	61.8	65.7	39.5
MGA_940	LOCUS_09360	sequence08:20027..21319(-)	frameshift,internal_stop_codon	21476..21478(-)	20029	WP_075552700.1	variable large family protein	53.0	65.7	41.3
MGA_941	LOCUS_09370	sequence08:21476..26584(-)	internal_stop_codon	21476..21478(-)		WP_075552700.1	variable large family protein	13.8	68.6	39.8
MGA_945	LOCUS_09410	sequence09:2311..2616(+)	frameshift		2187,2343	WP_014023153.1	P13 family porin	96.0	57.5	85.6
MGA_946	LOCUS_09420	sequence09:2891..3649(-)	frameshift		3675	WP_014023152.1	RNA-guided endonuclease TnpB family protein	95.6	63.9	90.0
MGA_947	LOCUS_09430	sequence09:3661..4056(-)	frameshift		3675	WP_014023152.1	RNA-guided endonuclease TnpB family protein	96.2	33.4	90.5
MGA_952	LOCUS_09480	sequence09:7483..10779(-)	partial			WP_055166304.1	tape measure protein	16.6	16.6	24.2
MGA_956	LOCUS_09520	sequence09:12309..12518(-)	partial			WP_010256673.1	hypothetical protein	100.0	46.9	100.0
MGA_974	LOCUS_09700	sequence09:26657..27085(+)	partial			WP_010890289.1	DUF226 domain-containing protein	90.1	74.9	96.1
MGA_982	LOCUS_09780	sequence10:3136..3348(-)	partial			WP_010258957.1	DUF226 domain-containing protein	100.0	36.4	41.4
MGA_989	LOCUS_09850	sequence10:15136..15345(+)	frameshift		14913,15155,14961	WP_010890299.1	right-handed parallel beta-helix repeat-containing protein	76.8	6.0	52.8
MGA_997	LOCUS_09930	sequence10:23189..23383(-)	frameshift,internal_stop_codon	23530..23532(-),23386..23388(-)	23553	WP_010890288.1	plasmid maintenance protein	71.9	10.2	64.0
MGA_1000	LOCUS_09960	sequence10:26978..27445(-)	partial			WP_014023152.1	RNA-guided endonuclease TnpB family protein	87.7	36.1	89.7
MGA_1005	LOCUS_10000	sequence11:1618..1863(+)	partial			WP_010883946.1	plasmid maintenance protein	100.0	22.0	95.1
MGA_1008	LOCUS_10030	sequence11:3923..4315(+)	frameshift,internal_stop_codon	3880..3882(+)	3948	WP_010890343.1	lipoprotein	93.1	47.2	60.3
MGA_1010	LOCUS_10050	sequence11:6603..6833(+)	partial			WP_010890330.1	virulence associated lipoprotein	94.7	32.6	72.2
MGA_1011	LOCUS_10060	sequence11:7183..8538(+)	partial			WP_010890325.1	virulence associated lipoprotein	45.9	45.9	99.0
MGA_1017	LOCUS_10120	sequence11:17093..17272(-)	frameshift		17337	WP_010890325.1	virulence associated lipoprotein	94.9	12.4	66.1
MGA_1018	LOCUS_10130	sequence11:17302..17874(-)	frameshift		17337	WP_010890325.1	virulence associated lipoprotein	61.6	25.9	63.2
MGA_1026	LOCUS_10210	sequence11:25524..25805(+)	internal_stop_codon	25446..25448(+)		WP_010890312.1	chromosome replication/partitioning protein	95.7	42.6	73.0
MGA_1029	LOCUS_10240	sequence11:26881..27069(-)	partial			WP_014023068.1	NINE protein	80.6	53.2	92.0
MGA_1116	LOCUS_11110	sequence14:1306..1458(+)	internal_stop_codon	1456..1458(+)		WP_010883890.1	DUF1357 domain-containing protein	88.0	19.1	90.9
MGA_1117	LOCUS_11120	sequence14:1462..2001(+)	internal_stop_codon	1456..1458(+)		WP_010883890.1	DUF1357 domain-containing protein	99.4	77.4	93.3
MGA_1149	LOCUS_11440	sequence14:21974..22252(+)	internal_stop_codon	22250..22252(+)		WP_010883737.1	Bdr family repetitive protein	98.9	40.0	68.1
MGA_1287	LOCUS_12820	sequence18:3379..3828(+)	frameshift		3798	WP_010883929.1	DUF228 domain-containing protein	100.0	78.0	90.6
MGA_1288	LOCUS_12830	sequence18:3825..3953(+)	frameshift		3798	WP_010883929.1	DUF228 domain-containing protein	100.0	22.0	97.6
MGA_1289	LOCUS_12840	sequence18:3975..4487(+)	frameshift		4466	WP_010883814.1	hypothetical protein	96.5	51.4	100.0
MGA_1290	LOCUS_12850	sequence18:4507..4938(+)	frameshift		4463	WP_010883774.1	hypothetical protein	100.0	44.8	100.0
MGA_1297	LOCUS_12920	sequence18:8380..8745(+)	frameshift		8378	WP_010883794.1	DUF1473 family protein	100.0	80.1	97.5
MGA_1301	LOCUS_12960	sequence18:10558..11037(+)	frameshift		10447	WP_010883770.1	DUF792 family protein	100.0	70.0	96.2
MGA_1303	LOCUS_12980	sequence18:12009..12152(+)	internal_stop_codon	12150..12152(+)		WP_010883798.1	DUF777 family protein	100.0	25.5	97.9
MGA_1306	LOCUS_13010	sequence18:13807..14244(+)	frameshift		14232	WP_010883801.1	DUF735 family protein	97.9	70.6	100.0
MGA_1314	LOCUS_13090	sequence18:17773..18120(-)	internal_stop_codon	18163..18165(-),18253..18255(-)		WP_014017690.1	ERF family protein	100.0	33.9	94.8
MGA_1315	LOCUS_13100	sequence18:18253..18714(-)	internal_stop_codon	18163..18165(-),18769..18771(-),18253..18255(-)		WP_010883781.1	ERF family protein	100.0	45.5	77.1
MGA_1323	LOCUS_13180	sequence18:25003..25479(-)	internal_stop_codon	25558..25560(-)		WP_010883864.1	site-specific integrase	100.0	61.2	94.3
MGA_1324	LOCUS_13190	sequence18:25558..25779(-)	internal_stop_codon	25558..25560(-)		WP_010883864.1	site-specific integrase	100.0	28.3	74.0
MGA_1331	LOCUS_13260	sequence19:1210..2223(-)	partial			WP_010890314.1	class I SAM-dependent DNA methyltransferase	97.6	25.8	74.2
MGA_1332	LOCUS_13270	sequence19:2818..3222(-)	frameshift		3232,2824,3421	WP_010890314.1	class I SAM-dependent DNA methyltransferase	88.1	9.2	70.3
MGA_1333	LOCUS_13280	sequence19:3225..3413(-)	frameshift		3232,3421	WP_010890314.1	class I SAM-dependent DNA methyltransferase	91.9	4.5	64.9
MGA_1334	LOCUS_13290	sequence19:3416..3583(-)	frameshift		3232,3421	WP_010890314.1	class I SAM-dependent DNA methyltransferase	98.2	4.2	94.4
MGA_1337	LOCUS_13320	sequence19:6804..6983(-)	frameshift		6930,6812	WP_010890314.1	class I SAM-dependent DNA methyltransferase	71.2	3.4	72.7
MGA_1348	LOCUS_13430	sequence19:18973..19173(+)	frameshift,internal_stop_codon	19173..19175(+),18776..18778(+),18846..18848(+),18762..18764(+)	18878,18839	WP_010890314.1	class I SAM-dependent DNA methyltransferase	100.0	5.2	80.3
MGA_1352	LOCUS_13470	sequence19:23073..23657(-)	partial			WP_010890334.1	immunogenic protein P37	70.6	42.5	41.1
MGA_1354	LOCUS_13490	sequence19:24293..24670(+)	frameshift		24240,24303	WP_010890362.1	hypothetical protein	96.8	52.1	39.2
MGA_1360	LOCUS_13550	sequence19:28586..29212(-)	internal_stop_codon	28586..28588(-)		WP_010890341.1	hypothetical protein	100.0	73.6	49.1
MGA_1367	LOCUS_13620	sequence19:36389..36577(-)	partial			WP_014023068.1	NINE protein	80.6	53.2	90.0
MGA_1368	LOCUS_13630	sequence20:482..667(+)	frameshift		664,679	WP_010890261.1	virulence associated lipoprotein	96.7	24.7	86.7
MGA_1369	LOCUS_13640	sequence20:927..1211(+)	frameshift		664,679	WP_010890261.1	virulence associated lipoprotein	98.9	37.9	73.1
MGA_1372	LOCUS_13670	sequence20:7270..7476(+)	frameshift,internal_stop_codon	7227..7229(+),7224..7226(+)	7268	WP_010890339.1	Bdr family repetitive protein	85.3	31.5	60.3
MGA_1410	LOCUS_14050	sequence21:8266..8445(+)	partial			WP_010258115.1	BlyA family holin	66.1	66.1	92.3
MGA_1451	LOCUS_14460	sequence21:39873..40112(-)	partial			WP_010890394.1	hypothetical protein	69.6	69.6	76.4
MGA_1460	LOCUS_14550	sequence21:48584..49222(-)	partial			WP_010890326.1	complement regulator-acquiring protein	90.6	66.2	34.9
MGA_1461	LOCUS_14560	sequence21:49447..49860(-)	partial			WP_010890397.1	complement regulator-acquiring protein	54.7	32.3	40.7
MGA_1468	LOCUS_14630	sequence22:1467..1814(+)	frameshift		1811	WP_010890262.1	S2/P23 family protein	100.0	40.1	87.8
MGA_1469	LOCUS_14640	sequence22:1726..2268(+)	frameshift		1811	WP_010890262.1	S2/P23 family protein	98.3	61.7	85.3
MGA_1475	LOCUS_14700	sequence22:6336..6674(-)	partial			WP_010890315.1	plasmid maintenance protein	62.5	23.5	54.3
MGA_1480	LOCUS_14750	sequence22:9238..9435(+)	internal_stop_codon	9433..9435(+)		WP_002658432.1	hypothetical protein	100.0	50.4	98.5
MGA_1481	LOCUS_14760	sequence22:9439..9627(+)	internal_stop_codon	9433..9435(+)		WP_002658432.1	hypothetical protein	100.0	48.1	100.0
MGA_1510	LOCUS_15050	sequence22:29937..30974(+)	partial			WP_010883925.1	laminin-binding protein ErpX	44.3	44.3	94.1
MGA_1514	LOCUS_15090	sequence22:33873..34358(+)	internal_stop_codon	34356..34358(+)		WP_010883851.1	DUF1073 domain-containing protein	100.0	39.6	100.0
MGA_1515	LOCUS_15100	sequence22:34371..34751(+)	frameshift,internal_stop_codon	34356..34358(+)	34733	WP_010883789.1	DUF1073 domain-containing protein	100.0	31.0	89.7
MGA_1516	LOCUS_15110	sequence22:34940..35098(+)	frameshift		34739	WP_010883789.1	DUF1073 domain-containing protein	100.0	12.8	100.0
MGA_1523	LOCUS_15180	sequence22:39802..39933(-)	frameshift,internal_stop_codon	39739..39741(-),39550..39552(-)	39819,39582	WP_010890294.1	hypothetical protein	90.7	21.5	92.3
MGA_1524	LOCUS_15190	sequence22:39959..40186(-)	partial			WP_010890295.1	DUF1073 domain-containing protein	100.0	22.0	97.3
MGA_1527	LOCUS_15220	sequence22:43915..44196(-)	frameshift,internal_stop_codon	44456..44458(-)	44368,44233,43903,44056	WP_002665626.1	type I restriction endonuclease	89.2	21.1	56.6
MGA_1528	LOCUS_15230	sequence22:44714..44983(+)	internal_stop_codon	44981..44983(+)		WP_010890322.1	MFS transporter	87.6	19.9	78.2
MGA_1530	LOCUS_15250	sequence22:47784..48131(-)	internal_stop_codon	48252..48254(-)		WP_010890331.1	lipoprotein P35	100.0	43.7	75.7
MGA_1531	LOCUS_15260	sequence22:48432..48626(-)	frameshift,internal_stop_codon	48251..48253(-)	48415	WP_010890325.1	virulence associated lipoprotein	46.9	6.7	73.3
MGA_1533	LOCUS_15280	sequence22:50395..50550(-)	frameshift,internal_stop_codon	50596..50598(-)	50409	WP_010883949.1	plasmid maintenance protein	100.0	41.8	70.6
