# locus_id	locus_tag	location	classification	internal_stop	indel	ref_id	description	query_cov	ref_cov	identity
MGA_1	LOCUS_00010	sequence1:1..1060(+)	partial			WP_011117009.1	replication initiation protein	69.9	73.7	25.6
MGA_3	LOCUS_00030	sequence1:1480..2754(+)	partial			WP_010880625.1	exonuclease subunit SbcC	95.8	42.3	22.1
MGA_6	LOCUS_00060	sequence1:4829..6103(+)	partial			WP_010880625.1	exonuclease subunit SbcC	95.8	42.3	22.1
MGA_7	LOCUS_00070	sequence1:6698..7738(+)	partial			WP_011117009.1	replication initiation protein	71.1	73.7	25.6
MGA_9	LOCUS_00090	sequence1:8158..9432(+)	partial			WP_010880625.1	exonuclease subunit SbcC	95.8	42.3	22.1
MGA_22	LOCUS_00200	sequence2:6495..12293(+)	partial			WP_011860792.1	DEAD/DEAH box helicase family protein	81.9	53.2	34.2
MGA_29	LOCUS_00270	sequence2:16969..18195(+)	partial			WP_001141540.1	DUF5710 domain-containing protein	90.7	28.5	31.2
MGA_41	LOCUS_00390	sequence2:26347..26904(+)	partial			WP_010622329.1	Rha family transcriptional regulator	54.1	37.9	42.0
MGA_50	LOCUS_00480	sequence2:31884..33062(+)	partial			WP_011264002.1	type IV secretion system protein VirB10	59.7	56.3	40.6
MGA_58	LOCUS_00560	sequence3:5502..5873(+)	frameshift		5849	WP_003112948.1	FAD-binding oxidoreductase	81.3	21.1	35.0
MGA_84	LOCUS_00820	sequence3:43436..46225(-)	partial			WP_011038245.1	ATP-binding protein	35.7	30.9	36.3
MGA_87	LOCUS_00850	sequence3:50352..51650(+)	partial			WP_002837927.1	translation elongation factor 4	25.7	19.1	87.7
MGA_90	LOCUS_00880	sequence3:54356..55897(+)	partial			WP_002788173.1	pentapeptide repeat-containing protein	90.1	73.7	75.8
MGA_129	LOCUS_01270	sequence3:96009..96632(-)	partial			WP_012257162.1	Crp/Fnr family transcriptional regulator	79.2	73.5	27.1
MGA_172	LOCUS_01700	sequence3:135184..135732(+)	frameshift		135720	WP_126621964.1	hemagglutinin repeat-containing protein	65.4	3.2	50.8
MGA_173	LOCUS_01710	sequence3:135732..137888(+)	partial			WP_022819412.1	hemagglutinin repeat-containing protein	89.8	22.3	24.0
MGA_174	LOCUS_01720	sequence3:137852..140593(+)	frameshift		137822	WP_022819412.1	hemagglutinin repeat-containing protein	89.3	32.4	21.8
MGA_192	LOCUS_01900	sequence3:155342..155545(-)	frameshift,internal_stop_codon	155624..155626(-)	155359	WP_002853178.1	bacteriohemerythrin	95.5	32.2	60.9
MGA_256	LOCUS_02540	sequence3:218401..218751(+)	frameshift		218342	WP_002851141.1	MerR family transcriptional regulator	98.3	79.7	93.9
MGA_257	LOCUS_02550	sequence3:218760..219206(-)	frameshift		219217,219338	WP_014206515.1	ACR3 family arsenite efflux transporter	94.6	40.7	50.0
MGA_258	LOCUS_02560	sequence3:219858..220202(-)	frameshift		219863	WP_011476020.1	arsenate reductase ArsC	99.1	80.3	53.5
MGA_259	LOCUS_02570	sequence3:220199..220516(-)	partial			WP_000230181.1	metalloregulator ArsR/SmtB family transcription factor	69.5	22.0	46.6
MGA_309	LOCUS_03060	sequence3:271755..273995(-)	partial			WP_000874574.1	vacuolating cytotoxin domain-containing protein	96.8	28.9	21.6
MGA_336	LOCUS_03330	sequence3:300808..301452(-)	partial			WP_003358861.1	WG repeat-containing protein	55.1	31.8	37.8
MGA_376	LOCUS_03730	sequence3:338791..341358(+)	partial			WP_000694256.1	CDP-glycerol glycerophosphotransferase family protein	99.5	65.9	30.1
MGA_377	LOCUS_03740	sequence3:342005..343765(+)	partial			WP_002858440.1	capsule biosynthesis protein CapA	19.1	17.9	50.9
MGA_385	LOCUS_03820	sequence3:352420..354588(+)	partial			WP_002858440.1	capsule biosynthesis protein CapA	15.1	17.4	49.5
MGA_388	LOCUS_03850	sequence3:356079..357194(+)	partial			WP_010979546.1	amidophosphoribosyltransferase	72.0	62.1	28.6
MGA_390	LOCUS_03870	sequence3:357830..358819(+)	partial			WP_011461003.1	aldolase catalytic domain-containing protein	94.2	57.0	25.1
MGA_393	LOCUS_03900	sequence3:361480..362019(+)	frameshift		361974	WP_002857981.1	capsule polysaccharide modification protein KpsS	88.8	40.4	86.8
MGA_394	LOCUS_03910	sequence3:362156..362662(+)	frameshift		361977	WP_002857981.1	capsule polysaccharide modification protein KpsS	99.4	42.4	83.8
MGA_408	LOCUS_04050	sequence3:374792..375610(-)	frameshift		375668	WP_002865443.1	ferrous iron transport protein B	100.0	44.4	86.4
MGA_409	LOCUS_04060	sequence3:375591..376208(-)	frameshift		375668,376182	WP_002865443.1	ferrous iron transport protein B	81.0	27.1	84.3
MGA_410	LOCUS_04070	sequence3:376162..376626(-)	frameshift		376182	WP_002865443.1	ferrous iron transport protein B	96.8	24.3	85.2
MGA_411	LOCUS_04080	sequence3:376712..376846(-)	frameshift		376738	WP_002779147.1	ferrous iron transport protein A	90.9	54.1	75.0
MGA_462	LOCUS_04590	sequence3:432522..433106(+)	frameshift		433082	WP_002864247.1	DUF2920 family protein	97.4	45.8	94.7
MGA_463	LOCUS_04600	sequence3:433103..433762(+)	frameshift		433088	WP_002864247.1	DUF2920 family protein	94.5	50.1	95.2
MGA_471	LOCUS_04680	sequence3:446609..446791(-)	frameshift		446623	WP_010891922.1	motility associated factor glycosyltransferase family protein	98.3	9.1	94.9
MGA_496	LOCUS_04930	sequence3:472972..473091(+)	frameshift		473064	WP_002856137.1	hypothetical protein	66.7	7.3	100.0
MGA_497	LOCUS_04940	sequence3:473114..473410(+)	frameshift,internal_stop_codon	473408..473410(+)	473064	WP_002856137.1	hypothetical protein	100.0	27.5	95.9
MGA_498	LOCUS_04950	sequence3:473426..474043(+)	internal_stop_codon	473408..473410(+)		WP_002856137.1	hypothetical protein	100.0	57.6	99.5
MGA_500	LOCUS_04970	sequence3:474269..474988(-)	partial			WP_015444193.1	amino acid adenylation domain-containing protein	69.0	12.1	29.9
MGA_504	LOCUS_05010	sequence3:478499..479155(+)	frameshift		479077	WP_010891921.1	DUF2920 family protein	95.4	51.4	92.3
MGA_505	LOCUS_05020	sequence3:479076..479717(+)	frameshift		479086	WP_010891921.1	DUF2920 family protein	98.1	51.6	97.6
MGA_513	LOCUS_05100	sequence3:484910..485848(-)	frameshift		486063	WP_002878575.1	DUF4910 domain-containing protein	100.0	71.7	93.9
MGA_514	LOCUS_05110	sequence3:486043..486219(-)	frameshift		486063	WP_002878575.1	DUF4910 domain-containing protein	89.7	12.0	96.2
MGA_592	LOCUS_05890	sequence3:559971..563306(+)	partial			WP_011461428.1	InlB B-repeat-containing protein	24.0	8.5	30.3
MGA_593	LOCUS_05900	sequence3:563394..564392(+)	frameshift		564329,564425	WP_010891897.1	hypothetical protein	89.2	39.5	35.2
MGA_594	LOCUS_05910	sequence3:564559..564732(+)	frameshift		564329,564425,564716	WP_010891897.1	hypothetical protein	89.5	6.7	49.0
MGA_595	LOCUS_05920	sequence3:564698..565714(+)	frameshift		564714	WP_010891897.1	hypothetical protein	97.3	42.3	32.4
MGA_599	LOCUS_05960	sequence3:567975..568151(+)	frameshift		567919	WP_002864120.1	ShlB/FhaC/HecB family hemolysin secretion/activation protein	82.8	8.4	50.0
MGA_638	LOCUS_06350	sequence3:604978..605688(-)	frameshift		605710	WP_002852850.1	cation:dicarboxylase symporter family transporter	100.0	51.5	96.2
MGA_639	LOCUS_06360	sequence3:605645..606295(-)	frameshift		605695	WP_002852850.1	cation:dicarboxylase symporter family transporter	90.7	42.8	87.8
MGA_678	LOCUS_06750	sequence3:642016..642771(+)	partial			WP_001263320.1	glycosyltransferase family 25 protein	79.3	72.9	31.9
MGA_684	LOCUS_06810	sequence3:646937..647380(+)	partial			WP_005771390.1	WxcM-like domain-containing protein	92.5	43.0	64.7
MGA_685	LOCUS_06820	sequence3:647444..648385(+)	partial			WP_013097856.1	glycosyltransferase family 2 protein	69.3	63.9	26.1
MGA_690	LOCUS_06870	sequence3:652641..653171(+)	partial			WP_000763834.1	hypothetical protein	84.1	64.5	38.4
MGA_731	LOCUS_07280	sequence3:693749..694939(-)	partial			WP_010891834.1	hypothetical protein	51.5	76.3	50.0
MGA_732	LOCUS_07290	sequence3:695017..695235(-)	frameshift		695318	WP_013530311.1	SDR family oxidoreductase	61.1	16.9	61.4
MGA_733	LOCUS_07300	sequence3:695310..695777(-)	frameshift		695318	WP_000653653.1	glucose 1-dehydrogenase	85.2	54.4	40.9
MGA_786	LOCUS_07830	sequence3:749690..751132(+)	partial			WP_083500625.1	restriction endonuclease subunit S	36.9	40.8	35.6
MGA_793	LOCUS_07900	sequence3:755611..755952(+)	frameshift		755940	WP_002857952.1	ATP-binding protein	97.3	38.5	84.5
MGA_794	LOCUS_07910	sequence3:755954..756466(+)	frameshift		755940	WP_002857952.1	ATP-binding protein	98.8	59.4	80.4
MGA_810	LOCUS_08070	sequence3:774731..775048(+)	partial			WP_002852929.1	flagellar assembly protein FlgQ	100.0	70.5	77.1
MGA_835	LOCUS_08320	sequence3:802042..802434(+)	partial			WP_002853058.1	rhomboid family intramembrane serine protease	97.7	73.8	74.8
MGA_859	LOCUS_08560	sequence3:823519..824442(-)	partial			WP_004080141.1	KAP family P-loop domain protein	91.9	39.7	28.1
MGA_860	LOCUS_08570	sequence3:824454..824870(-)	partial			WP_004080141.1	KAP family P-loop domain protein	78.3	15.0	35.2
MGA_875	LOCUS_08720	sequence3:835551..836219(-)	partial			WP_050716666.1	Rha family transcriptional regulator	50.9	57.4	41.9
MGA_899	LOCUS_08960	sequence3:852055..852789(+)	partial			WP_001031454.1	XRE family transcriptional regulator	43.4	41.4	34.0
MGA_917	LOCUS_09140	sequence3:861124..861831(+)	partial			WP_050716666.1	Rha family transcriptional regulator	45.5	54.5	43.2
MGA_958	LOCUS_09550	sequence3:895155..895448(-)	frameshift,internal_stop_codon	895451..895453(-)	895540	WP_002852438.1	hypothetical protein	92.8	60.3	69.1
MGA_1012	LOCUS_10090	sequence3:954865..956457(-)	partial			WP_002865311.1	methyl-accepting chemotaxis protein	66.2	59.1	25.5
MGA_1049	LOCUS_10460	sequence3:986257..987099(-)	partial			WP_002871823.1	metallophosphoesterase	99.6	74.6	78.1
MGA_1105	LOCUS_11020	sequence3:1043915..1044496(-)	partial			WP_000572325.1	LysE family translocator	67.9	65.7	29.0
MGA_1142	LOCUS_11390	sequence3:1080604..1080861(-)	frameshift		1080880,1080606	WP_011861238.1	IS200/IS605 family element RNA-guided endonuclease TnpB	89.4	21.2	36.7
MGA_1194	LOCUS_11910	sequence3:1136530..1136967(+)	frameshift		1136931	WP_002857879.1	class I SAM-dependent methyltransferase	92.4	52.1	85.8
MGA_1195	LOCUS_11920	sequence3:1137108..1137302(+)	frameshift		1136925	WP_002857879.1	class I SAM-dependent methyltransferase	100.0	24.9	92.2
MGA_1241	LOCUS_12380	sequence3:1180725..1180913(+)	internal_stop_codon	1180911..1180913(+)		WP_010940103.1	type I restriction enzyme HsdR N-terminal domain-containing protein	100.0	17.4	53.2
MGA_1242	LOCUS_12390	sequence3:1180917..1181768(+)	internal_stop_codon	1180911..1180913(+)		WP_011962872.1	type I restriction endonuclease	98.9	81.1	36.9
MGA_1293	LOCUS_12900	sequence3:1239252..1240190(-)	partial			WP_002852607.1	tyrosine-type recombinase/integrase	73.1	65.3	32.3
MGA_1319	LOCUS_13160	sequence3:1252997..1253704(-)	partial			WP_102756879.1	BspA family leucine-rich repeat surface protein	81.7	32.7	50.3
MGA_1325	LOCUS_13220	sequence3:1256454..1256912(-)	partial			WP_015777138.1	single-stranded DNA-binding protein	73.7	66.3	36.1
MGA_1329	LOCUS_13260	sequence3:1260859..1261419(+)	partial			WP_057801863.1	Rha family transcriptional regulator	55.9	40.0	41.3
MGA_1331	LOCUS_13280	sequence3:1262258..1262998(+)	partial			WP_010922216.1	phage antirepressor KilAC domain-containing protein	58.9	55.2	32.4
MGA_1333	LOCUS_13300	sequence3:1264373..1266778(+)	partial			WP_164930439.1	HD domain-containing protein	38.5	52.5	23.5
MGA_1335	LOCUS_13320	sequence3:1267068..1267508(+)	partial			WP_010942768.1	lytic transglycosylase domain-containing protein	78.1	67.9	42.2
MGA_1339	LOCUS_13360	sequence3:1268887..1269792(+)	frameshift		1269780	WP_002864485.1	type II CRISPR RNA-guided endonuclease Cas9	98.7	31.8	42.1
MGA_1340	LOCUS_13370	sequence3:1269849..1271783(+)	frameshift		1269780	WP_002864485.1	type II CRISPR RNA-guided endonuclease Cas9	99.8	66.1	44.1
MGA_1346	LOCUS_13430	sequence3:1274124..1274969(-)	partial			WP_102756879.1	BspA family leucine-rich repeat surface protein	50.5	23.9	42.3
MGA_1368	LOCUS_13650	sequence3:1288640..1289314(+)	partial			WP_013087341.1	TraU family protein	89.7	35.2	25.5
MGA_1369	LOCUS_13660	sequence3:1289331..1290329(+)	partial			WP_013087341.1	TraU family protein	90.1	54.9	40.7
MGA_1384	LOCUS_13810	sequence3:1302020..1304185(-)	partial			WP_013087340.1	conjugal transfer protein TraN	16.4	18.4	50.8
MGA_1387	LOCUS_13840	sequence3:1304851..1306041(-)	partial			WP_013087339.1	conjugal transfer protein TraN	57.1	37.7	25.7
MGA_1388	LOCUS_13850	sequence3:1306050..1307516(-)	partial			WP_001200841.1	IncHI-type conjugal transfer protein TrhH	39.5	42.0	27.2
MGA_1389	LOCUS_13860	sequence3:1307504..1308040(-)	partial			WP_013087344.1	S26 family signal peptidase	71.9	75.9	34.1
MGA_1410	LOCUS_14070	sequence3:1325371..1325520(-)	frameshift		1325572,1325254,1325391	WP_002864507.1	MATE family efflux transporter	91.8	10.2	68.9
MGA_1411	LOCUS_14080	sequence3:1325513..1326517(-)	frameshift		1325572,1325254,1325391	WP_002864507.1	MATE family efflux transporter	94.9	71.7	85.5
MGA_1414	LOCUS_14110	sequence3:1329053..1329307(+)	frameshift,internal_stop_codon	1329005..1329007(+)	1329256,1329428	WP_002864506.1	FUSC family protein	89.3	20.8	48.0
MGA_1415	LOCUS_14120	sequence3:1329553..1330047(+)	frameshift		1329428	WP_002864506.1	FUSC family protein	97.6	45.4	58.5
MGA_1443	LOCUS_14400	sequence3:1356979..1358787(-)	partial			WP_002669793.1	Na/Pi cotransporter family protein	57.0	62.5	28.6
MGA_1481	LOCUS_14780	sequence3:1395643..1395906(-)	frameshift		1395648,1395626	WP_003245409.1	UxaA family hydrolase	88.5	16.3	44.4
MGA_1518	LOCUS_15150	sequence3:1433389..1433628(-)	frameshift		1433611	WP_011267473.1	CoA ester lyase	78.5	22.5	45.2
MGA_1519	LOCUS_15160	sequence3:1433558..1433998(-)	frameshift		1433592,1434117	WP_015064995.1	CoA ester lyase	74.0	39.1	40.4
MGA_1523	LOCUS_15200	sequence3:1436264..1436746(-)	partial			WP_009888596.1	SLC13 family permease	82.5	31.7	25.9
MGA_1673	LOCUS_16700	sequence3:1579526..1579822(+)	frameshift		1579969,1579807	WP_000955756.1	phosphoglycerate transporter PgtP	95.9	20.3	51.1
MGA_1674	LOCUS_16710	sequence3:1579813..1580016(+)	frameshift,internal_stop_codon	1580111..1580113(+)	1579969,1579807	WP_000955756.1	phosphoglycerate transporter PgtP	79.1	11.4	60.4
MGA_1676	LOCUS_16730	sequence3:1580529..1580897(+)	internal_stop_codon	1580331..1580333(+),1580463..1580465(+)		WP_000955756.1	phosphoglycerate transporter PgtP	95.9	25.7	53.3
MGA_1679	LOCUS_16760	sequence3:1582558..1582875(+)	frameshift		1582857	WP_002851967.1	cytolethal distending toxin subunit Cj-CdtC	94.3	52.4	59.6
MGA_1714	LOCUS_17110	sequence3:1615023..1615421(+)	partial			WP_002858737.1	DUF2393 domain-containing protein	94.7	71.0	70.4
MGA_1764	LOCUS_17610	sequence3:1666536..1667153(+)	partial			WP_010940294.1	methyl-accepting chemotaxis protein	72.7	23.9	45.0
MGA_1766	LOCUS_17630	sequence3:1667566..1668276(+)	partial			WP_010891944.1	methyl-accepting chemotaxis protein	100.0	35.6	88.1
MGA_1804	LOCUS_18010	sequence3:1698915..1699445(-)	frameshift,internal_stop_codon	1699699..1699701(-)	1699686	WP_012545276.1	MFS transporter	95.5	44.1	39.8
MGA_1826	LOCUS_18230	sequence3:1717900..1718532(-)	frameshift		1718581	WP_002888535.1	McrB family protein	100.0	21.3	57.8
MGA_1827	LOCUS_18240	sequence3:1718579..1720075(-)	frameshift		1718581	WP_002888535.1	McrB family protein	98.6	62.8	38.7
MGA_1845	LOCUS_18420	sequence3:1735212..1736450(-)	partial			WP_002851870.1	hypothetical protein	43.0	72.5	46.9
MGA_1888	LOCUS_18850	sequence3:1765865..1767004(-)	partial			WP_012545721.1	site-specific integrase	58.3	62.9	26.3
MGA_1919	LOCUS_19160	sequence3:1789219..1789626(-)	partial			WP_002851214.1	50S ribosomal protein L22	73.3	70.2	98.0
MGA_1931	LOCUS_19280	sequence3:1798974..1799543(+)	frameshift,internal_stop_codon	1799541..1799543(+)	1799552	WP_011963742.1	glycosyl transferase family 90	93.7	56.5	39.7
MGA_1932	LOCUS_19290	sequence3:1799525..1799938(+)	frameshift,internal_stop_codon	1799541..1799543(+)	1799552	WP_011108791.1	glycosyl transferase family 90	86.9	36.7	54.5
MGA_1955	LOCUS_19510	sequence4:2838..3278(+)	frameshift		2744,3275,2836,2823	WP_000655392.1	type IA DNA topoisomerase	97.3	21.0	50.0
MGA_1956	LOCUS_19520	sequence4:3476..4630(+)	frameshift		3275	WP_000655392.1	type IA DNA topoisomerase	99.5	57.9	37.3
MGA_1968	LOCUS_19640	sequence4:10372..11196(-)	partial			WP_011117494.1	RepB family plasmid replication initiator protein	68.2	65.0	24.5
MGA_1973	LOCUS_19690	sequence4:16131..17363(+)	partial			WP_000323332.1	hypothetical protein	66.6	56.0	32.9
MGA_1993	LOCUS_19890	sequence4:30643..31764(+)	partial			WP_010920280.1	type IV secretion system protein VirB10	45.0	43.6	35.3
MGA_2015	LOCUS_20100	sequence5:1045..1728(+)	partial			WP_005813668.1	Fic family protein	68.7	71.3	39.1
MGA_2021	LOCUS_20160	sequence5:3906..6062(-)	partial			WP_009938884.1	relaxase/mobilization nuclease domain-containing protein	72.6	78.7	26.3
MGA_2022	LOCUS_20170	sequence5:6025..6408(-)	partial			WP_015039733.1	conjugal transfer transcriptional regulator TraJ	47.2	48.8	36.7
MGA_2028	LOCUS_20230	sequence5:10946..11242(+)	partial			WP_011970255.1	TrbC/VirB2 family protein	91.8	71.4	44.4
MGA_2031	LOCUS_20260	sequence5:13993..14577(+)	partial			WP_034165349.1	Rha family phage regulatory protein	53.6	33.7	47.2
MGA_2033	LOCUS_20280	sequence5:15452..15907(+)	partial			WP_000129024.1	Rha family phage regulatory protein	69.5	30.4	46.7
MGA_2034	LOCUS_20290	sequence5:15904..16458(+)	partial			WP_010922216.1	phage antirepressor KilAC domain-containing protein	58.7	41.5	40.7
MGA_2042	LOCUS_20370	sequence5:23188..23733(+)	partial			WP_011970881.1	type IV secretion system lytic transglycosylase VirB1	77.3	58.7	30.5
MGA_2043	LOCUS_20380	sequence5:23830..24192(+)	partial			WP_007339883.1	single-stranded DNA-binding protein	74.2	55.6	37.2
MGA_2045	LOCUS_20400	sequence5:24324..26537(+)	partial			WP_011263960.1	zincin-like metallopeptidase domain-containing protein	38.3	83.2	39.0
