# locus_id	locus_tag	location	classification	internal_stop	indel	ref_id	description	query_cov	ref_cov	identity
MGA_1	LOCUS_00010	sequence1:1..1131(+)	partial			WP_001141540.1	DUF5710 domain-containing protein	94.9	28.2	31.5
MGA_9	LOCUS_00090	sequence1:8724..9344(+)	partial			WP_002286562.1	phage regulatory protein	50.0	38.4	44.7
MGA_16	LOCUS_00160	sequence1:13025..14173(+)	partial			WP_011264002.1	type IV secretion system protein VirB10	57.1	53.3	42.2
MGA_22	LOCUS_00220	sequence1:18558..18968(+)	partial			WP_000776464.1	type IV secretion system apparatus protein CagT	77.9	38.9	40.9
MGA_27	LOCUS_00270	sequence1:21298..21540(+)	partial			WP_011264006.1	DNA topoisomerase III	85.0	10.1	45.6
MGA_30	LOCUS_00300	sequence1:22447..23040(+)	frameshift		22352,22337	WP_011264003.1	P-type DNA transfer ATPase VirB11	95.4	57.3	56.0
MGA_35	LOCUS_00350	sequence1:25850..26260(+)	partial			WP_000776464.1	type IV secretion system apparatus protein CagT	77.9	38.9	40.9
MGA_56	LOCUS_00560	sequence1:40560..41294(+)	partial			WP_004116510.1	DNA-binding protein	89.8	70.9	34.1
MGA_62	LOCUS_00620	sequence2:4536..5768(+)	partial			WP_011143795.1	AAA family ATPase	65.4	47.8	24.9
MGA_93	LOCUS_00930	sequence2:27783..29135(+)	partial			WP_011460692.1	HipA domain-containing protein	70.7	79.3	31.0
MGA_97	LOCUS_00970	sequence2:29863..31233(+)	partial			WP_010948074.1	lpg2370 family Dot/Icm T4SS effector	55.7	82.4	29.5
MGA_100	LOCUS_01000	sequence2:32320..34155(+)	partial			WP_010946195.1	type IVB secretion system protein IcmO/DotL	79.2	64.2	22.5
MGA_104	LOCUS_01040	sequence2:38592..46487(+)	partial			WP_011861367.1	DEAD/DEAH box helicase family protein	51.5	42.7	27.2
MGA_105	LOCUS_01050	sequence2:46572..47117(+)	partial			WP_005490290.1	hypothetical protein	72.4	74.9	36.1
MGA_106	LOCUS_01060	sequence2:47107..47997(+)	partial			WP_011068063.1	nucleotidyl transferase AbiEii/AbiGii toxin family protein	77.7	74.8	31.2
MGA_158	LOCUS_01580	sequence3:5540..5902(+)	frameshift		5385	WP_011108791.1	glycosyl transferase family 90	85.8	31.8	60.2
MGA_172	LOCUS_01720	sequence3:24521..25441(+)	partial			WP_209021411.1	Dam family site-specific DNA-(adenine-N6)-methyltransferase	95.8	42.0	36.9
MGA_200	LOCUS_02000	sequence3:57769..58173(+)	partial			WP_002851214.1	50S ribosomal protein L22	77.6	73.8	96.2
MGA_229	LOCUS_02290	sequence3:75252..76487(+)	partial			WP_035050627.1	site-specific DNA-methyltransferase	46.5	26.2	37.5
MGA_298	LOCUS_02970	sequence3:133590..133988(-)	partial			WP_034260979.1	DEAD/DEAH box helicase family protein	96.2	12.6	30.5
MGA_303	LOCUS_03020	sequence3:137903..138922(+)	partial			WP_002857891.1	capsular polysaccharide biosynthesis protein	97.3	48.6	62.1
MGA_340	LOCUS_03380	sequence3:173744..174208(-)	frameshift		173803	WP_010891936.1	ATP-grasp fold amidoligase family protein	95.5	18.6	55.1
MGA_341	LOCUS_03390	sequence3:174205..174450(-)	partial			WP_002858210.1	UDP-galactopyranose mutase	93.8	20.1	52.5
MGA_353	LOCUS_03510	sequence3:183981..185039(+)	partial			WP_010891936.1	ATP-grasp fold amidoligase family protein	92.6	40.2	43.7
MGA_356	LOCUS_03540	sequence3:187976..189460(-)	partial			WP_010891935.1	glycosyltransferase family 2 protein	23.1	25.6	42.1
MGA_368	LOCUS_03660	sequence3:201141..201641(+)	partial			WP_001052085.1	DUF3883 domain-containing protein	95.8	64.3	36.8
MGA_380	LOCUS_03780	sequence3:213183..214367(-)	partial			WP_002858443.1	DUF2972 domain-containing protein	99.2	65.2	28.9
MGA_402	LOCUS_04000	sequence3:233357..234127(+)	partial			WP_011458963.1	hypothetical protein	87.9	53.3	29.3
MGA_442	LOCUS_04400	sequence3:268742..269068(+)	partial			WP_002851686.1	hypothetical protein	99.1	73.6	53.3
MGA_464	LOCUS_04620	sequence3:290743..294156(+)	frameshift		294132	WP_002864285.1	N-6 DNA methylase	99.3	80.0	64.4
MGA_465	LOCUS_04630	sequence3:294165..294851(+)	partial			WP_000187233.1	restriction endonuclease subunit S	83.3	36.4	45.3
MGA_518	LOCUS_05160	sequence3:354699..355037(-)	frameshift		355027	WP_010891922.1	motility associated factor glycosyltransferase family protein	90.2	15.9	38.8
MGA_519	LOCUS_05170	sequence3:355004..356641(-)	frameshift		355045	WP_010891922.1	motility associated factor glycosyltransferase family protein	94.3	80.4	45.2
MGA_524	LOCUS_05220	sequence3:362343..362699(-)	partial			WP_002859309.1	hypothetical protein	97.5	70.7	51.7
MGA_526	LOCUS_05240	sequence3:362942..365653(+)	partial			WP_000604593.1	glutamine-hydrolyzing GMP synthase	36.0	62.4	71.7
MGA_642	LOCUS_06400	sequence3:489477..489833(+)	partial			WP_003130078.1	sugar O-acetyltransferase	92.4	53.5	39.4
MGA_645	LOCUS_06430	sequence3:490664..491200(+)	partial			WP_000146565.1	CatB-related O-acetyltransferase	47.2	44.8	44.3
MGA_647	LOCUS_06450	sequence3:492211..493011(+)	partial			WP_011203397.1	formyltransferase family protein	86.5	58.0	42.7
MGA_648	LOCUS_06460	sequence3:493008..493643(+)	partial			WP_003020709.1	glycosyltransferase family 2 protein	55.5	34.6	37.6
MGA_652	LOCUS_06500	sequence3:496162..497346(+)	partial			WP_011707827.1	glycosyltransferase family 8 protein	56.1	56.3	27.9
MGA_666	LOCUS_06640	sequence3:511265..512254(-)	frameshift		512352	WP_010891876.1	DUF2972 domain-containing protein	87.2	66.2	37.9
MGA_667	LOCUS_06650	sequence3:512206..512634(-)	frameshift		512352	WP_010891876.1	DUF2972 domain-containing protein	59.9	20.2	51.6
MGA_674	LOCUS_06720	sequence3:519016..519330(+)	partial			WP_002852929.1	flagellar assembly protein FlgQ	99.0	70.5	62.9
MGA_685	LOCUS_06830	sequence3:530419..532779(+)	partial			WP_002852780.1	undecaprenyl-diphosphooligosaccharide--protein glycotransferase	50.5	55.7	66.0
MGA_698	LOCUS_06960	sequence3:543268..544170(-)	partial			WP_014659976.1	hypothetical protein	100.0	33.0	41.0
MGA_701	LOCUS_06990	sequence3:544787..546508(-)	partial			WP_014659976.1	hypothetical protein	98.3	57.3	51.1
MGA_748	LOCUS_07460	sequence3:591298..591948(-)	partial			WP_001262061.1	glycosyltransferase family 25 protein	72.2	62.3	35.8
MGA_761	LOCUS_07590	sequence3:604799..605215(-)	partial			WP_002864362.1	hypothetical protein	84.1	40.8	71.6
MGA_771	LOCUS_07690	sequence3:611205..611432(-)	partial			WP_002214609.1	type II toxin-antitoxin system RelE/ParE family toxin	96.0	66.1	40.3
MGA_772	LOCUS_07700	sequence3:611619..612401(-)	partial			WP_002852607.1	tyrosine-type recombinase/integrase	91.5	68.1	29.6
MGA_780	LOCUS_07780	sequence3:622804..624741(-)	partial			WP_048653110.1	lipase family protein	20.6	28.8	35.3
MGA_814	LOCUS_08120	sequence3:659834..660085(+)	frameshift		660055	WP_013368641.1	ParA family partition ATPase	74.7	28.6	53.2
MGA_840	LOCUS_08380	sequence3:682700..683494(-)	partial			WP_005449458.1	type IVB secretion system protein IcmH/DotU	68.9	68.4	29.7
MGA_854	LOCUS_08520	sequence3:693651..695009(-)	partial			WP_010948074.1	lpg2370 family Dot/Icm T4SS effector	56.2	82.4	29.5
MGA_863	LOCUS_08610	sequence3:701056..701232(-)	frameshift		701246	WP_005772654.1	BrnT family toxin	94.8	57.7	57.1
MGA_864	LOCUS_08620	sequence3:701411..702034(-)	partial			WP_011249728.1	tyrosine recombinase XerA	86.0	60.3	29.9
MGA_870	LOCUS_08680	sequence3:710970..712889(+)	partial			WP_000350101.1	class I SAM-dependent DNA methyltransferase	76.8	64.4	52.2
MGA_912	LOCUS_09100	sequence3:755509..755757(-)	frameshift,internal_stop_codon	755880..755882(-)	755925,755560,755834,755755,755901	WP_002864285.1	N-6 DNA methylase	70.7	5.5	41.3
MGA_914	LOCUS_09120	sequence3:755908..756180(-)	frameshift,internal_stop_codon	755880..755882(-)	755834,755755,755925,755901	WP_002864285.1	N-6 DNA methylase	94.4	5.8	50.6
MGA_942	LOCUS_09400	sequence3:781231..782268(-)	frameshift		781239	WP_002858443.1	DUF2972 domain-containing protein	95.7	55.1	26.1
MGA_960	LOCUS_09580	sequence3:797903..798373(-)	partial			WP_011202294.1	site-specific DNA-methyltransferase	37.8	9.1	62.7
MGA_961	LOCUS_09590	sequence3:798339..799400(-)	partial			WP_211204934.1	site-specific DNA-methyltransferase	82.4	57.0	30.8
MGA_973	LOCUS_09710	sequence3:807307..807756(+)	partial			WP_196835716.1	adenine-specific methyltransferase EcoRI family protein	59.7	20.3	39.8
MGA_974	LOCUS_09720	sequence3:808038..808550(+)	partial			WP_196835716.1	adenine-specific methyltransferase EcoRI family protein	84.1	37.5	36.0
MGA_975	LOCUS_09730	sequence3:808563..809738(+)	partial			WP_025163903.1	DUF262 domain-containing protein	34.3	37.2	28.3
MGA_981	LOCUS_09790	sequence3:813787..815148(+)	partial			WP_000162279.1	ATP-binding protein	90.1	72.8	32.1
MGA_1032	LOCUS_10300	sequence3:861178..862080(-)	frameshift		862181	WP_000467025.1	anaerobic C4-dicarboxylate transporter DcuC	98.3	59.3	36.8
MGA_1033	LOCUS_10310	sequence3:862137..862631(-)	frameshift		862184	WP_011705380.1	C4-dicarboxylate transporter DcuC	82.9	29.7	40.4
MGA_1038	LOCUS_10360	sequence3:865457..866080(-)	partial			WP_000345576.1	protein-disulfide oxidoreductase DsbI	72.0	70.7	42.1
MGA_1048	LOCUS_10460	sequence3:874126..874347(-)	partial			WP_004523495.1	YqaE/Pmp3 family membrane protein	72.6	82.8	66.0
MGA_1066	LOCUS_10640	sequence3:891708..892430(+)	partial			WP_002722128.1	site-specific DNA-methyltransferase	91.7	65.6	23.1
MGA_1082	LOCUS_10800	sequence3:909965..910543(+)	frameshift		910531	WP_002857950.1	DUF2920 family protein	94.3	44.8	45.9
MGA_1083	LOCUS_10810	sequence3:910485..911192(+)	frameshift		910534	WP_002857950.1	DUF2920 family protein	92.3	53.5	53.5
MGA_1088	LOCUS_10860	sequence3:914640..916373(-)	partial			WP_010891944.1	methyl-accepting chemotaxis protein	71.8	62.2	68.2
MGA_1122	LOCUS_11200	sequence3:944365..945306(-)	partial			WP_011249728.1	tyrosine recombinase XerA	56.9	60.3	29.9
MGA_1170	LOCUS_11680	sequence3:970977..971396(-)	partial			WP_002865738.1	single-stranded DNA-binding protein	74.8	56.8	46.2
MGA_1177	LOCUS_11750	sequence3:978651..980903(+)	partial			WP_164930439.1	HD domain-containing protein	38.0	47.7	26.9
MGA_1179	LOCUS_11770	sequence3:981215..981646(+)	partial			WP_010942768.1	lytic transglycosylase domain-containing protein	82.5	70.2	44.2
MGA_1185	LOCUS_11830	sequence3:983863..984465(-)	partial			WP_002853387.1	thermonuclease family protein	73.0	80.0	43.8
MGA_1206	LOCUS_12040	sequence3:997262..998953(-)	partial			WP_013389859.1	phage antirepressor Ant	18.7	38.6	39.0
MGA_1219	LOCUS_12170	sequence3:1007678..1009846(-)	partial			WP_013087340.1	conjugal transfer protein TraN	15.4	18.4	46.2
MGA_1220	LOCUS_12180	sequence3:1010129..1011316(-)	partial			WP_013087339.1	conjugal transfer protein TraN	60.0	38.3	25.7
MGA_1221	LOCUS_12190	sequence3:1011328..1012794(-)	partial			WP_001200841.1	IncHI-type conjugal transfer protein TrhH	29.3	30.1	25.9
MGA_1222	LOCUS_12200	sequence3:1012782..1013318(-)	partial			WP_013087344.1	S26 family signal peptidase	50.0	54.2	36.7
MGA_1244	LOCUS_12420	sequence3:1030152..1030556(-)	frameshift		1030573	WP_002857589.1	molybdate ABC transporter substrate-binding protein	100.0	53.8	65.7
MGA_1245	LOCUS_12430	sequence3:1030514..1030897(-)	frameshift		1030853,1030573	WP_002857589.1	molybdate ABC transporter substrate-binding protein	97.6	50.2	56.0
MGA_1288	LOCUS_12860	sequence3:1068436..1070028(-)	partial			WP_000057937.1	methyl-accepting chemotaxis protein	64.0	58.7	27.4
MGA_1315	LOCUS_13130	sequence3:1099480..1100265(+)	partial			WP_013389859.1	phage antirepressor Ant	31.8	31.8	37.6
MGA_1316	LOCUS_13140	sequence3:1101323..1102531(-)	partial			WP_000323332.1	hypothetical protein	69.9	58.8	30.0
MGA_1340	LOCUS_13380	sequence3:1121988..1125284(-)	frameshift		1122026	WP_164930803.1	IGHMBP2 family helicase	38.2	83.5	24.6
MGA_1357	LOCUS_13550	sequence3:1145879..1146208(+)	partial			WP_002852445.1	hypothetical protein	100.0	73.3	61.8
MGA_1364	LOCUS_13620	sequence3:1152593..1152892(+)	partial			WP_002852583.1	hypothetical protein	75.8	74.3	64.0
MGA_1365	LOCUS_13630	sequence3:1152879..1153502(-)	frameshift		1153521	WP_002857950.1	DUF2920 family protein	98.1	52.2	42.7
MGA_1366	LOCUS_13640	sequence3:1153510..1154070(-)	frameshift		1153539	WP_002857950.1	DUF2920 family protein	96.2	44.6	44.2
MGA_1394	LOCUS_13920	sequence3:1185418..1186071(-)	partial			WP_012258297.1	DUF305 domain-containing protein	67.3	73.1	28.8
MGA_1402	LOCUS_14000	sequence3:1192226..1192849(-)	partial			WP_002858405.1	DUF2972 domain-containing protein	95.2	30.7	33.0
MGA_1415	LOCUS_14130	sequence3:1202924..1203724(-)	partial			WP_002858405.1	DUF2972 domain-containing protein	74.4	30.9	30.0
MGA_1435	LOCUS_14330	sequence3:1219879..1220916(-)	frameshift		1220944	WP_010883927.1	DNA methyltransferase	100.0	32.6	29.6
MGA_1436	LOCUS_14340	sequence3:1220921..1223068(-)	frameshift		1220947	WP_010883927.1	DNA methyltransferase	95.4	63.7	35.2
MGA_1489	LOCUS_14870	sequence3:1276267..1276554(+)	frameshift		1276752,1276524,1276806	WP_002864507.1	MATE family efflux transporter	89.5	19.9	59.1
MGA_1490	LOCUS_14880	sequence3:1276527..1276793(+)	frameshift		1276752,1276524,1276806,1276872	WP_002864507.1	MATE family efflux transporter	84.1	16.7	55.4
MGA_1491	LOCUS_14890	sequence3:1276967..1277377(+)	frameshift		1276808,1276874,1276763	WP_002864507.1	MATE family efflux transporter	93.4	28.7	43.3
MGA_1499	LOCUS_14970	sequence3:1284606..1285202(-)	frameshift		1285272	WP_002857976.1	class I SAM-dependent methyltransferase	100.0	78.3	87.4
MGA_1500	LOCUS_14980	sequence3:1285249..1285389(-)	frameshift		1285272	WP_002857976.1	class I SAM-dependent methyltransferase	84.8	15.4	82.1
MGA_1506	LOCUS_15040	sequence3:1290162..1291604(+)	internal_stop_codon	1291602..1291604(+)		WP_209611508.1	FAD-binding and (Fe-S)-binding domain-containing protein	99.2	51.5	53.0
MGA_1507	LOCUS_15050	sequence3:1291641..1292951(+)	internal_stop_codon	1291602..1291604(+)		WP_209611508.1	FAD-binding and (Fe-S)-binding domain-containing protein	98.9	45.9	47.1
MGA_1567	LOCUS_15650	sequence3:1359095..1360687(-)	frameshift		1360796	WP_010891905.1	LTA synthase family protein	99.2	81.4	47.7
MGA_1568	LOCUS_15660	sequence3:1360776..1361039(-)	frameshift		1360796	WP_010891905.1	LTA synthase family protein	88.5	12.0	57.0
MGA_1644	LOCUS_16420	sequence3:1432431..1433015(-)	frameshift		1433058	WP_002857950.1	DUF2920 family protein	98.5	49.0	37.9
MGA_1645	LOCUS_16430	sequence3:1433056..1433607(-)	frameshift		1433073	WP_010891921.1	DUF2920 family protein	95.6	44.0	46.1
MGA_1659	LOCUS_16570	sequence3:1443339..1443521(-)	partial			WP_002851842.1	cytochrome c	83.3	36.2	56.9
MGA_1701	LOCUS_16990	sequence3:1481766..1481921(-)	frameshift,internal_stop_codon	1481948..1481950(-)	1481950	WP_001024629.1	site-specific DNA-methyltransferase	78.4	13.9	70.0
MGA_1702	LOCUS_17000	sequence3:1481930..1482478(-)	frameshift,internal_stop_codon	1481948..1481950(-)	1481950,1482479	WP_001024629.1	site-specific DNA-methyltransferase	94.5	62.7	68.3
MGA_1703	LOCUS_17010	sequence3:1482453..1482665(-)	frameshift		1482479	WP_001024629.1	site-specific DNA-methyltransferase	70.0	17.1	65.3
MGA_1715	LOCUS_17130	sequence3:1491472..1491978(-)	partial			WP_011578509.1	restriction endonuclease subunit S	91.1	40.7	30.1
MGA_1716	LOCUS_17140	sequence3:1492065..1494455(-)	frameshift		1494414	WP_011476616.1	N-6 DNA methylase	41.6	47.0	53.7
MGA_1717	LOCUS_17150	sequence3:1494388..1495452(-)	frameshift		1494411	WP_001045361.1	N-6 DNA methylase	98.9	51.1	37.7
MGA_1758	LOCUS_17560	sequence3:1533012..1534202(-)	partial			WP_010891922.1	motility associated factor glycosyltransferase family protein	98.5	60.4	47.0
MGA_1759	LOCUS_17570	sequence3:1534174..1534515(-)	frameshift		1534510	WP_010891924.1	flagellin modification protein PseD	95.6	16.5	61.1
MGA_1760	LOCUS_17580	sequence3:1534499..1535041(-)	frameshift		1534501	WP_010891922.1	motility associated factor glycosyltransferase family protein	99.4	29.0	44.1
MGA_1825	LOCUS_18230	sequence3:1594113..1594472(-)	frameshift		1594545	WP_002788888.1	methyltransferase domain-containing protein	100.0	53.1	59.7
MGA_1826	LOCUS_18240	sequence3:1594519..1594785(-)	frameshift		1594545	WP_002788888.1	methyltransferase domain-containing protein	98.9	38.8	67.8
MGA_1863	LOCUS_18610	sequence3:1627126..1627425(-)	partial			WP_002851255.1	hypothetical protein	74.7	70.5	45.9
MGA_1867	LOCUS_18650	sequence3:1633969..1634193(-)	partial			WP_002859764.1	DUF4492 domain-containing protein	85.1	70.8	52.4
MGA_1883	LOCUS_18810	sequence3:1651224..1652504(+)	partial			WP_010874555.1	adenine-specific methyltransferase EcoRI family protein	41.5	49.8	31.1
MGA_1893	LOCUS_18910	sequence3:1660418..1661308(+)	partial			WP_002805290.1	flagellar basal body rod modification protein	74.3	74.5	74.5
MGA_1921	LOCUS_19190	sequence3:1684310..1684621(-)	frameshift		1684672,1684786,1684735	WP_002851996.1	manganese efflux pump MntP family protein	98.1	54.5	67.6
MGA_1941	LOCUS_19390	sequence3:1706027..1706596(+)	partial			WP_012870274.1	restriction endonuclease subunit S	95.8	49.5	37.1
MGA_1942	LOCUS_19400	sequence3:1706636..1707223(+)	partial			WP_010933538.1	restriction endonuclease subunit S	99.5	40.9	54.6
MGA_1985	LOCUS_19830	sequence3:1751293..1751793(-)	partial			WP_011263153.1	NAD(P)H-dependent oxidoreductase	87.3	72.2	39.2
MGA_1990	LOCUS_19880	sequence3:1754827..1755876(+)	frameshift,internal_stop_codon	1755874..1755876(+)	1755897	WP_209021411.1	Dam family site-specific DNA-(adenine-N6)-methyltransferase	98.9	45.3	38.0
MGA_1991	LOCUS_19890	sequence3:1755873..1756805(+)	frameshift,internal_stop_codon	1755874..1755876(+)	1755897	WP_209021411.1	Dam family site-specific DNA-(adenine-N6)-methyltransferase	94.8	40.9	32.2
MGA_2010	LOCUS_20060	sequence5:1423..1662(-)	frameshift		1425	WP_013368641.1	ParA family partition ATPase	78.5	28.6	53.2
