# locus_id	locus_tag	location	classification	internal_stop	indel	ref_id	description	query_cov	ref_cov	identity
MGA_25	LOCUS_00250	sequence01:26251..26838(-)	frameshift		26962	WP_000014003.1	type I restriction-modification system specificity subunit	94.9	40.0	23.7
MGA_26	LOCUS_00260	sequence01:26936..27541(-)	frameshift		26950	WP_081447092.1	restriction endonuclease subunit S	97.0	49.1	31.3
MGA_27	LOCUS_00270	sequence01:27541..29460(-)	partial			WP_000350101.1	class I SAM-dependent DNA methyltransferase	85.4	71.5	48.7
MGA_38	LOCUS_00380	sequence01:42318..42530(+)	partial			WP_002852798.1	cbb3-type cytochrome oxidase assembly protein CcoS	74.3	76.5	75.0
MGA_46	LOCUS_00460	sequence01:48910..50424(-)	frameshift		50644	WP_002858405.1	DUF2972 domain-containing protein	99.8	82.1	29.7
MGA_88	LOCUS_00880	sequence01:88976..90697(+)	partial			WP_014659976.1	hypothetical protein	98.3	57.3	49.6
MGA_91	LOCUS_00910	sequence01:91315..92199(+)	partial			WP_014659976.1	hypothetical protein	99.0	32.5	42.4
MGA_111	LOCUS_01110	sequence01:108883..111240(-)	partial			WP_002852780.1	undecaprenyl-diphosphooligosaccharide--protein glycotransferase	54.4	59.7	64.2
MGA_120	LOCUS_01200	sequence01:119767..120939(+)	frameshift,internal_stop_codon	120937..120939(+)	120942	WP_002858148.1	glycosyltransferase	99.7	75.7	62.6
MGA_121	LOCUS_01210	sequence01:120932..121297(+)	frameshift,internal_stop_codon	120937..120939(+)	120942	WP_002858148.1	glycosyltransferase	94.2	22.1	62.3
MGA_123	LOCUS_01230	sequence01:122359..122673(-)	partial			WP_002852929.1	flagellar assembly protein FlgQ	99.0	70.5	61.9
MGA_144	LOCUS_01440	sequence01:144312..145496(-)	partial			WP_011707827.1	glycosyltransferase family 8 protein	56.1	56.3	27.4
MGA_177	LOCUS_01770	sequence01:177821..179239(-)	partial			WP_002852900.1	hypothetical protein	45.1	38.7	50.5
MGA_191	LOCUS_01910	sequence01:192612..192932(+)	frameshift		192586,192610,192919	WP_002864548.1	inorganic phosphate transporter	98.1	20.5	88.5
MGA_192	LOCUS_01920	sequence01:192989..193537(+)	frameshift		193520,192917,193638	WP_002864548.1	inorganic phosphate transporter	98.4	36.4	73.5
MGA_193	LOCUS_01930	sequence01:193655..194017(+)	frameshift		193640,193525,193967	WP_002864548.1	inorganic phosphate transporter	83.3	19.7	92.0
MGA_201	LOCUS_02010	sequence01:200663..204592(+)	partial			WP_001034100.1	serine protease autotransporter EspP	54.2	54.3	31.6
MGA_245	LOCUS_02430	sequence02:6810..7049(-)	frameshift,internal_stop_codon	7055..7057(-)	7057	WP_002852402.1	DUF234 domain-containing protein	100.0	27.1	64.6
MGA_246	LOCUS_02440	sequence02:7004..7630(-)	frameshift,internal_stop_codon	7055..7057(-)	7057	WP_002852402.1	DUF234 domain-containing protein	93.3	67.5	53.8
MGA_256	LOCUS_02540	sequence02:14499..14918(-)	frameshift		15022	WP_011266513.1	hypothetical protein	98.6	65.2	39.4
MGA_273	LOCUS_02710	sequence02:30035..30880(+)	partial			WP_013224688.1	hypothetical protein	73.0	74.1	28.8
MGA_298	LOCUS_02960	sequence02:52551..54509(-)	partial			WP_147373209.1	methionyl-tRNA formyltransferase	35.1	75.2	32.3
MGA_333	LOCUS_03300	sequence03:24256..24822(+)	frameshift		24813	WP_002852070.1	sodium-dependent transporter	100.0	42.1	80.9
MGA_334	LOCUS_03310	sequence03:24819..25289(+)	frameshift		25272,25416,24813	WP_002852070.1	sodium-dependent transporter	91.7	32.2	83.3
MGA_335	LOCUS_03320	sequence03:25377..25580(+)	frameshift		25415,25271	WP_002852070.1	sodium-dependent transporter	94.0	14.1	58.7
MGA_346	LOCUS_03430	sequence03:34663..34824(-)	frameshift		34997	WP_002858595.1	hypothetical protein	98.1	36.1	61.5
MGA_394	LOCUS_03890	sequence04:17287..17982(+)	frameshift,internal_stop_codon	17914..17916(+)	17907	WP_002858290.1	alpha-2,3-sialyltransferase	89.2	72.4	48.1
MGA_396	LOCUS_03910	sequence04:19204..19962(+)	frameshift		19878,19983	WP_002858400.1	UDP-N-acetylglucosamine 2-epimerase	93.3	63.1	74.5
MGA_398	LOCUS_03930	sequence04:20323..20994(+)	partial			WP_002864821.1	acylneuraminate cytidylyltransferase	96.0	39.7	73.4
MGA_416	LOCUS_04110	sequence04:37654..39984(-)	partial			WP_011964266.1	DUF262 domain-containing protein	47.3	46.7	33.0
MGA_419	LOCUS_04140	sequence05:414..1163(+)	partial			WP_002858405.1	DUF2972 domain-containing protein	96.4	33.8	31.7
MGA_420	LOCUS_04150	sequence05:1144..1779(+)	partial			WP_002858405.1	DUF2972 domain-containing protein	94.8	32.0	29.1
MGA_453	LOCUS_04480	sequence05:33722..33979(+)	partial			WP_002851511.1	ABC-type transport auxiliary lipoprotein family protein	96.5	42.2	40.7
MGA_472	LOCUS_04650	sequence06:6064..7572(+)	partial			WP_002858440.1	capsule biosynthesis protein CapA	17.5	17.4	41.6
MGA_490	LOCUS_04830	sequence06:24892..25308(-)	frameshift		25388	WP_209611508.1	FAD-binding and (Fe-S)-binding domain-containing protein	100.0	14.8	47.1
MGA_491	LOCUS_04840	sequence06:25359..25580(-)	frameshift		25594,25390	WP_209611508.1	FAD-binding and (Fe-S)-binding domain-containing protein	86.3	6.8	56.2
MGA_493	LOCUS_04860	sequence06:25849..26103(-)	frameshift		26104,25905	WP_209611508.1	FAD-binding and (Fe-S)-binding domain-containing protein	81.0	10.1	46.9
MGA_494	LOCUS_04870	sequence06:26048..26323(-)	frameshift,internal_stop_codon	26408..26410(-)	26104,25908	WP_002851210.1	FAD-binding and (Fe-S)-binding domain-containing protein	75.8	7.7	52.1
MGA_495	LOCUS_04880	sequence06:26408..27130(-)	internal_stop_codon	26408..26410(-)		WP_209611508.1	FAD-binding and (Fe-S)-binding domain-containing protein	91.7	24.0	47.6
MGA_496	LOCUS_04890	sequence06:27130..27378(-)	partial			WP_209611508.1	FAD-binding and (Fe-S)-binding domain-containing protein	86.6	7.5	59.2
MGA_504	LOCUS_04970	sequence06:33389..33985(+)	frameshift		33306	WP_002857976.1	class I SAM-dependent methyltransferase	100.0	78.3	86.9
MGA_515	LOCUS_05080	sequence07:3641..4867(-)	partial			WP_001141540.1	DUF5710 domain-containing protein	88.7	27.5	29.5
MGA_521	LOCUS_05140	sequence07:8889..14696(-)	partial			WP_011861367.1	DEAD/DEAH box helicase family protein	77.8	48.8	34.0
MGA_535	LOCUS_05280	sequence07:24299..24997(-)	partial			WP_010622329.1	Rha family transcriptional regulator	38.8	37.0	37.8
MGA_546	LOCUS_05390	sequence07:31975..32535(-)	partial			WP_000129024.1	Rha family phage regulatory protein	65.6	35.9	40.2
MGA_556	LOCUS_05490	sequence08:5842..6204(-)	partial			WP_001052085.1	DUF3883 domain-containing protein	57.5	27.4	43.5
MGA_560	LOCUS_05530	sequence08:8662..9024(-)	partial			WP_002857889.1	FkbM family methyltransferase	99.2	43.8	51.6
MGA_561	LOCUS_05540	sequence08:8991..9338(-)	partial			WP_002857889.1	FkbM family methyltransferase	92.2	38.2	38.0
MGA_565	LOCUS_05580	sequence08:12450..12812(-)	partial			WP_002864204.1	hypothetical protein	77.5	30.2	57.0
MGA_574	LOCUS_05670	sequence08:23625..24110(+)	partial			WP_209611440.1	DNA cytosine methyltransferase	93.2	46.1	58.9
MGA_582	LOCUS_05750	sequence08:31437..32489(+)	partial			WP_010891936.1	ATP-grasp fold amidoligase family protein	91.7	40.2	44.3
MGA_586	LOCUS_05780	sequence09:1..548(+)	partial			WP_009881803.1	methyl-accepting chemotaxis protein	100.0	27.5	85.1
MGA_595	LOCUS_05870	sequence09:8627..9619(+)	partial			WP_002858440.1	capsule biosynthesis protein CapA	33.6	19.1	38.3
MGA_603	LOCUS_05950	sequence09:14419..15084(-)	partial			WP_000346779.1	site-specific DNA-methyltransferase	93.2	57.7	54.6
MGA_625	LOCUS_06150	sequence10:3357..3632(-)	frameshift,internal_stop_codon	3610..3612(-)	3640,3579,3758	WP_000046401.1	HAAAP family serine/threonine permease	74.7	16.5	57.4
MGA_626	LOCUS_06160	sequence10:3747..4178(-)	frameshift,internal_stop_codon	3610..3612(-)	3640,3761,3582	WP_000046401.1	HAAAP family serine/threonine permease	96.5	33.2	50.7
MGA_627	LOCUS_06170	sequence10:4211..4588(-)	partial			WP_002215443.1	HAAAP family serine/threonine permease	78.4	22.6	54.1
MGA_631	LOCUS_06210	sequence10:7667..8359(+)	frameshift		8385,8499	WP_002864082.1	Na+/H+ antiporter family protein	99.1	52.4	71.5
MGA_655	LOCUS_06450	sequence10:25519..25854(+)	partial			WP_002858833.1	DNA topoisomerase (ATP-hydrolyzing) subunit B	88.3	12.7	85.7
MGA_657	LOCUS_06460	sequence11:1258..1449(-)	frameshift		1263	WP_009881974.1	methyl-accepting chemotaxis protein	85.7	8.1	53.7
MGA_668	LOCUS_06570	sequence11:8346..8594(+)	partial			WP_002670476.1	hemerythrin family protein	76.8	47.4	38.5
MGA_676	LOCUS_06650	sequence11:14863..15264(+)	frameshift		14867,15243	WP_012775452.1	adenylate kinase	98.5	77.1	45.1
MGA_678	LOCUS_06670	sequence11:15588..16028(+)	frameshift		16019	WP_164979579.1	AAA domain-containing protein	77.4	12.7	50.0
MGA_679	LOCUS_06680	sequence11:16031..17581(+)	frameshift		17561,17733,16022	WP_164979579.1	AAA domain-containing protein	100.0	58.0	39.3
MGA_680	LOCUS_06690	sequence11:17719..17901(+)	frameshift,internal_stop_codon	17899..17901(+)	17732,17557	WP_164979579.1	AAA domain-containing protein	90.0	5.9	48.1
MGA_684	LOCUS_06730	sequence11:22643..23128(-)	partial			WP_002857889.1	FkbM family methyltransferase	98.8	56.9	44.1
MGA_718	LOCUS_07050	sequence12:27772..28791(-)	partial			WP_002857891.1	capsular polysaccharide biosynthesis protein	97.3	48.6	63.0
MGA_739	LOCUS_07250	sequence12:48101..48436(-)	frameshift,internal_stop_codon	48534..48536(-)	48530	WP_002852073.1	YafY family protein	96.4	36.9	72.0
MGA_740	LOCUS_07260	sequence12:48534..48983(-)	frameshift,internal_stop_codon	48534..48536(-)	48530	WP_002852073.1	YafY family protein	100.0	51.4	75.2
MGA_744	LOCUS_07300	sequence12:50569..53589(-)	partial			WP_121523862.1	DUF87 domain-containing protein	56.1	53.5	33.1
MGA_748	LOCUS_07340	sequence12:55216..56607(-)	frameshift		56807	WP_000258489.1	hypothetical protein	98.7	57.2	36.4
MGA_749	LOCUS_07350	sequence12:56796..57455(-)	frameshift		56807	WP_000258489.1	hypothetical protein	93.6	25.6	38.2
MGA_751	LOCUS_07370	sequence12:58288..59511(-)	partial			WP_051618796.1	GTP pyrophosphokinase family protein	65.1	65.5	28.7
MGA_762	LOCUS_07480	sequence12:69326..69502(-)	frameshift		69561,69661	WP_002864362.1	hypothetical protein	100.0	20.4	89.7
MGA_763	LOCUS_07490	sequence12:69803..70162(-)	frameshift,internal_stop_codon	69803..69805(-)	69561,69661	WP_002864362.1	hypothetical protein	100.0	41.9	77.3
MGA_767	LOCUS_07530	sequence12:72042..72980(+)	partial			WP_010891834.1	hypothetical protein	41.0	66.1	28.2
MGA_797	LOCUS_07830	sequence12:103005..103598(+)	partial			WP_012870274.1	restriction endonuclease subunit S	92.9	51.1	35.4
MGA_798	LOCUS_07840	sequence12:103601..104179(+)	frameshift		103553	WP_002352261.1	restriction endonuclease subunit S	98.4	31.2	51.3
MGA_827	LOCUS_08130	sequence12:121280..121684(-)	partial			WP_002851214.1	50S ribosomal protein L22	77.6	73.8	94.2
MGA_852	LOCUS_08380	sequence12:142459..143355(+)	partial			WP_209021411.1	Dam family site-specific DNA-(adenine-N6)-methyltransferase	97.3	41.6	37.3
MGA_859	LOCUS_08450	sequence12:148609..150789(-)	partial			WP_002852395.1	flagellin A	42.8	54.0	50.5
MGA_862	LOCUS_08480	sequence12:154044..154214(-)	frameshift		154049	WP_002216166.1	GIY-YIG nuclease family protein	91.1	54.3	54.9
MGA_867	LOCUS_08530	sequence12:162683..163642(+)	partial			WP_002858440.1	capsule biosynthesis protein CapA	55.2	27.0	29.6
MGA_874	LOCUS_08600	sequence12:173603..174652(+)	frameshift,internal_stop_codon	174650..174652(+)	174679	WP_209021411.1	Dam family site-specific DNA-(adenine-N6)-methyltransferase	98.9	45.3	38.3
MGA_875	LOCUS_08610	sequence12:174649..175581(+)	frameshift,internal_stop_codon	174650..174652(+)	174679	WP_209021411.1	Dam family site-specific DNA-(adenine-N6)-methyltransferase	94.8	40.9	32.9
MGA_882	LOCUS_08680	sequence13:1..1030(+)	partial			WP_002858032.1	AMP-binding protein	98.8	67.3	69.4
MGA_911	LOCUS_08960	sequence14:6075..6626(+)	partial			WP_209612115.1	hypothetical protein	45.9	30.5	38.8
MGA_960	LOCUS_09410	sequence17:6353..8416(-)	partial			WP_083774549.1	restriction endonuclease subunit S	50.1	79.1	28.5
MGA_961	LOCUS_09420	sequence17:8409..10502(-)	partial			WP_011071650.1	N-6 DNA methylase	71.0	78.7	26.0
MGA_963	LOCUS_09430	sequence18:841..1128(-)	partial			WP_010891893.1	DNA translocase FtsK	97.9	10.1	51.0
MGA_978	LOCUS_09550	sequence20:3749..4639(+)	partial			WP_039851149.1	hypothetical protein	71.3	81.7	34.0
MGA_1025	LOCUS_09970	sequence23:35199..35870(+)	partial			WP_048065707.1	AzlC family ABC transporter permease	77.1	62.0	43.6
MGA_1043	LOCUS_10150	sequence23:51874..52191(+)	frameshift		52176	WP_006995241.1	dipeptidase PepE	59.0	25.6	56.5
MGA_1044	LOCUS_10160	sequence23:52184..52687(+)	frameshift		52176	WP_006995241.1	dipeptidase PepE	100.0	70.5	54.2
MGA_1046	LOCUS_10180	sequence23:53405..54028(-)	partial			WP_000511506.1	protein-disulfide oxidoreductase DsbI	72.0	71.3	42.1
MGA_1087	LOCUS_10590	sequence23:93333..94376(-)	partial			WP_011578509.1	restriction endonuclease subunit S	44.7	39.4	37.3
MGA_1088	LOCUS_10600	sequence23:94366..96294(-)	partial			WP_011476616.1	N-6 DNA methylase	72.7	57.2	24.6
MGA_1093	LOCUS_10650	sequence23:100416..100598(-)	partial			WP_002852403.1	lipoprotein	88.3	74.7	58.9
MGA_1121	LOCUS_10930	sequence23:126348..126557(-)	partial			WP_000233875.1	site-specific DNA-methyltransferase	69.6	17.3	68.8
MGA_1130	LOCUS_11020	sequence23:132660..133493(+)	frameshift		133412	WP_011962872.1	type I restriction endonuclease	92.4	71.5	43.0
MGA_1134	LOCUS_11060	sequence23:134322..135683(-)	partial			WP_000162279.1	ATP-binding protein	90.3	73.0	31.1
MGA_1140	LOCUS_11120	sequence23:139738..140913(-)	partial			WP_025163903.1	DUF262 domain-containing protein	34.3	37.2	28.3
MGA_1141	LOCUS_11130	sequence23:140926..141438(-)	partial			WP_196835716.1	adenine-specific methyltransferase EcoRI family protein	76.5	33.8	38.2
MGA_1142	LOCUS_11140	sequence23:141720..142169(-)	partial			WP_196835716.1	adenine-specific methyltransferase EcoRI family protein	59.7	20.3	40.9
MGA_1162	LOCUS_11340	sequence23:156311..156772(-)	frameshift		156833	WP_002816243.1	DUF452 family protein	98.7	76.4	51.6
MGA_1163	LOCUS_11350	sequence23:156887..157420(-)	frameshift		157592,157433	WP_002816245.1	pyridoxal phosphate-dependent aminotransferase family protein	99.4	47.1	65.9
MGA_1164	LOCUS_11360	sequence23:157360..157563(-)	frameshift		157592,157433	WP_002816245.1	pyridoxal phosphate-dependent aminotransferase family protein	64.2	11.3	55.8
MGA_1165	LOCUS_11370	sequence23:157539..158009(-)	frameshift		157595,157436	WP_002816245.1	pyridoxal phosphate-dependent aminotransferase family protein	88.5	36.6	67.6
MGA_1178	LOCUS_11450	sequence29:340..918(-)	frameshift		348	WP_002864247.1	DUF2920 family protein	99.0	45.8	47.1
MGA_1198	LOCUS_11630	sequence34:16413..18878(-)	partial			WP_052729532.1	DNA methyltransferase	24.8	22.4	30.9
MGA_1290	LOCUS_12550	sequence34:112087..113343(+)	partial			WP_080803342.1	DNA cytosine methyltransferase	29.4	36.3	43.5
MGA_1302	LOCUS_12670	sequence34:124954..126423(-)	frameshift		126643	WP_002858443.1	DUF2972 domain-containing protein	99.2	83.0	41.0
MGA_1317	LOCUS_12820	sequence34:140320..140610(+)	partial			WP_002864146.1	hypothetical protein	76.0	20.2	59.3
MGA_1396	LOCUS_13570	sequence38:68658..70151(-)	partial			WP_000057937.1	methyl-accepting chemotaxis protein	55.7	47.9	28.8
MGA_1405	LOCUS_13660	sequence38:81786..82691(+)	partial			WP_011017006.1	sugar phosphate nucleotidyltransferase	98.3	53.6	41.1
MGA_1476	LOCUS_14360	sequence39:22366..22731(+)	partial			WP_005466243.1	glycosyltransferase family 25 protein	88.4	38.1	35.5
MGA_1490	LOCUS_14500	sequence39:38888..39169(+)	frameshift		39160	WP_003245409.1	UxaA family hydrolase	82.8	16.3	48.1
MGA_1522	LOCUS_14820	sequence39:76172..76660(-)	frameshift		76671	WP_002858642.1	putative metalloprotease CJM1_0395 family protein	95.7	63.2	60.6
MGA_1526	LOCUS_14860	sequence39:77890..78573(-)	partial			WP_002858716.1	membrane protein	99.1	71.4	46.3
MGA_1528	LOCUS_14880	sequence39:80821..81150(-)	frameshift		81091,81149	WP_010891922.1	motility associated factor glycosyltransferase family protein	77.1	12.9	40.5
MGA_1529	LOCUS_14890	sequence39:81117..82763(-)	frameshift,internal_stop_codon	82773..82775(-)	81091,81149	WP_010891922.1	motility associated factor glycosyltransferase family protein	95.6	82.4	46.1
MGA_1537	LOCUS_14970	sequence39:90625..91233(+)	partial			WP_011964364.1	DNA (cytosine-5-)-methyltransferase	78.2	38.1	59.9
MGA_1542	LOCUS_15020	sequence39:92602..93156(-)	partial			WP_209612115.1	hypothetical protein	44.6	29.4	41.5
MGA_1552	LOCUS_15110	sequence40:8438..8941(-)	frameshift		9066	WP_002857950.1	DUF2920 family protein	98.2	42.3	35.7
MGA_1553	LOCUS_15120	sequence40:9022..9615(-)	frameshift		9090	WP_010891921.1	DUF2920 family protein	91.9	48.1	46.0
MGA_1557	LOCUS_15160	sequence40:10582..10854(-)	frameshift		10868	WP_011460936.1	cytochrome b/b6 domain-containing protein	88.9	31.9	56.2
MGA_1558	LOCUS_15170	sequence40:10842..11252(-)	frameshift		10868	WP_011460936.1	cytochrome b/b6 domain-containing protein	95.6	51.8	46.9
MGA_1560	LOCUS_15190	sequence40:11376..12185(-)	frameshift		11522,11390	WP_011460935.1	4Fe-4S dicluster domain-containing protein	71.0	57.6	55.1
MGA_1601	LOCUS_15600	sequence40:48559..48741(+)	partial			WP_002851842.1	cytochrome c	80.0	34.8	61.2
MGA_1634	LOCUS_15930	sequence40:77458..78993(+)	partial			WP_002851181.1	DNA primase	85.5	71.9	35.6
MGA_1679	LOCUS_16370	sequence41:34858..36138(-)	partial			WP_010874555.1	adenine-specific methyltransferase EcoRI family protein	48.1	58.6	30.2
MGA_1693	LOCUS_16510	sequence41:51954..52484(-)	partial			WP_002864362.1	hypothetical protein	93.8	58.1	77.0
MGA_1697	LOCUS_16550	sequence41:55207..55431(+)	partial			WP_002859764.1	DUF4492 domain-containing protein	85.1	70.8	58.7
MGA_1701	LOCUS_16590	sequence41:62022..62282(+)	partial			WP_002851255.1	hypothetical protein	86.0	70.5	41.9
MGA_1751	LOCUS_17080	sequence42:44257..44487(+)	frameshift,internal_stop_codon	44485..44487(+)	44607	WP_010964898.1	anion permease	98.7	15.8	58.7
MGA_1752	LOCUS_17090	sequence42:44615..44842(+)	frameshift,internal_stop_codon	44485..44487(+)	44824,44876,45110,44598	WP_003689366.1	DASS family sodium-coupled anion symporter	68.0	10.5	56.9
MGA_1762	LOCUS_17190	sequence42:53571..54119(+)	partial			WP_002858405.1	DUF2972 domain-containing protein	98.9	28.0	30.0
