# locus_id	locus_tag	location	classification	internal_stop	indel	ref_id	description	query_cov	ref_cov	identity
MGA_11	LOCUS_00100	sequence001:8467..8937(-)	frameshift		8978	WP_010891841.1	class I SAM-dependent methyltransferase	99.4	62.8	60.6
MGA_12	LOCUS_00110	sequence001:8958..9161(-)	frameshift		8978	WP_010891841.1	class I SAM-dependent methyltransferase	100.0	27.1	74.6
MGA_30	LOCUS_00280	sequence002:1..840(+)	partial			WP_012258754.1	NADH-quinone oxidoreductase subunit NuoG	30.5	9.0	45.3
MGA_31	LOCUS_00290	sequence002:837..2111(+)	partial			WP_011964314.1	NADH-quinone oxidoreductase subunit NuoH	69.3	83.1	40.5
MGA_37	LOCUS_00350	sequence002:6660..8066(+)	partial			WP_010941019.1	NADH-quinone oxidoreductase subunit N	73.5	72.7	33.1
MGA_55	LOCUS_00530	sequence003:5181..6146(-)	partial			WP_010891843.1	putative transporter	83.8	70.1	61.2
MGA_69	LOCUS_00670	sequence003:16057..17616(-)	partial			WP_002229415.1	class I SAM-dependent methyltransferase	70.7	71.0	35.2
MGA_80	LOCUS_00780	sequence004:5048..5251(+)	partial			WP_012047923.1	hydroxylamine reductase	85.1	9.8	49.1
MGA_96	LOCUS_00940	sequence004:16505..17131(+)	frameshift		17122	WP_004525821.1	tyrosine-type recombinase/integrase	86.1	45.5	31.0
MGA_97	LOCUS_00950	sequence004:17290..17508(+)	partial			WP_013530181.1	integrase arm-type DNA-binding domain-containing protein	93.1	15.9	46.3
MGA_109	LOCUS_01050	sequence005:4949..6292(-)	partial			WP_002865311.1	methyl-accepting chemotaxis protein	74.0	55.9	26.9
MGA_117	LOCUS_01130	sequence005:14935..15069(-)	partial			WP_002776864.1	50S ribosomal protein L34	72.7	72.7	90.6
MGA_120	LOCUS_01150	sequence006:1..541(+)	partial			WP_002857707.1	multidrug effflux MFS transporter	97.2	43.5	50.6
MGA_125	LOCUS_01200	sequence006:4678..6159(+)	partial			WP_010891831.1	flagellar hook-length control protein FliK	93.3	69.2	30.7
MGA_128	LOCUS_01230	sequence006:8686..9021(+)	partial			WP_003813638.1	MGMT family protein	72.1	75.5	50.0
MGA_133	LOCUS_01280	sequence006:15145..>16116(-)	partial			WP_002853102.1	CTP synthase	99.4	59.1	69.8
MGA_148	LOCUS_01410	sequence008:1..2904(+)	partial			WP_002858452.1	S8 family serine peptidase	52.4	46.4	45.6
MGA_151	LOCUS_01440	sequence008:4542..5345(+)	partial			WP_011201897.1	glycosyltransferase family 2 protein	82.8	62.6	39.8
MGA_177	LOCUS_01680	sequence009:12045..>12574(-)	partial			WP_000716331.1	substrate-binding domain-containing protein	96.6	58.7	48.3
MGA_178	LOCUS_01690	sequence010:1..554(+)	partial			WP_005481251.1	GGDEF domain-containing protein	80.9	31.1	26.4
MGA_183	LOCUS_01740	sequence010:5891..6493(+)	partial			WP_011704306.1	putative metalloprotease CJM1_0395 family protein	70.0	53.2	41.5
MGA_191	LOCUS_01820	sequence010:11429..>12172(-)	partial			WP_002864614.1	excinuclease ABC subunit UvrC	98.8	40.7	57.0
MGA_204	LOCUS_01950	sequence011:10947..11471(-)	partial			WP_003863794.1	TIGR00730 family Rossman fold protein	98.3	68.0	42.5
MGA_205	LOCUS_01960	sequence011:11468..>12135(-)	partial			WP_010891948.1	bifunctional diaminohydroxyphosphoribosylaminopyrimidine deaminase/5-amino-6-(5-phosphoribosylamino)uracil reductase RibD	91.9	59.8	41.0
MGA_240	LOCUS_02280	sequence013:9347..9895(+)	partial			WP_000345576.1	protein-disulfide oxidoreductase DsbI	84.1	70.2	42.4
MGA_256	LOCUS_02400	sequence015:332..751(-)	partial			WP_002855217.1	hypothetical protein	95.0	73.6	39.4
MGA_258	LOCUS_02420	sequence015:1034..3193(-)	partial			WP_010891893.1	DNA translocase FtsK	79.6	61.4	65.1
MGA_283	LOCUS_02640	sequence017:7850..9256(-)	partial			WP_102756879.1	BspA family leucine-rich repeat surface protein	55.8	40.8	36.3
MGA_321	LOCUS_02970	sequence021:5247..5456(+)	partial			WP_010989439.1	zinc ribbon domain-containing protein YjdM	97.1	60.4	61.2
MGA_343	LOCUS_03160	sequence023:4334..4804(-)	partial			WP_002852972.1	flagellar assembly lipoprotein FlgP	79.5	72.5	68.5
MGA_357	LOCUS_03290	sequence024:8628..9596(-)	partial			WP_012546793.1	2-isopropylmalate synthase	94.7	59.9	52.8
MGA_375	LOCUS_03460	sequence027:1..589(+)	partial			WP_010891825.1	RluA family pseudouridine synthase	99.5	56.3	43.8
MGA_389	LOCUS_03590	sequence028:4728..4955(-)	partial			WP_002851307.1	cytochrome c oxidase, cbb3-type, CcoQ subunit	74.7	64.4	53.6
MGA_394	LOCUS_03640	sequence029:1..809(+)	partial			WP_002919663.1	flagellar hook-length control protein FliK	88.4	33.9	35.1
MGA_409	LOCUS_03780	sequence030:8194..>8877(-)	partial			WP_010879949.1	GGDEF domain-containing protein	78.9	43.2	35.8
MGA_426	LOCUS_03940	sequence032:2777..3451(-)	partial			WP_004188272.1	CDP-alcohol phosphatidyltransferase family protein	41.1	41.0	31.6
MGA_431	LOCUS_03990	sequence032:7987..>8498(-)	partial			WP_011706120.1	bifunctional 2-methylcitrate dehydratase/aconitate hydratase	97.6	34.3	63.0
MGA_439	LOCUS_04060	sequence033:6447..8165(+)	partial			WP_005478689.1	EAL domain-containing protein	33.7	25.5	31.9
MGA_453	LOCUS_04160	sequence035:261..506(-)	partial			WP_002852414.1	AtpZ/AtpI family protein	97.5	72.5	58.2
MGA_481	LOCUS_04390	sequence038:31..828(-)	partial			WP_002856962.1	molybdopterin molybdotransferase MoeA	97.7	66.6	52.1
MGA_497	LOCUS_04540	sequence039:5254..>7423(-)	partial			WP_002858661.1	carbamoyl-phosphate synthase large subunit	99.9	66.7	67.9
MGA_567	LOCUS_05150	sequence047:5951..6346(+)	internal_stop_codon	6344..6346(+)		WP_002852492.1	Holliday junction branch migration protein RuvA	100.0	72.1	60.6
MGA_575	LOCUS_05210	sequence048:5103..5678(+)	frameshift,internal_stop_codon	5676..5678(+)	5759	WP_000775280.1	DUF3519 domain-containing protein	41.9	7.5	43.8
MGA_582	LOCUS_05270	sequence049:3531..3860(+)	partial			WP_002026021.1	arsenical resistance operon transcriptional regulator ArsR	68.8	74.3	46.7
MGA_587	LOCUS_05310	sequence050:32..1183(+)	partial			WP_011038245.1	ATP-binding protein	65.8	23.6	30.4
MGA_588	LOCUS_05320	sequence050:1370..1708(+)	frameshift		1712,1800,1834,1702	WP_000080564.1	DEAD/DEAH box helicase	98.2	10.1	31.0
MGA_589	LOCUS_05330	sequence050:1744..2169(+)	frameshift		2149,1702	WP_011268772.1	ATP-binding protein	73.0	10.0	35.5
MGA_590	LOCUS_05340	sequence050:2210..2500(+)	frameshift		2148	WP_011038245.1	ATP-binding protein	68.8	6.3	48.5
MGA_614	LOCUS_05550	sequence052:5864..>6697(-)	partial			WP_002851328.1	paralyzed flagella protein PflA	98.2	34.4	26.3
MGA_623	LOCUS_05630	sequence053:6047..>6598(-)	partial			WP_010943208.1	serine O-acetyltransferase	88.5	74.2	52.1
MGA_634	LOCUS_05730	sequence055:2196..4067(+)	partial			WP_011035470.1	site-specific DNA-methyltransferase	56.3	68.1	41.9
MGA_645	LOCUS_05810	sequence057:1484..2233(-)	partial			WP_002793288.1	ABC transporter ATP-binding protein	85.5	65.0	43.3
MGA_684	LOCUS_06130	sequence063:4696..5052(+)	partial			WP_116269310.1	tetratricopeptide repeat protein	81.4	22.3	49.0
MGA_694	LOCUS_06210	sequence064:5874..6323(-)	partial			WP_002853680.1	RdgB/HAM1 family non-canonical purine NTP pyrophosphatase	91.9	68.0	55.5
MGA_701	LOCUS_06270	sequence065:5608..6156(-)	partial			WP_005693201.1	HugZ family heme oxygenase	95.6	69.6	37.1
MGA_702	LOCUS_06280	sequence066:313..1218(-)	partial			WP_012584100.1	diguanylate cyclase	59.1	18.4	33.3
MGA_717	LOCUS_06420	sequence067:5537..>6209(-)	partial			WP_002852087.1	lytic transglycosylase domain-containing protein	76.7	48.7	41.2
MGA_725	LOCUS_06480	sequence069:11..1885(-)	partial			WP_002858440.1	capsule biosynthesis protein CapA	69.4	72.9	28.2
MGA_728	LOCUS_06510	sequence069:3884..5236(-)	partial			WP_010891936.1	ATP-grasp fold amidoligase family protein	98.2	56.3	51.1
MGA_729	LOCUS_06520	sequence069:5237..>6060(-)	partial			WP_002858210.1	UDP-galactopyranose mutase	98.5	73.1	72.1
MGA_731	LOCUS_06530	sequence070:531..1124(-)	frameshift,internal_stop_codon	531..533(-)	518	WP_002864247.1	DUF2920 family protein	99.5	46.0	36.6
MGA_736	LOCUS_06580	sequence070:5287..>6024(-)	partial			WP_002852810.1	FAD-linked oxidase C-terminal domain-containing protein	99.6	53.3	71.0
MGA_737	LOCUS_06590	sequence071:1..623(+)	partial			WP_002857221.1	DNA adenine methylase	99.0	55.6	58.3
MGA_745	LOCUS_06660	sequence072:1..195(+)	partial			WP_002779353.1	30S ribosomal protein S10	100.0	62.1	95.3
MGA_765	LOCUS_06840	sequence073:4396..>5860(-)	partial			WP_002858134.1	preprotein translocase subunit SecA	100.0	57.9	67.5
MGA_773	LOCUS_06900	sequence075:1..855(+)	partial			WP_002852404.1	periplasmic nitrate reductase subunit alpha	100.0	30.7	81.0
MGA_785	LOCUS_07010	sequence076:1928..3442(-)	partial			WP_012545463.1	type III-A CRISPR-associated protein Cas10/Csm1	50.4	32.5	27.7
MGA_787	LOCUS_07030	sequence076:4251..5477(-)	partial			WP_010871198.1	TIGR02221 family CRISPR-associated protein	99.8	67.4	33.0
MGA_814	LOCUS_07230	sequence080:3540..4013(+)	partial			WP_002853278.1	hypothetical protein	94.9	61.9	31.6
MGA_817	LOCUS_07250	sequence081:1..755(+)	partial			WP_002853860.1	M23 family metallopeptidase	100.0	62.2	57.6
MGA_827	LOCUS_07330	sequence082:4573..>5553(-)	partial			WP_002852456.1	murein biosynthesis integral membrane protein MurJ	98.8	67.3	41.3
MGA_835	LOCUS_07410	sequence083:4930..>5497(-)	partial			WP_002856044.1	AI-2E family transporter	98.4	53.3	49.7
MGA_854	LOCUS_07550	sequence087:39..479(-)	partial			WP_147367330.1	ABC transporter ATP-binding protein	95.2	53.3	37.3
MGA_856	LOCUS_07570	sequence087:1468..3522(-)	partial			WP_011963613.1	TonB-dependent receptor	24.0	23.0	33.1
MGA_857	LOCUS_07580	sequence087:3534..4493(-)	partial			WP_005810403.1	ABC transporter substrate-binding protein	49.2	43.2	37.3
MGA_883	LOCUS_07760	sequence092:610..1050(+)	partial			WP_002857391.1	molybdate ABC transporter permease subunit	97.9	63.8	58.0
MGA_891	LOCUS_07820	sequence093:3061..3195(+)	internal_stop_codon	3193..3195(+),3205..3207(+)		WP_001853304.1	ATP-dependent Clp endopeptidase proteolytic subunit ClpP	97.7	21.9	76.7
MGA_892	LOCUS_07830	sequence093:3262..3642(+)	internal_stop_codon	3193..3195(+),3205..3207(+)		WP_002806309.1	ATP-dependent Clp endopeptidase proteolytic subunit ClpP	100.0	64.9	74.6
MGA_907	LOCUS_07950	sequence096:35..310(+)	partial			WP_000163893.1	methionyl-tRNA formyltransferase	92.3	25.4	34.5
MGA_925	LOCUS_08090	sequence099:180..530(+)	partial			WP_001862740.1	preprotein translocase subunit SecG	79.3	46.2	58.7
MGA_937	LOCUS_08190	sequence100:2033..2344(+)	partial			WP_011390607.1	hypothetical protein	74.8	36.2	41.6
MGA_956	LOCUS_08340	sequence104:1..195(+)	partial			WP_002776330.1	hydrogenase nickel incorporation protein HypB	98.4	25.5	54.0
MGA_968	LOCUS_08440	sequence105:3968..4747(-)	partial			WP_002826316.1	molecular chaperone DnaK	100.0	41.6	80.3
MGA_969	LOCUS_08450	sequence106:1..557(+)	partial			WP_011072825.1	AI-2E family transporter	99.5	49.7	44.0
MGA_973	LOCUS_08490	sequence107:127..864(+)	partial			WP_002853029.1	tRNA guanosine(34) transglycosylase Tgt	99.6	65.4	73.4
MGA_978	LOCUS_08530	sequence108:1..776(+)	partial			WP_011020981.1	histidine--tRNA ligase	54.1	39.5	23.9
MGA_981	LOCUS_08560	sequence108:2461..2976(+)	partial			WP_001226637.1	MotE family protein	80.7	68.0	31.5
MGA_992	LOCUS_08640	sequence110:1..569(+)	partial			WP_000885323.1	2-oxoglutarate ferredoxin oxidoreductase subunit beta	95.2	65.6	67.6
MGA_999	LOCUS_08700	sequence111:120..431(+)	partial			WP_011390131.1	PAS domain-containing protein	59.2	35.1	45.9
MGA_1012	LOCUS_08790	sequence114:8..397(+)	partial			WP_002857891.1	capsular polysaccharide biosynthesis protein	88.4	17.9	47.2
MGA_1018	LOCUS_08840	sequence115:67..2304(-)	partial			WP_002858440.1	capsule biosynthesis protein CapA	57.4	73.5	23.2
MGA_1019	LOCUS_08850	sequence115:2360..>4474(-)	partial			WP_000694256.1	CDP-glycerol glycerophosphotransferase family protein	93.8	55.4	29.4
MGA_1031	LOCUS_08950	sequence117:3779..>4338(-)	partial			WP_002851769.1	glutamate 5-kinase	98.4	72.5	59.3
MGA_1043	LOCUS_09050	sequence119:3578..>4246(-)	partial			WP_010951065.1	DUF2163 domain-containing protein	68.9	54.6	28.0
MGA_1080	LOCUS_09330	sequence126:3186..>4004(-)	partial			WP_002858735.1	ABC-F family ATP-binding cassette domain-containing protein	96.7	49.7	69.6
MGA_1103	LOCUS_09490	sequence131:2921..3880(-)	partial			WP_002853182.1	polyribonucleotide nucleotidyltransferase	99.7	44.2	76.2
MGA_1108	LOCUS_09530	sequence132:3331..3828(-)	partial			WP_002853346.1	YaaA family protein	98.2	65.9	49.1
MGA_1116	LOCUS_09580	sequence134:1600..1839(-)	partial			WP_014208348.1	septation protein IspZ	100.0	45.5	46.2
MGA_1126	LOCUS_09670	sequence135:3199..>3797(-)	partial			WP_002852516.1	D-alanine--D-alanine ligase	98.0	56.1	55.9
MGA_1130	LOCUS_09710	sequence136:3107..>3773(-)	partial			WP_002864546.1	tRNA uridine-5-carboxymethylaminomethyl(34) synthesis enzyme MnmG	98.2	35.1	60.8
MGA_1131	LOCUS_09720	sequence137:1..593(+)	partial			WP_223294596.1	RtcB family protein	91.3	45.9	45.1
MGA_1144	LOCUS_09820	sequence140:1..1562(+)	partial			WP_002907389.1	isoleucine--tRNA ligase	99.4	55.9	63.1
MGA_1154	LOCUS_09890	sequence143:1..2514(+)	partial			WP_002858508.1	DNA-directed RNA polymerase subunit beta'	99.9	55.2	76.7
MGA_1158	LOCUS_09920	sequence144:1..621(+)	partial			WP_002857605.1	Ppx/GppA phosphatase family protein	99.0	40.1	43.5
MGA_1163	LOCUS_09950	sequence145:2231..3553(-)	partial			WP_002858598.1	penicillin-binding protein 2	95.9	69.6	48.4
MGA_1169	LOCUS_10000	sequence147:3079..>3584(-)	partial			WP_010891842.1	ABC transporter ATP-binding protein	96.4	53.0	47.2
MGA_1172	LOCUS_10020	sequence148:3363..3563(-)	partial			WP_002858451.1	sodium-dependent transporter	87.9	13.1	41.4
MGA_1180	LOCUS_10080	sequence150:2871..>3504(-)	partial			WP_011071660.1	integrase domain-containing protein	90.5	45.8	32.0
MGA_1194	LOCUS_10160	sequence154:153..1445(+)	partial			WP_011201896.1	glycosyltransferase family 8 protein	59.5	78.1	26.6
MGA_1198	LOCUS_10200	sequence154:2869..>3398(-)	partial			WP_002851858.1	COG3014 family protein	98.9	38.6	37.7
MGA_1214	LOCUS_10310	sequence159:1306..2283(-)	partial			WP_011202928.1	alpha-1,2-fucosyltransferase	55.4	64.2	25.3
MGA_1215	LOCUS_10320	sequence159:2276..>3282(-)	partial			WP_004597670.1	glycosyltransferase	21.6	26.1	45.2
MGA_1221	LOCUS_10360	sequence161:1..537(+)	partial			WP_002858051.1	lipid A biosynthesis lauroyl acyltransferase HtrB	98.9	58.6	40.9
MGA_1223	LOCUS_10380	sequence161:1631..2635(+)	partial			WP_012545557.1	glycosyltransferase family 4 protein	62.3	56.1	28.0
MGA_1225	LOCUS_10390	sequence162:342..2747(-)	partial			WP_000874574.1	vacuolating cytotoxin domain-containing protein	82.6	26.1	21.5
MGA_1236	LOCUS_10460	sequence166:750..1736(-)	partial			WP_014207550.1	sulfite reductase flavoprotein subunit alpha	79.3	31.9	25.3
MGA_1237	LOCUS_10470	sequence166:1973..2440(-)	frameshift		2466	WP_010891841.1	class I SAM-dependent methyltransferase	100.0	62.8	72.9
MGA_1238	LOCUS_10480	sequence166:2461..2664(-)	frameshift		2466	WP_010891841.1	class I SAM-dependent methyltransferase	100.0	27.1	89.6
MGA_1247	LOCUS_10530	sequence169:531..2918(-)	partial			WP_005478977.1	EAL domain-containing protein	52.6	51.2	27.7
MGA_1259	LOCUS_10610	sequence172:2514..>3063(-)	partial			WP_002852712.1	flagellar biosynthetic protein FliR	91.8	65.5	50.3
MGA_1265	LOCUS_10640	sequence174:2058..>3019(-)	partial			WP_002858054.1	UDP-N-acetylglucosamine 4,6-dehydratase (configuration-retaining)	99.7	53.6	63.0
MGA_1288	LOCUS_10780	sequence179:1982..2368(-)	partial			WP_012545648.1	response regulator	85.2	30.2	41.3
MGA_1296	LOCUS_10840	sequence181:1498..2727(-)	partial			WP_055064620.1	acyltransferase	41.3	79.0	32.9
MGA_1302	LOCUS_10880	sequence183:1..524(+)	partial			WP_002853221.1	bifunctional tRNA (5-methylaminomethyl-2-thiouridine)(34)-methyltransferase MnmD/FAD-dependent 5-carboxymethylaminomethyl-2-thiouridine(34) oxidoreductase MnmC	96.0	27.1	42.9
MGA_1305	LOCUS_10910	sequence184:81..434(-)	frameshift		495	WP_000659810.1	GDP-mannose 4,6-dehydratase	100.0	30.7	52.1
MGA_1306	LOCUS_10920	sequence184:858..1520(+)	frameshift		1514	WP_002858413.1	D-glycero-D-manno-heptose 7-phosphate kinase	99.1	64.3	87.6
MGA_1307	LOCUS_10930	sequence184:1544..1876(+)	frameshift		1514	WP_002858413.1	D-glycero-D-manno-heptose 7-phosphate kinase	100.0	32.4	78.2
MGA_1310	LOCUS_10950	sequence185:3..827(+)	partial			WP_010891860.1	DNA-directed RNA polymerase subunit beta	100.0	19.9	80.7
MGA_1313	LOCUS_10970	sequence186:515..1534(-)	partial			WP_002864146.1	hypothetical protein	57.8	48.8	27.6
MGA_1324	LOCUS_11060	sequence189:1..965(+)	partial			WP_000775280.1	DUF3519 domain-containing protein	96.6	32.2	31.5
MGA_1325	LOCUS_11070	sequence189:878..1234(-)	partial			WP_008768057.1	DNA polymerase IV	76.3	22.3	38.9
MGA_1326	LOCUS_11080	sequence189:1239..>2778(-)	partial			WP_011861457.1	heavy metal translocating P-type ATPase	98.6	61.9	39.8
MGA_1342	LOCUS_11190	sequence194:1887..2708(+)	partial			WP_002900389.1	FTR1 family iron permease	92.3	44.2	33.1
MGA_1359	LOCUS_11300	sequence198:1909..>2652(-)	partial			WP_002853235.1	serine protease HtrA	100.0	52.1	51.4
MGA_1371	LOCUS_11390	sequence202:1289..>2570(-)	partial			WP_012546013.1	type IV-A pilus assembly ATPase PilB	85.0	67.4	45.4
MGA_1377	LOCUS_11420	sequence205:1..781(+)	partial			WP_002852436.1	pitrilysin family protein	98.8	61.5	51.2
MGA_1382	LOCUS_11450	sequence206:304..768(-)	partial			WP_000444659.1	glycosyltransferase family 2 protein	67.5	34.1	47.1
MGA_1383	LOCUS_11460	sequence206:968..1702(+)	partial			WP_002858013.1	glycosyltransferase family 2 protein	59.8	38.2	34.2
MGA_1391	LOCUS_11500	sequence208:1543..>2508(-)	partial			WP_002858588.1	ATP-dependent DNA helicase RecG	97.2	52.2	58.8
