# locus_id	locus_tag	location	classification	internal_stop	indel	ref_id	description	query_cov	ref_cov	identity
MGA_3	LOCUS_0020	sequence001:1923..2498(-)	partial			WP_011963937.1	T9SS C-terminal target domain-containing protein	62.3	15.5	32.0
MGA_4	LOCUS_0030	sequence001:2810..3652(+)	partial			Q64N02	aminotransferase	83.9	40.1	34.9
MGA_5	LOCUS_0040	sequence001:3720..4850(+)	partial			P55648	hypothetical protein	94.1	57.3	33.3
MGA_6	LOCUS_0050	sequence001:4850..5494(+)	partial			WP_004522420.1	phosphatidyltransferase	57.0	41.7	36.8
MGA_14	LOCUS_0130	sequence002:1..532(+)	partial			WP_016361986.1	protein of unknown function precursor; adhesin	69.3	5.0	35.5
MGA_29	LOCUS_0280	sequence003:9312..9851(-)	partial			WP_011962330.1	Xaa-Pro aminopeptidase	90.5	37.9	57.7
MGA_36	LOCUS_0340	sequence004:7594..>8987(-)	partial			Q56307	beta-galactosidase	98.1	39.7	31.7
MGA_43	LOCUS_0400	sequence005:4227..6881(-)	partial			WP_011963634.1	histidine kinase	33.7	30.5	36.0
MGA_71	LOCUS_0610	sequence009:5205..6239(+)	partial			WP_011962354.1	T9SS C-terminal target domain-containing protein	25.9	24.5	40.0
MGA_79	LOCUS_0680	sequence010:5818..6408(+)	partial			WP_011964201.1	NifU family protein	96.9	63.8	42.0
MGA_107	LOCUS_0900	sequence015:1729..2499(+)	partial			WP_005784340.1	PASTA domain-containing protein	66.0	79.3	31.4
MGA_111	LOCUS_0940	sequence015:5298..>5824(-)	partial			Q74G11	aminodeoxyfutalosine synthase	100.0	48.2	48.3
MGA_115	LOCUS_0970	sequence016:2712..3815(+)	partial			WP_012583084.1	O-antigen polymerase	74.1	35.6	25.1
MGA_123	LOCUS_1030	sequence017:4765..>5556(-)	partial			Q64YK6	GTPase HflX	100.0	65.0	66.8
MGA_138	LOCUS_1140	sequence020:1..1484(+)	partial			WP_011962267.1	glycosyl hydrolase	77.7	33.5	34.6
MGA_140	LOCUS_1160	sequence020:2370..3731(-)	partial			WP_011962200.1	lytic transglycosylase	89.2	69.2	37.0
MGA_160	LOCUS_1300	sequence024:1..862(+)	partial			WP_011202207.1	beta-glucosidase	99.0	30.2	44.9
MGA_196	LOCUS_1600	sequence030:3920..4153(+)	partial			WP_010888716.1	NrdH-redoxin	71.4	67.9	47.3
MGA_201	LOCUS_1630	sequence031:2888..3634(-)	internal_stop_codon	3692..3694(-)		WP_011963439.1	hypothetical protein	99.6	81.2	56.7
MGA_204	LOCUS_1650	sequence032:1..1060(+)	partial			WP_011962469.1	membrane protein	81.5	27.0	31.2
MGA_206	LOCUS_1670	sequence032:1667..2443(-)	partial			YP_001704094.1	hypothetical protein	71.3	69.6	34.6
MGA_224	LOCUS_1800	sequence035:1..1371(+)	partial			A6GY25	UvrABC system protein B	99.1	68.5	64.5
MGA_228	LOCUS_1840	sequence035:4120..4506(+)	partial			WP_011461621.1	transcriptional regulator	70.3	77.8	28.3
MGA_231	LOCUS_1850	sequence036:343..1326(-)	partial			WP_008760378.1	hybrid sensor histidine kinase/response regulator	91.7	24.8	21.2
MGA_234	LOCUS_1880	sequence036:3798..>4593(-)	partial			WP_011962300.1	T9SS C-terminal target domain-containing protein	36.7	30.6	35.0
MGA_237	LOCUS_1910	sequence037:1345..2151(-)	partial			Q87KB5	L-threonine dehydratase	94.8	49.1	26.4
MGA_257	LOCUS_2040	sequence041:1914..2393(-)	internal_stop_codon	1914..1916(-)		Q8A754	endonuclease III	97.5	68.9	60.6
MGA_267	LOCUS_2110	sequence043:2343..>4259(-)	partial			WP_010933213.1	peptidase M16	100.0	66.9	45.4
MGA_286	LOCUS_2230	sequence048:3297..>4105(-)	partial			WP_011964075.1	gliding motility lipoprotein GldK	97.4	53.2	51.1
MGA_295	LOCUS_2290	sequence050:3522..>4040(-)	partial			A6GYZ5	Sec-independent protein translocase protein TatC	97.7	61.3	48.8
MGA_309	LOCUS_2390	sequence053:2666..3814(-)	partial			WP_011405119.1	glycosyl transferase	40.1	39.0	37.9
MGA_314	LOCUS_2430	sequence055:1..480(+)	partial			WP_011203690.1	rhomboid family intramembrane serine protease	97.5	62.1	49.4
MGA_316	LOCUS_2450	sequence055:1610..2419(+)	partial			WP_011963288.1	endonuclease	91.8	70.7	35.9
MGA_345	LOCUS_2630	sequence061:1..1620(+)	partial			WP_010883237.1	peptide ABC transporter substrate-binding protein	42.9	32.1	31.3
MGA_346	LOCUS_2640	sequence061:1636..3114(+)	partial			WP_010942081.1	peptide ABC transporter permease	51.4	76.7	42.1
MGA_348	LOCUS_2650	sequence062:1..294(+)	partial			WP_011963945.1	DUF4835 domain-containing protein	89.7	29.5	35.6
MGA_353	LOCUS_2690	sequence063:1..863(+)	partial			WP_008760901.1	phospholipase	60.8	47.9	24.6
MGA_356	LOCUS_2720	sequence063:2621..3118(-)	frameshift		3171	WP_011071290.1	methionine synthase	97.6	12.9	60.9
MGA_357	LOCUS_2730	sequence063:3148..>3853(-)	frameshift		3171	WP_002212080.1	methionine synthase	99.1	18.8	51.1
MGA_359	LOCUS_2740	sequence064:954..2093(+)	partial			WP_011021764.1	surface antigen gene	29.0	10.0	34.5
MGA_398	LOCUS_2970	sequence073:1549..2427(+)	partial			WP_010989425.1	cell wall surface anchor protein	72.3	30.3	39.8
MGA_406	LOCUS_3020	sequence075:180..1292(-)	partial			WP_011023149.1	zinc metalloprotease	67.6	73.1	29.4
MGA_409	LOCUS_3030	sequence076:151..1992(+)	partial			WP_011120805.1	hypothetical protein	55.8	48.9	29.0
MGA_415	LOCUS_3070	sequence077:2767..>3636(-)	partial			WP_011964521.1	membrane protein	99.7	69.8	26.6
MGA_416	LOCUS_3080	sequence078:1..866(+)	partial			B5YL60	aspartyl/glutamyl-tRNA(Asn/Gln) amidotransferase subunit B	97.9	58.9	44.1
MGA_418	LOCUS_3100	sequence078:1660..>3626(-)	partial			WP_011023149.1	zinc metalloprotease	13.1	22.8	42.4
MGA_442	LOCUS_3260	sequence083:2014..2739(-)	partial			WP_012546266.1	uroporphyrinogen III methyltransferase	95.9	50.1	25.5
MGA_458	LOCUS_3370	sequence087:1..551(+)	partial			WP_014206395.1	phenylacetic acid degradation protein	100.0	58.3	63.7
MGA_465	LOCUS_3420	sequence088:282..764(-)	partial			WP_011962362.1	NAD metabolism ATPase/kinase	96.9	23.6	39.1
MGA_482	LOCUS_3530	sequence092:1..564(+)	partial			WP_005477139.1	patatin family protein	87.2	57.4	26.4
MGA_497	LOCUS_3630	sequence096:1..606(+)	partial			Q8EYF0	phosphoribosylglycinamide formyltransferase 2	99.0	51.7	65.7
MGA_522	LOCUS_3810	sequence101:1098..2291(+)	partial			WP_010902857.1	membrane protein	57.2	57.3	30.3
MGA_537	LOCUS_3900	sequence105:1..848(+)	partial			WP_011962462.1	DNA polymerase I	97.2	28.8	57.9
MGA_543	LOCUS_3950	sequence106:423..824(-)	partial			WP_011266746.1	NAD-dependent dehydratase	99.2	43.7	40.9
MGA_545	LOCUS_3970	sequence106:2623..>3214(-)	partial			Q8AA40	replicative DNA helicase	80.6	30.8	69.2
MGA_546	LOCUS_3980	sequence107:1..891(+)	partial			A6GZF0	UDP-N-acetylmuramoyl-tripeptide--D-alanyl-D-alanine ligase	100.0	71.2	46.4
MGA_548	LOCUS_4000	sequence107:1930..>3207(-)	partial			WP_011202650.1	capsule polysaccharide transporter	97.2	57.0	27.4
MGA_558	LOCUS_4080	sequence109:2640..>3196(-)	partial			WP_011963149.1	peptidase M1	76.1	25.6	41.1
MGA_565	LOCUS_4130	sequence111:2279..>3175(-)	partial			WP_010932712.1	DEAD/DEAH box family ATP-dependent RNA helicase	92.6	66.9	59.2
MGA_567	LOCUS_4140	sequence112:1059..2087(-)	partial			WP_011119574.1	porin	98.8	70.0	30.7
MGA_588	LOCUS_4240	sequence119:2265..>3110(-)	partial			A6GYX7	glyceraldehyde-3-phosphate dehydrogenase	100.0	58.3	63.0
MGA_589	LOCUS_4250	sequence120:30..452(-)	partial			A6H1P9	50S ribosomal protein L21	72.1	47.9	71.3
MGA_605	LOCUS_4350	sequence124:1..2568(+)	partial			WP_011037954.1	peptidase	52.6	79.5	27.8
MGA_608	LOCUS_4360	sequence125:995..1438(+)	partial			WP_011963864.1	hypothetical protein	85.0	69.8	47.2
MGA_635	LOCUS_4560	sequence131:116..1195(+)	partial			WP_011963209.1	bifunctional UDP-N-acetylmuramoyl-tripeptide:D-alanyl-D-alanine ligase/alanine racemase	98.6	44.4	42.1
MGA_637	LOCUS_4580	sequence131:2354..>3023(-)	partial			WP_008765353.1	peptidase S41	98.2	38.9	41.4
MGA_640	LOCUS_4600	sequence132:492..803(-)	partial			WP_011101594.1	NADH oxidase	73.8	13.3	36.8
MGA_650	LOCUS_4670	sequence134:331..1890(+)	partial			WP_011964073.1	gliding motility protein GldM	49.9	51.3	23.4
MGA_675	LOCUS_4810	sequence142:1..564(+)	partial			WP_011963220.1	phosphate starvation protein PhoH	100.0	59.5	71.8
MGA_682	LOCUS_4860	sequence143:2253..2621(+)	partial			Q97MF2	UPF0721 transmembrane protein	71.3	72.5	40.2
MGA_687	LOCUS_4890	sequence144:1867..2634(-)	frameshift,internal_stop_codon	1890..1892(-)	1908	WP_011963344.1	DUF2279 domain-containing protein	95.3	80.3	29.1
MGA_708	LOCUS_5010	sequence151:2253..>2796(-)	partial			Q7UIR2	enolase	86.7	36.4	75.6
MGA_718	LOCUS_5060	sequence154:1582..>2773(-)	partial			WP_016362020.1	protein of unknown function precursor; adhesin	98.0	12.8	23.9
MGA_727	LOCUS_5120	sequence156:1446..>2768(-)	partial			WP_011962187.1	T9SS C-terminal target domain-containing protein	77.7	41.8	26.2
MGA_731	LOCUS_5150	sequence158:1..2300(+)	partial			WP_012256611.1	peptidase S8	25.2	28.3	34.0
MGA_765	LOCUS_5320	sequence168:2119..>2654(-)	partial			Q8P6Q4	copper homeostasis protein CutC	83.6	62.1	36.2
MGA_771	LOCUS_5360	sequence170:1949..2464(-)	internal_stop_codon	1949..1951(-)		WP_011962258.1	iron-dependent repressor	98.8	77.9	56.8
MGA_787	LOCUS_5480	sequence174:1206..>2587(-)	partial			A6GY22	threonine--tRNA ligase	99.1	70.5	70.9
MGA_811	LOCUS_5570	sequence183:1..660(+)	partial			Q64ZR4	translation initiation factor IF-2	99.5	21.5	68.8
MGA_822	LOCUS_5640	sequence186:1..1681(+)	partial			WP_011963634.1	histidine kinase	85.2	48.1	23.4
MGA_824	LOCUS_5650	sequence187:1..1121(+)	partial			WP_011964220.1	cell surface protein SprA	97.8	14.7	38.0
MGA_838	LOCUS_5740	sequence191:1..506(+)	partial			A6GXG2	serine hydroxymethyltransferase	99.4	39.2	63.9
MGA_841	LOCUS_5750	sequence192:326..838(+)	partial			WP_008762996.1	thiol:disulfide interchange protein	72.4	32.2	52.8
MGA_845	LOCUS_5770	sequence193:134..448(-)	internal_stop_codon	494..496(-)		A6H0Z9	urocanate hydratase	96.2	15.2	74.0
MGA_846	LOCUS_5780	sequence193:494..2137(-)	internal_stop_codon	494..496(-)		A6H0Z9	urocanate hydratase	99.3	81.8	70.0
MGA_850	LOCUS_5800	sequence194:618..1166(+)	partial			WP_002858643.1	colicin V biosynthesis protein	70.9	69.0	27.8
MGA_854	LOCUS_5840	sequence195:1176..1412(-)	partial			WP_011462228.1	ATP synthase epsilon chain	97.4	56.8	39.5
MGA_855	LOCUS_5850	sequence195:1420..>2403(-)	partial			A6GVV9	ATP synthase subunit beta	99.4	64.6	85.8
MGA_865	LOCUS_5900	sequence199:1..510(+)	partial			WP_011962187.1	T9SS C-terminal target domain-containing protein	91.7	18.4	32.1
MGA_886	LOCUS_6000	sequence207:1663..>2331(-)	partial			WP_011122293.1	ABC transporter ATP-binding protein	97.7	32.7	56.2
MGA_901	LOCUS_6080	sequence213:2..298(+)	partial			A6GXW5	histidine ammonia-lyase	95.9	19.0	65.3
MGA_904	LOCUS_6110	sequence213:1705..>2291(-)	partial			WP_005813680.1	phosphoenolpyruvate carboxykinase (ATP)	97.9	36.8	61.1
MGA_915	LOCUS_6180	sequence217:1..812(+)	partial			A6GY98	3-hydroxyacyl-[acyl-carrier-protein] dehydratase FabZ	100.0	58.2	56.1
MGA_935	LOCUS_6290	sequence223:760..>2227(-)	partial			A6GYG2	phenylalanine--tRNA ligase beta subunit	99.4	60.0	52.6
MGA_939	LOCUS_6320	sequence225:1..595(+)	partial			WP_008761007.1	TIGR01212 family radical SAM protein	99.5	60.5	47.7
MGA_944	LOCUS_6350	sequence226:1406..>2212(-)	partial			WP_011964419.1	lipid-A-disaccharide synthase	98.5	72.9	51.1
MGA_959	LOCUS_6440	sequence230:390..1685(+)	partial			WP_010956698.1	hypothetical protein	58.9	43.2	33.0
MGA_973	LOCUS_6490	sequence235:1422..>2143(-)	partial			Q64PY9	1-deoxy-D-xylulose 5-phosphate reductoisomerase	99.6	61.3	65.5
MGA_974	LOCUS_6500	sequence236:3..845(+)	partial			Q64TM7	DNA ligase	98.2	41.5	57.2
MGA_981	LOCUS_6530	sequence238:1051..>2091(-)	partial			WP_014207643.1	two-component sensor histidine kinase	61.3	57.2	26.6
MGA_983	LOCUS_6540	sequence239:475..>2087(-)	partial			Q2RIS7	putative K(+)-stimulated pyrophosphate-energized sodium pump	69.8	51.6	56.6
MGA_1008	LOCUS_6660	sequence248:1..693(+)	partial			Q8A6N7	histidine--tRNA ligase	98.7	50.9	52.6
MGA_1016	LOCUS_6680	sequence251:1453..>2018(-)	partial			Q8A0C2	1-deoxy-D-xylulose-5-phosphate synthase	95.7	27.8	53.3
MGA_1025	LOCUS_6710	sequence256:1..875(+)	partial			A5I0U1	aldehyde dehydrogenase	100.0	63.4	47.9
MGA_1028	LOCUS_6720	sequence257:838..>1990(-)	partial			A6GXZ5	DNA helicase	99.7	51.4	48.5
MGA_1032	LOCUS_6740	sequence259:1..541(+)	partial			WP_010940160.1	amidohydrolase	89.4	42.4	29.6
MGA_1041	LOCUS_6780	sequence262:605..>1972(-)	partial			WP_011035510.1	nuclease	88.6	67.0	32.8
MGA_1055	LOCUS_6830	sequence268:1..822(+)	partial			WP_011963922.1	MBL fold metallo-hydrolase	100.0	57.9	47.1
MGA_1081	LOCUS_6940	sequence279:1636..1896(-)	partial			WP_011964474.1	hypothetical protein	100.0	51.2	34.9
MGA_1091	LOCUS_7000	sequence283:783..1880(-)	partial			WP_011405586.1	T9SS C-terminal target domain-containing protein	30.4	9.2	32.4
MGA_1096	LOCUS_7020	sequence285:604..1275(-)	partial			Q8R6H4	demethylmenaquinone methyltransferase	71.3	73.2	27.9
MGA_1100	LOCUS_7040	sequence286:311..1114(-)	partial			YP_001700844.1	putative oxidoreductase EphD	72.7	69.7	36.4
MGA_1101	LOCUS_7050	sequence286:1127..>1869(-)	partial			WP_011963836.1	acyl-CoA dehydrogenase	100.0	41.4	58.1
MGA_1105	LOCUS_7080	sequence288:1..1278(+)	partial			WP_005791499.1	HDIG domain-containing protein	98.1	60.7	41.2
MGA_1114	LOCUS_7120	sequence292:3..413(+)	partial			WP_011964286.1	hypothetical protein	100.0	32.6	47.8
MGA_1122	LOCUS_7170	sequence294:1..807(+)	partial			WP_013096762.1	bifunctional aldehyde dehydrogenase/enoyl-CoA hydratase	98.1	38.7	49.4
MGA_1129	LOCUS_7210	sequence296:1106..>1825(-)	partial			WP_008765466.1	signal peptide peptidase SppA	99.6	40.2	48.1
MGA_1137	LOCUS_7250	sequence300:1..659(+)	partial			WP_011962845.1	phosphoribosylformylglycinamidine cyclo-ligase	100.0	55.9	73.1
MGA_1143	LOCUS_7300	sequence302:295..750(+)	partial			A6H1N2	7-carboxy-7-deazaguanine synthase	100.0	71.4	50.3
MGA_1145	LOCUS_7310	sequence303:1..826(+)	partial			Q64MG4	leucine--tRNA ligase	99.6	28.8	53.5
MGA_1153	LOCUS_7340	sequence307:165..827(+)	internal_stop_codon	57..59(+)		Q8A451	primosomal protein N'	100.0	26.9	50.0
MGA_1155	LOCUS_7350	sequence308:1..588(+)	partial			WP_011118862.1	glycosyl transferase	96.4	73.7	46.8
MGA_1165	LOCUS_7390	sequence312:285..917(-)	partial			WP_005790934.1	acetyltransferase	100.0	71.8	36.9
MGA_1167	LOCUS_7400	sequence313:694..>1757(-)	partial			WP_005420148.1	sodium-independent anion transporter	96.0	66.4	57.3
MGA_1170	LOCUS_7420	sequence315:1..997(+)	partial			WP_011038080.1	lipase	74.3	67.0	31.6
MGA_1177	LOCUS_7460	sequence317:1198..1713(-)	partial			WP_011962545.1	molybdopterin oxidoreductase	100.0	36.5	71.9
MGA_1180	LOCUS_7480	sequence319:1..901(+)	partial			Q64N34	4-hydroxy-3-methylbut-2-en-1-yl diphosphate synthase (flavodoxin)	90.0	42.8	45.0
MGA_1190	LOCUS_7510	sequence323:861..>1692(-)	partial			WP_011962586.1	DUF5103 domain-containing protein	96.0	63.8	32.7
MGA_1191	LOCUS_7520	sequence324:1..774(+)	partial			WP_000557282.1	membrane protein	48.6	20.8	37.2
MGA_1208	LOCUS_7600	sequence331:696..>1676(-)	partial			WP_005791861.1	ATP-dependent DNA helicase RecQ	100.0	44.9	43.0
MGA_1209	LOCUS_7610	sequence332:1..1119(+)	partial			WP_011962850.1	collagen-binding protein	99.7	49.2	33.3
MGA_1219	LOCUS_7650	sequence336:1166..1462(-)	internal_stop_codon	1508..1510(-)		WP_011963430.1	sugar transporter	79.6	9.6	42.3
MGA_1225	LOCUS_7670	sequence338:232..1371(+)	partial			WP_011987113.1	acyl-CoA dehydrogenase	100.0	59.7	50.4
MGA_1234	LOCUS_7710	sequence341:378..1073(+)	partial			WP_011962268.1	SCO family protein	61.9	59.8	40.3
MGA_1239	LOCUS_7740	sequence342:858..>1639(-)	partial			WP_011964202.1	thioredoxin	96.9	36.4	42.6
MGA_1250	LOCUS_7800	sequence347:1..507(+)	partial			WP_005788741.1	23S rRNA (guanosine(2251)-2'-O)-methyltransferase RlmB	98.2	67.1	57.6
MGA_1261	LOCUS_7870	sequence352:3..1304(+)	partial			WP_011964423.1	competence protein ComEC	99.3	62.3	32.0
MGA_1266	LOCUS_7880	sequence355:1..833(+)	partial			A6H128	carbamoyl-phosphate synthase (glutamine-hydrolyzing)	100.0	29.1	70.7
MGA_1269	LOCUS_7900	sequence356:55..1593(-)	partial			WP_011404998.1	amino acid transporter	84.0	57.1	25.3
MGA_1273	LOCUS_7920	sequence358:1..657(+)	partial			A6H1G3	Holliday junction ATP-dependent DNA helicase RuvB	100.0	64.1	73.9
MGA_1277	LOCUS_7950	sequence359:1..1311(+)	partial			WP_000557282.1	membrane protein	79.8	54.1	28.7
MGA_1281	LOCUS_7960	sequence361:586..1575(-)	partial			WP_008760476.1	sodium:proton antiporter	98.5	68.2	47.8
MGA_1285	LOCUS_7970	sequence363:316..1329(-)	partial			WP_010907889.1	hydrolase	73.0	80.3	33.6
MGA_1313	LOCUS_8060	sequence375:669..1334(-)	partial			WP_012061515.1	sulfotransferase	69.7	53.9	28.6
MGA_1321	LOCUS_8080	sequence378:454..>1515(-)	partial			WP_011963906.1	membrane protein	96.3	42.7	43.8
