# locus_id	locus_tag	location	classification	internal_stop	indel	ref_id	description	query_cov	ref_cov	identity
MGA_80	LOCUS_00790	sequence001:85196..87436(-)	partial			Q87LP4	histidine kinase	90.1	73.6	30.1
MGA_115	LOCUS_01140	sequence001:125478..125837(-)	partial			WP_005766452.1	preprotein translocase subunit SecG	64.7	61.1	49.4
MGA_146	LOCUS_01450	sequence001:155230..156003(-)	partial			Q9HVU1	cell shape-determining protein MreC	95.7	74.5	45.9
MGA_152	LOCUS_01510	sequence001:161716..162699(+)	partial			WP_011122223.1	deoxyribodipyrimidine photo-lyase	96.6	40.1	34.4
MGA_155	LOCUS_01540	sequence001:164188..>164944(-)	partial			WP_003134747.1	acyl-CoA dehydrogenase	98.8	65.1	69.8
MGA_156	LOCUS_01550	sequence002:1..1399(+)	partial			WP_010938022.1	PAS domain-containing sensor histidine kinase	60.4	30.0	34.8
MGA_165	LOCUS_01640	sequence002:9094..9948(-)	partial			Q4ZPK7	iron-sulfur cluster carrier protein	90.5	70.6	62.3
MGA_178	LOCUS_01770	sequence002:21861..22634(-)	partial			Q74GW4	methionyl-tRNA formyltransferase	36.2	29.0	37.6
MGA_210	LOCUS_02090	sequence002:54067..55947(+)	partial			WP_003113915.1	two-component sensor CbrA	98.4	63.1	37.1
MGA_219	LOCUS_02180	sequence002:63547..63834(+)	internal_stop_codon	63832..63834(+)		O68562	outer membrane protein assembly factor BamE	89.5	48.3	47.1
MGA_245	LOCUS_02440	sequence002:91110..92384(-)	partial			WP_005796268.1	aminopeptidase	29.2	40.5	30.7
MGA_246	LOCUS_02450	sequence002:92489..92845(-)	partial			WP_010971130.1	membrane protein	95.8	46.9	35.4
MGA_258	LOCUS_02570	sequence002:103761..104549(+)	partial			WP_011125484.1	SAM-dependent methyltransferase	80.9	74.9	27.5
MGA_266	LOCUS_02640	sequence003:1..1004(+)	partial			WP_011121854.1	sulfatase	74.5	38.9	40.3
MGA_272	LOCUS_02700	sequence003:7241..8008(+)	partial			WP_002682266.1	glycerophosphoryl diester phosphodiesterase	64.7	68.4	31.8
MGA_282	LOCUS_02800	sequence003:15588..16880(-)	partial			Q9KVQ7	DNA recombination protein RmuC	87.2	74.5	44.2
MGA_286	LOCUS_02840	sequence003:24373..24906(+)	partial			WP_011087915.1	molecular chaperone DnaJ	97.2	71.8	36.1
MGA_316	LOCUS_03140	sequence003:56905..57210(-)	partial			Q8EE15	YcgL domain-containing protein	74.3	81.5	42.7
MGA_327	LOCUS_03250	sequence003:69152..69652(-)	partial			WP_003318487.1	colicin V production protein CvpA	83.1	70.3	47.9
MGA_347	LOCUS_03450	sequence003:90060..90581(-)	partial			WP_003106488.1	hypothetical protein	69.9	77.1	45.5
MGA_398	LOCUS_03950	sequence004:39015..39620(+)	partial			WP_003406491.1	rhomboid family intramembrane serine protease	74.1	51.4	42.7
MGA_413	LOCUS_04100	sequence004:58534..58857(-)	partial			WP_005458022.1	hypothetical protein	66.4	81.6	57.7
MGA_424	LOCUS_04210	sequence004:74172..76370(+)	partial			WP_011120368.1	N-acetylgalactosamine-6-sulfatase	55.1	76.6	30.3
MGA_434	LOCUS_04310	sequence005:1..666(+)	partial			Q9I719	protoheme IX farnesyltransferase 1	95.0	69.1	60.5
MGA_450	LOCUS_04470	sequence005:16644..16805(-)	internal_stop_codon	16848..16850(-)		F0KJ86	adenosylhomocysteinase	98.1	11.3	78.8
MGA_451	LOCUS_04480	sequence005:16848..18020(-)	internal_stop_codon	16848..16850(-)		Q4ZZ92	adenosylhomocysteinase	98.2	83.6	75.3
MGA_564	LOCUS_05590	sequence006:67220..67819(-)	partial			WP_012066941.1	pseudoazurin	51.3	70.1	48.5
MGA_602	LOCUS_05960	sequence007:29431..30165(+)	partial			Q8P8M7	segregation and condensation protein B	90.2	55.9	49.3
MGA_623	LOCUS_06170	sequence007:56699..57166(+)	partial			A0A0H3CFV4	30S ribosomal protein S6	67.1	79.4	71.2
MGA_685	LOCUS_06770	sequence009:1..802(+)	partial			WP_005458380.1	proton/glutamate symporter	95.1	58.3	61.3
MGA_700	LOCUS_06920	sequence009:14728..15759(-)	partial			Q9I6C1	signal recognition particle receptor FtsY	90.1	68.4	62.6
MGA_705	LOCUS_06970	sequence009:18553..19506(+)	partial			WP_003118763.1	hypothetical protein	79.5	74.0	37.9
MGA_728	LOCUS_07200	sequence009:45450..46520(+)	partial			F0KJG3	ATP synthase subunit a	68.5	84.2	56.2
MGA_729	LOCUS_07210	sequence009:46558..46797(+)	partial			Q8E8B5	ATP synthase subunit c	60.8	57.8	68.8
MGA_776	LOCUS_07660	sequence010:39922..41688(-)	partial			WP_011035768.1	cytochrome c biogenesis protein	91.8	74.5	37.4
MGA_777	LOCUS_07670	sequence010:41917..42387(+)	partial			WP_010971644.1	hypothetical protein	75.6	36.7	32.8
MGA_814	LOCUS_08020	sequence011:34965..35309(+)	partial			WP_011705378.1	arsenate reductase	98.2	45.0	52.7
MGA_818	LOCUS_08060	sequence011:39534..40190(+)	partial			WP_005478460.1	TetR family transcriptional regulator	71.6	65.6	25.0
MGA_838	LOCUS_08240	sequence012:12148..13620(-)	partial			WP_010918645.1	PAS domain-containing sensor histidine kinase	72.0	71.0	22.3
MGA_862	LOCUS_08480	sequence012:36599..37075(+)	partial			WP_011071554.1	sigma E factor positive regulatory protein RseC	50.0	48.4	35.4
MGA_876	LOCUS_08600	sequence013:3837..4250(-)	partial			WP_012640167.1	DUF1330 domain-containing protein	86.1	73.0	33.1
MGA_902	LOCUS_08860	sequence013:27344..28384(-)	partial			WP_003104128.1	hypothetical protein	75.1	74.5	51.7
MGA_913	LOCUS_08970	sequence013:36332..39139(+)	partial			Q9HZM8	ribonuclease E	60.1	53.3	65.1
MGA_919	LOCUS_09030	sequence014:5169..5585(-)	partial			WP_011104999.1	hypothetical protein	100.0	41.8	55.7
MGA_953	LOCUS_09350	sequence015:11390..12352(-)	partial			WP_003405098.1	cupin	87.5	72.9	53.9
MGA_1019	LOCUS_09990	sequence017:20041..20508(-)	partial			WP_011103347.1	molybdenum cofactor sulfurase	61.9	57.5	33.0
MGA_1025	LOCUS_10040	sequence018:1..547(+)	partial			WP_024265814.1	MFS transporter	69.1	25.2	37.6
MGA_1031	LOCUS_10100	sequence018:5255..6766(-)	partial			WP_011072834.1	hypothetical protein	50.3	30.5	34.2
MGA_1032	LOCUS_10110	sequence018:6753..7964(-)	partial			WP_011962729.1	cytochrome-c peroxidase	72.7	49.6	37.7
MGA_1037	LOCUS_10160	sequence018:12771..14966(-)	partial			WP_010969896.1	ligand-gated channel	80.0	64.1	39.3
MGA_1038	LOCUS_10170	sequence018:15366..16910(-)	partial			WP_011205191.1	DNA polymerase/helicase	53.9	72.4	37.9
MGA_1042	LOCUS_10210	sequence018:20237..20887(-)	partial			WP_013528658.1	TetR family transcriptional regulator	34.3	31.5	45.9
MGA_1049	LOCUS_10260	sequence019:2425..3192(-)	partial			WP_000981084.1	AraC family transcriptional regulator	51.8	35.2	36.4
MGA_1078	LOCUS_10530	sequence020:12034..12561(+)	partial			NP_274216.1	sulfite reductase flavoprotein subunit alpha	83.4	24.3	37.4
MGA_1093	LOCUS_10670	sequence021:1..585(+)	partial			WP_013230940.1	3-oxoacyl-ACP reductase	100.0	43.7	54.1
MGA_1095	LOCUS_10690	sequence021:1603..4872(+)	partial			WP_011118116.1	cellulosome anchoring protein	42.9	23.8	26.3
MGA_1132	LOCUS_11050	sequence022:20781..22709(+)	partial			WP_010865031.1	laminarinase	37.1	38.6	48.8
MGA_1133	LOCUS_11060	sequence022:22758..23591(+)	partial			WP_011405546.1	beta-glucanase	81.6	59.0	41.4
MGA_1139	LOCUS_11110	sequence023:632..886(+)	partial			WP_011262876.1	hypothetical protein	64.3	65.1	46.3
MGA_1162	LOCUS_11340	sequence023:23820..>24821(-)	partial			WP_003815250.1	MFS transporter	89.8	72.0	40.5
MGA_1175	LOCUS_11470	sequence024:13668..14759(+)	partial			WP_011103023.1	DNA protecting protein DprA	80.4	72.1	47.6
MGA_1181	LOCUS_11530	sequence024:18297..18539(+)	partial			WP_003083624.1	hypothetical protein	70.0	63.7	55.2
MGA_1191	LOCUS_11610	sequence025:1278..1661(-)	partial			A0KL22	UPF0225 protein	95.3	63.4	43.1
MGA_1193	LOCUS_11630	sequence025:2229..2597(-)	partial			Q8EE02	peptide methionine sulfoxide reductase MsrA	93.4	37.9	65.8
MGA_1194	LOCUS_11640	sequence025:2597..3376(-)	partial			WP_010956937.1	choline kinase	69.1	36.0	25.4
MGA_1275	LOCUS_12420	sequence028:21561..>22259(-)	partial			Q8F7S5	aldehyde dehydrogenase	98.7	46.8	46.1
MGA_1308	LOCUS_12720	sequence030:8246..8851(-)	partial			WP_005457970.1	hypothetical protein	73.1	78.0	38.5
MGA_1312	LOCUS_12760	sequence030:12117..12626(+)	partial			O31820	thioredoxin-like protein YneN	69.8	69.4	38.0
MGA_1320	LOCUS_12840	sequence030:19455..>20204(-)	partial			WP_015775991.1	glycine cleavage system protein T	96.8	60.7	45.3
MGA_1362	LOCUS_13220	sequence033:5552..5983(+)	partial			Q8EGR4	tRNA sulfurtransferase	59.4	17.4	43.5
MGA_1404	LOCUS_13610	sequence035:17292..17495(+)	partial			WP_003123689.1	hypothetical protein	95.5	62.1	43.8
MGA_1423	LOCUS_13780	sequence036:16618..>17285(-)	partial			WP_012583217.1	beta-glucosidase	94.1	27.2	45.7
MGA_1428	LOCUS_13820	sequence037:3099..4214(-)	partial			WP_013096327.1	DNA primase	67.7	53.9	35.3
MGA_1433	LOCUS_13870	sequence037:8827..10122(-)	partial			WP_001269640.1	integrase	55.9	61.9	27.2
MGA_1446	LOCUS_14000	sequence038:6936..7520(-)	partial			WP_011404018.1	CIA30 family protein	61.3	68.2	28.2
MGA_1448	LOCUS_14020	sequence038:7957..9096(+)	partial			WP_005810429.1	serine hydrolase	67.8	72.5	32.2
MGA_1456	LOCUS_14090	sequence039:3197..5395(+)	partial			Q5NGJ7	protein TolB	29.2	49.4	25.5
MGA_1459	LOCUS_14120	sequence039:7796..8650(-)	partial			WP_011104810.1	tol-pal system protein YbgF	74.3	71.7	28.0
MGA_1462	LOCUS_14150	sequence039:10634..11380(-)	partial			WP_004406115.1	protein TolA	77.0	55.1	32.0
MGA_1484	LOCUS_14350	sequence041:2416..2652(+)	partial			WP_003091178.1	hypothetical protein	71.8	65.3	53.6
MGA_1498	LOCUS_14470	sequence042:196..987(-)	partial			Q87JP5	cryptochrome DASH	98.5	58.2	62.5
MGA_1505	LOCUS_14540	sequence042:6138..6851(+)	partial			WP_011338219.1	DNA mismatch repair protein MutT	39.7	45.3	35.5
MGA_1516	LOCUS_14640	sequence043:1..1518(+)	partial			WP_011120142.1	acriflavine resistance protein B	95.8	45.7	30.7
MGA_1538	LOCUS_14850	sequence044:9416..9868(+)	partial			Q9HUB2	ribosomal RNA small subunit methyltransferase E	98.7	63.0	59.5
MGA_1539	LOCUS_14860	sequence044:9856..10323(-)	partial			WP_011405502.1	N-acetyltransferase	94.2	63.7	51.4
MGA_1541	LOCUS_14880	sequence044:12038..13630(-)	partial			WP_003091724.1	ATP-dependent DNA helicase RecQ	98.9	74.3	60.2
MGA_1563	LOCUS_15080	sequence046:12030..13094(-)	partial			WP_011083637.1	serine hydrolase	74.0	60.2	26.5
MGA_1586	LOCUS_15290	sequence048:6928..8079(+)	partial			WP_010926041.1	(2Fe-2S)-binding protein	48.3	50.1	32.7
MGA_1593	LOCUS_15360	sequence049:2492..2803(-)	partial			WP_005772089.1	FmdB family transcriptional regulator	57.3	64.8	59.3
MGA_1605	LOCUS_15470	sequence050:1..802(+)	partial			Q4ZV05	UvrABC system protein B	99.6	39.6	69.0
MGA_1612	LOCUS_15540	sequence050:8536..9261(+)	partial			WP_010973329.1	histidine utilization repressor	96.7	70.9	42.1
MGA_1641	LOCUS_15790	sequence053:1..2900(+)	partial			WP_011070585.1	GlyGly-CTERM sorting domain-containing protein	94.5	36.7	27.3
MGA_1655	LOCUS_15920	sequence054:9240..10358(+)	partial			WP_011727945.1	alkane 1-monooxygenase	72.3	68.8	32.2
MGA_1658	LOCUS_15940	sequence055:1144..2127(+)	partial			WP_004540034.1	DNA internalization-related competence protein ComEC/Rec2	87.8	32.5	35.7
MGA_1675	LOCUS_16100	sequence056:9500..>10433(-)	partial			WP_014207710.1	terpene utilization protein AtuA	97.4	49.3	39.0
MGA_1695	LOCUS_16260	sequence059:3453..5531(+)	partial			WP_000180345.1	hypothetical protein	29.0	73.5	33.0
MGA_1697	LOCUS_16280	sequence059:5794..6603(+)	partial			WP_011056967.1	hypothetical protein	49.4	30.0	33.8
MGA_1702	LOCUS_16310	sequence060:540..1277(-)	partial			WP_005762447.1	hypothetical protein	70.6	84.5	36.2
MGA_1711	LOCUS_16390	sequence061:1..791(+)	partial			WP_001093009.1	4-aminobutyrate--2-oxoglutarate transaminase	67.2	38.5	38.6
MGA_1718	LOCUS_16450	sequence062:32..2161(+)	partial			Q2RWN5	bifunctional protein PutA	98.4	55.8	42.2
MGA_1728	LOCUS_16530	sequence063:643..2004(-)	partial			WP_011262221.1	MFS transporter	96.2	69.3	43.6
MGA_1733	LOCUS_16580	sequence063:4928..5449(-)	internal_stop_codon	5531..5533(-)		WP_010918217.1	molybdate ABC transporter substrate-binding protein	98.8	67.9	43.7
MGA_1734	LOCUS_16590	sequence063:5774..6160(-)	partial			WP_010972117.1	membrane protein	93.0	71.6	41.2
MGA_1742	LOCUS_16650	sequence064:5151..6452(+)	partial			WP_001012297.1	carboxylic ester hydrolase	42.5	45.0	28.2
MGA_1766	LOCUS_16850	sequence067:6745..6954(+)	partial			K0MPK7	Sec-independent protein translocase protein TatA	58.0	52.0	70.0
MGA_1767	LOCUS_16860	sequence067:6988..7281(+)	partial			Q4ZZG9	sec-independent protein translocase protein TatB	71.1	43.7	56.5
MGA_1776	LOCUS_16930	sequence069:1..1059(+)	partial			Q8E8C0	ATP synthase subunit beta	99.1	73.9	86.0
MGA_1794	LOCUS_17080	sequence071:1311..2279(+)	partial			WP_064496935.1	serralysin	64.0	68.1	29.6
MGA_1825	LOCUS_17340	sequence076:153..866(+)	partial			WP_011388356.1	phosphate ABC transporter substrate-binding protein	68.4	46.8	52.5
MGA_1847	LOCUS_17530	sequence079:4665..5690(+)	partial			NP_268633.1	possibly involved in regulation of genetic competence	73.9	67.6	27.1
MGA_1848	LOCUS_17540	sequence080:148..588(+)	partial			WP_000860837.1	transcriptional regulator	62.3	79.8	51.6
MGA_1857	LOCUS_17620	sequence081:2491..3516(-)	partial			WP_010967763.1	AraC family transcriptional regulator	75.4	73.8	26.3
MGA_1859	LOCUS_17640	sequence081:4620..>5690(-)	partial			WP_011970080.1	putrescine-ornithine antiporter	91.9	74.1	24.5
MGA_1860	LOCUS_17650	sequence082:3..491(+)	partial			WP_011388877.1	MBL fold metallo-hydrolase	94.4	47.4	42.2
MGA_1867	LOCUS_17710	sequence083:1..973(+)	partial			WP_011120974.1	solute:sodium symporter family transporter	80.5	49.6	31.2
MGA_1876	LOCUS_17800	sequence085:1..921(+)	partial			WP_012709055.1	aldehyde dehydrogenase	99.3	63.7	69.7
MGA_1880	LOCUS_17840	sequence085:4403..>5084(-)	partial			WP_011087559.1	NADH oxidoreductase	99.6	58.7	60.9
MGA_1885	LOCUS_17890	sequence086:4126..>4923(-)	partial			Q4ZTG0	error-prone DNA polymerase	100.0	25.7	38.5
MGA_1889	LOCUS_17920	sequence087:2118..2768(-)	partial			WP_000680175.1	nucleoside-diphosphate sugar epimerase	91.2	70.9	39.1
MGA_1895	LOCUS_17970	sequence088:4008..>4755(-)	partial			WP_012640427.1	glutathione S-transferase	99.2	69.5	44.3
MGA_1902	LOCUS_18030	sequence089:3214..>4351(-)	partial			Q5E0C6	histidine ammonia-lyase	99.2	73.7	56.0
MGA_1905	LOCUS_18050	sequence090:1518..3320(+)	partial			WP_010921047.1	carbamoyl-phosphate-synthetase	97.7	54.4	53.2
MGA_1918	LOCUS_18140	sequence093:1254..1898(+)	frameshift		1856	WP_013228899.1	cyclase	80.4	55.5	30.5
MGA_1919	LOCUS_18150	sequence093:1850..2248(+)	frameshift		1844	WP_011729508.1	cyclase	98.5	40.7	36.8
MGA_1946	LOCUS_18330	sequence100:2925..>3761(-)	partial			WP_011074059.1	class V aminotransferase	98.9	72.5	50.2
MGA_1956	LOCUS_18400	sequence102:2786..>3460(-)	partial			WP_004185551.1	acyl-CoA dehydrogenase	100.0	57.5	56.8
MGA_1961	LOCUS_18440	sequence103:2914..>3459(-)	partial			WP_003089998.1	acyl-CoA dehydrogenase	98.9	43.8	68.2
MGA_1977	LOCUS_18530	sequence108:1..616(+)	partial			Q886X6	inosine-5'-monophosphate dehydrogenase	99.0	41.5	80.3
MGA_1979	LOCUS_18550	sequence108:2382..2696(+)	partial			WP_001129562.1	integrase	98.1	24.7	62.7
MGA_1983	LOCUS_18570	sequence110:1..1097(+)	partial			Q9I137	glycine dehydrogenase (decarboxylating) 1	99.7	37.6	71.9
MGA_1990	LOCUS_18610	sequence113:1..916(+)	partial			WP_014207705.1	3-methylcrotonyl-CoA carboxylase subunit alpha	97.4	43.0	33.0
MGA_1993	LOCUS_18630	sequence114:1..578(+)	partial			WP_010920963.1	TonB-dependent receptor	100.0	25.6	33.3
MGA_1995	LOCUS_18650	sequence114:1871..>2398(-)	partial			A6UBH7	L-carnitine dehydrogenase	100.0	37.7	33.2
MGA_1996	LOCUS_18660	sequence115:1..638(+)	partial			Q8F7S5	aldehyde dehydrogenase	98.6	42.5	45.2
MGA_2001	LOCUS_18690	sequence117:1..693(+)	partial			WP_013530403.1	short-chain dehydrogenase	77.0	74.2	37.6
MGA_2014	LOCUS_18760	sequence120:1365..>1917(-)	partial			WP_011388726.1	4-diphosphocytidyl-2C-methyl-D-erythritol kinase	94.0	33.7	30.8
MGA_2015	LOCUS_18770	sequence121:1..593(+)	partial			A0A0H3END7	agmatinase	95.4	61.1	61.5
