# locus_id	locus_tag	location	classification	internal_stop	indel	ref_id	description	query_cov	ref_cov	identity
MGA_2	LOCUS_0020	sequence1:439..723(-)	partial			WP_011123567.1	DUF1080 domain-containing protein	70.2	26.7	39.5
MGA_3	LOCUS_0030	sequence1:1056..1970(-)	frameshift		2016,1009,1064	WP_011118384.1	hypothetical protein	99.3	59.6	68.0
MGA_4	LOCUS_0040	sequence1:2008..2388(-)	frameshift		2016	WP_011118384.1	hypothetical protein	90.5	24.6	39.2
MGA_5	LOCUS_0050	sequence1:2458..3144(-)	frameshift		2520,3262	WP_164922507.1	arylsulfatase	92.1	40.9	61.9
MGA_6	LOCUS_0060	sequence1:3245..3940(-)	frameshift		3265	WP_164922507.1	arylsulfatase	97.8	44.4	67.1
MGA_8	LOCUS_0080	sequence1:5712..6449(-)	frameshift		6618,6468,6582,6522,6654	WP_011121087.1	sulfatase	91.8	45.8	62.3
MGA_9	LOCUS_0090	sequence1:6436..6777(-)	frameshift,internal_stop_codon	6853..6855(-)	6913,6465,6819,6762,6768,6579,6615,6651,6519	WP_011121087.1	sulfatase	84.1	19.4	38.1
MGA_14	LOCUS_0140	sequence1:11532..12131(-)	frameshift		12156	WP_164921691.1	sulfatase	100.0	40.9	42.6
MGA_15	LOCUS_0150	sequence1:12133..12516(-)	frameshift		12156	WP_164921691.1	sulfatase	93.7	23.8	56.3
MGA_16	LOCUS_0160	sequence1:13084..13764(-)	frameshift,internal_stop_codon	13834..13836(-)	13852	WP_005785070.1	sulfatase	88.5	38.6	34.6
MGA_20	LOCUS_0200	sequence1:15088..15726(-)	frameshift		14979,15012,14847,15918,14928,15252,14901,15771,15708,15967	WP_011117793.1	sulfatase	73.6	26.9	60.5
MGA_21	LOCUS_0210	sequence1:15749..15928(-)	frameshift		15923,16024,15770,15707,15966,16063	WP_011117793.1	sulfatase	84.7	9.5	66.7
MGA_22	LOCUS_0220	sequence1:16824..17090(-)	frameshift		17286,17255,17159,17195,16846,17362,17332,17174,16699	WP_164921694.1	DUF1501 domain-containing protein	90.9	16.7	83.8
MGA_23	LOCUS_0230	sequence1:19322..19660(-)	frameshift,internal_stop_codon	19317..19319(-)	19749,19782,19112,19689,19659,19572,19509,19834,19229	WP_236615801.1	PSD1 and planctomycete cytochrome C domain-containing protein	88.4	10.7	42.7
MGA_24	LOCUS_0240	sequence1:19829..20596(-)	frameshift		19744,19777,19684,20133,19654,20331,19567,20562,20052,19829,20061,19998	WP_236615801.1	PSD1 and planctomycete cytochrome C domain-containing protein	91.4	24.5	35.7
MGA_29	LOCUS_0290	sequence1:27541..28161(-)	partial			WP_008669493.1	DUF1080 domain-containing protein	85.9	39.0	33.0
MGA_31	LOCUS_0310	sequence1:29761..30975(-)	frameshift		31155,31179,31197	WP_011122548.1	PA14 domain-containing protein	93.3	46.7	33.8
MGA_33	LOCUS_0330	sequence1:32641..32916(-)	frameshift,internal_stop_codon	32638..32640(-)	32856,32935,32878,33007	WP_011071153.1	DUF2238 domain-containing protein	97.8	44.3	58.4
MGA_35	LOCUS_0350	sequence1:35633..36244(-)	frameshift		35692,35517,35412,35575	WP_164922487.1	sulfatase	94.6	39.5	78.6
MGA_37	LOCUS_0370	sequence1:37084..38352(-)	partial			WP_008666312.1	arylsulfatase	86.3	62.6	35.4
MGA_43	LOCUS_0430	sequence1:42878..43573(-)	frameshift		43808,43703	WP_164922898.1	FAD-dependent oxidoreductase	97.0	27.5	53.5
MGA_48	LOCUS_0480	sequence1:49437..49736(+)	frameshift,internal_stop_codon	49956..49958(+),49734..49736(+)	49922,49883,49892,49970	WP_164921311.1	ThuA domain-containing protein	61.6	4.1	49.2
MGA_49	LOCUS_0490	sequence1:50137..50808(+)	frameshift,internal_stop_codon	49954..49956(+),50815..50817(+)	49920,49968,50805,50904,50124	WP_090339627.1	ThuA domain-containing protein	96.9	18.4	58.3
MGA_50	LOCUS_0500	sequence1:50975..51355(+)	frameshift		50847,50754,50838,50907,51276,51453,50799	WP_164921311.1	ThuA domain-containing protein	65.1	5.1	58.5
MGA_53	LOCUS_0530	sequence1:52556..53107(+)	frameshift		53104,53167	WP_007329925.1	Gfo/Idh/MocA family oxidoreductase	100.0	49.3	57.9
MGA_54	LOCUS_0540	sequence1:53133..53486(+)	frameshift,internal_stop_codon	53486..53488(+)	53104,53569,53521,53641,53563,53167	WP_007329925.1	Gfo/Idh/MocA family oxidoreductase	74.4	23.5	60.9
MGA_55	LOCUS_0550	sequence1:53938..54978(+)	frameshift		54969,55081	WP_011120799.1	sulfatase	95.4	62.4	35.1
MGA_57	LOCUS_0570	sequence1:56113..56304(+)	partial			WP_011404337.1	plastocyanin/azurin family copper-binding protein	92.1	30.7	37.9
MGA_58	LOCUS_0580	sequence1:56599..59514(+)	frameshift		56563,56687	WP_164921683.1	FG-GAP-like repeat-containing protein	51.4	34.2	42.7
MGA_69	LOCUS_0680	sequence2:2036..2260(-)	partial			WP_003115035.1	2-hydroxychromene-2-carboxylate isomerase	85.1	32.3	34.9
MGA_74	LOCUS_0730	sequence2:6213..6797(-)	frameshift,internal_stop_codon	6360..6362(-),6159..6161(-)	6380	WP_010969025.1	aquaglyceroporin AqpS	67.0	56.2	45.0
MGA_75	LOCUS_0740	sequence2:6798..7097(-)	frameshift		7128,7101	WP_010938935.1	arsenate reductase ArsC	94.9	61.2	46.8
MGA_86	LOCUS_0850	sequence2:13504..16584(+)	partial			WP_011038525.1	TonB-dependent receptor	39.8	45.1	28.0
MGA_87	LOCUS_0860	sequence2:16663..17994(+)	partial			WP_011403217.1	hypothetical protein	82.2	62.2	40.8
MGA_89	LOCUS_0880	sequence2:19914..20630(+)	partial			WP_011266767.1	glycosyltransferase family 1 protein	98.3	57.9	37.7
MGA_96	LOCUS_0950	sequence2:26189..27823(+)	partial			WP_011791822.1	phosphate ABC transporter permease subunit PstC	46.9	84.8	42.9
MGA_98	LOCUS_0970	sequence2:28753..29499(+)	partial			WP_010939749.1	phosphate ABC transporter permease PstA	96.4	74.8	49.0
MGA_101	LOCUS_1000	sequence2:33316..33555(-)	frameshift,internal_stop_codon	33340..33342(-)	33357,33588,33813,33750	WP_007327912.1	DUF1501 domain-containing protein	100.0	18.4	42.5
MGA_103	LOCUS_1020	sequence2:37257..37670(-)	frameshift,internal_stop_codon	37257..37259(-)	37007,37202,37067,37106	WP_236616031.1	sulfatase-like hydrolase/transferase	97.8	16.8	52.6
MGA_104	LOCUS_1030	sequence2:38380..38577(-)	frameshift,internal_stop_codon	38801..38803(-),38378..38380(-)	38635,38587	WP_164922306.1	sulfatase	100.0	13.9	53.8
MGA_106	LOCUS_1050	sequence3:5036..5419(-)	frameshift,internal_stop_codon	5498..5500(-),5489..5491(-),5447..5449(-),5450..5452(-)	5536,5136,5479,5341,5581,5359	WP_164921596.1	DUF1588 domain-containing protein	74.8	11.4	55.8
MGA_108	LOCUS_1070	sequence3:9278..10486(+)	frameshift		10282	WP_002724194.1	tripartite tricarboxylate transporter permease	83.6	67.5	43.5
MGA_109	LOCUS_1080	sequence3:11303..11632(+)	frameshift		11626,11645,11790	WP_164922709.1	sulfatase	95.4	20.2	38.3
MGA_112	LOCUS_1110	sequence3:13655..13801(-)	frameshift,internal_stop_codon	13652..13654(-)	13968,13841,14083,13798,13863,13822	WP_164922453.1	Gfo/Idh/MocA family oxidoreductase	91.7	9.5	65.9
MGA_115	LOCUS_1140	sequence3:18085..18594(-)	frameshift		18704,18755,18566	WP_011261760.1	DUF1679 domain-containing protein	94.7	50.2	57.4
MGA_122	LOCUS_1210	sequence3:22699..23505(-)	partial			WP_011203533.1	sulfatase	87.7	46.5	31.7
MGA_127	LOCUS_1260	sequence3:27774..28397(-)	frameshift		28416,28468	WP_013368537.1	dehydrogenase	98.6	26.1	35.1
MGA_131	LOCUS_1300	sequence3:31721..32611(-)	partial			WP_011120859.1	SGNH/GDSL hydrolase family protein	16.6	19.6	51.0
MGA_132	LOCUS_1310	sequence3:33739..34074(-)	frameshift		33777,33506,33491,33717	WP_007326881.1	DUF1552 domain-containing protein	76.6	18.8	56.8
MGA_133	LOCUS_1320	sequence4:384..803(+)	frameshift		995,776,968,394,301,175,400,433,463,1043,214,343,502,379,1055	WP_236615908.1	sulfatase	82.7	23.7	54.2
MGA_134	LOCUS_1330	sequence4:809..994(+)	frameshift		1124,1034,1229,767,1046,986,1211,959	WP_236615908.1	sulfatase	73.8	9.3	63.0
MGA_136	LOCUS_1350	sequence4:7085..8257(+)	frameshift		8353,8404,8221	WP_011118026.1	arylsulfatase	91.8	63.8	60.4
MGA_137	LOCUS_1360	sequence4:8874..12203(+)	partial			WP_164922491.1	PSD1 and planctomycete cytochrome C domain-containing protein	49.4	56.1	36.0
MGA_138	LOCUS_1370	sequence4:12252..13025(+)	frameshift		13016,12265,13022	WP_011122120.1	DUF1501 domain-containing protein	93.4	50.4	54.7
MGA_139	LOCUS_1380	sequence4:13030..13608(+)	frameshift		13428,13461,13022,13359	WP_007329353.1	DUF1501 domain-containing protein	99.0	39.8	56.0
MGA_147	LOCUS_1460	sequence4:20095..21684(+)	partial			WP_011118382.1	dienelactone hydrolase family protein	95.1	44.6	23.5
MGA_149	LOCUS_1480	sequence5:1673..1945(-)	frameshift		1967	WP_011203637.1	GDSL-type esterase/lipase family protein	84.4	8.9	35.5
MGA_150	LOCUS_1490	sequence5:2450..4165(-)	partial			WP_011203637.1	GDSL-type esterase/lipase family protein	99.5	66.8	39.6
MGA_152	LOCUS_1510	sequence5:5722..6198(-)	frameshift,internal_stop_codon	5722..5724(-)	5493	WP_011118540.1	hypothetical protein	86.7	22.9	35.0
MGA_155	LOCUS_1540	sequence5:7304..7690(-)	frameshift		7106,7076,7686,7338,7277	WP_011119041.1	glycerophosphodiester phosphodiesterase	91.4	40.4	51.7
MGA_156	LOCUS_1550	sequence5:7830..9419(-)	partial			WP_011121181.1	L-sorbosone dehydrogenase	69.8	30.8	29.0
MGA_157	LOCUS_1560	sequence5:9976..11256(-)	partial			WP_011121181.1	L-sorbosone dehydrogenase	85.9	31.0	54.9
MGA_158	LOCUS_1570	sequence5:11278..11718(-)	partial			WP_011120148.1	aquaporin	69.2	21.2	41.6
MGA_161	LOCUS_1600	sequence6:666..2099(-)	partial			WP_164921368.1	sulfatase-like hydrolase/transferase	87.8	60.7	49.4
MGA_164	LOCUS_1630	sequence6:5141..5362(-)	frameshift,internal_stop_codon	5528..5530(-)	5512,5395	WP_164921573.1	Gfo/Idh/MocA family oxidoreductase	95.9	15.7	45.7
MGA_166	LOCUS_1650	sequence6:5986..6444(-)	frameshift		5922,5891,5798,5994,5819,5756	WP_007328455.1	Gfo/Idh/MocA family oxidoreductase	96.7	31.2	41.9
MGA_167	LOCUS_1660	sequence6:7384..8652(-)	partial			WP_236615476.1	NPCBM/NEW2 domain-containing protein	77.3	51.2	36.1
MGA_168	LOCUS_1670	sequence6:8936..10396(+)	partial			WP_008659530.1	metallophosphoesterase	27.8	27.5	35.8
MGA_171	LOCUS_1700	sequence6:14023..14382(+)	frameshift		14342,14630,13769,14573,13875,14456,14011,14140,14333,14110	WP_008666725.1	GDSL-type esterase/lipase family protein	72.3	6.7	40.2
