# locus_id	locus_tag	location	classification	internal_stop	indel	ref_id	description	query_cov	ref_cov	identity
MGA_2	LOCUS_00010	sequence1:5529..6278(-)	partial			WP_010918711.1	class I SAM-dependent DNA methyltransferase	57.0	16.2	37.5
MGA_135	LOCUS_01340	sequence1:146592..147383(+)	partial			WP_011336832.1	light-harvesting protein	24.3	24.3	100.0
MGA_137	LOCUS_01360	sequence1:148994..150337(-)	partial			WP_011840243.1	2-dehydropantoate 2-reductase	55.9	77.2	99.6
MGA_198	LOCUS_01970	sequence1:215060..215509(-)	partial			WP_013389859.1	phage antirepressor Ant	65.8	33.0	40.8
MGA_217	LOCUS_02160	sequence1:235040..235414(-)	partial			WP_108221498.1	hypothetical protein	72.6	70.3	98.9
MGA_243	LOCUS_02420	sequence1:251967..253136(+)	frameshift		253364,253085	WP_011339454.1	ParB/RepB/Spo0J family partition protein	95.9	61.6	89.0
MGA_244	LOCUS_02430	sequence1:253034..253432(+)	frameshift		253085,253367	WP_011339454.1	ParB/RepB/Spo0J family partition protein	83.3	18.6	86.7
MGA_245	LOCUS_02440	sequence1:253510..253785(+)	frameshift		253366	WP_011339454.1	ParB/RepB/Spo0J family partition protein	100.0	15.0	98.9
MGA_365	LOCUS_03640	sequence1:362975..364252(+)	frameshift		362922,362916	WP_014537447.1	tetratricopeptide repeat protein	95.5	72.2	41.8
MGA_552	LOCUS_05510	sequence1:553274..553609(-)	frameshift,internal_stop_codon	553599..553601(-)	553556	WP_010975401.1	IS66 family insertion sequence element accessory protein TnpB	82.0	77.8	79.1
MGA_554	LOCUS_05530	sequence1:554841..555140(+)	partial			WP_188789631.1	GyrI-like domain-containing protein	98.0	59.5	56.6
MGA_555	LOCUS_05540	sequence1:555297..555593(-)	partial			WP_011337116.1	hypothetical protein	100.0	67.6	92.9
MGA_575	LOCUS_05740	sequence1:573933..574565(-)	frameshift		574569,574578	WP_012256609.1	deoxyribodipyrimidine photo-lyase	83.3	39.2	35.5
MGA_602	LOCUS_06010	sequence1:608379..609002(-)	frameshift		608323,608260	WP_011337151.1	GcrA family cell cycle regulator	46.9	46.9	100.0
MGA_631	LOCUS_06300	sequence1:632514..632711(+)	partial			WP_011338352.1	sigma-70 family RNA polymerase sigma factor	100.0	22.7	60.0
MGA_640	LOCUS_06390	sequence1:643521..644180(+)	partial			WP_092685457.1	ThiF family adenylyltransferase	100.0	36.5	48.9
MGA_660	LOCUS_06590	sequence1:659725..660159(-)	partial			WP_011337206.1	hypothetical protein	38.9	38.9	100.0
MGA_776	LOCUS_07750	sequence1:779476..780159(-)	frameshift		780209	WP_037391726.1	4-aminobutyrate--2-oxoglutarate transaminase	99.1	53.3	72.0
MGA_777	LOCUS_07760	sequence1:780048..780752(-)	frameshift		780212	WP_010975708.1	4-aminobutyrate--2-oxoglutarate transaminase	73.5	40.8	75.6
MGA_834	LOCUS_08330	sequence1:844088..844618(-)	partial			WP_011037563.1	hybrid sensor histidine kinase/response regulator	61.9	20.2	43.1
MGA_961	LOCUS_09600	sequence1:972001..972381(+)	partial			WP_041669283.1	DUF192 domain-containing protein	100.0	73.7	99.2
MGA_1095	LOCUS_10940	sequence1:1113297..1113815(+)	partial			WP_002719629.1	gene transfer agent family protein	41.9	68.6	84.7
MGA_1120	LOCUS_11190	sequence1:1141261..1141686(-)	frameshift		1141709	WP_011971012.1	IS21-like element helper ATPase IstB	100.0	57.8	85.8
MGA_1121	LOCUS_11200	sequence1:1141575..1141988(-)	frameshift		1141709	WP_011971012.1	IS21-like element helper ATPase IstB	67.9	38.1	79.6
MGA_1122	LOCUS_11210	sequence1:1141921..1143006(-)	partial			WP_128955176.1	IS21 family transposase	93.4	67.5	76.6
MGA_1123	LOCUS_11220	sequence1:1143069..1144271(+)	partial			WP_131002207.1	TniQ family protein	95.0	61.3	27.6
MGA_1162	LOCUS_11610	sequence1:1184387..1184863(+)	partial			WP_002719691.1	Sec-independent protein translocase protein TatB	57.6	57.6	86.8
MGA_1256	LOCUS_12550	sequence1:1275639..1276265(+)	frameshift		1275619	WP_003528003.1	2-(1,2-epoxy-1,2-dihydrophenyl)acetyl-CoA isomerase PaaG	100.0	79.8	51.0
MGA_1268	LOCUS_12670	sequence1:1287811..1288704(-)	frameshift		1288717	WP_014538199.1	phosphogluconate dehydratase	100.0	49.2	72.7
MGA_1270	LOCUS_12690	sequence1:1289905..1290078(+)	partial			WP_002719795.1	hypothetical protein	73.7	73.7	100.0
MGA_1310	LOCUS_13090	sequence1:1328782..1329012(-)	partial			WP_011337658.1	DUF1289 domain-containing protein	72.4	72.4	100.0
MGA_1330	LOCUS_13290	sequence1:1351453..1352802(-)	frameshift		1352869	WP_013532331.1	ABC transporter substrate-binding protein	99.8	81.6	53.8
MGA_1331	LOCUS_13300	sequence1:1352792..1353082(-)	frameshift		1352869	WP_013532331.1	ABC transporter substrate-binding protein	71.9	12.8	40.0
MGA_1655	LOCUS_16540	sequence1:1698257..1698649(-)	partial			WP_069332664.1	IS66 family transposase	76.9	21.3	39.7
MGA_1663	LOCUS_16620	sequence1:1706177..1706467(-)	partial			WP_013368588.1	pirin family protein	62.5	18.8	66.7
MGA_1704	LOCUS_17030	sequence1:1744979..1745167(+)	partial			WP_011337946.1	hypothetical protein	67.7	67.7	100.0
MGA_1766	LOCUS_17650	sequence1:1809216..1811264(-)	frameshift,internal_stop_codon	1809216..1809218(-),1809117..1809119(-)	1811288	WP_011337993.1	TRAP transporter large permease subunit	78.7	78.7	91.4
MGA_1805	LOCUS_18040	sequence1:1849610..1851049(+)	partial			WP_011090968.1	phage/plasmid primase, P4 family	59.5	60.0	62.1
MGA_1808	LOCUS_18070	sequence1:1853527..1854537(+)	partial			WP_011338020.1	30S ribosomal protein S6	31.5	80.3	100.0
MGA_1852	LOCUS_18510	sequence1:1898504..1898803(-)	frameshift		1898867	WP_012066592.1	ABC transporter ATP-binding protein	100.0	37.6	85.9
MGA_1853	LOCUS_18520	sequence1:1898820..1899305(-)	frameshift		1898867	WP_014537570.1	ABC transporter ATP-binding protein	85.1	53.3	74.5
MGA_2010	LOCUS_20090	sequence1:2057118..2058452(-)	partial			WP_011970097.1	hypothetical protein	47.3	28.1	31.4
MGA_2031	LOCUS_20300	sequence1:2083519..2083941(+)	partial			WP_112311416.1	error-prone DNA polymerase	73.6	8.9	62.1
MGA_2044	LOCUS_20430	sequence1:2097708..2098334(+)	partial			WP_011338185.1	preprotein translocase subunit SecG	57.7	57.7	79.2
MGA_2167	LOCUS_21660	sequence1:2223852..2224604(+)	frameshift		2223832	WP_037396064.1	sugar kinase	99.6	81.7	45.2
MGA_2264	LOCUS_22630	sequence1:2323412..2323774(+)	partial			WP_011338334.1	pyridoxamine 5'-phosphate oxidase family protein	100.0	73.2	99.2
MGA_2287	LOCUS_22860	sequence1:2344764..2346443(-)	partial			WP_091704098.1	CRISPR-associated helicase/endonuclease Cas3	82.1	52.6	36.3
MGA_2300	LOCUS_22990	sequence1:2355083..2355265(-)	partial			WP_011336913.1	phage major capsid protein	80.0	10.8	64.6
MGA_2304	LOCUS_23030	sequence1:2362032..2362214(-)	partial			WP_002720789.1	DNA gyrase inhibitor YacG	68.3	68.3	100.0
MGA_2353	LOCUS_23520	sequence1:2411472..2412716(-)	partial			WP_017139941.1	cell envelope integrity/translocation protein TolA	68.8	68.8	67.0
MGA_2414	LOCUS_24130	sequence1:2471779..2471997(+)	partial			WP_011338441.1	hypothetical protein	72.2	72.2	88.5
MGA_2428	LOCUS_24270	sequence1:2484382..2484567(-)	partial			WP_011338454.1	aa3-type cytochrome c oxidase subunit IV	72.1	72.1	100.0
MGA_2535	LOCUS_25340	sequence1:2594091..2595059(+)	frameshift		2594089	WP_063172931.1	tetratricopeptide repeat-containing sulfotransferase family protein	94.4	56.6	39.9
MGA_2897	LOCUS_28960	sequence1:2965128..2965505(-)	internal_stop_codon	2965527..2965529(-)		WP_193365317.1	carbon-nitrogen hydrolase family protein	97.6	44.4	65.3
MGA_2898	LOCUS_28970	sequence1:2965527..2965958(-)	internal_stop_codon	2965527..2965529(-)		WP_193365317.1	carbon-nitrogen hydrolase family protein	99.3	50.2	54.2
MGA_2903	LOCUS_29020	sequence1:2969160..2969336(-)	partial			WP_009563233.1	hypothetical protein	72.4	72.4	81.0
MGA_2916	LOCUS_29150	sequence1:2981425..2981985(-)	frameshift		2982037	WP_013385459.1	threonine ammonia-lyase IlvA	100.0	44.8	68.3
MGA_3110	LOCUS_31090	sequence1:3180599..3180940(+)	partial			WP_011338933.1	hypothetical protein	47.8	47.8	90.7
MGA_3129	LOCUS_31270	sequence2:14324..14662(-)	internal_stop_codon	14669..14671(-)		WP_011339202.1	tyrosine-type recombinase/integrase	38.4	10.0	72.1
MGA_3147	LOCUS_31450	sequence2:28573..28827(+)	partial			WP_017140305.1	hypothetical protein	63.1	63.1	100.0
MGA_3157	LOCUS_31540	sequence2:39958..40566(+)	frameshift,internal_stop_codon	40631..40633(+),39691..39693(+)	40518	WP_046463617.1	hypothetical protein	90.1	27.1	47.8
MGA_3159	LOCUS_31560	sequence2:42204..42785(-)	partial			WP_013653377.1	IS481 family transposase	99.0	54.9	81.7
MGA_3161	LOCUS_31580	sequence2:43479..43826(-)	frameshift		43843	WP_010975540.1	IS66-like element ISRm14 family transposase	83.5	17.5	80.2
MGA_3162	LOCUS_31590	sequence2:43757..44923(-)	frameshift		43843	WP_010975540.1	IS66-like element ISRm14 family transposase	57.0	40.9	75.1
MGA_3296	LOCUS_32930	sequence2:189858..190262(-)	frameshift		189896,189953,189865	WP_024311089.1	DUF2243 domain-containing protein	77.6	65.6	48.6
MGA_3378	LOCUS_33750	sequence2:275623..277722(-)	partial			WP_011391239.1	hybrid sensor histidine kinase/response regulator	96.9	67.3	35.2
MGA_3467	LOCUS_34640	sequence2:370899..371384(+)	internal_stop_codon	370890..370892(+)		WP_012582696.1	glucose 1-dehydrogenase	98.8	68.3	53.5
MGA_3576	LOCUS_35720	sequence2:481353..482357(-)	frameshift		481344	WP_162829286.1	iron ABC transporter permease	93.7	80.1	81.8
MGA_3579	LOCUS_35750	sequence2:486089..486238(-)	frameshift		486417	WP_010967926.1	AraC family transcriptional regulator	71.4	11.7	65.7
MGA_3580	LOCUS_35760	sequence2:486190..487008(-)	frameshift		486420	WP_010967926.1	AraC family transcriptional regulator	71.7	65.6	42.9
MGA_3584	LOCUS_35800	sequence2:491037..491330(+)	partial			WP_011339297.1	hypothetical protein	100.0	51.6	96.9
MGA_3673	LOCUS_36690	sequence2:589406..589759(+)	partial			WP_011339371.1	PepSY domain-containing protein	71.8	71.8	95.2
MGA_3702	LOCUS_36980	sequence2:631145..633103(+)	frameshift		632980	WP_197642299.1	hypothetical protein	80.5	74.8	64.4
MGA_3703	LOCUS_36990	sequence2:633553..634533(+)	partial			WP_004554541.1	DEAD/DEAH box helicase family protein	79.1	27.1	26.4
MGA_3705	LOCUS_37010	sequence2:635369..635578(+)	partial			WP_235841049.1	hypothetical protein	100.0	22.8	82.6
MGA_3706	LOCUS_37020	sequence2:635633..636163(-)	partial			WP_023004221.1	toll/interleukin-1 receptor domain-containing protein	100.0	73.9	99.4
MGA_3744	LOCUS_37400	sequence2:675343..675486(-)	partial			WP_011339431.1	hypothetical protein	100.0	63.5	95.7
MGA_3777	LOCUS_37730	sequence2:709836..710168(-)	partial			WP_014537628.1	S24 family peptidase	63.6	33.2	45.7
MGA_3794	LOCUS_37900	sequence2:728568..728723(+)	partial			WP_011339468.1	hypothetical protein	100.0	64.6	98.0
MGA_3796	LOCUS_37920	sequence2:729592..729828(+)	internal_stop_codon	729826..729828(+)		WP_011337191.1	M15 family metallopeptidase	42.3	12.3	97.0
MGA_3797	LOCUS_37930	sequence2:729883..730194(+)	internal_stop_codon	729826..729828(+)		WP_011336894.1	M15 family metallopeptidase	100.0	38.3	99.0
MGA_3810	LOCUS_38060	sequence2:738680..739411(+)	partial			WP_011339612.1	phage portal protein	88.5	43.3	97.7
MGA_3833	LOCUS_38290	sequence2:758278..759075(-)	frameshift		758358	WP_011339453.1	recombinase family protein	91.3	44.9	89.3
MGA_3834	LOCUS_38300	sequence2:759100..759972(+)	partial			WP_069332403.1	phage portal protein	96.6	68.1	91.8
MGA_3839	LOCUS_38350	sequence2:762951..763361(-)	frameshift		763497	WP_021706804.1	IS5-like element ISVpa3 family transposase	97.8	42.2	36.3
MGA_3953	LOCUS_39490	sequence2:899871..900368(+)	partial			WP_217991922.1	YbjQ family protein	58.2	82.1	49.0
MGA_3992	LOCUS_39880	sequence2:926494..926811(-)	partial			WP_011339636.1	universal stress protein	100.0	74.5	99.0
MGA_3993	LOCUS_39890	sequence2:926696..929575(-)	partial			WP_067553987.1	TRAP transporter permease	68.9	75.8	55.6
MGA_4064	LOCUS_40600	sequence3:64513..64938(+)	partial			WP_011331303.1	aromatic ring-hydroxylating dioxygenase subunit alpha	90.1	31.0	96.9
MGA_4065	LOCUS_40610	sequence3:65085..66020(+)	frameshift		65071	WP_011331489.1	conjugal transfer protein TraG N-terminal domain-containing protein	98.1	26.8	96.7
MGA_4069	LOCUS_40650	sequence3:67149..67745(-)	partial			WP_066867479.1	IS110 family transposase	93.9	47.4	64.0
MGA_4092	LOCUS_40870	sequence3:91161..91490(+)	frameshift		90999	WP_011339201.1	ISNCY family transposase	100.0	23.8	99.1
MGA_4114	LOCUS_41090	sequence4:621..1421(+)	frameshift		655,607	WP_011339201.1	ISNCY family transposase	95.9	55.7	100.0
MGA_4134	LOCUS_41290	sequence4:25750..25962(+)	partial			WP_005766716.1	class II fumarate hydratase	92.9	14.0	56.9
MGA_4219	LOCUS_42130	sequence5:44..373(-)	frameshift		424,646	WP_011339201.1	ISNCY family transposase	100.0	23.8	99.1
MGA_4220	LOCUS_42140	sequence5:327..602(-)	frameshift		424,646	WP_011339201.1	ISNCY family transposase	64.8	12.9	100.0
MGA_4221	LOCUS_42150	sequence5:503..1423(-)	frameshift		424,646	WP_011339201.1	ISNCY family transposase	84.6	56.6	96.5
MGA_4222	LOCUS_42160	sequence5:1785..2156(-)	partial			WP_012258143.1	MBL fold metallo-hydrolase	54.5	15.3	43.3
MGA_4236	LOCUS_42300	sequence5:14239..14508(-)	partial			WP_011339028.1	methyl-accepting chemotaxis protein	97.8	16.8	53.2
MGA_4261	LOCUS_42550	sequence5:35431..35577(+)	partial			WP_003526659.1	Hsp20/alpha crystallin family protein	91.7	25.1	56.8
MGA_4262	LOCUS_42560	sequence5:35883..37913(-)	partial			WP_106459194.1	tetratricopeptide repeat protein	87.9	69.3	36.7
MGA_4271	LOCUS_42650	sequence5:47345..47476(-)	partial			WP_003816713.1	DUF1153 domain-containing protein	79.1	32.7	70.6
MGA_4273	LOCUS_42670	sequence5:49257..49529(+)	frameshift		49236,49479	WP_014466931.1	IS630 family transposase	82.2	20.4	63.5
MGA_4274	LOCUS_42680	sequence5:49550..50038(+)	frameshift		49478	WP_011085265.1	IS630-like element ISBj5 family transposase	96.3	42.3	56.4
MGA_4275	LOCUS_42690	sequence5:52627..52980(-)	partial			WP_106356446.1	acyltransferase	95.7	57.7	58.0
MGA_4278	LOCUS_42720	sequence5:55599..56489(-)	frameshift		56629	WP_011035783.1	IS5-like element IS1478 family transposase	88.2	57.8	53.8
MGA_4279	LOCUS_42730	sequence5:56618..56944(-)	frameshift		56629	WP_014497842.1	IS5 family transposase	90.7	21.7	53.1
MGA_4293	LOCUS_42870	sequence5:69304..69504(+)	frameshift,internal_stop_codon	69298..69300(+)	69248	WP_011836225.1	MobF family relaxase	93.9	5.6	77.4
MGA_4294	LOCUS_42880	sequence5:69547..70071(-)	partial			WP_069331744.1	DNA-binding transcriptional regulator	59.2	52.5	67.2
MGA_4303	LOCUS_42970	sequence5:80153..80488(+)	partial			WP_011331396.1	ferredoxin-type protein NapF	100.0	69.4	100.0
MGA_4320	LOCUS_43140	sequence5:98305..98679(-)	partial			WP_011331409.1	hypothetical protein	63.7	42.9	45.6
MGA_4340	LOCUS_43340	sequence6:8711..9229(+)	partial			WP_017140531.1	hypothetical protein	41.3	60.7	46.5
MGA_4344	LOCUS_43380	sequence6:11583..12386(+)	partial			WP_083079845.1	plasmid pRiA4b ORF-3 family protein	51.7	73.0	69.2
MGA_4345	LOCUS_43390	sequence6:12450..12770(+)	partial			WP_167540391.1	IS66 family transposase	100.0	18.9	59.4
MGA_4362	LOCUS_43560	sequence6:26991..27248(-)	partial			WP_040425865.1	IS66 family transposase	95.3	24.8	60.5
MGA_4363	LOCUS_43570	sequence6:27549..27764(+)	frameshift		27874	WP_114196139.1	IS3 family transposase	88.7	16.9	54.0
MGA_4369	LOCUS_43630	sequence6:32103..32222(+)	internal_stop_codon	32220..32222(+),32406..32408(+)		WP_010975401.1	IS66 family insertion sequence element accessory protein TnpB	100.0	33.3	82.1
MGA_4370	LOCUS_43640	sequence6:32226..32408(+)	internal_stop_codon	32220..32222(+),32406..32408(+)		WP_010975539.1	IS66 family insertion sequence element accessory protein TnpB	100.0	51.3	78.3
MGA_4371	LOCUS_43650	sequence6:32568..32870(+)	internal_stop_codon	32868..32870(+),32526..32528(+)		WP_010975540.1	IS66-like element ISRm14 family transposase	100.0	18.2	75.0
MGA_4372	LOCUS_43660	sequence6:32976..33932(+)	frameshift,internal_stop_codon	32868..32870(+)	33440,33468,33920	WP_010975400.1	IS66-like element ISRm14 family transposase	99.1	62.9	73.1
MGA_4373	LOCUS_43670	sequence6:33947..34093(+)	frameshift		33920	WP_010975400.1	IS66-like element ISRm14 family transposase	70.8	6.2	85.3
MGA_4384	LOCUS_43780	sequence6:44851..45153(+)	partial			WP_011331451.1	methanogen output domain 1-containing protein	100.0	54.3	99.0
MGA_4395	LOCUS_43890	sequence6:53956..54378(+)	frameshift,internal_stop_codon	53918..53920(+),54377..54379(+)	53947	WP_011974570.1	aconitate hydratase AcnA	97.1	16.6	44.8
MGA_4402	LOCUS_43960	sequence6:61699..61959(-)	partial			WP_167540391.1	IS66 family transposase	87.2	13.6	68.0
MGA_4403	LOCUS_43970	sequence6:62194..62571(+)	partial			WP_011970910.1	IS110 family transposase	72.8	23.9	56.0
MGA_4405	LOCUS_43990	sequence6:63079..63309(-)	frameshift		63082,63484,63454	WP_164925630.1	IS3-like element ISSod2 family transposase	97.4	21.2	57.9
MGA_4453	LOCUS_44470	sequence7:6242..6412(+)	frameshift		6406	WP_011836225.1	MobF family relaxase	100.0	7.1	68.4
MGA_4454	LOCUS_44480	sequence7:6409..6831(+)	frameshift		6406	WP_011836225.1	MobF family relaxase	48.6	6.1	97.1
MGA_4474	LOCUS_44680	sequence7:25268..25591(-)	frameshift		25671	WP_069332664.1	IS66 family transposase	89.7	17.4	78.1
MGA_4480	LOCUS_44740	sequence7:33153..33665(-)	frameshift,internal_stop_codon	33731..33733(-)	33664	WP_207464355.1	IS1182 family transposase	60.6	21.5	82.5
MGA_4481	LOCUS_44750	sequence7:33731..33946(-)	frameshift,internal_stop_codon	33731..33733(-)	33664	WP_207464355.1	IS1182 family transposase	100.0	14.8	87.3
MGA_4482	LOCUS_44760	sequence7:34646..35152(-)	partial			WP_011836253.1	MerR family transcriptional regulator	53.0	65.9	96.7
MGA_4483	LOCUS_44770	sequence7:35259..35474(-)	partial			WP_011836222.1	hypothetical protein	81.7	35.6	86.2
MGA_4484	LOCUS_44780	sequence7:35612..36631(+)	partial			WP_011339201.1	ISNCY family transposase	89.1	65.3	89.1
