# locus_id	locus_tag	location	classification	internal_stop	indel	ref_id	description	query_cov	ref_cov	identity
MGA_158	LOCUS_01570	sequence01:162917..163597(+)	partial			WP_001881747.1	DNA polymerase III subunit delta'	100.0	69.8	100.0
MGA_322	LOCUS_03210	sequence01:351744..352031(+)	frameshift		352022	WP_001091290.1	tol-pal system-associated acyl-CoA thioesterase	89.5	63.0	100.0
MGA_352	LOCUS_03510	sequence01:381869..382126(+)	frameshift		381716	WP_011071640.1	inovirus Gp2 family protein	98.8	37.3	40.5
MGA_355	LOCUS_03540	sequence01:384292..384753(-)	partial			WP_078219576.1	helix-turn-helix transcriptional regulator	42.5	58.6	55.4
MGA_369	LOCUS_03680	sequence01:393086..394126(+)	partial			WP_011072643.1	tape measure protein	97.4	60.9	65.6
MGA_461	LOCUS_04580	sequence02:110256..112391(+)	frameshift		112364	WP_172626063.1	metal-dependent phosphohydrolase	96.2	71.1	98.0
MGA_462	LOCUS_04590	sequence02:112388..113200(+)	frameshift		112364	WP_172626063.1	metal-dependent phosphohydrolase	100.0	28.1	98.9
MGA_523	LOCUS_05200	sequence02:174495..175280(+)	frameshift		175274	WP_000981402.1	DUF3541 domain-containing protein	99.6	64.7	100.0
MGA_524	LOCUS_05210	sequence02:175277..175699(+)	frameshift		175274	WP_000981402.1	DUF3541 domain-containing protein	100.0	34.8	100.0
MGA_539	LOCUS_05360	sequence02:190806..192353(-)	partial			WP_011104387.1	methyl-accepting chemotaxis protein	68.2	54.4	29.3
MGA_777	LOCUS_07730	sequence03:124250..124861(-)	frameshift		125136	WP_001005173.1	AAA family ATPase	100.0	37.6	100.0
MGA_778	LOCUS_07740	sequence03:125074..125871(-)	frameshift		125130	WP_001005173.1	AAA family ATPase	95.5	46.9	98.0
MGA_779	LOCUS_07750	sequence03:125872..126366(-)	partial			WP_085304998.1	retron St85 family RNA-directed DNA polymerase	97.0	50.8	59.4
MGA_957	LOCUS_09530	sequence04:280..903(-)	partial			WP_000453414.1	dicarboxylate/amino acid:cation symporter	88.9	44.0	96.7
MGA_1146	LOCUS_11420	sequence04:225285..226826(-)	internal_stop_codon	226863..226865(-)		WP_000425792.1	Hsp70 family protein	100.0	81.3	95.7
MGA_1147	LOCUS_11430	sequence04:226863..227180(-)	internal_stop_codon	226863..226865(-)		WP_000425792.1	Hsp70 family protein	100.0	16.6	100.0
MGA_1148	LOCUS_11440	sequence04:227180..227599(-)	frameshift		227619	WP_001017942.1	DUF2760 domain-containing protein	100.0	66.2	99.3
MGA_1149	LOCUS_11450	sequence04:227503..227811(-)	frameshift		227619	WP_001017942.1	DUF2760 domain-containing protein	68.6	33.3	55.7
MGA_1181	LOCUS_11770	sequence05:1..1134(+)	partial			WP_000098688.1	transketolase	100.0	56.7	98.1
MGA_1331	LOCUS_13270	sequence05:179451..180350(+)	frameshift		179326	WP_010895430.1	peptide chain release factor 2	100.0	81.9	99.7
MGA_1383	LOCUS_13790	sequence06:9851..10159(+)	frameshift		10141	WP_000562056.1	exopolysaccharide biosynthesis flippase VpsE	98.0	21.3	84.0
MGA_1384	LOCUS_13800	sequence06:10174..11256(+)	frameshift		10141	WP_000562056.1	exopolysaccharide biosynthesis flippase VpsE	100.0	76.8	98.3
MGA_1455	LOCUS_14510	sequence06:91606..95073(+)	partial			WP_001880813.1	polar hub landmark protein HubP	88.0	62.7	87.3
MGA_1456	LOCUS_14520	sequence06:94974..95885(+)	partial			WP_001880813.1	polar hub landmark protein HubP	100.0	18.7	98.3
MGA_1506	LOCUS_15020	sequence06:147785..148024(+)	partial			WP_001880857.1	YbaN family protein	100.0	59.8	97.5
MGA_1526	LOCUS_15220	sequence06:165757..166647(+)	internal_stop_codon	166645..166647(+)		WP_172626045.1	glycosyl hydrolase family 18 protein	100.0	27.6	89.9
MGA_1527	LOCUS_15230	sequence06:166660..168942(+)	internal_stop_codon	166645..166647(+)		WP_172626045.1	glycosyl hydrolase family 18 protein	100.0	71.0	98.8
MGA_1557	LOCUS_15530	sequence06:201246..201719(-)	internal_stop_codon	201741..201743(-)		WP_001880887.1	tRNA dihydrouridine(16) synthase DusC	100.0	48.6	99.4
MGA_1558	LOCUS_15540	sequence06:201741..202217(-)	internal_stop_codon	201741..201743(-)		WP_001880887.1	tRNA dihydrouridine(16) synthase DusC	100.0	48.9	98.7
MGA_1608	LOCUS_16030	sequence07:36379..39828(+)	partial			WP_011036642.1	DEAD/DEAH box helicase	45.3	75.4	36.1
MGA_1609	LOCUS_16040	sequence07:39959..40372(-)	frameshift,internal_stop_codon	40432..40434(-)	40419	WP_001107728.1	integrase domain-containing protein	89.8	29.1	93.5
MGA_1648	LOCUS_16430	sequence07:88742..89074(-)	frameshift		89112	WP_000373561.1	Lrp/AsnC family transcriptional regulator	100.0	74.8	99.1
MGA_1709	LOCUS_17040	sequence07:159250..160914(-)	frameshift		160919	WP_000009926.1	M9 family metallopeptidase	100.0	69.2	95.1
MGA_1710	LOCUS_17050	sequence07:160911..161669(-)	frameshift		160919	WP_000009926.1	M9 family metallopeptidase	99.2	30.6	100.0
MGA_1738	LOCUS_17330	sequence07:197159..203572(+)	partial			WP_011073976.1	retention module-containing protein	98.8	72.9	42.8
MGA_1770	LOCUS_17640	sequence08:25085..26614(+)	frameshift		26470	WP_000096405.1	VWA domain-containing protein	86.6	68.3	95.2
MGA_1771	LOCUS_17650	sequence08:26730..27017(+)	frameshift		26482	WP_000096405.1	VWA domain-containing protein	100.0	14.7	94.7
MGA_1815	LOCUS_18090	sequence08:81300..81821(-)	frameshift		81302	WP_001882971.1	type VI secretion system membrane subunit TssM	100.0	14.6	97.7
MGA_1821	LOCUS_18150	sequence08:88915..89460(-)	frameshift		89450	WP_000458007.1	type VI secretion system baseplate subunit TssK	98.9	40.3	99.4
MGA_1822	LOCUS_18160	sequence08:89346..90251(-)	frameshift		89441	WP_000458007.1	type VI secretion system baseplate subunit TssK	89.7	60.8	100.0
MGA_1829	LOCUS_18230	sequence08:96929..97240(-)	frameshift		97262	WP_000031391.1	type VI secretion system contractile sheath small subunit	100.0	61.3	100.0
MGA_1830	LOCUS_18240	sequence08:97260..97436(-)	frameshift		97262	WP_000031391.1	type VI secretion system contractile sheath small subunit	100.0	34.5	100.0
MGA_1943	LOCUS_19350	sequence09:33407..33895(-)	partial			WP_032468650.1	ComF family protein	100.0	56.6	91.4
MGA_1961	LOCUS_19530	sequence09:56165..58408(-)	frameshift		58362	WP_206819303.1	pullulanase-type alpha-1,6-glucosidase	97.6	53.8	58.9
MGA_1962	LOCUS_19540	sequence09:58315..59805(-)	frameshift		58365	WP_005482097.1	pullulanase-type alpha-1,6-glucosidase	58.5	22.6	30.4
MGA_2089	LOCUS_20800	sequence10:3211..3525(-)	internal_stop_codon	3733..3735(-)		WP_001183929.1	hypothetical protein	100.0	31.5	100.0
MGA_2090	LOCUS_20810	sequence10:3733..4206(-)	internal_stop_codon	3733..3735(-)		WP_001183929.1	hypothetical protein	100.0	47.6	94.9
MGA_2107	LOCUS_20980	sequence10:25172..25405(+)	partial			WP_011070746.1	AlpA family phage regulatory protein	79.2	73.2	62.3
MGA_2151	LOCUS_21410	sequence10:77504..77908(-)	frameshift,internal_stop_codon	77504..77506(-)	77906	WP_000027427.1	ISAs1-like element ISEc26 family transposase	100.0	34.4	49.3
MGA_2152	LOCUS_21420	sequence10:77895..78122(-)	frameshift,internal_stop_codon	78207..78209(-)	77909	WP_000027427.1	ISAs1-like element ISEc26 family transposase	85.3	16.4	60.9
MGA_2153	LOCUS_21430	sequence10:78207..78404(-)	internal_stop_codon	78207..78209(-)		WP_000420971.1	ISAs1-like element ISEc1 family transposase	86.2	14.8	67.9
MGA_2276	LOCUS_22650	sequence11:49250..49447(+)	partial			WP_005477197.1	hypothetical protein	72.3	66.2	59.6
MGA_2392	LOCUS_23810	sequence12:12658..16806(-)	internal_stop_codon	16903..16905(-)		WP_000126926.1	NAD-glutamate dehydrogenase	99.1	84.9	98.8
MGA_2393	LOCUS_23820	sequence12:16903..17499(-)	internal_stop_codon	16903..16905(-)		WP_000126926.1	NAD-glutamate dehydrogenase	100.0	12.3	100.0
MGA_2492	LOCUS_24810	sequence12:128251..128838(+)	frameshift		128228	WP_000340058.1	diguanylate cyclase	100.0	55.2	99.5
MGA_2508	LOCUS_24970	sequence12:142870..143091(-)	partial			WP_001095833.1	23S rRNA (adenine(1618)-N(6))-methyltransferase RlmF	100.0	20.2	98.6
MGA_2510	LOCUS_24980	sequence13:9..434(-)	partial			WP_102964529.1	IS481 family transposase	100.0	43.4	97.9
MGA_2515	LOCUS_25030	sequence13:7431..8135(+)	partial			WP_010888392.1	nuclease-related domain-containing protein	88.5	61.9	33.5
MGA_2627	LOCUS_26150	sequence14:30009..30587(+)	frameshift		30473	WP_000086312.1	type II secretion system protein	91.1	68.4	86.9
MGA_2628	LOCUS_26160	sequence14:30584..30778(+)	frameshift		30473	WP_000086312.1	type II secretion system protein	100.0	25.0	98.4
MGA_2868	LOCUS_28530	sequence17:21936..22556(-)	frameshift		22630	WP_001104009.1	TDT family transporter	100.0	64.4	97.1
MGA_2869	LOCUS_28540	sequence17:22559..22897(-)	frameshift		22630	WP_001104009.1	TDT family transporter	79.5	27.8	91.0
MGA_2977	LOCUS_29610	sequence19:594..1019(+)	partial			WP_102964529.1	IS481 family transposase	100.0	43.4	97.9
MGA_2978	LOCUS_29620	sequence19:1045..1482(-)	internal_stop_codon	1507..1509(-)		WP_021706804.1	IS5-like element ISVpa3 family transposase	49.7	23.5	98.6
MGA_2979	LOCUS_29630	sequence19:1507..1725(-)	internal_stop_codon	1507..1509(-)		WP_021706804.1	IS5-like element ISVpa3 family transposase	100.0	23.5	93.1
MGA_2983	LOCUS_29670	sequence19:8634..11522(+)	partial			WP_011263458.1	beta/gamma crystallin-related protein	7.8	44.3	44.9
MGA_3004	LOCUS_29880	sequence19:31711..32367(+)	partial			WP_001880634.1	M23 family metallopeptidase	100.0	72.2	100.0
MGA_3006	LOCUS_29900	sequence19:33190..33456(+)	frameshift		33432	WP_000702220.1	accessory colonization factor AcfD	92.0	5.3	100.0
MGA_3008	LOCUS_29920	sequence19:38384..38620(-)	frameshift,internal_stop_codon	38327..38329(-),38622..38624(-),38715..38717(-),38685..38687(-)	38384,38804,38669	WP_000002768.1	tyrosine-type recombinase/integrase	100.0	19.0	78.2
MGA_3009	LOCUS_29930	sequence19:38790..38948(-)	frameshift,internal_stop_codon	39003..39005(-),38715..38717(-),39108..39110(-),38685..38687(-),38622..38624(-)	38672,39162,38804	WP_000002768.1	tyrosine-type recombinase/integrase	98.1	12.4	82.4
MGA_3061	LOCUS_30440	sequence20:32851..34356(-)	frameshift		34333	WP_001125273.1	cytolysin VCC	98.4	66.5	99.0
MGA_3062	LOCUS_30450	sequence20:34331..34996(-)	frameshift		34333	WP_001125273.1	cytolysin VCC	100.0	29.8	99.5
MGA_3077	LOCUS_30590	sequence21:1971..9854(-)	partial			WP_172625977.1	MARTX multifunctional-autoprocessing repeats-in-toxin holotoxin RtxA	100.0	57.8	98.0
MGA_3078	LOCUS_30600	sequence21:10023..11129(+)	partial			WP_149560561.1	RTX toxin T1SS ABC transporter subunit RtxB	94.6	49.6	97.1
MGA_3156	LOCUS_31350	sequence23:48..806(+)	partial			WP_000453414.1	dicarboxylate/amino acid:cation symporter	88.9	53.6	100.0
MGA_3195	LOCUS_31730	sequence24:9..434(-)	partial			WP_102964529.1	IS481 family transposase	100.0	43.4	97.9
MGA_3276	LOCUS_32510	sequence26:58..279(+)	partial			WP_001217709.1	GMP reductase	100.0	21.0	100.0
MGA_3296	LOCUS_32710	sequence26:13154..13831(+)	partial			WP_011262463.1	Bro-N domain-containing protein	46.2	56.6	57.7
MGA_3317	LOCUS_32920	sequence26:28797..30635(+)	partial			WP_013097383.1	phage tail protein	48.5	44.8	38.2
MGA_3324	LOCUS_32980	sequence27:2533..3774(+)	partial			WP_015038871.1	SIR2 family protein	40.9	37.9	35.6
MGA_3325	LOCUS_32990	sequence27:3778..5589(+)	partial			WP_011084726.1	DUF87 domain-containing protein	28.4	26.2	35.9
MGA_3326	LOCUS_33000	sequence27:5848..7224(-)	partial			WP_009889821.1	UvrD-helicase domain-containing protein	41.7	48.7	28.3
MGA_3327	LOCUS_33010	sequence27:7221..8918(-)	partial			WP_011963675.1	ATP-dependent endonuclease	75.0	69.8	26.1
MGA_3330	LOCUS_33040	sequence27:9839..10603(-)	partial			WP_011262056.1	type II toxin-antitoxin system HipA family toxin	96.9	56.3	44.4
MGA_3344	LOCUS_33180	sequence28:1156..2814(+)	partial			WP_023003660.1	recombinase family protein	37.7	36.1	30.6
MGA_3375	LOCUS_33480	sequence29:5189..5497(-)	internal_stop_codon	5660..5662(-)		WP_000373826.1	cupin domain-containing protein	100.0	60.0	99.0
MGA_3435	LOCUS_34030	sequence31:14847..15083(+)	partial			WP_014164108.1	hypothetical protein	98.7	67.5	64.6
MGA_3446	LOCUS_34140	sequence32:7726..8115(-)	partial			WP_001894072.1	translation initiation factor IF-3	100.0	70.5	90.7
MGA_3451	LOCUS_34190	sequence32:12665..13780(-)	frameshift		12748	WP_010895476.1	hypothetical protein	89.5	81.6	99.4
MGA_3453	LOCUS_34200	sequence33:132..272(+)	frameshift		93	WP_000415750.1	hypothetical protein	100.0	32.6	100.0
MGA_3470	LOCUS_34370	sequence33:13094..13816(-)	partial			WP_000019370.1	IS5-like element ISVch5 family transposase	100.0	73.6	100.0
MGA_3487	LOCUS_34530	sequence34:11448..12686(+)	partial			WP_011072650.1	SGNH/GDSL hydrolase family protein	69.9	49.7	27.1
MGA_3491	LOCUS_34560	sequence35:1056..1559(-)	frameshift		1690	WP_011072631.1	phage protease	100.0	52.0	53.9
MGA_3492	LOCUS_34570	sequence35:1595..2011(-)	frameshift		1690	WP_011072631.1	phage protease	74.6	32.3	73.8
MGA_3495	LOCUS_34600	sequence35:3260..3772(-)	partial			WP_000785540.1	tail needle knob protein	84.7	50.0	40.3
MGA_3507	LOCUS_34720	sequence35:10830..11246(-)	partial			WP_011070977.1	Mor transcription activator family protein	79.7	74.8	30.1
MGA_3532	LOCUS_34950	sequence38:4941..5306(+)	partial			WP_011072604.1	Mu phage protein Kil	62.8	67.9	40.8
MGA_3572	LOCUS_35290	sequence42:484..726(-)	partial			WP_014164108.1	hypothetical protein	100.0	68.4	98.8
MGA_3583	LOCUS_35400	sequence43:58..279(+)	partial			WP_001217709.1	GMP reductase	100.0	21.0	100.0
MGA_3596	LOCUS_35520	sequence44:5628..5849(+)	internal_stop_codon	5592..5594(+)		WP_080033391.1	DUF1289 domain-containing protein	98.6	77.4	95.8
MGA_3603	LOCUS_35580	sequence46:1..1134(+)	partial			WP_000098688.1	transketolase	100.0	56.7	98.4
MGA_3609	LOCUS_35620	sequence47:1129..1680(-)	partial			WP_053407642.1	helix-turn-helix domain-containing protein	45.9	38.8	45.2
MGA_3617	LOCUS_35690	sequence48:1511..2254(-)	partial			WP_001268534.1	minor coat protein pIII	100.0	62.5	84.6
MGA_3643	LOCUS_35900	sequence58:73..381(+)	frameshift		330	WP_094958998.1	IS3 family transposase	88.2	23.0	96.7
