# locus_id	locus_tag	location	classification	internal_stop	indel	ref_id	description	query_cov	ref_cov	identity
MGA_203	LOCUS_02030	sequence1:227721..228533(+)	frameshift		228710	WP_003117234.1	energy transducer TonB	35.6	35.6	100.0
MGA_258	LOCUS_02580	sequence1:283529..284398(-)	partial			WP_011103200.1	lipid II-degrading bacteriocin	54.7	55.8	40.3
MGA_393	LOCUS_03930	sequence1:425591..425761(-)	partial			WP_005482461.1	DUF167 family protein YggU	87.5	51.0	53.1
MGA_449	LOCUS_04490	sequence1:495372..495776(+)	frameshift		495261	WP_003121770.1	hotdog domain-containing protein	100.0	74.9	100.0
MGA_481	LOCUS_04810	sequence1:529800..530489(-)	frameshift		530487	WP_003113260.1	LysR family transcriptional regulator	100.0	72.5	96.5
MGA_536	LOCUS_05360	sequence1:580889..581152(-)	partial			WP_003118870.1	hypothetical protein	100.0	51.8	100.0
MGA_561	LOCUS_05610	sequence1:604946..605371(-)	partial			WP_003121808.1	nuclear transport factor 2 family protein	100.0	64.7	100.0
MGA_578	LOCUS_05780	sequence1:618984..619169(-)	partial			WP_046463959.1	site-specific integrase	70.5	11.7	86.0
MGA_627	LOCUS_06270	sequence1:669659..670099(+)	partial			WP_010895512.1	phage tail assembly chaperone	76.7	73.7	42.9
MGA_791	LOCUS_07910	sequence1:851454..852044(+)	internal_stop_codon	852042..852044(+)		WP_023187660.1	LysE family translocator	100.0	79.0	95.4
MGA_806	LOCUS_08060	sequence1:869717..871147(-)	frameshift		869504,869561	WP_010895670.1	cytochrome c oxidase accessory protein CcoG	100.0	83.1	93.7
MGA_838	LOCUS_08380	sequence1:905809..906213(+)	partial			WP_003088835.1	DUF2790 domain-containing protein	45.5	76.2	49.2
MGA_947	LOCUS_09470	sequence1:1014652..1015218(+)	internal_stop_codon	1015216..1015218(+)		WP_003114092.1	alpha/beta hydrolase	100.0	63.5	97.9
MGA_948	LOCUS_09480	sequence1:1015252..1015542(+)	internal_stop_codon	1015216..1015218(+)		WP_003114092.1	alpha/beta hydrolase	100.0	32.4	93.8
MGA_1099	LOCUS_10990	sequence1:1176964..1177098(+)	partial			WP_004528349.1	DUF2165 domain-containing protein	68.2	18.4	80.0
MGA_1121	LOCUS_11210	sequence1:1200927..1201802(-)	frameshift,internal_stop_codon	1202039..1202041(-)	1201828	WP_089600859.1	IS3 family transposase	100.0	75.9	61.5
MGA_1122	LOCUS_11220	sequence1:1201799..1202026(-)	frameshift,internal_stop_codon	1202039..1202041(-)	1201831	WP_157861812.1	IS3 family transposase	96.0	18.8	59.7
MGA_1258	LOCUS_12580	sequence1:1349787..1350689(+)	frameshift		1349665	WP_010895661.1	peptide chain release factor 2	100.0	82.4	96.3
MGA_1595	LOCUS_15930	sequence1:1709342..1710133(+)	partial			WP_010895620.1	RHS repeat protein	88.2	71.5	77.7
MGA_1598	LOCUS_15960	sequence1:1713425..1713700(-)	partial			WP_003109297.1	hypothetical protein	79.1	64.3	98.6
MGA_1668	LOCUS_16650	sequence1:1796793..1798097(+)	frameshift		1798046	WP_003091643.1	long-chain-fatty-acid--CoA ligase FadD1	96.3	74.4	100.0
MGA_1669	LOCUS_16660	sequence1:1798136..1798480(+)	frameshift		1798046	WP_003091643.1	long-chain-fatty-acid--CoA ligase FadD1	100.0	20.3	100.0
MGA_1676	LOCUS_16730	sequence1:1808735..1808992(+)	frameshift,internal_stop_codon	1809006..1809008(+),1809005..1809007(+)	1809089,1808741,1809079,1808936,1808941	WP_003114072.1	DUF3304 domain-containing protein	83.5	24.9	91.5
MGA_1679	LOCUS_16760	sequence1:1811149..1812489(+)	partial			WP_010895654.1	DUF2235 domain-containing protein	100.0	50.6	91.9
MGA_1741	LOCUS_17380	sequence1:1875107..1875265(+)	partial			WP_003109182.1	DUF3309 family protein	73.1	73.1	81.6
MGA_1817	LOCUS_18140	sequence1:1952731..1953267(+)	partial			WP_197524122.1	glycosyltransferase family 4 protein	96.1	64.2	36.8
MGA_1985	LOCUS_19810	sequence1:2148162..2151353(-)	partial			WP_010895645.1	ribonuclease E	57.2	57.5	94.7
MGA_2005	LOCUS_20000	sequence1:2168434..2169225(-)	partial			WP_003112560.1	IS3 family transposase	72.2	67.9	97.9
MGA_2012	LOCUS_20070	sequence1:2176044..2176457(+)	partial			WP_011035718.1	virulence RhuM family protein	59.1	24.1	48.1
MGA_2037	LOCUS_20320	sequence1:2204559..2204690(+)	partial			WP_010895643.1	hypothetical protein	100.0	27.0	100.0
MGA_2079	LOCUS_20740	sequence1:2245583..2246173(+)	partial			WP_003091000.1	hypothetical protein	54.6	76.4	100.0
MGA_2113	LOCUS_21080	sequence1:2282017..2282334(+)	partial			WP_003119864.1	hypothetical protein	100.0	71.9	100.0
MGA_2156	LOCUS_21500	sequence1:2324329..2324466(-)	partial			WP_003090889.1	PA2816 family glutamine-rich protein	66.7	23.8	100.0
MGA_2204	LOCUS_21980	sequence1:2365801..2366022(+)	partial			WP_003143767.1	hypothetical protein	100.0	55.3	94.5
MGA_2223	LOCUS_22170	sequence1:2379306..2379608(+)	partial			WP_003122559.1	hypothetical protein	100.0	69.4	98.0
MGA_2251	LOCUS_22450	sequence1:2397662..2397970(-)	frameshift,internal_stop_codon	2398018..2398020(-)	2397981	WP_164689163.1	IS3 family transposase	80.4	23.2	37.8
MGA_2252	LOCUS_22460	sequence1:2398483..2400189(+)	partial			WP_011459236.1	DUF3578 domain-containing protein	62.7	34.7	34.3
MGA_2253	LOCUS_22470	sequence1:2400186..2401763(+)	partial			WP_010876141.1	DUF2357 domain-containing protein	52.8	50.3	28.3
MGA_2254	LOCUS_22480	sequence1:2401749..2405675(-)	partial			WP_052729532.1	DNA methyltransferase	36.9	57.9	34.4
MGA_2255	LOCUS_22490	sequence1:2405861..2406445(+)	partial			WP_012583655.1	DEAD/DEAH box helicase family protein	91.2	16.1	35.0
MGA_2257	LOCUS_22510	sequence1:2406745..2407926(-)	partial			WP_167355291.1	hypothetical protein	39.4	23.7	26.8
MGA_2259	LOCUS_22530	sequence1:2408410..2408811(+)	frameshift		2408643	WP_003112560.1	IS3 family transposase	56.4	26.8	100.0
MGA_2260	LOCUS_22540	sequence1:2408747..2409262(+)	frameshift		2408643	WP_003112560.1	IS3 family transposase	100.0	61.1	95.9
MGA_2263	LOCUS_22570	sequence1:2411224..2417520(-)	partial			WP_046463281.1	WGR domain-containing protein	25.8	29.0	31.4
MGA_2329	LOCUS_23230	sequence1:2484949..2485215(-)	partial			WP_011035581.1	YfeK family protein	97.7	69.6	50.6
MGA_2502	LOCUS_24960	sequence1:2686497..2687411(-)	frameshift		2687301	WP_010895622.1	LysR substrate-binding domain-containing protein	88.5	77.5	98.1
MGA_2504	LOCUS_24980	sequence1:2688791..2689459(-)	partial			WP_003113001.1	TolC family protein	98.2	46.3	93.6
MGA_2534	LOCUS_25280	sequence1:2720532..2721323(-)	partial			WP_010895620.1	RHS repeat protein	88.2	71.5	76.4
MGA_2563	LOCUS_25570	sequence1:2755414..2756427(+)	partial			WP_011263060.1	GNAT family N-acetyltransferase	57.3	63.7	51.3
MGA_2568	LOCUS_25620	sequence1:2773064..2773576(-)	partial			WP_010895615.1	Bro-N domain-containing protein	100.0	64.4	94.1
MGA_2598	LOCUS_25890	sequence1:2803656..2816066(+)	partial			WP_010895613.1	non-ribosomal peptide synthetase	74.0	59.3	69.1
MGA_2641	LOCUS_26320	sequence1:2884043..2884309(+)	partial			WP_010895608.1	hypothetical protein	100.0	68.2	100.0
MGA_2780	LOCUS_27710	sequence1:3045511..3047097(-)	partial			WP_003102337.1	DUF1302 domain-containing protein	63.6	59.3	31.8
MGA_2792	LOCUS_27830	sequence1:3061668..3062588(+)	partial			WP_011976361.1	NAD(P)-dependent oxidoreductase	49.0	51.4	34.7
MGA_2829	LOCUS_28200	sequence1:3102536..3102748(-)	partial			WP_003113684.1	cyanide-forming glycine dehydrogenase subunit HcnA	100.0	67.3	98.6
MGA_2831	LOCUS_28220	sequence1:3103086..3103313(+)	partial			WP_011102274.1	alpha-glucosidase	68.0	10.5	57.9
MGA_2891	LOCUS_28820	sequence1:3162320..3162709(-)	partial			WP_003120287.1	response regulator	100.0	72.5	99.2
MGA_2959	LOCUS_29500	sequence1:3235117..3235392(-)	partial			WP_003114860.1	nitrilase family protein	71.4	24.1	81.5
MGA_3091	LOCUS_30820	sequence1:3385193..3385327(+)	partial			WP_010895590.1	hypothetical protein	100.0	57.9	97.7
MGA_3111	LOCUS_31020	sequence1:3415335..3415481(+)	partial			WP_011389030.1	anaerobic ribonucleoside-triphosphate reductase	68.8	56.9	63.6
MGA_3144	LOCUS_31350	sequence1:3449501..3449872(-)	partial			WP_003118964.1	hypothetical protein	89.4	33.6	100.0
MGA_3291	LOCUS_32820	sequence1:3620110..3620394(-)	partial			WP_003132845.1	GNAT family N-acetyltransferase	100.0	58.4	98.9
MGA_3345	LOCUS_33360	sequence1:3666383..3666781(+)	partial			WP_010895580.1	type III secretion system needle length determinant PscP	100.0	35.8	87.1
MGA_3382	LOCUS_33730	sequence1:3702944..3703267(-)	partial			WP_003413692.1	PAAR domain-containing protein	52.3	31.0	78.6
MGA_3462	LOCUS_34530	sequence1:3789759..3790019(-)	partial			WP_003104388.1	succinate dehydrogenase, cytochrome b556 subunit	100.0	67.2	83.7
MGA_3465	LOCUS_34560	sequence1:3792637..3792825(-)	partial			WP_003087397.1	YkgJ family cysteine cluster protein	100.0	73.8	100.0
MGA_3571	LOCUS_35620	sequence1:3906288..3906464(-)	partial			WP_003083136.1	heme exporter protein CcmD	65.5	65.5	100.0
MGA_3657	LOCUS_36480	sequence1:3995274..3995603(+)	partial			WP_003112412.1	adenylyl-sulfate kinase	100.0	55.6	97.2
MGA_3680	LOCUS_36710	sequence1:4023490..4023891(-)	partial			WP_011035672.1	efflux transporter outer membrane subunit	98.5	26.7	71.8
MGA_3692	LOCUS_36830	sequence1:4037174..4037698(-)	partial			WP_003082855.1	RNA polymerase sigma factor	100.0	70.7	99.4
MGA_3700	LOCUS_36910	sequence1:4043745..4044014(-)	partial			WP_010895554.1	MoaD/ThiS family protein	100.0	70.6	87.6
MGA_3707	LOCUS_36980	sequence1:4049234..4049572(-)	partial			WP_003082789.1	hypothetical protein	100.0	47.7	80.4
MGA_3827	LOCUS_38180	sequence1:4180934..4181122(-)	partial			WP_003082517.1	DUF1656 domain-containing protein	71.0	67.7	79.5
MGA_3870	LOCUS_38610	sequence1:4223661..4224707(-)	partial			WP_010895519.1	phage coat protein A	89.7	73.8	67.1
MGA_3879	LOCUS_38700	sequence1:4228349..4229326(-)	partial			WP_011016192.1	retron St85 family RNA-directed DNA polymerase	63.7	58.2	24.6
MGA_3919	LOCUS_39100	sequence1:4273800..4275518(+)	partial			WP_164929046.1	AIPR family protein	24.1	23.1	29.8
MGA_3923	LOCUS_39140	sequence1:4277984..4278328(-)	frameshift		4278452,4278470	WP_003100853.1	hypothetical protein	57.0	52.8	73.8
MGA_3925	LOCUS_39160	sequence1:4279108..4280964(-)	partial			WP_003112476.1	S-type pyocin domain-containing protein	89.5	72.4	71.8
MGA_3942	LOCUS_39330	sequence1:4299277..4299690(+)	frameshift		4299274	WP_010895540.1	thiol-disulfide oxidoreductase DCC family protein	88.3	69.9	86.8
MGA_3986	LOCUS_39770	sequence1:4340815..4341201(-)	partial			WP_003112502.1	flagellar protein FlaG	58.6	61.0	56.0
MGA_3989	LOCUS_39800	sequence1:4346317..4347396(-)	partial			WP_011460782.1	FkbM family methyltransferase	53.8	53.9	33.0
MGA_3991	LOCUS_39820	sequence1:4348091..4349221(-)	partial			WP_010926041.1	aromatic ring-hydroxylating dioxygenase subunit alpha	49.7	48.3	33.9
MGA_4085	LOCUS_40760	sequence1:4441896..4442273(+)	frameshift		4442189	WP_003108614.1	multiple virulence factor transcriptional regulator MvfR	77.6	29.2	94.8
MGA_4086	LOCUS_40770	sequence1:4442239..4442877(+)	frameshift		4442189	WP_003108614.1	multiple virulence factor transcriptional regulator MvfR	100.0	63.9	98.1
MGA_4098	LOCUS_40890	sequence1:4456117..4456494(-)	partial			WP_003114318.1	transporter substrate-binding domain-containing protein	87.2	9.0	44.0
MGA_4120	LOCUS_41110	sequence1:4473547..4473975(-)	partial			WP_003123219.1	HIT domain-containing protein	100.0	67.9	100.0
MGA_4218	LOCUS_42090	sequence1:4575397..4575570(+)	partial			WP_011969604.1	XapX domain-containing protein	96.5	64.9	57.4
MGA_4282	LOCUS_42730	sequence1:4640583..4640879(-)	partial			WP_003118646.1	DUF3649 domain-containing protein	100.0	55.4	86.7
MGA_4377	LOCUS_43680	sequence1:4736463..4738751(+)	partial			WP_003113198.1	phage tail protein	45.1	50.2	66.0
MGA_4382	LOCUS_43730	sequence1:4741546..4744260(+)	partial			WP_001390260.1	phage tail tape measure protein	71.9	67.1	31.3
MGA_4412	LOCUS_44030	sequence1:4764392..4764634(-)	frameshift		4764442	WP_010895518.1	hypothetical protein	68.8	44.0	96.4
MGA_4449	LOCUS_44400	sequence1:4811020..4812231(-)	partial			WP_010895515.1	type II secretion system protein GspL	70.2	74.3	86.2
MGA_4475	LOCUS_44660	sequence1:4851188..4851439(+)	partial			WP_003120837.1	hypothetical protein	100.0	36.4	98.8
MGA_4735	LOCUS_47260	sequence1:5131618..5131902(+)	partial			WP_005769278.1	PP0621 family protein	84.0	73.1	44.3
MGA_4776	LOCUS_47670	sequence1:5174336..5174713(+)	partial			WP_003107850.1	hypothetical protein	68.8	68.8	90.7
MGA_5005	LOCUS_49960	sequence1:5427616..5427948(+)	partial			WP_010895518.1	hypothetical protein	71.8	63.2	98.7
MGA_5087	LOCUS_50770	sequence1:5518564..5518854(-)	partial			WP_003095479.1	PsiF family protein	99.0	70.3	88.7
MGA_5234	LOCUS_52240	sequence1:5690173..5691015(+)	frameshift		5690937	WP_003114559.1	phosphodiesterase DipA	91.8	28.6	98.4
MGA_5235	LOCUS_52250	sequence1:5691069..5692874(+)	frameshift		5690937	WP_003114559.1	phosphodiesterase DipA	100.0	66.9	99.0
MGA_5278	LOCUS_52680	sequence1:5749938..5750867(-)	frameshift,internal_stop_codon	5750725..5750727(-),5749809..5749811(-),5749938..5749940(-)	5749936,5750880,5749955,5750631,5750457,5750715,5749902	WP_003146415.1	phasin family protein	44.7	44.7	94.9
MGA_5287	LOCUS_52770	sequence1:5755994..5756422(+)	partial			WP_003115042.1	Sec-independent protein translocase protein TatB	63.4	63.8	95.6
MGA_5335	LOCUS_53250	sequence1:5812211..5812702(+)	partial			WP_003114472.1	helix-turn-helix domain-containing protein	49.7	57.4	92.6
MGA_5448	LOCUS_54380	sequence1:5935019..5935228(+)	partial			WP_003123689.1	TIGR02449 family protein	100.0	67.0	92.8
MGA_5477	LOCUS_54670	sequence1:5966297..5967406(-)	frameshift		5966052,5966199,5966332,5966205,5966335	WP_003115263.1	alginate regulator AlgP	36.0	37.8	95.5
MGA_5488	LOCUS_54780	sequence1:5977430..5978053(-)	partial			WP_003120367.1	hypothetical protein	100.0	64.1	97.6
MGA_5510	LOCUS_55000	sequence1:6001331..6001648(-)	partial			WP_003098240.1	transcriptional regulator SutA	70.5	70.5	94.6
MGA_5787	LOCUS_57770	sequence1:6305882..6306139(-)	partial			WP_003097235.1	F0F1 ATP synthase subunit C	74.1	74.1	95.2
MGA_5794	LOCUS_57840	sequence1:6312317..6312541(-)	partial			WP_003146853.1	hypothetical protein	100.0	58.3	95.9
