# locus_id	locus_tag	location	classification	internal_stop	indel	ref_id	description	query_cov	ref_cov	identity
MGA_1	LOCUS_00010	sequence01:1..605(+)	partial			WP_011267592.1	RHS repeat-associated core domain-containing protein	41.0	8.7	57.3
MGA_3	LOCUS_00030	sequence01:1141..1416(-)	partial			WP_003109297.1	hypothetical protein	79.1	64.3	98.6
MGA_73	LOCUS_00720	sequence01:84509..85813(+)	frameshift		85762	WP_003091643.1	long-chain-fatty-acid--CoA ligase FadD1	96.3	74.4	100.0
MGA_74	LOCUS_00730	sequence01:85852..86196(+)	frameshift		85762	WP_003091643.1	long-chain-fatty-acid--CoA ligase FadD1	100.0	20.3	100.0
MGA_81	LOCUS_00800	sequence01:96451..96708(+)	frameshift,internal_stop_codon	96722..96724(+),96721..96723(+)	96657,96805,96457,96795,96652	WP_003114072.1	DUF3304 domain-containing protein	83.5	24.9	91.5
MGA_84	LOCUS_00830	sequence01:98865..100205(+)	partial			WP_010895654.1	DUF2235 domain-containing protein	100.0	50.6	91.9
MGA_146	LOCUS_01450	sequence01:162823..162981(+)	partial			WP_003109182.1	DUF3309 family protein	73.1	73.1	81.6
MGA_194	LOCUS_01910	sequence02:510..842(-)	partial			WP_010895518.1	hypothetical protein	71.8	63.2	98.7
MGA_322	LOCUS_03180	sequence03:10405..11325(-)	partial			WP_011976361.1	NAD(P)-dependent oxidoreductase	49.0	51.4	34.7
MGA_334	LOCUS_03300	sequence03:25896..27482(+)	partial			WP_003102337.1	DUF1302 domain-containing protein	63.6	59.3	31.8
MGA_449	LOCUS_04430	sequence04:43937..44071(+)	partial			WP_010895590.1	hypothetical protein	100.0	57.9	97.7
MGA_469	LOCUS_04630	sequence04:74079..74225(+)	partial			WP_011389030.1	anaerobic ribonucleoside-triphosphate reductase	68.8	56.9	63.6
MGA_620	LOCUS_06090	sequence07:578..820(-)	frameshift		628	WP_010895518.1	hypothetical protein	68.8	44.0	96.4
MGA_657	LOCUS_06460	sequence07:47206..48417(-)	partial			WP_010895515.1	type II secretion system protein GspL	70.2	74.3	86.2
MGA_709	LOCUS_06950	sequence11:15990..18704(-)	partial			WP_001390260.1	phage tail tape measure protein	71.9	67.1	31.3
MGA_715	LOCUS_07010	sequence11:21499..23787(-)	partial			WP_003113198.1	phage tail protein	45.1	50.2	66.0
MGA_810	LOCUS_07960	sequence11:119371..119667(+)	partial			WP_003118646.1	DUF3649 domain-containing protein	100.0	55.4	86.7
MGA_874	LOCUS_08600	sequence11:184680..184853(-)	partial			WP_011969604.1	XapX domain-containing protein	96.5	64.9	57.4
MGA_972	LOCUS_09580	sequence11:286275..286703(+)	partial			WP_003123219.1	HIT domain-containing protein	100.0	67.9	100.0
MGA_994	LOCUS_09800	sequence11:303756..304133(+)	partial			WP_003114318.1	transporter substrate-binding domain-containing protein	87.2	9.0	44.0
MGA_1006	LOCUS_09920	sequence11:317373..318011(-)	frameshift		318060	WP_003108614.1	multiple virulence factor transcriptional regulator MvfR	100.0	63.9	98.1
MGA_1007	LOCUS_09930	sequence11:317977..318354(-)	frameshift		318060	WP_003108614.1	multiple virulence factor transcriptional regulator MvfR	77.6	29.2	94.8
MGA_1101	LOCUS_10870	sequence11:411029..412159(+)	partial			WP_010926041.1	aromatic ring-hydroxylating dioxygenase subunit alpha	49.7	48.3	33.9
MGA_1103	LOCUS_10890	sequence11:412851..413933(+)	partial			WP_011460782.1	FkbM family methyltransferase	53.6	53.9	33.0
MGA_1106	LOCUS_10920	sequence11:419049..419435(+)	partial			WP_003112502.1	flagellar protein FlaG	58.6	61.0	56.0
MGA_1150	LOCUS_11360	sequence11:460560..460973(-)	frameshift		460975	WP_010895540.1	thiol-disulfide oxidoreductase DCC family protein	88.3	69.9	86.8
MGA_1167	LOCUS_11530	sequence11:479286..481142(+)	partial			WP_003112476.1	S-type pyocin domain-containing protein	89.5	72.4	71.8
MGA_1169	LOCUS_11550	sequence11:481922..482266(+)	frameshift		481779,481797	WP_003100853.1	hypothetical protein	57.0	52.8	73.8
MGA_1173	LOCUS_11590	sequence11:484732..486450(-)	partial			WP_164929046.1	AIPR family protein	24.1	23.1	29.8
MGA_1213	LOCUS_11990	sequence11:530924..531901(+)	partial			WP_011016192.1	retron St85 family RNA-directed DNA polymerase	63.7	58.2	24.6
MGA_1222	LOCUS_12080	sequence11:535519..536589(+)	partial			WP_010895519.1	phage coat protein A	87.6	73.8	67.6
MGA_1265	LOCUS_12510	sequence11:579128..579316(+)	partial			WP_003082517.1	DUF1656 domain-containing protein	71.0	67.7	79.5
MGA_1386	LOCUS_13720	sequence11:710678..711016(+)	partial			WP_003082789.1	hypothetical protein	100.0	47.7	80.4
MGA_1393	LOCUS_13790	sequence11:716236..716505(+)	partial			WP_010895554.1	MoaD/ThiS family protein	100.0	70.6	87.6
MGA_1401	LOCUS_13870	sequence11:722552..723076(+)	partial			WP_003082855.1	RNA polymerase sigma factor	100.0	70.7	99.4
MGA_1413	LOCUS_13990	sequence11:736359..736760(+)	partial			WP_011035672.1	efflux transporter outer membrane subunit	98.5	26.7	71.8
MGA_1436	LOCUS_14220	sequence11:764647..764976(-)	partial			WP_003112412.1	adenylyl-sulfate kinase	100.0	55.6	97.2
MGA_1522	LOCUS_15080	sequence11:853786..853962(+)	partial			WP_003083136.1	heme exporter protein CcmD	65.5	65.5	100.0
MGA_1627	LOCUS_16130	sequence11:967425..967613(+)	partial			WP_003087397.1	YkgJ family cysteine cluster protein	100.0	73.8	100.0
MGA_1710	LOCUS_16960	sequence11:1056983..1057306(+)	partial			WP_003413692.1	PAAR domain-containing protein	52.3	31.0	78.6
MGA_1747	LOCUS_17330	sequence11:1093469..1093867(-)	partial			WP_010895580.1	type III secretion system needle length determinant PscP	100.0	35.8	87.1
MGA_1801	LOCUS_17870	sequence11:1139856..1140140(+)	partial			WP_003132845.1	GNAT family N-acetyltransferase	100.0	58.4	98.9
MGA_1948	LOCUS_19340	sequence11:1310378..1310749(+)	partial			WP_003118964.1	hypothetical protein	89.4	33.6	100.0
MGA_2001	LOCUS_19780	sequence19:26594..27034(-)	partial			WP_010895512.1	phage tail assembly chaperone	76.7	73.7	42.9
MGA_2050	LOCUS_20270	sequence19:77524..77709(+)	partial			WP_046463959.1	site-specific integrase	70.5	11.7	86.0
MGA_2067	LOCUS_20440	sequence19:91322..91747(+)	partial			WP_003121808.1	nuclear transport factor 2 family protein	100.0	64.7	100.0
MGA_2092	LOCUS_20690	sequence19:115541..115804(+)	partial			WP_003118870.1	hypothetical protein	100.0	51.8	100.0
MGA_2148	LOCUS_21250	sequence19:166204..166893(+)	frameshift		166205	WP_003113260.1	LysR family transcriptional regulator	100.0	72.5	96.5
MGA_2180	LOCUS_21570	sequence19:200917..201321(-)	frameshift		201431	WP_003121770.1	hotdog domain-containing protein	100.0	74.9	100.0
MGA_2236	LOCUS_22130	sequence19:270932..271102(+)	partial			WP_005482461.1	DUF167 family protein YggU	87.5	51.0	53.1
MGA_2372	LOCUS_23490	sequence19:412295..413164(+)	partial			WP_011103200.1	lipid II-degrading bacteriocin	54.7	55.8	40.3
MGA_2427	LOCUS_24040	sequence19:468160..468972(-)	frameshift		467982	WP_003117234.1	energy transducer TonB	35.6	35.6	100.0
MGA_2634	LOCUS_26110	sequence19:701202..701426(+)	partial			WP_003146853.1	hypothetical protein	100.0	58.3	95.9
MGA_2641	LOCUS_26180	sequence19:707604..707861(+)	partial			WP_003097235.1	F0F1 ATP synthase subunit C	74.1	74.1	95.2
MGA_2869	LOCUS_28420	sequence24:34777..35313(+)	partial			WP_197524122.1	glycosyltransferase family 4 protein	96.1	64.2	36.8
MGA_3037	LOCUS_30090	sequence24:230208..233399(-)	partial			WP_010895645.1	ribonuclease E	57.2	57.5	94.7
MGA_3057	LOCUS_30280	sequence24:250480..251271(-)	partial			WP_003112560.1	IS3 family transposase	72.2	67.9	97.9
MGA_3064	LOCUS_30350	sequence24:258090..258503(+)	partial			WP_011035718.1	virulence RhuM family protein	59.1	24.1	48.1
MGA_3089	LOCUS_30600	sequence24:286605..286736(+)	partial			WP_010895643.1	hypothetical protein	100.0	27.0	100.0
MGA_3131	LOCUS_31020	sequence24:327629..328219(+)	partial			WP_003091000.1	hypothetical protein	54.6	76.4	100.0
MGA_3165	LOCUS_31360	sequence24:364063..364380(+)	partial			WP_003119864.1	hypothetical protein	100.0	71.9	100.0
MGA_3208	LOCUS_31780	sequence24:406375..406512(-)	partial			WP_003090889.1	PA2816 family glutamine-rich protein	66.7	23.8	100.0
MGA_3256	LOCUS_32260	sequence24:447847..448068(+)	partial			WP_003143767.1	hypothetical protein	100.0	55.3	94.5
MGA_3275	LOCUS_32450	sequence24:461352..461654(+)	partial			WP_003122559.1	hypothetical protein	100.0	69.4	98.0
MGA_3303	LOCUS_32730	sequence24:479708..480016(-)	frameshift,internal_stop_codon	480064..480066(-)	480027	WP_164689163.1	IS3 family transposase	80.4	23.2	37.8
MGA_3304	LOCUS_32740	sequence24:480529..482235(+)	partial			WP_011459236.1	DUF3578 domain-containing protein	62.7	34.7	34.3
MGA_3305	LOCUS_32750	sequence24:482232..483809(+)	partial			WP_010876141.1	DUF2357 domain-containing protein	52.8	50.3	28.3
MGA_3306	LOCUS_32760	sequence24:483795..487721(-)	partial			WP_052729532.1	DNA methyltransferase	36.9	57.9	34.4
MGA_3307	LOCUS_32770	sequence24:487907..488491(+)	partial			WP_012583655.1	DEAD/DEAH box helicase family protein	91.2	16.1	35.0
MGA_3309	LOCUS_32790	sequence24:488791..489972(-)	partial			WP_167355291.1	hypothetical protein	39.4	23.7	26.8
MGA_3311	LOCUS_32810	sequence24:490465..490857(+)	frameshift		490689	WP_003112560.1	IS3 family transposase	57.7	26.8	100.0
MGA_3312	LOCUS_32820	sequence24:490793..491308(+)	frameshift		490689	WP_003112560.1	IS3 family transposase	100.0	61.1	95.9
MGA_3315	LOCUS_32850	sequence24:493270..499566(-)	partial			WP_046463281.1	WGR domain-containing protein	25.8	29.0	31.4
MGA_3382	LOCUS_33520	sequence24:566995..567261(-)	partial			WP_011035581.1	YfeK family protein	97.7	69.6	50.6
MGA_3555	LOCUS_35250	sequence24:768544..769458(-)	frameshift		769348	WP_010895622.1	LysR substrate-binding domain-containing protein	88.5	77.5	98.1
MGA_3557	LOCUS_35270	sequence24:770838..771506(-)	partial			WP_003113001.1	TolC family protein	98.2	46.3	93.6
MGA_3586	LOCUS_35560	sequence24:799901..>801891(-)	partial			WP_011267592.1	RHS repeat-associated core domain-containing protein	83.1	61.6	49.8
MGA_3617	LOCUS_35860	sequence25:26601..27167(+)	internal_stop_codon	27165..27167(+)		WP_003114092.1	alpha/beta hydrolase	100.0	63.5	97.9
MGA_3618	LOCUS_35870	sequence25:27201..27491(+)	internal_stop_codon	27165..27167(+)		WP_003114092.1	alpha/beta hydrolase	100.0	32.4	93.8
MGA_3769	LOCUS_37380	sequence25:188913..189047(+)	partial			WP_004528349.1	DUF2165 domain-containing protein	68.2	18.4	80.0
MGA_3791	LOCUS_37600	sequence25:212876..213751(-)	frameshift,internal_stop_codon	213988..213990(-)	213777	WP_089600859.1	IS3 family transposase	100.0	75.9	61.5
MGA_3792	LOCUS_37610	sequence25:213748..213975(-)	frameshift,internal_stop_codon	213988..213990(-)	213780	WP_157861812.1	IS3 family transposase	96.0	18.8	59.7
MGA_3928	LOCUS_38970	sequence25:361736..362638(+)	frameshift		361614	WP_010895661.1	peptide chain release factor 2	100.0	82.4	96.3
MGA_4351	LOCUS_43170	sequence26:89428..89745(+)	partial			WP_003098240.1	transcriptional regulator SutA	70.5	70.5	94.6
MGA_4373	LOCUS_43390	sequence26:113023..113646(+)	partial			WP_003120367.1	hypothetical protein	100.0	64.1	97.6
MGA_4384	LOCUS_43500	sequence26:123670..124779(+)	frameshift		124740,124870,124743,124876,125023	WP_003115263.1	alginate regulator AlgP	36.0	37.8	95.5
MGA_4413	LOCUS_43790	sequence26:155848..156057(-)	partial			WP_003123689.1	TIGR02449 family protein	100.0	67.0	92.8
MGA_4526	LOCUS_44920	sequence26:278375..278866(-)	partial			WP_003114472.1	helix-turn-helix domain-containing protein	49.7	57.4	92.6
MGA_4574	LOCUS_45400	sequence26:334655..335083(-)	partial			WP_003115042.1	Sec-independent protein translocase protein TatB	63.4	63.8	95.6
MGA_4583	LOCUS_45490	sequence26:340210..341139(+)	frameshift,internal_stop_codon	340350..340352(+),341266..341268(+),341137..341139(+)	341121,341140,340196,341174,340361,340619,340445	WP_003146415.1	phasin family protein	44.7	44.7	94.9
MGA_4626	LOCUS_45920	sequence26:398203..400008(-)	frameshift		400139	WP_003114559.1	phosphodiesterase DipA	100.0	66.9	99.0
MGA_4627	LOCUS_45930	sequence26:400062..400904(-)	frameshift		400139	WP_003114559.1	phosphodiesterase DipA	91.8	28.6	98.4
MGA_4774	LOCUS_47400	sequence26:572223..572513(+)	partial			WP_003095479.1	PsiF family protein	99.0	70.3	88.7
MGA_4860	LOCUS_48250	sequence27:20673..20924(+)	partial			WP_003120837.1	hypothetical protein	100.0	36.4	98.8
MGA_5120	LOCUS_50850	sequence27:301103..301387(+)	partial			WP_005769278.1	PP0621 family protein	84.0	73.1	44.3
MGA_5161	LOCUS_51260	sequence27:343821..344198(+)	partial			WP_003107850.1	hypothetical protein	68.8	68.8	90.7
MGA_5204	LOCUS_51690	sequence27:394420..>395927(-)	partial			WP_003148161.1	two-partner secretion system adhesin CdrA	100.0	23.3	92.0
MGA_5231	LOCUS_51950	sequence28:28109..28312(-)	partial			WP_003113684.1	cyanide-forming glycine dehydrogenase subunit HcnA	100.0	64.4	98.5
MGA_5233	LOCUS_51970	sequence28:28659..28886(+)	partial			WP_011102274.1	alpha-glucosidase	68.0	10.5	57.9
MGA_5293	LOCUS_52570	sequence28:87893..88282(-)	partial			WP_003120287.1	response regulator	100.0	72.5	99.2
MGA_5361	LOCUS_53250	sequence28:160690..160965(-)	partial			WP_003114860.1	nitrilase family protein	71.4	24.1	81.5
MGA_5479	LOCUS_54410	sequence29:34533..35546(+)	partial			WP_011263060.1	GNAT family N-acetyltransferase	57.3	63.7	51.3
MGA_5484	LOCUS_54460	sequence29:52183..52695(-)	partial			WP_010895615.1	Bro-N domain-containing protein	100.0	64.4	94.1
MGA_5515	LOCUS_54740	sequence29:82774..95184(+)	partial			WP_010895613.1	non-ribosomal peptide synthetase	74.0	59.3	69.1
MGA_5558	LOCUS_55170	sequence29:163161..163427(+)	partial			WP_010895608.1	hypothetical protein	100.0	68.2	100.0
MGA_5693	LOCUS_56500	sequence30:75795..76385(+)	internal_stop_codon	76383..76385(+)		WP_023187660.1	LysE family translocator	100.0	79.0	95.4
MGA_5708	LOCUS_56650	sequence30:94058..95488(-)	frameshift		93845,93902	WP_010895670.1	cytochrome c oxidase accessory protein CcoG	100.0	83.1	93.7
MGA_5740	LOCUS_56970	sequence30:130150..130554(+)	partial			WP_003088835.1	DUF2790 domain-containing protein	45.5	76.2	49.2
