# locus_id	locus_tag	location	classification	internal_stop	indel	ref_id	description	query_cov	ref_cov	identity
MGA_14	LOCUS_00140	sequence1:19589..20179(+)	internal_stop_codon	20177..20179(+)		WP_011070438.1	Xaa-Pro dipeptidase	100.0	44.6	93.9
MGA_15	LOCUS_00150	sequence1:20195..20911(+)	internal_stop_codon	20177..20179(+)		WP_011070438.1	Xaa-Pro dipeptidase	99.6	54.0	92.4
MGA_60	LOCUS_00580	sequence1:69565..70545(+)	partial			WP_012870355.1	glycosyltransferase	35.3	35.3	30.4
MGA_110	LOCUS_01080	sequence1:128884..130140(-)	frameshift		129105	WP_011074228.1	two-component system sensor histidine kinase EnvZ	82.5	78.8	92.8
MGA_117	LOCUS_01150	sequence1:138226..138801(+)	partial			WP_164925802.1	ComF family protein	100.0	72.9	82.2
MGA_124	LOCUS_01220	sequence1:145811..146326(-)	frameshift		145843,145651	WP_011071191.1	transposase	94.2	46.8	95.0
MGA_126	LOCUS_01240	sequence1:146935..147867(-)	partial			WP_169337322.1	IPT/TIG domain-containing protein	71.0	5.2	36.2
MGA_127	LOCUS_01250	sequence1:147855..152537(-)	partial			WP_169337322.1	IPT/TIG domain-containing protein	83.5	39.1	27.0
MGA_208	LOCUS_02030	sequence1:229744..229992(-)	frameshift		230045	WP_011262736.1	fumarate reductase subunit FrdD	98.8	57.9	44.4
MGA_267	LOCUS_02620	sequence1:286692..286877(-)	partial			WP_011074058.1	YceK/YidQ family lipoprotein	100.0	57.0	75.4
MGA_268	LOCUS_02630	sequence1:287773..288645(+)	partial			WP_000904079.1	type VI secretion system immunity protein TsiV2	50.7	62.4	28.4
MGA_278	LOCUS_02730	sequence1:301091..302311(+)	partial			WP_091138101.1	serine protease	46.1	30.2	32.3
MGA_291	LOCUS_02860	sequence1:311573..311848(-)	internal_stop_codon	311849..311851(-)		WP_011074036.1	3-ketoacyl-ACP reductase FabG2	100.0	37.8	96.7
MGA_292	LOCUS_02870	sequence1:311849..312298(-)	internal_stop_codon	311849..311851(-)		WP_011074036.1	3-ketoacyl-ACP reductase FabG2	100.0	61.8	87.2
MGA_298	LOCUS_02930	sequence1:318709..319305(-)	partial			WP_011074030.1	outer membrane lipoprotein carrier protein LolA	100.0	73.2	78.2
MGA_433	LOCUS_04250	sequence1:465408..465920(+)	partial			WP_139685680.1	type II secretion system protein	61.8	59.5	44.4
MGA_471	LOCUS_04630	sequence1:515767..516642(+)	partial			WP_011016055.1	toxin-antitoxin system YwqK family antitoxin	99.0	71.6	36.1
MGA_493	LOCUS_04850	sequence1:543244..544170(-)	partial			WP_013383507.1	HNH endonuclease	46.4	36.3	32.2
MGA_503	LOCUS_04950	sequence1:556707..557417(+)	partial			WP_011073744.1	single-stranded DNA-binding protein	56.4	54.6	92.5
MGA_637	LOCUS_06290	sequence1:709300..710157(+)	partial			WP_022771536.1	DUF1566 domain-containing protein	81.1	14.1	27.5
MGA_640	LOCUS_06320	sequence1:711091..711327(-)	partial			WP_003688619.1	helix-turn-helix transcriptional regulator	82.1	60.4	43.8
MGA_644	LOCUS_06360	sequence1:715844..716647(-)	partial			WP_107272294.1	HNH endonuclease	34.8	42.4	33.0
MGA_648	LOCUS_06400	sequence1:719669..723772(+)	partial			WP_169337322.1	IPT/TIG domain-containing protein	91.4	38.8	27.3
MGA_649	LOCUS_06410	sequence1:723794..724570(+)	partial			WP_169337322.1	IPT/TIG domain-containing protein	67.8	4.8	39.7
MGA_656	LOCUS_06480	sequence1:730194..730802(-)	partial			WP_000087610.1	HNH endonuclease	56.9	51.3	50.0
MGA_658	LOCUS_06500	sequence1:732138..732323(+)	frameshift,internal_stop_codon	732057..732059(+)	732284	WP_001118645.1	IS5 family transposase	91.8	18.2	58.9
MGA_711	LOCUS_07030	sequence1:785943..786200(+)	frameshift		785950	WP_011073594.1	SirB2 family protein	97.6	63.4	97.6
MGA_729	LOCUS_07210	sequence1:802743..803084(+)	frameshift		803063	WP_011073580.1	porin family protein	93.8	54.5	66.0
MGA_730	LOCUS_07220	sequence1:803110..803319(+)	frameshift		803063	WP_011073580.1	porin family protein	100.0	36.9	81.2
MGA_739	LOCUS_07310	sequence1:811029..814907(-)	partial			WP_011072016.1	S8 family serine peptidase	57.9	64.5	30.8
MGA_815	LOCUS_08070	sequence1:898556..898789(+)	frameshift		898479	WP_011071246.1	hypothetical protein	100.0	56.6	77.9
MGA_865	LOCUS_08570	sequence1:960692..961315(+)	frameshift,internal_stop_codon	960614..960616(+),960515..960517(+)	960841,960670,960510	WP_011074156.1	transposase	76.8	48.9	88.1
MGA_939	LOCUS_09270	sequence1:1039774..1040022(+)	frameshift		1039730,1040087,1039805,1040018	WP_011072286.1	IS630-like element ISSod10 family transposase	89.0	21.4	75.3
MGA_940	LOCUS_09280	sequence1:1040086..1040625(+)	frameshift		1040016,1040085	WP_011072286.1	IS630-like element ISSod10 family transposase	97.8	53.7	73.2
MGA_1004	LOCUS_09920	sequence1:1118057..1118608(+)	internal_stop_codon	1118606..1118608(+)		WP_011071487.1	gamma-glutamyl-gamma-aminobutyrate hydrolase family protein	100.0	72.3	88.5
MGA_1005	LOCUS_09930	sequence1:1118621..1118818(+)	internal_stop_codon	1118606..1118608(+)		WP_011071487.1	gamma-glutamyl-gamma-aminobutyrate hydrolase family protein	100.0	25.7	87.7
MGA_1065	LOCUS_10530	sequence1:1186464..1186691(+)	partial			WP_164925647.1	protein YgfX	85.3	42.1	65.6
MGA_1078	LOCUS_10660	sequence1:1198065..1198481(+)	frameshift		1198478	WP_011071562.1	DUF962 domain-containing protein	100.0	78.9	73.9
MGA_1112	LOCUS_11000	sequence1:1234809..1235003(+)	partial			WP_011071594.1	HD domain-containing protein	68.8	10.6	72.7
MGA_1125	LOCUS_11130	sequence1:1248431..1248739(+)	partial			WP_010938934.1	metalloregulator ArsR/SmtB family transcription factor	81.4	72.8	51.8
MGA_1129	LOCUS_11170	sequence1:1251229..1252122(+)	partial			WP_011674076.1	type I-E CRISPR-associated endoribonuclease Cas2e	51.5	51.5	35.9
MGA_1149	LOCUS_11370	sequence1:1270278..1271759(-)	partial			WP_010942354.1	site-specific integrase	67.3	58.8	26.3
MGA_1156	LOCUS_11440	sequence1:1276410..1277651(+)	frameshift		1277522	WP_164925657.1	GGDEF domain-containing protein	97.3	69.3	48.8
MGA_1157	LOCUS_11450	sequence1:1277599..1278144(+)	frameshift		1277528	WP_164925657.1	GGDEF domain-containing protein	98.3	30.7	80.3
MGA_1159	LOCUS_11470	sequence1:1280234..1281706(-)	internal_stop_codon	1281947..1281949(-)		WP_011071669.1	TonB-dependent receptor	100.0	60.0	84.1
MGA_1160	LOCUS_11480	sequence1:1281947..1282678(-)	internal_stop_codon	1281947..1281949(-)		WP_011071669.1	TonB-dependent receptor	98.8	29.2	81.7
MGA_1187	LOCUS_11750	sequence1:1321865..1323043(-)	partial			WP_052846270.1	proteasome-activating nucleotidase	38.5	43.6	30.1
MGA_1227	LOCUS_12150	sequence1:1371926..1372084(-)	frameshift		1372115	WP_011071744.1	DUF2461 domain-containing protein	100.0	22.1	80.8
MGA_1228	LOCUS_12160	sequence1:1372098..1372640(-)	frameshift		1372115	WP_011071744.1	DUF2461 domain-containing protein	92.8	71.1	86.8
MGA_1245	LOCUS_12330	sequence1:1390809..1392359(-)	frameshift		1392358	WP_172966575.1	beta-ketoacyl synthase N-terminal-like domain-containing protein	100.0	25.7	84.7
MGA_1246	LOCUS_12340	sequence1:1392284..1396765(-)	frameshift		1392361	WP_172966575.1	beta-ketoacyl synthase N-terminal-like domain-containing protein	98.1	74.2	71.6
MGA_1248	LOCUS_12360	sequence1:1399026..1407251(-)	partial			WP_011071759.1	type I polyketide synthase	63.3	65.2	66.5
MGA_1267	LOCUS_12550	sequence1:1421473..1423404(+)	partial			WP_012582875.1	HD-GYP domain-containing protein	29.4	48.6	46.6
MGA_1332	LOCUS_13200	sequence1:1502138..1502329(-)	internal_stop_codon	1502564..1502566(-),1502342..1502344(-)		WP_011071191.1	transposase	79.4	14.5	98.0
MGA_1333	LOCUS_13210	sequence1:1502564..1502776(-)	internal_stop_codon	1502564..1502566(-),1502342..1502344(-)		WP_011071843.1	transposase	98.6	19.8	94.2
MGA_1361	LOCUS_13490	sequence1:1534083..1535522(+)	frameshift		1535465	WP_130624425.1	choline BCCT transporter BetT	95.8	69.0	65.2
MGA_1362	LOCUS_13500	sequence1:1535510..1536061(+)	frameshift		1535471	WP_130624425.1	choline BCCT transporter BetT	95.1	27.1	35.6
MGA_1453	LOCUS_14410	sequence1:1642306..1642665(+)	frameshift		1642614	WP_011072762.1	SMC family ATPase	86.6	10.1	87.4
MGA_1542	LOCUS_15300	sequence1:1740122..1741285(+)	partial			WP_002209756.1	DUF4401 domain-containing protein	84.8	46.7	21.0
MGA_1589	LOCUS_15760	sequence1:1791023..1791787(-)	frameshift		1791882	WP_011072047.1	gamma-glutamyltransferase	100.0	43.9	90.2
MGA_1590	LOCUS_15770	sequence1:1791787..1792761(-)	frameshift		1791888	WP_011072047.1	gamma-glutamyltransferase	90.4	50.6	85.7
MGA_1714	LOCUS_17010	sequence1:1926764..1927183(+)	partial			WP_004523328.1	PRC-barrel domain-containing protein	82.7	70.6	55.7
MGA_1721	LOCUS_17080	sequence1:1934482..1934922(+)	partial			WP_011014990.1	DUF4274 domain-containing protein	30.8	29.6	42.2
MGA_1740	LOCUS_17270	sequence1:1961108..1963834(-)	partial			WP_013531683.1	phage/plasmid primase, P4 family	37.2	74.5	32.7
MGA_1742	LOCUS_17290	sequence1:1964851..1965249(+)	internal_stop_codon	1965247..1965249(+)		WP_164925653.1	DUF86 domain-containing protein	99.2	47.5	95.4
MGA_1743	LOCUS_17300	sequence1:1965265..1965693(+)	internal_stop_codon	1965247..1965249(+)		WP_164925653.1	DUF86 domain-containing protein	97.9	50.4	89.9
MGA_1745	LOCUS_17320	sequence1:1966327..1966809(+)	partial			WP_011073923.1	DNA repair protein RadC	77.5	55.1	67.7
MGA_1752	LOCUS_17390	sequence1:1969590..1970795(+)	partial			WP_011269081.1	ImmA/IrrE family metallo-endopeptidase	51.1	71.3	34.0
MGA_1849	LOCUS_18330	sequence1:2090826..2091311(+)	partial			WP_028173083.1	nitrate reductase cytochrome c-type subunit	70.8	73.1	64.9
MGA_1851	LOCUS_18350	sequence1:2092052..2092432(+)	partial			WP_164922434.1	DUF1801 domain-containing protein	58.7	75.5	44.4
MGA_1860	LOCUS_18440	sequence1:2102043..2102792(-)	partial			WP_011122515.1	AraC family transcriptional regulator	31.3	31.4	41.0
MGA_1863	LOCUS_18470	sequence1:2105362..2108448(+)	partial			WP_011070706.1	EAL domain-containing protein	66.6	44.5	35.3
MGA_1865	LOCUS_18490	sequence1:2109158..2109652(+)	partial			WP_014640192.1	tRNA-uridine aminocarboxypropyltransferase	92.7	65.1	36.4
MGA_1876	LOCUS_18600	sequence1:2120295..2121491(+)	partial			WP_011072414.1	putative metalloprotease CJM1_0395 family protein	92.5	54.5	46.8
MGA_1960	LOCUS_19430	sequence1:2214179..2216065(-)	partial			WP_011031707.1	family 43 glycosylhydrolase	54.1	69.0	36.3
MGA_1963	LOCUS_19460	sequence1:2218798..2219340(+)	frameshift		2219313	WP_010964837.1	family 43 glycosylhydrolase	95.0	52.3	55.6
MGA_1964	LOCUS_19470	sequence1:2219369..2219746(+)	frameshift		2219319	WP_010964837.1	family 43 glycosylhydrolase	98.4	37.6	61.0
MGA_1986	LOCUS_19690	sequence1:2247903..2248295(+)	partial			WP_011072394.1	class I ribonucleotide reductase maintenance protein YfaE	69.2	62.5	78.9
MGA_1995	LOCUS_19780	sequence1:2260748..2261092(-)	frameshift		2261084	WP_011072167.1	FAD:protein FMN transferase	99.1	37.7	81.4
MGA_1996	LOCUS_19790	sequence1:2261034..2261657(-)	frameshift		2261090	WP_011072167.1	FAD:protein FMN transferase	89.9	62.0	65.6
MGA_2012	LOCUS_19950	sequence1:2281410..2282567(-)	partial			WP_011072118.1	cation diffusion facilitator family transporter	41.8	40.9	87.0
MGA_2070	LOCUS_20530	sequence1:2346825..2348888(+)	internal_stop_codon	2348886..2348888(+)		WP_011072267.1	transcription-repair coupling factor	100.0	58.8	88.6
MGA_2071	LOCUS_20540	sequence1:2348907..2350313(+)	internal_stop_codon	2348886..2348888(+)		WP_011072267.1	transcription-repair coupling factor	100.0	40.5	94.7
MGA_2077	LOCUS_20600	sequence1:2358065..2358787(+)	frameshift		2358721	WP_011071694.1	IS91-like element ISSod25 family transposase	91.7	59.1	93.2
MGA_2078	LOCUS_20610	sequence1:2358756..2359181(+)	frameshift		2358721	WP_011071694.1	IS91-like element ISSod25 family transposase	100.0	37.9	87.2
MGA_2118	LOCUS_21010	sequence1:2410580..2411062(+)	partial			WP_011072554.1	paraquat-inducible protein A	97.5	73.9	84.6
MGA_2148	LOCUS_21310	sequence1:2441904..2442158(+)	internal_stop_codon	2442156..2442158(+)		WP_011072583.1	cupin domain-containing protein	91.7	20.3	80.5
MGA_2149	LOCUS_21320	sequence1:2442168..2443064(+)	internal_stop_codon	2442156..2442158(+)		WP_011072583.1	cupin domain-containing protein	100.0	78.4	81.2
MGA_2165	LOCUS_21480	sequence1:2462633..2465188(-)	partial			WP_011072046.1	invasin	94.1	70.0	30.7
MGA_2189	LOCUS_21720	sequence1:2489234..2491126(+)	frameshift		2491102	WP_011072023.1	efflux RND transporter permease subunit	99.2	57.3	89.6
MGA_2190	LOCUS_21730	sequence1:2491086..2492486(+)	frameshift		2491108	WP_011072023.1	efflux RND transporter permease subunit	98.1	41.9	84.7
MGA_2239	LOCUS_22220	sequence1:2537832..2539097(-)	partial			WP_001107728.1	integrase domain-containing protein	48.5	48.8	28.5
MGA_2254	LOCUS_22370	sequence1:2548390..2548668(+)	partial			WP_011072907.1	hypothetical protein	87.0	72.2	57.8
MGA_2256	LOCUS_22390	sequence1:2548944..2549492(+)	partial			WP_013087213.1	hypothetical protein	46.2	79.4	41.4
MGA_2258	LOCUS_22410	sequence1:2549801..2550985(+)	partial			WP_000741454.1	site-specific integrase	53.3	49.7	29.1
MGA_2302	LOCUS_22850	sequence1:2594026..2594412(+)	frameshift		2594343	WP_011072674.1	glucan biosynthesis protein G	93.8	22.5	49.2
MGA_2303	LOCUS_22860	sequence1:2594414..2595616(+)	frameshift		2594343	WP_011072674.1	glucan biosynthesis protein G	100.0	75.8	87.2
MGA_2338	LOCUS_23190	sequence1:2649718..2650200(+)	frameshift		2650164	WP_011072813.1	methyltransferase	96.2	43.1	75.3
MGA_2339	LOCUS_23200	sequence1:2650346..2650798(+)	frameshift		2650173	WP_011072813.1	methyltransferase	98.7	41.5	85.1
MGA_2504	LOCUS_24850	sequence1:2861241..2862215(-)	partial			WP_011461005.1	glycosyltransferase	70.7	28.8	34.5
MGA_2505	LOCUS_24860	sequence1:2862510..2863235(-)	partial			WP_055064620.1	acyltransferase	59.8	74.2	31.8
MGA_2582	LOCUS_25630	sequence1:2940417..2941262(-)	partial			WP_011202934.1	LicD family protein	30.6	36.4	34.0
MGA_2667	LOCUS_26480	sequence1:3033184..3033840(-)	frameshift		3033833	WP_011073246.1	cyclopropane-fatty-acyl-phospholipid synthase family protein	96.3	50.2	86.7
MGA_2668	LOCUS_26490	sequence1:3033723..3034439(-)	frameshift		3033836	WP_011073246.1	cyclopropane-fatty-acyl-phospholipid synthase family protein	84.9	48.3	85.1
MGA_2852	LOCUS_28330	sequence1:3248044..3248280(+)	partial			WP_174847485.1	tyrosine-type recombinase/integrase	74.4	17.2	51.7
MGA_2878	LOCUS_28590	sequence1:3277899..3278324(-)	frameshift		3278358	WP_011071694.1	IS91-like element ISSod25 family transposase	100.0	37.9	87.2
MGA_2879	LOCUS_28600	sequence1:3278293..3279015(-)	frameshift		3278358	WP_011071694.1	IS91-like element ISSod25 family transposase	91.7	59.1	93.2
MGA_2881	LOCUS_28620	sequence1:3279896..3280375(+)	frameshift		3280372	WP_011072111.1	integron integrase	90.6	45.1	95.8
MGA_2882	LOCUS_28630	sequence1:3280354..3280605(+)	frameshift		3280372	WP_011072111.1	integron integrase	91.6	23.8	97.4
MGA_2927	LOCUS_29080	sequence1:3329241..3329696(+)	partial			WP_028730510.1	FRG domain-containing protein	58.9	17.6	42.9
MGA_2954	LOCUS_29350	sequence1:3363017..3363409(-)	frameshift		3363097	WP_164925634.1	GNAT family N-acetyltransferase	69.2	56.6	58.9
MGA_2964	LOCUS_29450	sequence1:3370547..3370708(-)	partial			WP_011071691.1	glyoxalase superfamily protein	100.0	43.8	73.6
MGA_2980	LOCUS_29610	sequence1:3386474..3386713(+)	partial			WP_011071262.1	DUF2846 domain-containing protein	100.0	54.1	88.6
MGA_3030	LOCUS_30110	sequence1:3454695..3455144(+)	internal_stop_codon	3455142..3455144(+)		WP_164925911.1	TIGR04211 family SH3 domain-containing protein	93.3	76.4	72.7
MGA_3091	LOCUS_30720	sequence1:3537099..3537758(+)	partial			WP_011071126.1	SprT family zinc-dependent metalloprotease	73.5	78.2	78.9
MGA_3100	LOCUS_30810	sequence1:3547073..3547321(-)	partial			WP_011815910.1	sensor domain-containing diguanylate cyclase	81.7	20.3	45.6
MGA_3114	LOCUS_30950	sequence1:3566537..3566839(-)	partial			WP_011071103.1	DUF3622 domain-containing protein	69.0	68.3	92.8
MGA_3140	LOCUS_31210	sequence1:3592397..3593344(-)	partial			WP_235841049.1	hypothetical protein	70.8	70.3	25.0
MGA_3197	LOCUS_31780	sequence1:3656368..3656790(-)	partial			WP_011073741.1	HTH-type transcriptional regulator YidZ	100.0	43.6	90.7
MGA_3220	LOCUS_32010	sequence1:3681393..3681920(+)	frameshift		3681848	WP_011070924.1	mechanosensitive ion channel	86.9	14.2	78.9
MGA_3230	LOCUS_32110	sequence1:3694038..3697649(-)	partial			WP_011071149.1	PAS domain S-box protein	54.6	36.8	41.1
MGA_3297	LOCUS_32780	sequence1:3768084..3768380(+)	partial			WP_011038926.1	helix-hairpin-helix domain-containing protein	94.9	72.7	52.7
MGA_3354	LOCUS_33350	sequence1:3843768..3843977(+)	partial			WP_011070771.1	DNA gyrase inhibitor YacG	71.0	71.0	91.8
MGA_3405	LOCUS_33860	sequence1:3888431..3889312(+)	partial			WP_000922504.1	FliM/FliN family flagellar motor switch protein	66.6	80.6	23.2
MGA_3427	LOCUS_34080	sequence1:3907344..3908048(-)	frameshift		3908022	WP_011073971.1	class I adenylate cyclase	96.6	28.1	88.1
MGA_3428	LOCUS_34090	sequence1:3907999..3909759(-)	frameshift		3908025	WP_011073971.1	class I adenylate cyclase	98.8	72.0	85.7
MGA_3433	LOCUS_34140	sequence1:3914471..3919828(+)	frameshift		3919819	WP_011707240.1	retention module-containing protein	95.5	34.4	57.5
MGA_3434	LOCUS_34150	sequence1:3919848..3924272(+)	partial			WP_011073976.1	retention module-containing protein	81.2	42.7	32.2
MGA_3439	LOCUS_34200	sequence1:3929981..3930334(+)	frameshift		3930325	WP_011073981.1	transglutaminase-like cysteine peptidase	97.4	48.5	82.5
MGA_3440	LOCUS_34210	sequence1:3930318..3930692(+)	frameshift		3930325	WP_011073981.1	transglutaminase-like cysteine peptidase	99.2	52.3	92.7
MGA_3462	LOCUS_34430	sequence1:3960512..3961150(+)	partial			WP_010871028.1	DEAD/DEAH box helicase	88.2	23.8	43.2
MGA_3577	LOCUS_35560	sequence1:4102890..4104065(-)	partial			WP_011070577.1	sulfotransferase family protein	64.2	66.9	37.8
MGA_3578	LOCUS_35570	sequence1:4104065..4105147(-)	partial			WP_011070576.1	phytanoyl-CoA dioxygenase family protein	92.5	50.2	74.9
MGA_3764	LOCUS_37410	sequence1:4313589..4314008(-)	partial			WP_010940509.1	HPP family protein	95.0	72.6	51.9
