# locus_id	locus_tag	location	classification	internal_stop	indel	ref_id	description	query_cov	ref_cov	identity
MGA_11	LOCUS_00100	sequence01:6607..7401(-)	internal_stop_codon	7411..7413(-)		WP_005461424.1	DNA protecting protein DprA	99.2	67.3	66.0
MGA_12	LOCUS_00110	sequence01:7411..7749(-)	internal_stop_codon	7411..7413(-)		WP_011262883.1	DNA processing protein DprA	98.2	30.1	45.0
MGA_24	LOCUS_00230	sequence01:20527..20676(-)	internal_stop_codon	20677..20679(-)		WP_005481190.1	ATP-dependent protease	100.0	9.7	83.7
MGA_59	LOCUS_00580	sequence01:59424..60059(-)	internal_stop_codon	60060..60062(-)		WP_005459829.1	potassium channel protein	95.7	58.5	47.5
MGA_60	LOCUS_00590	sequence01:60060..60470(-)	internal_stop_codon	60060..60062(-)		WP_005459829.1	potassium channel protein	100.0	39.5	48.9
MGA_107	LOCUS_01060	sequence02:599..2194(-)	partial			WP_011262918.1	chitin-binding protein	62.1	83.4	43.0
MGA_113	LOCUS_01120	sequence02:8312..9175(+)	internal_stop_codon	9173..9175(+)		WP_015365759.1	alkyl sulfatase	100.0	43.5	76.0
MGA_114	LOCUS_01130	sequence02:9215..10291(+)	internal_stop_codon	9173..9175(+)		WP_015365759.1	alkyl sulfatase	100.0	54.4	80.2
MGA_171	LOCUS_01700	sequence02:76215..76445(+)	partial			WP_011261384.1	hypothetical protein	94.7	67.9	61.1
MGA_173	LOCUS_01720	sequence02:78649..79089(+)	partial			WP_011106045.1	hypothetical protein	93.8	73.0	45.3
MGA_175	LOCUS_01740	sequence02:80078..81088(-)	internal_stop_codon	81170..81172(-)		WP_000833026.1	chitinase	99.7	39.6	79.7
MGA_176	LOCUS_01750	sequence02:81170..81406(-)	internal_stop_codon	81170..81172(-),81641..81643(-)		WP_005479039.1	chitinase	100.0	9.2	57.7
MGA_177	LOCUS_01760	sequence02:81641..82621(-)	internal_stop_codon	81641..81643(-)		WP_011261385.1	chitinase	100.0	38.5	51.5
MGA_187	LOCUS_01860	sequence03:157..1173(+)	partial			WP_005417604.1	sigma-54-dependent Fis family transcriptional regulator	98.2	73.9	52.7
MGA_220	LOCUS_02190	sequence03:42180..42704(-)	partial			WP_011707638.1	helix-turn-helix transcriptional regulator	78.2	60.3	41.2
MGA_223	LOCUS_02220	sequence03:46270..47070(+)	internal_stop_codon	47068..47070(+)		WP_005482602.1	hypothetical protein	99.6	26.5	39.3
MGA_224	LOCUS_02230	sequence03:47308..48417(+)	partial			WP_011261170.1	MSHA biogenesis protein MshQ	97.8	34.9	32.1
MGA_259	LOCUS_02580	sequence03:82196..83116(-)	partial			WP_011706160.1	GGDEF domain-containing protein	99.0	52.9	30.9
MGA_260	LOCUS_02590	sequence04:1..1183(+)	partial			Q87N45	30S ribosomal protein S1	100.0	70.7	90.8
MGA_299	LOCUS_02980	sequence04:40802..41191(-)	frameshift,internal_stop_codon	41200..41202(-),41227..41229(-)	41211	WP_001881490.1	hypothetical protein	93.0	78.5	35.2
MGA_333	LOCUS_03320	sequence05:201..509(+)	partial			WP_005467215.1	UDP-glucose 6-dehydrogenase	100.0	26.3	83.3
MGA_422	LOCUS_04210	sequence06:25975..26805(+)	frameshift		25951	WP_005419628.1	transcriptional regulator CysB	99.6	84.9	60.4
MGA_434	LOCUS_04330	sequence06:38252..39403(-)	partial			WP_011263106.1	phosphoethanolamine transferase	98.4	69.4	57.3
MGA_454	LOCUS_04530	sequence06:57986..58507(+)	partial			WP_000047148.1	hypothetical protein	65.9	63.1	41.0
MGA_455	LOCUS_04540	sequence06:58760..59179(+)	partial			WP_011261749.1	hypothetical protein	97.1	71.1	52.6
MGA_457	LOCUS_04560	sequence06:59727..59984(+)	partial			WP_011072730.1	glutaredoxin	90.6	64.4	46.8
MGA_521	LOCUS_05190	sequence07:62785..63774(-)	frameshift		63772	WP_005417767.1	cytosine deaminase	99.7	77.2	85.7
MGA_522	LOCUS_05200	sequence07:63767..64057(-)	frameshift		63772	WP_001180693.1	cytosine deaminase	97.9	22.5	62.5
MGA_523	LOCUS_05210	sequence07:64092..64688(-)	partial			WP_005477307.1	cytosine permease	87.4	41.5	80.3
MGA_557	LOCUS_05550	sequence08:32509..32784(+)	internal_stop_codon	32782..32784(+)		WP_011261364.1	type IV pilus biogenesis/stability protein PilW	82.4	35.7	57.3
MGA_584	LOCUS_05820	sequence08:60882..61553(+)	partial			WP_011706239.1	SM-20 protein	74.9	72.3	50.0
MGA_588	LOCUS_05850	sequence09:122..379(-)	partial			WP_011459236.1	ATPase	94.1	9.0	41.2
MGA_589	LOCUS_05860	sequence09:728..1849(-)	partial			WP_013227417.1	hypothetical protein	67.0	68.0	29.9
MGA_595	LOCUS_05920	sequence09:6167..6760(+)	partial			WP_011073961.1	iron-sulfur cluster repair di-iron protein	82.7	65.7	49.7
MGA_606	LOCUS_06030	sequence09:15755..15970(-)	partial			WP_005482874.1	3-methyladenine DNA glycosylase	67.6	10.5	68.8
MGA_627	LOCUS_06240	sequence09:38930..40390(-)	frameshift		40434	WP_011106088.1	fimbrial protein	100.0	83.0	73.0
MGA_632	LOCUS_06290	sequence09:42564..43337(-)	frameshift,internal_stop_codon	42564..42566(-)	43326	WP_000520444.1	pilus assembly protein PilM	96.1	71.6	50.6
MGA_633	LOCUS_06300	sequence09:43255..43497(-)	frameshift		43326	WP_000520444.1	pilus assembly protein PilM	85.0	19.2	55.9
MGA_663	LOCUS_06600	sequence10:21049..21294(+)	partial			WP_001143718.1	CidA/LrgA family protein	90.1	53.7	58.9
MGA_669	LOCUS_06660	sequence10:25769..26053(-)	partial			WP_010895592.1	hypothetical protein	72.3	28.3	52.9
MGA_674	LOCUS_06710	sequence10:29324..29836(+)	partial			WP_011074162.1	LysR family transcriptional regulator	95.9	50.8	74.8
MGA_676	LOCUS_06730	sequence10:31902..32438(+)	partial			WP_011074162.1	LysR family transcriptional regulator	90.4	50.2	65.8
MGA_680	LOCUS_06770	sequence10:34536..35345(-)	partial			WP_010990036.1	AraC family transcriptional regulator	26.8	26.9	45.8
MGA_702	LOCUS_06980	sequence11:115..1014(-)	partial			WP_005482342.1	AMP-dependent synthetase	93.0	48.9	66.9
MGA_781	LOCUS_07760	sequence12:28013..28606(+)	partial			WP_011263173.1	ATP-dependent Zn protease	81.7	74.2	55.3
MGA_802	LOCUS_07960	sequence13:1686..2870(-)	frameshift,internal_stop_codon	1666..1668(-)	1690,3055	WP_014205995.1	type I restriction-modification system subunit M	99.5	75.3	60.9
MGA_847	LOCUS_08410	sequence14:1348..1662(+)	frameshift		1653	Q5E6Y3	2-dehydropantoate 2-reductase	98.1	33.2	45.1
MGA_848	LOCUS_08420	sequence14:1643..2251(+)	frameshift		1653	Q87M95	2-dehydropantoate 2-reductase	98.5	67.3	44.5
MGA_851	LOCUS_08450	sequence14:4114..4413(-)	partial			WP_000801254.1	SAM-dependent methyltransferase	94.9	38.0	56.4
MGA_893	LOCUS_08870	sequence14:49229..49876(-)	frameshift		49850	WP_003113742.1	cytochrome c	89.8	43.5	43.0
MGA_894	LOCUS_08880	sequence14:49809..50258(-)	frameshift		49856	WP_003112821.1	cytochrome c	81.9	18.2	50.4
MGA_930	LOCUS_09240	sequence15:49398..49994(-)	partial			Q8EB51	aldehyde dehydrogenase	91.4	38.2	45.9
MGA_1039	LOCUS_10320	sequence18:30516..31079(-)	frameshift,internal_stop_codon	31106..31108(-)	31081	WP_011105745.1	rhombosortase	91.4	83.7	46.8
MGA_1051	LOCUS_10440	sequence18:43493..44497(-)	partial			WP_001881705.1	MFS transporter	97.9	52.2	56.3
MGA_1064	LOCUS_10560	sequence19:16726..16977(-)	frameshift		16740,16743	WP_005483465.1	ferredoxin-type protein NapF	73.5	37.0	49.2
MGA_1090	LOCUS_10820	sequence19:43556..44512(+)	partial			WP_005423059.1	MFS transporter	84.3	68.4	76.1
MGA_1091	LOCUS_10830	sequence20:125..385(-)	partial			Q87LY0	histidine kinase	94.2	7.2	67.9
MGA_1123	LOCUS_11150	sequence20:40577..41479(+)	frameshift		40455	Q5E7P9	peptide chain release factor 2	100.0	82.2	89.3
MGA_1125	LOCUS_11170	sequence20:43336..43665(+)	partial			WP_005417604.1	sigma-54-dependent Fis family transcriptional regulator	99.1	24.0	54.6
MGA_1153	LOCUS_11450	sequence21:28083..29627(+)	partial			WP_010945791.1	GGDEF domain-containing protein	60.1	31.3	39.5
MGA_1166	LOCUS_11580	sequence21:40591..40812(-)	partial			WP_011105608.1	hypothetical protein	100.0	58.2	51.2
MGA_1183	LOCUS_11750	sequence22:21675..22094(-)	partial			WP_001881191.1	hypothetical protein	43.2	46.0	41.7
MGA_1234	LOCUS_12260	sequence23:38719..39825(-)	partial			WP_001881634.1	DNA internalization-related competence protein ComEC/Rec2	99.7	47.7	44.0
MGA_1247	LOCUS_12390	sequence24:14434..14703(+)	frameshift		14398	WP_001909686.1	prepilin-type N-terminal cleavage/methylation domain-containing protein	98.9	59.9	37.0
MGA_1250	LOCUS_12420	sequence24:16939..17706(+)	frameshift		17661	Q9X4G9	type IV pilin assembly protein PilC	90.6	56.6	68.0
MGA_1251	LOCUS_12430	sequence24:17718..18170(+)	frameshift		17664	Q9X4G9	type IV pilin assembly protein PilC	99.3	36.5	74.5
MGA_1257	LOCUS_12490	sequence24:22547..23419(-)	partial			WP_011262661.1	general secretion pathway protein GspB	63.4	79.6	34.7
MGA_1277	LOCUS_12690	sequence25:1676..1894(+)	partial			Q9KLK4	UPF0213 protein	88.9	64.4	75.4
MGA_1317	LOCUS_13090	sequence26:8468..9508(-)	partial			WP_011122386.1	hypothetical protein	75.7	59.3	26.7
MGA_1378	LOCUS_13690	sequence28:176..1474(+)	partial			WP_011067938.1	N-acetyl-beta-hexosaminidase	59.5	36.1	31.1
MGA_1407	LOCUS_13980	sequence29:113..346(-)	internal_stop_codon	374..376(-)		WP_013097822.1	aerobactin synthase IucA	67.5	9.0	53.8
MGA_1408	LOCUS_13990	sequence29:374..1579(-)	internal_stop_codon	374..376(-)		WP_011263059.1	aerobactin siderophore biosynthesis protein IucA	97.3	65.5	30.6
MGA_1440	LOCUS_14300	sequence30:2459..2818(+)	partial			WP_011339292.1	ligand-gated channel	99.2	17.2	48.8
MGA_1455	LOCUS_14450	sequence30:22111..22620(+)	partial			WP_005460890.1	ATP-dependent Zn protease	78.1	58.1	52.3
MGA_1496	LOCUS_14840	sequence31:32566..32718(-)	partial			WP_000110093.1	type I restriction endonuclease EcoAI subunit S	98.0	8.4	49.0
MGA_1497	LOCUS_14850	sequence31:33220..33957(-)	partial			WP_001880867.1	diguanylate cyclase	97.1	34.6	41.7
MGA_1511	LOCUS_14980	sequence32:12925..14382(+)	partial			Q87TC9	type II secretion system protein L	50.7	61.9	45.2
MGA_1518	LOCUS_15050	sequence32:18860..19207(-)	partial			WP_005459005.1	amidophosphoribosyltransferase	99.1	45.2	52.6
MGA_1529	LOCUS_15160	sequence32:31699..32376(-)	partial			WP_012256767.1	peptidase M23	77.8	18.1	38.9
MGA_1562	LOCUS_15490	sequence34:128..1099(-)	partial			WP_001881634.1	DNA internalization-related competence protein ComEC/Rec2	92.6	37.5	35.8
MGA_1582	LOCUS_15690	sequence34:22924..23538(+)	frameshift		23358	WP_011707055.1	patatin family protein	71.1	52.2	52.4
MGA_1587	LOCUS_15740	sequence34:27326..28054(+)	internal_stop_codon	28052..28054(+)		WP_005478185.1	aminotransferase	100.0	51.7	61.7
MGA_1588	LOCUS_15750	sequence34:28100..28732(+)	internal_stop_codon	28052..28054(+)		WP_005478185.1	aminotransferase	98.1	44.2	72.0
MGA_1593	LOCUS_15800	sequence35:1..1296(+)	frameshift		1254	WP_004666649.1	integrase	97.0	82.5	49.4
MGA_1603	LOCUS_15900	sequence35:11915..13069(+)	frameshift,internal_stop_codon	11640..11642(+)	11897	WP_012868917.1	xanthine permease	76.6	65.0	39.8
MGA_1608	LOCUS_15950	sequence35:19209..19430(+)	partial			WP_011106302.1	hypothetical protein	87.7	64.7	53.0
MGA_1624	LOCUS_16100	sequence36:7779..8468(-)	internal_stop_codon	8562..8564(-)		WP_002211868.1	type I-F CRISPR-associated protein Csy2	90.0	65.2	40.2
MGA_1698	LOCUS_16840	sequence39:2160..2591(-)	partial			WP_004552423.1	phage integrase	99.3	68.3	47.9
MGA_1749	LOCUS_17340	sequence41:9128..9934(+)	frameshift		9053	WP_011262922.1	lipoprotein	88.4	44.0	34.2
MGA_1763	LOCUS_17480	sequence42:329..604(+)	partial			WP_011071243.1	transposase	94.5	24.0	83.7
MGA_1769	LOCUS_17540	sequence42:4284..4898(-)	partial			WP_005460549.1	SAM-dependent methyltransferase	95.1	34.5	45.4
MGA_1782	LOCUS_17670	sequence42:18550..18738(-)	partial			WP_011263276.1	hypothetical protein	75.8	72.6	61.7
MGA_1789	LOCUS_17740	sequence42:26956..27252(-)	partial			WP_005462981.1	LuxR family transcriptional regulator	90.8	40.4	62.2
MGA_1800	LOCUS_17850	sequence43:12961..13608(-)	frameshift,internal_stop_codon	13803..13805(-)	13658	WP_005480207.1	serine protease	99.5	28.5	55.0
MGA_1801	LOCUS_17860	sequence43:13803..14849(-)	frameshift,internal_stop_codon	13802..13804(-)	13660,14878	WP_001890383.1	hypothetical protein	98.9	44.9	55.8
MGA_1802	LOCUS_17870	sequence43:14858..15259(-)	frameshift		14878	WP_005480207.1	serine protease	90.2	15.6	59.2
MGA_1814	LOCUS_17980	sequence44:309..626(+)	partial			WP_011070504.1	nucleoside permease	99.0	25.6	78.8
MGA_1815	LOCUS_17990	sequence44:631..963(+)	partial			WP_011263785.1	guanine deaminase	95.5	23.0	48.6
MGA_1842	LOCUS_18260	sequence45:1..616(+)	partial			WP_011104442.1	transposase	95.6	37.6	47.7
MGA_1852	LOCUS_18360	sequence45:8268..8492(-)	partial			WP_005495828.1	cyd operon protein YbgE	98.6	73.0	49.3
MGA_1897	LOCUS_18810	sequence47:8128..8658(-)	frameshift,internal_stop_codon	8707..8709(-)	8130	WP_000545591.1	respiratory nitrate reductase subunit gamma	96.6	75.6	74.7
MGA_1944	LOCUS_19260	sequence49:398..1195(+)	frameshift		308	WP_011070736.1	transposase	98.5	67.6	59.0
MGA_1947	LOCUS_19290	sequence49:3486..3758(+)	frameshift		3746	WP_011103689.1	NAD(P)H dehydrogenase	94.4	42.2	41.9
MGA_1955	LOCUS_19370	sequence49:9654..9863(+)	frameshift		9842	WP_000044451.1	hypothetical protein	88.4	28.4	59.0
MGA_1956	LOCUS_19380	sequence49:9844..10299(+)	frameshift		9845	WP_011263627.1	hypothetical protein	99.3	69.1	42.7
MGA_1963	LOCUS_19450	sequence49:17649..18734(+)	partial			WP_011261927.1	carbohydrate-binding protein	90.9	72.5	37.7
MGA_1964	LOCUS_19460	sequence49:18767..19798(+)	partial			WP_010947421.1	IS630 family transposase	26.5	73.4	64.8
MGA_1965	LOCUS_19470	sequence49:19795..20076(+)	partial			WP_011030596.1	chitinase	54.8	10.3	42.3
MGA_1985	LOCUS_19670	sequence50:20207..20971(+)	partial			WP_011706160.1	GGDEF domain-containing protein	88.6	41.5	38.1
MGA_2001	LOCUS_19830	sequence51:18830..18991(+)	partial			WP_013095031.1	sodium transporter	73.6	12.4	53.8
MGA_2009	LOCUS_19910	sequence52:5974..6774(+)	partial			WP_005480794.1	paraquat-inducible protein A	99.6	63.9	56.6
MGA_2062	LOCUS_20430	sequence54:16615..17229(-)	internal_stop_codon	17236..17238(-)		WP_011263062.1	lysine 6-monooxygenase	91.7	43.3	45.5
MGA_2063	LOCUS_20440	sequence54:17236..17946(-)	internal_stop_codon	17236..17238(-)		WP_011263062.1	lysine 6-monooxygenase	95.8	52.1	50.4
MGA_2064	LOCUS_20450	sequence54:17972..19393(-)	partial			WP_011263060.1	aerobactin siderophore synthesis protein IucB	52.0	77.2	39.0
MGA_2071	LOCUS_20520	sequence55:5687..6166(-)	partial			WP_011261220.1	endonuclease	100.0	63.7	43.8
MGA_2078	LOCUS_20590	sequence55:13252..13860(+)	partial			Q9KVD2	nucleoid occlusion factor SlmA	72.3	74.5	25.3
MGA_2083	LOCUS_20640	sequence55:17212..18066(+)	partial			WP_010938992.1	DEAD/DEAH box helicase	83.8	22.0	64.5
MGA_2087	LOCUS_20670	sequence56:1965..3224(-)	partial			WP_011922229.1	type I restriction modification protein	69.7	69.2	36.1
MGA_2091	LOCUS_20710	sequence56:8256..8486(-)	partial			WP_012546249.1	Mrr restriction system protein	78.9	19.1	45.0
MGA_2095	LOCUS_20750	sequence56:10516..12765(+)	partial			WP_000351437.1	transposase	52.2	54.2	25.4
MGA_2099	LOCUS_20780	sequence57:1..1012(+)	partial			WP_010947421.1	IS630 family transposase	17.0	46.0	66.7
MGA_2103	LOCUS_20820	sequence57:2751..3002(-)	frameshift		3022	Q87T86	UPF0758 protein	97.6	36.2	82.7
MGA_2104	LOCUS_20830	sequence57:2954..3424(-)	frameshift		3022	Q87T86	UPF0758 protein	87.2	60.7	75.0
MGA_2116	LOCUS_20950	sequence58:3073..4299(+)	partial			WP_080510887.1	hypothetical protein	60.3	58.4	27.3
MGA_2119	LOCUS_20980	sequence58:5494..6345(-)	partial			WP_064496597.1	N-glycosylase	43.8	62.1	33.3
MGA_2123	LOCUS_21020	sequence58:10238..11884(+)	partial			WP_011123252.1	ABC transporter	23.7	22.4	34.6
MGA_2124	LOCUS_21030	sequence58:11881..12729(+)	partial			WP_007478815.1	hypothetical protein	59.6	60.0	28.3
MGA_2154	LOCUS_21280	sequence61:7804..8598(-)	partial			WP_011082909.1	hypothetical protein	38.6	21.9	43.3
MGA_2155	LOCUS_21290	sequence61:9237..9548(-)	partial			YP_001702502.1	hypothetical protein	66.0	81.9	52.9
MGA_2158	LOCUS_21310	sequence62:1..871(+)	partial			WP_005766752.1	MBL fold hydrolase	93.4	59.8	51.6
MGA_2161	LOCUS_21340	sequence62:3196..4074(-)	partial			WP_010942156.1	glycosyl transferase	70.2	64.2	34.5
MGA_2163	LOCUS_21360	sequence62:5341..6483(-)	partial			WP_000227804.1	LPS 1,2-N-acetylglucosaminetransferase	70.5	73.4	24.4
MGA_2178	LOCUS_21480	sequence64:838..1761(+)	partial			WP_011070748.1	integrase	98.7	70.6	30.4
MGA_2194	LOCUS_21620	sequence66:147..452(-)	partial			WP_011105937.1	cold-shock protein	42.6	26.2	62.8
MGA_2197	LOCUS_21650	sequence66:1792..2202(-)	partial			WP_011816772.1	dehydrogenase	86.8	46.4	40.7
MGA_2224	LOCUS_21900	sequence69:5668..6102(-)	partial			Q87HJ6	mannose-6-phosphate isomerase	97.9	34.3	58.9
MGA_2252	LOCUS_22110	sequence73:204..635(+)	partial			WP_003112570.1	transposase	99.3	51.6	70.4
MGA_2256	LOCUS_22150	sequence74:379..1020(+)	partial			YP_001704007.1	hypothetical protein	65.3	65.7	38.1
MGA_2259	LOCUS_22180	sequence74:1519..1707(-)	internal_stop_codon	1849..1851(-),1723..1725(-)		WP_010938991.1	metal-dependent hydrolase	98.4	24.7	72.1
MGA_2260	LOCUS_22190	sequence74:1849..2295(-)	internal_stop_codon	1849..1851(-),1723..1725(-)		WP_011038030.1	metal-dependent hydrolase	66.2	38.7	34.7
