# locus_id	locus_tag	location	classification	internal_stop	indel	ref_id	description	query_cov	ref_cov	identity
MGA_4	LOCUS_00040	sequence001:4073..5005(-)	frameshift		4967	WP_014207544.1	alanine/glycine:cation symporter family protein	98.1	61.9	90.8
MGA_5	LOCUS_00050	sequence001:4953..5549(-)	frameshift		4967	WP_014207544.1	alanine/glycine:cation symporter family protein	98.0	39.5	91.8
MGA_15	LOCUS_00150	sequence001:16964..17197(-)	partial			WP_014207553.1	YbaN family protein	100.0	63.1	85.7
MGA_104	LOCUS_01040	sequence001:116762..117781(+)	partial			WP_000558370.1	glycosyltransferase	78.2	42.3	37.5
MGA_110	LOCUS_01100	sequence001:122392..123375(-)	partial			WP_005483478.1	glycosyltransferase	62.4	57.6	30.3
MGA_144	LOCUS_01440	sequence002:3069..4001(-)	partial			WP_014208275.1	pseudouridine synthase	62.9	83.7	94.4
MGA_200	LOCUS_02000	sequence002:71055..72437(+)	partial			WP_014208234.1	AAA family ATPase	33.9	70.9	81.4
MGA_244	LOCUS_02440	sequence002:120172..120819(+)	partial			WP_014208204.1	hypothetical protein	100.0	72.1	87.0
MGA_633	LOCUS_06320	sequence007:13446..14192(+)	frameshift		13459	WP_014207777.1	DMT family transporter	96.0	80.7	95.4
MGA_682	LOCUS_06810	sequence007:64002..64754(+)	frameshift		64718	WP_014207746.1	30S ribosomal protein S3	90.0	84.9	99.1
MGA_705	LOCUS_07040	sequence007:77599..77889(+)	partial			WP_014207739.1	hypothetical protein	96.9	72.1	55.9
MGA_788	LOCUS_07860	sequence009:8835..9083(-)	partial			WP_005455908.1	DUF2061 domain-containing protein	64.6	39.6	47.2
MGA_818	LOCUS_08160	sequence009:40116..40283(+)	partial			WP_014208305.1	ASCH domain-containing protein	96.4	44.2	81.1
MGA_834	LOCUS_08320	sequence009:52442..52804(-)	frameshift,internal_stop_codon	52429..52431(-),52369..52371(-),52435..52437(-)	52486	WP_014208312.1	hypothetical protein	90.8	70.8	70.6
MGA_953	LOCUS_09510	sequence011:29566..30345(-)	partial			WP_010946906.1	Dot/Icm type IV secretion system effector LidL	79.2	41.8	43.8
MGA_1051	LOCUS_10490	sequence013:1895..2539(-)	partial			WP_014208382.1	DMT family transporter	100.0	69.5	95.3
MGA_1067	LOCUS_10650	sequence013:20472..20750(+)	partial			WP_011707247.1	ComEA family DNA-binding protein	80.4	69.8	47.3
MGA_1163	LOCUS_11610	sequence014:56120..56977(+)	partial			WP_014208165.1	YifB family Mg chelatase-like AAA ATPase	98.2	56.6	91.1
MGA_1236	LOCUS_12340	sequence016:25156..25983(-)	partial			WP_014206760.1	energy transducer TonB	55.6	55.6	89.5
MGA_1317	LOCUS_13150	sequence018:3240..3956(+)	partial			WP_014206609.1	energy transducer TonB	42.4	42.6	97.0
MGA_1358	LOCUS_13560	sequence018:40964..41206(-)	partial			WP_014206585.1	hypothetical protein	73.8	83.3	85.0
MGA_1428	LOCUS_14260	sequence020:1168..2418(-)	internal_stop_codon	2491..2493(-)		WP_014207909.1	choline BCCT transporter BetT	100.0	63.5	91.6
MGA_1429	LOCUS_14270	sequence020:2491..3135(-)	internal_stop_codon	2491..2493(-)		WP_014207909.1	choline BCCT transporter BetT	100.0	32.7	95.3
MGA_1566	LOCUS_15620	sequence022:40654..41016(+)	partial			WP_013225580.1	cyclophilin-like fold protein	82.5	66.4	48.5
MGA_1587	LOCUS_15820	sequence023:11856..12521(+)	internal_stop_codon	12519..12521(+)		WP_000081480.1	IclR family transcriptional regulator	100.0	78.9	99.5
MGA_1588	LOCUS_15830	sequence023:12540..12698(+)	internal_stop_codon	12519..12521(+)		WP_000081480.1	IclR family transcriptional regulator	100.0	18.6	98.1
MGA_1634	LOCUS_16290	sequence024:18711..19157(-)	partial			WP_014206313.1	DUF4424 family protein	100.0	46.2	93.9
MGA_1635	LOCUS_16300	sequence024:19298..19612(+)	frameshift		19585,19757	WP_015063811.1	FAD-dependent monooxygenase	88.5	22.4	33.3
MGA_1644	LOCUS_16390	sequence024:27864..28226(-)	partial			WP_012256361.1	CorA family divalent cation transporter	82.5	31.8	45.5
MGA_1646	LOCUS_16410	sequence024:29565..30332(-)	partial			WP_014206293.1	EAL domain-containing protein	97.6	54.2	86.7
MGA_1699	LOCUS_16940	sequence025:42803..>43399(-)	partial			WP_014206203.1	alkyl hydroperoxide reductase subunit F	100.0	37.5	98.0
MGA_1732	LOCUS_17270	sequence026:35014..35697(-)	partial			WP_014208165.1	YifB family Mg chelatase-like AAA ATPase	98.2	45.1	95.5
MGA_1733	LOCUS_17280	sequence026:35822..36274(+)	partial			WP_223862839.1	TnsA endonuclease N-terminal domain-containing protein	90.7	58.4	40.4
MGA_1736	LOCUS_17310	sequence026:39554..40192(+)	partial			WP_011102975.1	TniB family NTP-binding protein	76.9	53.7	41.1
MGA_1739	LOCUS_17340	sequence026:41378..>41934(-)	partial			WP_003813546.1	universal stress protein	97.8	63.4	44.2
MGA_1826	LOCUS_18180	sequence029:11635..12216(+)	partial			WP_005804461.1	single-stranded DNA-binding protein	68.4	67.7	99.2
MGA_1851	LOCUS_18430	sequence029:36841..37203(+)	partial			WP_014207953.1	type VI secretion system Vgr family protein	85.0	9.3	32.7
MGA_1854	LOCUS_18460	sequence029:39356..39499(-)	internal_stop_codon	39356..39358(-)		WP_014207879.1	DUF6500 family protein	100.0	65.3	95.7
MGA_1914	LOCUS_19030	sequence031:18694..19014(+)	partial			WP_010635605.1	membrane protein insertion efficiency factor YidD	61.3	84.1	65.2
MGA_2002	LOCUS_19910	sequence033:31667..32056(-)	partial			WP_010919964.1	PaaI family thioesterase	87.6	73.9	27.6
MGA_2012	LOCUS_20000	sequence034:2639..2935(+)	frameshift		2929	WP_014206937.1	DUF421 domain-containing protein	99.0	43.1	82.5
MGA_2013	LOCUS_20010	sequence034:3039..3317(+)	frameshift		2929	WP_014206937.1	DUF421 domain-containing protein	100.0	40.9	93.5
MGA_2076	LOCUS_20640	sequence035:36414..>37010(-)	partial			WP_014206518.1	alkyl hydroperoxide reductase subunit F	100.0	37.5	99.0
MGA_2089	LOCUS_20770	sequence036:12060..12260(+)	partial			WP_002118955.1	NF038104 family lipoprotein	59.1	75.0	84.6
MGA_2118	LOCUS_21050	sequence037:2006..3664(+)	partial			WP_000204763.1	PBSX family phage terminase large subunit	43.8	52.2	35.7
MGA_2134	LOCUS_21210	sequence037:13643..16255(+)	partial			WP_000990884.1	hypothetical protein	42.2	56.6	36.0
MGA_2149	LOCUS_21360	sequence037:26794..27183(-)	partial			WP_024699234.1	hypothetical protein	90.7	68.2	47.0
MGA_2203	LOCUS_21890	sequence039:10455..12944(-)	partial			WP_010951067.1	phage tail protein	97.6	59.4	39.8
MGA_2206	LOCUS_21920	sequence039:13614..15089(-)	partial			WP_011166707.1	BspA family leucine-rich repeat surface protein	53.8	56.2	38.1
MGA_2210	LOCUS_21960	sequence039:18489..21260(-)	partial			WP_010951073.1	tape measure protein	57.7	52.3	24.0
MGA_2225	LOCUS_22110	sequence039:28691..29503(-)	partial			WP_000184977.1	phage minor head protein	68.9	78.9	34.5
MGA_2232	LOCUS_22170	sequence040:1..3178(+)	partial			WP_118839700.1	DEAD/DEAH box helicase family protein	30.8	41.1	25.5
MGA_2345	LOCUS_23300	sequence043:21509..22579(+)	frameshift		22558	WP_014206684.1	ABC transporter substrate-binding protein	96.3	72.1	98.3
MGA_2346	LOCUS_23310	sequence043:22572..22937(+)	frameshift		22558	WP_014206684.1	ABC transporter substrate-binding protein	100.0	25.4	96.7
MGA_2361	LOCUS_23460	sequence044:5271..5633(-)	partial			WP_029304069.1	copper-binding protein	69.2	69.2	41.0
MGA_2417	LOCUS_24020	sequence046:4293..7532(+)	internal_stop_codon	7530..7532(+)		WP_014208106.1	non-ribosomal peptide synthetase	100.0	81.8	89.0
MGA_2418	LOCUS_24030	sequence046:7611..8252(+)	internal_stop_codon	7530..7532(+)		WP_014208106.1	non-ribosomal peptide synthetase	99.5	16.1	93.4
MGA_2462	LOCUS_24460	sequence047:27051..27671(-)	partial			WP_003704933.1	NeuD/PglB/VioB family sugar acetyltransferase	94.7	47.2	60.5
MGA_2465	LOCUS_24490	sequence047:29556..30497(-)	partial			WP_010965472.1	glycosyltransferase	75.1	72.7	34.0
MGA_2471	LOCUS_24550	sequence048:4161..4496(-)	partial			WP_002121079.1	Rieske (2Fe-2S) protein	72.1	79.4	38.3
MGA_2492	LOCUS_24760	sequence049:1..1293(+)	partial			WP_014206344.1	type VI secretion system Vgr family protein	99.3	40.9	81.7
MGA_2513	LOCUS_24970	sequence049:19548..20186(+)	frameshift		20162	WP_014208096.1	CoA-acylating methylmalonate-semialdehyde dehydrogenase	97.2	40.8	94.7
MGA_2514	LOCUS_24980	sequence049:20173..21063(+)	frameshift		20165	WP_014208096.1	CoA-acylating methylmalonate-semialdehyde dehydrogenase	100.0	58.6	95.3
MGA_2546	LOCUS_25300	sequence051:91..498(-)	frameshift,internal_stop_codon	559..561(-)	150	WP_014208136.1	TetR/AcrR family transcriptional regulator	88.9	63.5	87.5
MGA_2602	LOCUS_25860	sequence053:1..514(+)	partial			WP_014206899.1	3-oxoadipyl-CoA thiolase	100.0	42.1	97.1
MGA_2632	LOCUS_26160	sequence054:1531..2820(+)	partial			WP_011073221.1	type IV pilus twitching motility protein PilT	63.9	73.3	31.3
MGA_2642	LOCUS_26260	sequence054:10597..11481(+)	partial			WP_004466992.1	ParA family protein	68.0	73.5	31.2
MGA_2643	LOCUS_26270	sequence054:11485..12366(+)	partial			WP_038965125.1	ParB/RepB/Spo0J family partition protein	46.4	47.5	29.1
MGA_2646	LOCUS_26300	sequence054:14917..15339(-)	partial			WP_005069871.1	translesion error-prone DNA polymerase V autoproteolytic subunit	92.1	65.5	63.9
MGA_2647	LOCUS_26310	sequence054:15702..17360(-)	partial			WP_000331690.1	LPD5 domain-containing protein	50.7	9.5	33.2
MGA_2651	LOCUS_26350	sequence054:18420..20255(-)	partial			WP_002666722.1	M23 family metallopeptidase	19.0	33.5	36.8
MGA_2674	LOCUS_26570	sequence055:15081..15515(+)	internal_stop_codon	15018..15020(+)		WP_014207048.1	AceI family chlorhexidine efflux PACE transporter	100.0	82.8	95.8
MGA_2729	LOCUS_27090	sequence058:1163..1786(+)	internal_stop_codon	1784..1786(+)		WP_014207712.1	acyl-CoA dehydrogenase family protein	100.0	53.5	95.2
MGA_2730	LOCUS_27100	sequence058:1808..2326(+)	internal_stop_codon	1784..1786(+)		WP_014207712.1	acyl-CoA dehydrogenase family protein	100.0	44.4	98.3
MGA_2756	LOCUS_27360	sequence059:41..733(-)	frameshift		909	WP_188825379.1	IS3 family transposase	97.0	58.8	63.2
MGA_2766	LOCUS_27460	sequence059:11253..11402(-)	partial			WP_002118887.1	lipoprotein	100.0	65.8	65.3
MGA_2872	LOCUS_28510	sequence064:3309..7289(+)	partial			WP_011104844.1	phage tail tape measure protein	56.3	67.3	28.8
MGA_2883	LOCUS_28620	sequence064:18002..18919(-)	partial			WP_015706186.1	tyrosine-type recombinase/integrase	85.9	64.3	33.8
MGA_2889	LOCUS_28680	sequence064:21916..22413(-)	partial			WP_005069871.1	translesion error-prone DNA polymerase V autoproteolytic subunit	84.2	71.4	64.8
MGA_2904	LOCUS_28830	sequence065:15059..15307(-)	partial			WP_014206567.1	hypothetical protein	43.9	78.3	83.3
MGA_2915	LOCUS_28940	sequence065:23579..23929(-)	internal_stop_codon	23975..23977(-)		WP_014206556.1	hypothetical protein	100.0	60.4	87.9
MGA_3066	LOCUS_30420	sequence073:1026..1475(+)	partial			WP_000336721.1	IS3 family transposase	97.3	53.3	51.0
MGA_3068	LOCUS_30440	sequence073:3237..3566(-)	partial			WP_000506893.1	DUF4236 domain-containing protein	68.8	18.4	44.0
MGA_3074	LOCUS_30500	sequence073:9897..11768(-)	partial			WP_002209923.1	primase-like DNA-binding domain-containing protein	23.6	17.4	37.4
MGA_3158	LOCUS_31330	sequence077:8234..8689(+)	internal_stop_codon	8687..8689(+)		WP_014206714.1	AraC family transcriptional regulator	100.0	42.9	96.7
MGA_3159	LOCUS_31340	sequence077:8789..9292(+)	internal_stop_codon	8687..8689(+)		WP_014206714.1	AraC family transcriptional regulator	100.0	47.4	97.0
MGA_3231	LOCUS_32040	sequence082:376..2388(-)	partial			WP_013095179.1	ATP-binding protein	35.4	27.1	32.1
MGA_3248	LOCUS_32210	sequence082:13361..13699(-)	partial			WP_000801427.1	H-NS histone family protein	71.4	71.3	42.5
MGA_3260	LOCUS_32330	sequence083:10359..10670(+)	partial			WP_164925740.1	helix-turn-helix transcriptional regulator	85.4	66.2	39.8
MGA_3290	LOCUS_32620	sequence086:1..782(+)	partial			WP_014207039.1	DNA polymerase III subunit gamma/tau	99.6	38.2	83.2
MGA_3355	LOCUS_33270	sequence091:1..505(+)	partial			WP_014206899.1	3-oxoadipyl-CoA thiolase	100.0	41.3	97.6
MGA_3401	LOCUS_33690	sequence095:957..1181(-)	partial			WP_010974257.1	helix-turn-helix domain-containing protein	93.2	71.9	46.4
MGA_3461	LOCUS_34260	sequence100:5228..6409(-)	partial			WP_012870447.1	ParB/RepB/Spo0J family partition protein	55.0	65.9	30.0
MGA_3476	LOCUS_34390	sequence102:1..1158(+)	partial			WP_014206351.1	type VI secretion system Vgr family protein	99.7	44.9	94.8
MGA_3480	LOCUS_34430	sequence102:5633..6109(+)	frameshift		6088	WP_005304004.1	putative type VI secretion system effector	98.7	60.5	75.0
MGA_3481	LOCUS_34440	sequence102:6123..6416(+)	frameshift		6094	WP_005304004.1	putative type VI secretion system effector	95.9	36.0	78.5
MGA_3483	LOCUS_34460	sequence102:7589..8293(-)	partial			WP_081403079.1	formylglycine-generating enzyme family protein	46.2	66.8	28.7
MGA_3487	LOCUS_34490	sequence103:1189..1698(-)	partial			WP_002222513.1	hypothetical protein	74.6	59.2	29.1
MGA_3513	LOCUS_34740	sequence105:2699..2929(-)	partial			WP_014207661.1	hypothetical protein	76.3	74.4	89.7
MGA_3520	LOCUS_34810	sequence106:1167..1568(-)	partial			WP_011705908.1	hypothetical protein	76.7	73.6	42.9
MGA_3524	LOCUS_34850	sequence106:2205..3167(-)	partial			WP_000086416.1	DnaT-like ssDNA-binding domain-containing protein	50.3	55.2	34.2
MGA_3533	LOCUS_34930	sequence107:1..942(+)	partial			WP_014208422.1	anthranilate synthase component I family protein	100.0	69.6	83.1
MGA_3541	LOCUS_35010	sequence108:1..754(+)	partial			WP_002219732.1	replication initiation protein RepM	77.2	57.5	50.8
MGA_3546	LOCUS_35060	sequence108:5769..5954(+)	partial			WP_005461253.1	AI-2E family transporter	65.6	11.1	75.0
MGA_3567	LOCUS_35260	sequence110:5401..5802(+)	partial			WP_011705908.1	hypothetical protein	51.9	49.3	47.8
MGA_3571	LOCUS_35300	sequence111:42..680(+)	partial			WP_001220164.1	TetR/AcrR family transcriptional regulator	40.1	39.8	28.2
MGA_3612	LOCUS_35710	sequence116:1827..2180(-)	partial			WP_003857248.1	DUF202 domain-containing protein	75.2	72.1	37.8
MGA_3623	LOCUS_35820	sequence117:5213..5851(+)	internal_stop_codon	5849..5851(+)		WP_014206658.1	HRDC domain-containing protein	100.0	56.7	92.9
MGA_3624	LOCUS_35830	sequence117:5852..6337(+)	internal_stop_codon	5849..5851(+)		WP_014206658.1	HRDC domain-containing protein	98.8	42.5	86.8
MGA_3625	LOCUS_35840	sequence118:266..895(+)	partial			WP_011038959.1	hypothetical protein	49.3	35.1	35.0
MGA_3667	LOCUS_36200	sequence125:3015..5255(+)	partial			WP_003244876.1	N-acetylmuramoyl-L-alanine amidase	7.6	18.0	49.1
MGA_3705	LOCUS_36530	sequence134:1124..1732(+)	partial			WP_014206866.1	hypothetical protein	74.3	74.9	31.4
MGA_3724	LOCUS_36690	sequence138:1097..1984(+)	partial			WP_051000362.1	AraC family transcriptional regulator	68.5	61.0	31.7
MGA_3734	LOCUS_36790	sequence140:1743..1919(-)	partial			WP_014206735.1	hypothetical protein	100.0	9.9	94.8
MGA_3735	LOCUS_36800	sequence140:2029..2277(-)	partial			WP_014206735.1	hypothetical protein	32.9	4.6	96.3
MGA_3739	LOCUS_36830	sequence141:483..1139(+)	frameshift		1133	WP_014207062.1	minor capsid protein	99.5	59.0	68.7
MGA_3740	LOCUS_36840	sequence141:1327..1590(+)	frameshift		1136	WP_014207062.1	minor capsid protein	100.0	23.6	81.6
MGA_3746	LOCUS_36900	sequence142:896..1696(+)	partial			WP_011261955.1	DUF2971 domain-containing protein	41.7	58.6	40.5
MGA_3763	LOCUS_37030	sequence146:310..849(-)	partial			WP_013531251.1	CmlA/FloR family chloramphenicol efflux MFS transporter	81.6	36.7	47.3
MGA_3779	LOCUS_37150	sequence151:5..832(+)	partial			WP_005787233.1	RsiV family protein	36.7	37.0	35.2
MGA_3788	LOCUS_37210	sequence153:449..1564(+)	partial			WP_054186121.1	TniQ family protein	48.0	47.8	29.4
MGA_3792	LOCUS_37230	sequence154:1257..1805(-)	frameshift,internal_stop_codon	1844..1846(-)	1891	WP_014206869.1	TetR/AcrR family transcriptional regulator	98.9	82.1	76.7
MGA_3799	LOCUS_37300	sequence156:1706..>2709(-)	partial			WP_011073024.1	ABC transporter ATP-binding protein	100.0	54.0	76.6
MGA_3803	LOCUS_37330	sequence158:960..1601(-)	partial			WP_002115248.1	ATP-binding protein	100.0	72.7	88.7
MGA_3804	LOCUS_37340	sequence158:1520..2074(-)	partial			WP_003233883.1	ATP-dependent helicase	84.8	25.9	66.0
MGA_3812	LOCUS_37400	sequence161:1..556(+)	partial			WP_005066014.1	DNA-binding transcriptional regulator HcaR	96.7	59.1	37.1
MGA_3823	LOCUS_37480	sequence166:61..372(-)	frameshift		102	WP_188825379.1	IS3 family transposase	85.4	23.2	96.6
MGA_3824	LOCUS_37490	sequence166:425..718(-)	partial			WP_002063889.1	AAA family ATPase	89.7	48.3	100.0
MGA_3835	LOCUS_37570	sequence169:171..1016(+)	partial			WP_011707856.1	porin OmpA	44.5	33.2	36.0
MGA_3840	LOCUS_37600	sequence171:26..1756(-)	partial			WP_015040403.1	retention module-containing protein	71.5	22.0	28.5
MGA_3850	LOCUS_37690	sequence176:487..1059(-)	frameshift		1069	WP_014206869.1	TetR/AcrR family transcriptional regulator	94.7	82.1	73.9
MGA_3892	LOCUS_37890	sequence200:140..460(-)	frameshift		690,557	WP_014207949.1	haloacid dehalogenase-like hydrolase	83.0	40.4	90.9
MGA_3940	LOCUS_38200	sequence222:29802..30164(+)	frameshift,internal_stop_codon	30175..30177(+),30235..30237(+),30169..30171(+)	30119	WP_014208312.1	hypothetical protein	90.8	70.8	70.6
MGA_3981	LOCUS_38610	sequence224:6934..7182(-)	partial			WP_014206567.1	hypothetical protein	43.9	78.3	83.3
MGA_3992	LOCUS_38720	sequence224:15454..15804(-)	internal_stop_codon	15850..15852(-)		WP_014206556.1	hypothetical protein	100.0	60.4	87.9
MGA_4012	LOCUS_38910	sequence226:2383..3042(+)	partial			WP_013531251.1	CmlA/FloR family chloramphenicol efflux MFS transporter	79.5	43.7	49.4
MGA_4018	LOCUS_38970	sequence227:1524..1709(-)	partial			WP_005461253.1	AI-2E family transporter	65.6	11.1	75.0
MGA_4034	LOCUS_39110	sequence230:1747..2757(-)	partial			WP_011073024.1	ABC transporter ATP-binding protein	100.0	54.5	76.2
MGA_4036	LOCUS_39130	sequence231:1001..1642(-)	partial			WP_002115248.1	ATP-binding protein	100.0	72.7	88.7
MGA_4037	LOCUS_39140	sequence231:1561..2115(-)	partial			WP_003233883.1	ATP-dependent helicase	84.8	25.9	66.0
MGA_4043	LOCUS_39180	sequence233:956..1249(+)	partial			WP_002063889.1	AAA family ATPase	89.7	48.3	100.0
MGA_4044	LOCUS_39190	sequence233:1302..1613(+)	frameshift		1571	WP_188825379.1	IS3 family transposase	85.4	23.2	96.6
