# locus_id	locus_tag	location	classification	internal_stop	indel	ref_id	description	query_cov	ref_cov	identity
MGA_88	LOCUS_00030	sequence085:31..150(-)	frameshift		179	WP_011475483.1	IS200/IS605 family transposase	92.3	23.2	80.6
MGA_89	LOCUS_00040	sequence085:141..494(-)	frameshift		179	WP_011475483.1	IS200/IS605 family transposase	90.6	68.4	88.7
MGA_107	LOCUS_00090	sequence098:139..408(+)	frameshift		496,81,381,75,141	WP_003642759.1	glucose-6-phosphate isomerase	89.9	17.8	73.8
MGA_113	LOCUS_00110	sequence100:84..434(+)	frameshift		404	WP_100190734.1	IS3 family transposase	82.8	18.4	39.2
MGA_128	LOCUS_00230	sequence103:8715..9806(+)	partial			WP_028730510.1	FRG domain-containing protein	32.0	23.1	35.3
MGA_138	LOCUS_00290	sequence106:29..445(-)	partial			WP_001274758.1	LexA family transcriptional regulator	99.3	57.8	92.0
MGA_139	LOCUS_00300	sequence106:546..977(+)	partial			WP_000185503.1	replication protein	83.9	40.1	100.0
MGA_141	LOCUS_00310	sequence106:4113..4241(-)	partial			WP_015038860.1	conjugative transfer ATPase	76.2	3.3	78.1
MGA_142	LOCUS_00320	sequence106:4329..4592(+)	partial			WP_013087128.1	site-specific integrase	60.9	20.5	77.4
MGA_151	LOCUS_00400	sequence107:3109..3648(+)	partial			WP_010905374.1	phage terminase small subunit P27 family	62.0	73.3	39.6
MGA_155	LOCUS_00440	sequence107:6908..8815(+)	partial			WP_010905379.1	phage major capsid protein	54.5	78.5	56.9
MGA_169	LOCUS_00570	sequence107:20278..20787(+)	partial			WP_010966366.1	Ig-like domain-containing protein	78.7	19.5	32.4
MGA_197	LOCUS_00830	sequence107:33872..34402(+)	partial			WP_001173389.1	DUF669 domain-containing protein	62.5	64.4	30.9
MGA_218	LOCUS_01040	sequence108:2019..5027(+)	internal_stop_codon	1935..1937(+)		WP_011836594.1	SEC10/PgrA surface exclusion domain-containing protein	72.6	75.8	20.7
MGA_249	LOCUS_01320	sequence108:42158..42751(+)	frameshift		42652	WP_011101332.1	FGGY family carbohydrate kinase	84.3	32.5	49.4
MGA_250	LOCUS_01330	sequence108:42646..43746(+)	frameshift		42673	WP_003563002.1	gluconokinase	90.7	64.0	49.1
MGA_281	LOCUS_01630	sequence108:76553..77107(+)	partial			WP_011101020.1	DNA-directed RNA polymerase subunit delta	63.0	56.8	72.4
MGA_313	LOCUS_01950	sequence108:114501..114821(+)	partial			WP_015705465.1	nitronate monooxygenase	88.7	28.9	35.1
MGA_419	LOCUS_03000	sequence109:110577..110732(+)	internal_stop_codon	110730..110732(+)		WP_000998260.1	glycosyltransferase	90.2	6.6	43.5
MGA_420	LOCUS_03010	sequence109:110874..111773(+)	internal_stop_codon	110730..110732(+)		WP_000998260.1	glycosyltransferase	99.3	43.1	32.5
MGA_422	LOCUS_03030	sequence109:113664..115457(-)	partial			WP_002326842.1	LTA synthase family protein	97.3	64.1	40.6
MGA_450	LOCUS_03300	sequence109:147188..148030(+)	partial			WP_003641072.1	CdaR family protein	81.8	70.8	39.6
MGA_463	LOCUS_03430	sequence109:162153..163118(-)	partial			WP_002679604.1	Rpn family recombination-promoting nuclease/putative transposase	67.9	84.6	31.7
MGA_495	LOCUS_03740	sequence109:195791..196009(+)	partial			WP_000052064.1	F0F1 ATP synthase subunit C	73.6	73.6	58.5
MGA_514	LOCUS_03930	sequence109:213536..214210(+)	frameshift		214183	WP_005808874.1	group II intron reverse transcriptase/maturase	78.6	37.5	55.7
MGA_515	LOCUS_03940	sequence109:214188..214925(+)	frameshift		214201	WP_010966780.1	group II intron reverse transcriptase/maturase	96.3	50.2	45.8
MGA_517	LOCUS_03960	sequence109:215851..216672(-)	frameshift		216844,216709	WP_011102220.1	GntR family transcriptional regulator	96.7	73.7	51.5
MGA_518	LOCUS_03970	sequence109:216600..216842(-)	frameshift		216844,216709	WP_011102220.1	GntR family transcriptional regulator	55.0	12.0	81.8
MGA_553	LOCUS_04320	sequence109:258906..259451(+)	frameshift		259385	WP_011101707.1	DNA mismatch repair endonuclease MutL	88.4	23.3	68.1
MGA_554	LOCUS_04330	sequence109:259474..260955(+)	frameshift		259391	WP_011101707.1	DNA mismatch repair endonuclease MutL	97.6	74.0	52.4
MGA_575	LOCUS_04540	sequence109:279774..280205(+)	partial			WP_002357316.1	DUF948 domain-containing protein	71.3	76.2	37.6
MGA_582	LOCUS_04610	sequence109:285148..285663(+)	partial			WP_011475746.1	competence type IV pilus assembly protein ComGB	94.2	45.1	33.5
MGA_596	LOCUS_04740	sequence110:2157..4766(+)	internal_stop_codon	2148..2150(+)		WP_010890786.1	MMPL family transporter	96.1	82.9	31.3
MGA_599	LOCUS_04770	sequence110:7962..8963(+)	partial			WP_002287681.1	Fe-S cluster assembly protein SufD	81.1	72.2	22.3
MGA_627	LOCUS_05030	sequence110:38927..39982(+)	partial			WP_011836915.1	glucosaminidase domain-containing protein	47.6	72.4	47.6
MGA_725	LOCUS_05970	sequence110:125924..126214(+)	partial			WP_003547938.1	exodeoxyribonuclease VII small subunit	69.8	83.8	53.7
MGA_780	LOCUS_06500	sequence110:171800..172456(+)	partial			WP_000031367.1	ERF family protein	62.4	66.7	59.1
MGA_782	LOCUS_06520	sequence110:173117..173965(+)	partial			WP_011860882.1	conserved phage C-terminal domain-containing protein	33.7	21.4	35.8
MGA_797	LOCUS_06670	sequence110:181316..181999(+)	frameshift,internal_stop_codon	181208..181210(+)	181658,181636	WP_011674653.1	PBSX family phage terminase large subunit	88.5	49.6	29.4
MGA_809	LOCUS_06790	sequence110:189916..193953(+)	partial			WP_011475661.1	tape measure protein	31.4	31.3	34.3
MGA_810	LOCUS_06800	sequence110:194271..194936(+)	partial			WP_011475956.1	phage tail family protein	76.9	56.8	38.0
MGA_811	LOCUS_06810	sequence110:194933..197173(+)	partial			WP_011475663.1	phage tail protein	40.2	38.4	38.7
MGA_812	LOCUS_06820	sequence110:197185..198570(+)	partial			WP_013389917.1	GH25 family lysozyme	51.4	66.9	35.4
MGA_822	LOCUS_06920	sequence110:204754..205848(+)	partial			WP_010774154.1	GH25 family lysozyme	57.1	52.2	45.6
MGA_824	LOCUS_06940	sequence110:206469..206999(+)	partial			WP_000117962.1	tail fiber protein	83.5	21.6	34.9
MGA_831	LOCUS_07000	sequence110:210660..211322(+)	partial			WP_011475497.1	matrixin family metalloprotease	70.0	70.0	56.5
MGA_832	LOCUS_07010	sequence110:211406..212677(-)	frameshift		212763	WP_011475563.1	heavy metal translocating P-type ATPase	98.8	68.9	66.5
MGA_833	LOCUS_07020	sequence110:212758..213225(-)	frameshift		212766	WP_011475563.1	heavy metal translocating P-type ATPase	98.7	25.5	66.9
MGA_848	LOCUS_07170	sequence110:228899..229108(+)	internal_stop_codon	229106..229108(+)		WP_012972583.1	sugar transferase	100.0	20.8	43.7
MGA_849	LOCUS_07180	sequence110:229357..229797(+)	frameshift,internal_stop_codon	229106..229108(+)	229390,229735	WP_001263776.1	sugar transferase	78.8	34.0	33.1
MGA_944	LOCUS_08100	sequence111:66141..67706(+)	partial			WP_011101661.1	DNA internalization-related competence protein ComEC/Rec2	98.1	67.8	39.6
MGA_968	LOCUS_08330	sequence111:94475..95623(+)	partial			WP_000072627.1	restriction endonuclease subunit S	55.0	50.4	42.5
MGA_974	LOCUS_08370	sequence111:101743..102375(-)	partial			WP_011948401.1	restriction endonuclease subunit S	85.7	47.2	38.7
MGA_1036	LOCUS_08990	sequence111:168254..168922(+)	partial			WP_004255026.1	amino acid ABC transporter permease	91.4	70.2	32.5
MGA_1058	LOCUS_09190	sequence111:188036..188254(+)	partial			WP_011101154.1	argininosuccinate lyase	97.2	15.0	55.7
MGA_1127	LOCUS_09860	sequence111:261587..262072(+)	partial			WP_012583929.1	DUF438 domain-containing protein	72.0	28.6	31.9
MGA_1141	LOCUS_09990	sequence111:273235..273630(-)	internal_stop_codon	273772..273774(-)		WP_011254160.1	LysR family transcriptional regulator	91.6	41.0	45.8
MGA_1142	LOCUS_10000	sequence111:273772..273933(-)	internal_stop_codon	273772..273774(-)		WP_011254160.1	LysR family transcriptional regulator	100.0	18.1	73.6
MGA_1144	LOCUS_10020	sequence111:274167..274298(+)	frameshift		274253	WP_002288289.1	alpha/beta hydrolase	72.1	9.6	71.0
MGA_1145	LOCUS_10030	sequence111:274300..275130(+)	frameshift		274253	WP_002288289.1	alpha/beta hydrolase	100.0	84.3	62.3
MGA_1154	LOCUS_10120	sequence111:284911..285201(+)	frameshift		285177	WP_011674828.1	MDR family MFS transporter	82.3	16.3	35.4
MGA_1155	LOCUS_10130	sequence111:285324..286121(+)	frameshift,internal_stop_codon	286120..286122(+)	285177	WP_003733258.1	cholic acid efflux MFS transporter MdrT	100.0	53.5	45.3
MGA_1163	LOCUS_10200	sequence111:292616..293341(-)	frameshift,internal_stop_codon	293412..293414(-)	293327	WP_011101922.1	LysR family transcriptional regulator	98.3	80.9	45.5
MGA_1165	LOCUS_10220	sequence111:293650..294252(+)	internal_stop_codon	294250..294252(+)		WP_003547290.1	aldo/keto reductase	100.0	70.3	68.7
MGA_1166	LOCUS_10230	sequence111:294331..294471(+)	internal_stop_codon	294250..294252(+)		WP_003547290.1	aldo/keto reductase	95.7	15.4	86.4
MGA_1173	LOCUS_10290	sequence111:299289..299651(+)	internal_stop_codon	299879..299881(+)		WP_025080575.1	alpha/beta hydrolase	65.8	26.5	53.2
MGA_1175	LOCUS_10310	sequence111:300432..300977(+)	internal_stop_codon	300975..300977(+)		WP_011836955.1	alpha/beta hydrolase	92.3	60.9	49.7
MGA_1176	LOCUS_10320	sequence111:301020..301337(+)	internal_stop_codon	300975..300977(+)		WP_172824466.1	alpha/beta hydrolase	81.0	30.2	62.4
MGA_1239	LOCUS_10910	sequence111:372544..373680(+)	frameshift		372523	WP_162038636.1	IS110 family transposase	95.2	83.5	49.7
MGA_1240	LOCUS_10920	sequence111:374186..374902(-)	frameshift		374864	WP_000547977.1	aldo/keto reductase	89.9	78.5	44.2
MGA_1247	LOCUS_10990	sequence111:379929..380378(-)	partial			WP_011101131.1	GH25 family lysozyme	50.3	19.4	36.0
MGA_1248	LOCUS_11000	sequence111:380541..380846(-)	internal_stop_codon	380541..380543(-)		WP_013389917.1	GH25 family lysozyme	75.2	21.3	51.3
MGA_1252	LOCUS_11040	sequence111:384173..384634(+)	partial			WP_002286319.1	LysR family transcriptional regulator	85.0	45.1	27.6
MGA_1255	LOCUS_11070	sequence111:386528..387175(+)	partial			WP_003564898.1	hypothetical protein	82.3	70.7	33.1
MGA_1265	LOCUS_11160	sequence111:395487..395798(-)	partial			WP_011084122.1	glucose 1-dehydrogenase	82.5	34.0	42.9
MGA_1270	LOCUS_11210	sequence111:398624..402145(-)	partial			WP_041272308.1	DEAD/DEAH box helicase	58.8	65.0	40.0
MGA_1275	LOCUS_11250	sequence111:404807..405013(+)	frameshift		405004	WP_125607117.1	IS30 family transposase	79.4	17.6	55.6
MGA_1278	LOCUS_11270	sequence111:408017..408994(-)	partial			WP_011922118.1	glycosyltransferase family 2 protein	67.4	64.4	37.2
MGA_1310	LOCUS_11580	sequence112:34912..35202(-)	frameshift		35290	WP_003130468.1	deoxyribose-phosphate aldolase	96.9	42.3	69.9
MGA_1311	LOCUS_11590	sequence112:35282..35581(-)	frameshift		35290	WP_011949107.1	deoxyribose-phosphate aldolase	91.9	42.9	60.4
MGA_1333	LOCUS_11810	sequence112:59703..62738(-)	internal_stop_codon	62766..62768(-)		WP_011476621.1	LPXTG cell wall anchor domain-containing protein	18.4	37.7	31.2
MGA_1335	LOCUS_11830	sequence112:63171..66941(+)	partial			WP_011101323.1	MucBP domain-containing protein	35.4	37.4	24.6
MGA_1339	LOCUS_11870	sequence112:70440..71006(-)	partial			WP_011101897.1	PAS domain-containing protein	98.4	42.9	46.5
MGA_1343	LOCUS_11910	sequence112:75896..76297(+)	partial			WP_071742188.1	hypothetical protein	69.9	84.0	33.3
MGA_1357	LOCUS_12050	sequence112:90010..90327(-)	partial			WP_011102010.1	hypothetical protein	98.1	74.5	41.0
MGA_1379	LOCUS_12270	sequence112:118492..119358(+)	partial			WP_011837699.1	DUF4097 family beta strand repeat-containing protein	35.4	29.5	31.4
MGA_1380	LOCUS_12280	sequence112:119468..119812(-)	frameshift		119771	WP_003644879.1	iron-containing alcohol dehydrogenase	87.7	25.9	69.3
MGA_1381	LOCUS_12290	sequence112:119766..120641(-)	frameshift		119771	WP_003644879.1	iron-containing alcohol dehydrogenase	98.3	73.3	77.3
MGA_1382	LOCUS_12300	sequence112:120782..121330(-)	partial			WP_013229998.1	NAD(P)H-dependent oxidoreductase	80.2	44.0	41.5
MGA_1383	LOCUS_12310	sequence112:121552..123996(-)	partial			WP_207215633.1	MucBP domain-containing protein	43.4	29.1	25.3
MGA_1427	LOCUS_12720	sequence112:167827..168195(+)	frameshift		167605	WP_003644005.1	biotin--[acetyl-CoA-carboxylase] ligase	91.0	34.3	30.1
MGA_1438	LOCUS_12830	sequence112:181836..182393(-)	partial			WP_003550024.1	PepSY domain-containing protein	78.4	72.3	45.6
MGA_1446	LOCUS_12910	sequence112:189937..190395(-)	partial			WP_003548090.1	EAL domain-containing protein	100.0	57.7	40.3
MGA_1464	LOCUS_13080	sequence112:207614..208312(+)	partial			WP_011084101.1	RibD family protein	47.4	44.9	31.8
MGA_1471	LOCUS_13150	sequence112:211894..212646(-)	frameshift		212864	WP_003547400.1	5-methyltetrahydropteroyltriglutamate--homocysteine S-methyltransferase	99.6	66.9	70.3
MGA_1474	LOCUS_13170	sequence112:215008..215934(-)	internal_stop_codon	216025..216027(-)		WP_011674806.1	C69 family dipeptidase	100.0	64.4	68.8
MGA_1475	LOCUS_13180	sequence112:216025..216438(-)	internal_stop_codon	216025..216027(-)		WP_011674806.1	C69 family dipeptidase	98.5	28.4	78.5
MGA_1476	LOCUS_13190	sequence112:216521..217234(-)	partial			WP_002357427.1	response regulator transcription factor	74.3	73.3	37.3
MGA_1484	LOCUS_13270	sequence112:224616..225164(+)	frameshift,internal_stop_codon	224586..224588(+)	225149	WP_003644782.1	MFS transporter	96.2	41.8	66.3
MGA_1485	LOCUS_13280	sequence112:225187..225798(+)	frameshift		225149	WP_003644782.1	MFS transporter	98.0	47.8	68.8
MGA_1497	LOCUS_13400	sequence112:238003..238359(-)	partial			WP_002321425.1	metalloregulator ArsR/SmtB family transcription factor	73.7	75.0	44.8
MGA_1498	LOCUS_13410	sequence112:238449..240407(-)	partial			WP_010706701.1	autolysin	73.9	66.9	35.3
MGA_1505	LOCUS_13480	sequence112:246749..247390(-)	partial			WP_164924808.1	NAD(P)H-hydrate dehydratase	95.8	39.6	37.2
MGA_1575	LOCUS_14150	sequence112:318482..318901(-)	partial			WP_011100921.1	energy-coupling factor transporter transmembrane component T	99.3	63.0	53.6
MGA_1582	LOCUS_14220	sequence112:326241..326954(-)	frameshift,internal_stop_codon	326240..326242(-)	327052	WP_011101835.1	LTA synthase family protein	98.3	32.4	61.4
MGA_1583	LOCUS_14230	sequence112:326966..328423(-)	frameshift		327052	WP_011101835.1	LTA synthase family protein	93.8	63.2	66.4
MGA_1588	LOCUS_14280	sequence112:332694..333152(-)	partial			WP_000675241.1	DNA-binding domain-containing protein	98.0	53.8	34.2
MGA_1592	LOCUS_14310	sequence112:338307..339419(+)	frameshift		339386	WP_010966780.1	group II intron reverse transcriptase/maturase	98.1	78.3	47.7
MGA_1635	LOCUS_14740	sequence112:392879..393295(+)	partial			WP_003641117.1	hypothetical protein	28.3	23.1	69.2
MGA_1642	LOCUS_14800	sequence112:401213..401398(+)	partial			WP_003546918.1	CsbD family protein	55.7	59.6	67.6
MGA_1656	LOCUS_14920	sequence112:418263..418430(+)	internal_stop_codon	418428..418430(+)		WP_003817429.1	GyrI-like domain-containing protein	100.0	40.3	37.9
MGA_1657	LOCUS_14930	sequence112:418497..418808(+)	internal_stop_codon	418428..418430(+)		WP_003548076.1	GyrI-like domain-containing protein	98.1	48.6	64.4
MGA_1665	LOCUS_15000	sequence112:426804..427484(+)	partial			WP_001259486.1	matrixin family metalloprotease	78.8	71.6	31.9
MGA_1675	LOCUS_15100	sequence112:436964..437557(+)	partial			WP_012258317.1	class I SAM-dependent methyltransferase	59.9	49.6	30.1
MGA_1678	LOCUS_15130	sequence112:440054..441040(-)	frameshift		440059	WP_011475486.1	ABC-F type ribosomal protection protein	96.6	63.7	48.7
MGA_1681	LOCUS_15160	sequence112:443216..444907(+)	partial			WP_011836786.1	CshA/CshB family fibrillar adhesin-related protein	50.3	11.2	29.5
MGA_1689	LOCUS_15240	sequence112:453668..454231(-)	partial			WP_135794525.1	serine hydrolase	95.7	66.3	40.1
MGA_1694	LOCUS_15280	sequence112:458827..460365(+)	partial			WP_011123196.1	helix-turn-helix domain-containing protein	28.1	50.7	29.9
MGA_1719	LOCUS_15530	sequence112:489981..490310(-)	partial			WP_011101188.1	transporter substrate-binding domain-containing protein	98.2	38.5	74.8
MGA_1785	LOCUS_16170	sequence112:548210..548839(+)	partial			WP_003703028.1	glycoside hydrolase family 73 protein	71.8	67.9	59.6
MGA_1802	LOCUS_16320	sequence112:568524..570860(-)	partial			WP_011030338.1	phage/plasmid primase, P4 family	39.6	40.2	28.8
MGA_1815	LOCUS_16440	sequence112:584255..585265(+)	partial			WP_023905931.1	Abi family protein	74.7	74.3	27.6
MGA_1819	LOCUS_16480	sequence112:590179..590403(-)	partial			WP_225852596.1	recombinase family protein	100.0	22.6	64.9
MGA_1831	LOCUS_16580	sequence112:600847..602373(+)	partial			WP_019318694.1	bifunctional glutamate--cysteine ligase GshA/glutathione synthetase GshB	92.3	60.1	31.6
MGA_1837	LOCUS_16640	sequence112:607303..607914(+)	partial			WP_002262616.1	helix-turn-helix transcriptional regulator	41.9	68.1	42.4
MGA_1839	LOCUS_16660	sequence112:609275..609868(-)	frameshift		609918	WP_011475480.1	Rpn family recombination-promoting nuclease/putative transposase	77.2	60.4	29.9
MGA_1845	LOCUS_16720	sequence112:614694..615053(+)	partial			WP_000125656.1	type II toxin-antitoxin system PemK/MazF family toxin	73.1	75.2	49.4
MGA_1859	LOCUS_16860	sequence112:626181..628013(+)	partial			WP_011476414.1	KxYKxGKxW signal peptide domain-containing protein	76.6	52.7	38.9
MGA_1863	LOCUS_16900	sequence112:631347..633461(-)	partial			WP_010964394.1	hypothetical protein	54.0	13.1	38.9
MGA_1864	LOCUS_16910	sequence112:633644..635767(+)	partial			WP_010964394.1	hypothetical protein	66.8	16.4	34.7
MGA_1869	LOCUS_16940	sequence112:642600..643313(+)	partial			WP_011017006.1	sugar phosphate nucleotidyltransferase	95.4	41.9	40.9
MGA_1880	LOCUS_17030	sequence112:657081..659699(+)	partial			WP_010964394.1	hypothetical protein	72.5	21.1	33.5
MGA_1881	LOCUS_17040	sequence112:659814..661820(+)	partial			WP_010964394.1	hypothetical protein	53.0	13.5	34.1
MGA_1882	LOCUS_17050	sequence112:662029..663333(+)	partial			WP_000728266.1	phosphorylcholine esterase CbpE	51.6	33.8	35.6
MGA_1884	LOCUS_17070	sequence112:664020..664997(+)	partial			WP_011254543.1	DUF4767 domain-containing protein	40.3	39.9	36.8
MGA_1886	LOCUS_17090	sequence112:666959..669103(+)	partial			WP_010964394.1	hypothetical protein	73.9	19.8	31.2
MGA_1887	LOCUS_17100	sequence112:669214..670422(+)	partial			WP_000757725.1	endo-beta-N-acetylglucosaminidase	70.6	39.0	31.0
MGA_1895	LOCUS_17170	sequence112:677182..678495(+)	frameshift		677048	WP_002326842.1	LTA synthase family protein	98.4	47.3	46.5
