# locus_id	locus_tag	location	classification	internal_stop	indel	ref_id	description	query_cov	ref_cov	identity
MGA_39	LOCUS_00380	sequence01:37460..38698(+)	partial			WP_025163903.1	DUF262 domain-containing protein	21.4	23.5	33.7
MGA_62	LOCUS_00600	sequence02:1334..6457(+)	partial			WP_015942796.1	InlB B-repeat-containing protein	11.5	13.6	28.4
MGA_75	LOCUS_00730	sequence02:20695..21024(+)	internal_stop_codon	20641..20643(+),21022..21024(+)		WP_011109309.1	ATP-binding protein	98.2	23.5	37.8
MGA_76	LOCUS_00740	sequence02:21055..21663(+)	internal_stop_codon	21022..21024(+)		WP_011109309.1	ATP-binding protein	91.6	38.7	34.2
MGA_81	LOCUS_00790	sequence02:25295..26476(-)	partial			WP_010979427.1	GTP 3',8-cyclase MoaA	47.8	60.7	25.8
MGA_86	LOCUS_00840	sequence02:30285..30467(+)	partial			WP_011861202.1	ABC-F family ATP-binding cassette domain-containing protein	95.0	8.9	45.6
MGA_87	LOCUS_00850	sequence02:30502..31152(+)	frameshift		30446	WP_000411125.1	ABC transporter ATP-binding protein	98.1	71.7	31.2
MGA_89	LOCUS_00870	sequence02:31889..32404(+)	partial			WP_002893678.1	LytTR family DNA-binding domain-containing protein	52.0	61.5	37.4
MGA_97	LOCUS_00940	sequence03:4419..5426(+)	partial			WP_000364967.1	ThiF family adenylyltransferase	82.7	74.7	38.1
MGA_101	LOCUS_00980	sequence03:7441..7728(-)	frameshift		7466,7739	WP_000837499.1	XRE/MutR family transcriptional regulator	100.0	37.3	50.9
MGA_104	LOCUS_01010	sequence03:9530..10522(+)	partial			WP_013226635.1	ATP-grasp domain-containing protein	80.3	62.2	25.3
MGA_107	LOCUS_01040	sequence03:12094..13008(+)	frameshift		12987	WP_000238677.1	ATP-grasp domain-containing protein	82.2	59.9	34.5
MGA_153	LOCUS_01480	sequence07:626..892(-)	partial			WP_001262593.1	virulence RhuM family protein	98.9	26.6	81.6
MGA_156	LOCUS_01500	sequence08:1..1439(+)	partial			WP_002352261.1	restriction endonuclease subunit S	100.0	73.6	42.5
MGA_175	LOCUS_01640	sequence11:10854..11909(+)	frameshift		10863	WP_000701298.1	peptidase domain-containing ABC transporter	91.7	46.7	29.3
MGA_209	LOCUS_01980	sequence11:45313..45504(+)	frameshift,internal_stop_codon	45502..45504(+)	45525,45622	WP_014636518.1	radical SAM protein	96.8	14.8	44.3
MGA_210	LOCUS_01990	sequence11:45787..46371(+)	partial			WP_012027878.1	ABC transporter ATP-binding protein	42.3	15.6	62.2
MGA_226	LOCUS_02150	sequence11:61472..61636(+)	internal_stop_codon	61460..61462(+),61634..61636(+)		WP_011166415.1	Eco47II family restriction endonuclease	100.0	21.3	64.8
MGA_227	LOCUS_02160	sequence11:61715..62194(+)	internal_stop_codon	61460..61462(+),61634..61636(+)		WP_011166415.1	Eco47II family restriction endonuclease	92.5	55.9	46.4
MGA_302	LOCUS_02910	sequence11:147797..148288(+)	partial			WP_002405593.1	thioredoxin domain-containing protein	66.9	67.7	39.6
MGA_308	LOCUS_02970	sequence11:153443..155797(-)	partial			WP_002399687.1	DNA polymerase	58.3	70.1	47.6
MGA_313	LOCUS_03020	sequence11:158397..160682(+)	partial			WP_003903975.1	phage/plasmid primase, P4 family	46.0	73.5	31.5
MGA_317	LOCUS_03060	sequence11:163322..163687(+)	partial			WP_011072872.1	HNH endonuclease signature motif containing protein	64.5	71.6	52.6
MGA_323	LOCUS_03120	sequence11:167868..168629(+)	internal_stop_codon	168627..168629(+)		WP_165443313.1	terminase large subunit	93.3	41.1	37.3
MGA_324	LOCUS_03130	sequence11:168944..169447(+)	frameshift		168950	WP_009936861.1	terminase large subunit	83.8	28.9	38.4
MGA_326	LOCUS_03150	sequence11:169772..170032(+)	frameshift		169966	WP_011476321.1	type II toxin-antitoxin system death-on-curing family toxin	74.4	52.0	60.9
MGA_327	LOCUS_03160	sequence11:170011..170142(+)	frameshift		169966	WP_011476321.1	type II toxin-antitoxin system death-on-curing family toxin	100.0	35.0	62.8
MGA_330	LOCUS_03190	sequence11:171770..172468(+)	partial			WP_225426975.1	Clp protease ClpP	75.0	73.1	43.3
MGA_331	LOCUS_03200	sequence11:172481..173659(+)	partial			WP_011975494.1	phage major capsid protein	77.0	69.1	28.8
MGA_341	LOCUS_03300	sequence11:180029..184195(+)	internal_stop_codon	184193..184195(+)		WP_001880132.1	phage tail spike protein	39.5	41.1	46.7
MGA_345	LOCUS_03340	sequence11:185549..187018(+)	partial			WP_010922095.1	glucosaminidase domain-containing protein	32.9	37.8	32.9
MGA_346	LOCUS_03350	sequence11:187242..188483(+)	partial			WP_011461951.1	recombinase family protein	80.6	64.2	43.2
MGA_347	LOCUS_03360	sequence11:188428..189732(+)	partial			WP_000301254.1	recombinase family protein	84.8	70.0	50.5
MGA_352	LOCUS_03410	sequence11:192966..194426(+)	partial			WP_010979803.1	S9 family peptidase	47.5	45.0	28.2
MGA_354	LOCUS_03430	sequence11:194702..196027(+)	partial			WP_127742798.1	class III lanthionine synthetase LanKC	91.8	51.8	25.2
MGA_363	LOCUS_03520	sequence11:208265..208534(+)	frameshift,internal_stop_codon	208527..208529(+)	208456	WP_000056777.1	zinc ribbon domain-containing protein YjdM	73.0	62.4	82.4
MGA_384	LOCUS_03730	sequence11:228971..230203(+)	partial			WP_001042403.1	McrB family protein	98.0	59.7	43.8
MGA_387	LOCUS_03760	sequence11:232838..235444(-)	partial			WP_000700451.1	pneumococcal histidine triad protein PhtA	46.0	42.8	46.9
MGA_398	LOCUS_03870	sequence11:245613..246704(+)	partial			WP_025163903.1	DUF262 domain-containing protein	38.8	40.9	29.9
MGA_404	LOCUS_03930	sequence11:254729..255205(-)	partial			WP_010979815.1	YncE family protein	79.1	29.5	29.6
MGA_418	LOCUS_04070	sequence11:267020..267184(+)	internal_stop_codon	266987..266989(+)		WP_011222005.1	protein rep	98.1	16.9	55.6
MGA_432	LOCUS_04210	sequence11:278322..278804(-)	internal_stop_codon	278820..278822(-)		WP_000274751.1	DNA repair protein RadC	98.8	69.9	73.4
MGA_433	LOCUS_04220	sequence11:278820..279008(-)	internal_stop_codon	278820..278822(-)		WP_000274751.1	DNA repair protein RadC	98.4	27.0	67.2
MGA_450	LOCUS_04390	sequence11:297251..298327(-)	frameshift		297259	WP_001202979.1	pyrimidine-nucleoside phosphorylase	99.2	83.5	74.9
MGA_473	LOCUS_04620	sequence11:317453..317743(+)	frameshift		317816,317444,317708,317750	WP_000891067.1	GTP pyrophosphokinase	90.6	47.0	62.1
MGA_499	LOCUS_04880	sequence11:345830..347212(-)	partial			WP_002936357.1	sugar transferase	61.7	61.7	48.1
MGA_529	LOCUS_05170	sequence11:381351..381866(-)	partial			WP_002984923.1	hypothetical protein	77.8	74.7	50.4
MGA_557	LOCUS_05450	sequence11:413848..414270(-)	internal_stop_codon	413848..413850(-)		WP_000599739.1	Fic family protein	100.0	69.2	61.4
MGA_562	LOCUS_05500	sequence11:417787..418614(-)	partial			WP_074016730.1	GIY-YIG nuclease family protein	62.2	59.0	36.0
MGA_580	LOCUS_05680	sequence11:436997..437155(-)	partial			WP_000602601.1	DUF1146 family protein	88.5	60.5	47.8
MGA_638	LOCUS_06260	sequence11:492188..492838(-)	partial			WP_127742798.1	class III lanthionine synthetase LanKC	48.6	12.2	38.7
MGA_671	LOCUS_06560	sequence14:7672..7806(-)	partial			WP_002885866.1	50S ribosomal protein L34	59.1	59.1	100.0
MGA_682	LOCUS_06670	sequence14:18873..19892(-)	frameshift		19920	WP_000153754.1	ABC-F type ribosomal protection protein	94.7	59.4	31.8
MGA_683	LOCUS_06680	sequence14:19885..20250(-)	frameshift		19920,19911	WP_011100919.1	ABC-F family ATP-binding cassette domain-containing protein	90.9	21.5	33.6
MGA_708	LOCUS_06930	sequence14:42625..42843(-)	frameshift,internal_stop_codon	43040..43042(-)	42820	WP_000564846.1	ISAs1-like element IS1548 family transposase	93.1	17.8	85.1
MGA_709	LOCUS_06940	sequence14:43040..43432(-)	frameshift,internal_stop_codon	43040..43042(-)	43457,42820	WP_010922786.1	ISAs1-like element IS1548 family transposase	95.4	32.9	69.4
MGA_710	LOCUS_06950	sequence14:43413..43712(-)	frameshift		43457	WP_000564846.1	ISAs1-like element IS1548 family transposase	91.9	24.1	68.1
MGA_711	LOCUS_06960	sequence14:43870..44760(+)	partial			WP_012774872.1	primase C-terminal domain-containing protein	94.9	56.7	73.7
MGA_712	LOCUS_06970	sequence14:44700..45161(+)	frameshift		44718,45143	WP_012774872.1	primase C-terminal domain-containing protein	94.1	29.0	62.5
MGA_718	LOCUS_07030	sequence14:48602..48826(-)	frameshift		48604	WP_012775182.1	MFS transporter	87.8	15.4	56.9
MGA_721	LOCUS_07060	sequence14:50506..52470(+)	partial			WP_092529862.1	class III lanthionine synthetase LanKC	49.2	38.7	25.9
MGA_805	LOCUS_07900	sequence14:145407..145601(-)	partial			WP_150880979.1	ISL3 family transposase	96.9	15.2	77.4
MGA_806	LOCUS_07910	sequence14:145727..145996(+)	frameshift,internal_stop_codon	145994..145996(+),146282..146284(+)	145667	WP_012027845.1	M50 family metallopeptidase	100.0	21.2	66.3
MGA_807	LOCUS_07920	sequence14:146057..146284(+)	internal_stop_codon	145994..145996(+),146282..146284(+)		WP_011837532.1	RIP metalloprotease RseP	97.3	17.5	49.3
MGA_808	LOCUS_07930	sequence14:146333..146515(+)	internal_stop_codon	146282..146284(+)		WP_000900660.1	RIP metalloprotease RseP	98.3	14.1	81.4
MGA_809	LOCUS_07940	sequence14:146543..147397(+)	frameshift		147373	WP_012027844.1	proline--tRNA ligase	97.5	44.7	92.1
MGA_810	LOCUS_07950	sequence14:147391..148401(+)	frameshift		147376	WP_012027844.1	proline--tRNA ligase	98.8	53.5	89.8
MGA_817	LOCUS_08020	sequence14:151767..152216(+)	partial			WP_012027838.1	PolC-type DNA polymerase III	57.7	5.9	57.0
MGA_818	LOCUS_08030	sequence14:152293..153027(+)	partial			WP_010921776.1	SH3 domain-containing protein	89.8	58.8	51.8
MGA_825	LOCUS_08090	sequence15:9227..9430(-)	partial			WP_011837540.1	TIM barrel protein	76.1	20.6	56.9
MGA_868	LOCUS_08520	sequence15:56272..57075(-)	frameshift		56358	WP_011837191.1	glycosyltransferase	92.5	77.1	46.2
MGA_881	LOCUS_08650	sequence15:70922..71101(-)	partial			WP_000048058.1	30S ribosomal protein S21	72.9	74.1	100.0
MGA_883	LOCUS_08670	sequence15:73017..73997(-)	partial			WP_011285736.1	hypothetical protein	11.3	42.0	70.3
MGA_929	LOCUS_09130	sequence15:124211..124936(-)	frameshift,internal_stop_codon	124257..124259(-)	124290,124181,124303	WP_000794285.1	site-specific DNA-methyltransferase	87.1	79.8	88.1
MGA_936	LOCUS_09200	sequence15:129879..130199(-)	internal_stop_codon	129879..129881(-)		WP_002263615.1	ASCH domain-containing protein	84.0	59.9	55.3
MGA_941	LOCUS_09250	sequence15:132299..133423(-)	frameshift		133424	WP_001239259.1	DEAD/DEAH box helicase family protein	99.2	36.7	42.6
MGA_942	LOCUS_09260	sequence15:133374..135338(-)	frameshift		133424	WP_001239259.1	DEAD/DEAH box helicase family protein	97.6	63.1	60.3
MGA_970	LOCUS_09540	sequence16:9126..10151(+)	partial			WP_000823931.1	DNA/RNA non-specific endonuclease	61.6	59.3	58.6
MGA_993	LOCUS_09770	sequence16:30966..31286(-)	frameshift,internal_stop_codon	31457..31459(-)	30995,31306,31275	WP_012027843.1	MIP/aquaporin family protein	93.4	42.8	58.4
MGA_1049	LOCUS_10330	sequence16:88410..88571(-)	partial			WP_011836441.1	mevalonate kinase	86.8	15.8	71.7
MGA_1056	LOCUS_10400	sequence16:94362..94565(-)	partial			WP_011962425.1	aminotransferase class I/II-fold pyridoxal phosphate-dependent enzyme	86.6	14.4	46.6
MGA_1058	LOCUS_10420	sequence16:95343..95885(-)	frameshift		95381	WP_003130693.1	iron-containing alcohol dehydrogenase family protein	87.8	44.1	33.1
MGA_1084	LOCUS_10680	sequence16:122533..123897(+)	partial			WP_003232562.1	serine protease Isp	58.6	67.1	30.3
MGA_1085	LOCUS_10690	sequence16:123984..125840(+)	partial			WP_000866454.1	choline binding-anchored murein hydrolase CbpD	52.3	76.3	38.2
MGA_1087	LOCUS_10710	sequence16:126541..128331(+)	partial			WP_011101863.1	SH3 domain-containing protein	52.9	36.9	33.5
MGA_1091	LOCUS_10750	sequence16:132063..132737(+)	partial			WP_010932831.1	N-6 DNA methylase	69.2	69.2	39.5
MGA_1111	LOCUS_10940	sequence17:13741..13884(-)	frameshift		14034,13911	WP_011836643.1	pseudouridine synthase	100.0	19.5	59.6
MGA_1112	LOCUS_10950	sequence17:13963..14478(-)	frameshift		14025,13911	WP_011922181.1	pseudouridine synthase	92.4	66.4	55.1
MGA_1120	LOCUS_11030	sequence17:23129..24814(-)	internal_stop_codon	24857..24859(-)		WP_034260979.1	DEAD/DEAH box helicase family protein	97.5	61.8	34.3
MGA_1121	LOCUS_11040	sequence17:24857..25753(-)	internal_stop_codon	24857..24859(-)		WP_034260979.1	DEAD/DEAH box helicase family protein	97.7	33.7	42.6
MGA_1147	LOCUS_11300	sequence17:52687..55122(-)	partial			WP_011964235.1	N-6 DNA methylase	70.7	75.3	29.5
MGA_1149	LOCUS_11320	sequence17:56172..56660(-)	partial			WP_000039971.1	YtxH domain-containing protein	66.7	75.5	59.3
MGA_1163	LOCUS_11460	sequence17:68427..68705(-)	frameshift		68749	WP_011837126.1	HD domain-containing protein	96.7	45.4	49.4
MGA_1164	LOCUS_11470	sequence17:68723..69004(-)	frameshift		68749	WP_011837126.1	HD domain-containing protein	89.2	42.9	60.7
MGA_1167	LOCUS_11500	sequence17:71153..74023(-)	partial			WP_000503026.1	non-ribosomal peptide synthetase	53.5	24.4	27.6
MGA_1190	LOCUS_11730	sequence17:100589..100990(-)	partial			WP_012027034.1	XRE family transcriptional regulator	66.9	31.2	43.8
MGA_1201	LOCUS_11840	sequence17:108549..111581(-)	partial			WP_010905924.1	phage tail protein	48.5	84.5	40.4
MGA_1203	LOCUS_11860	sequence17:113132..117595(-)	partial			WP_010905386.1	tape measure protein	73.0	82.3	27.9
MGA_1226	LOCUS_12090	sequence17:129700..130425(-)	partial			WP_001231960.1	ERF family protein	61.8	66.5	43.6
MGA_1243	LOCUS_12250	sequence18:2431..3204(-)	partial			WP_010905121.1	TMEM175 family protein	93.8	72.8	27.4
MGA_1255	LOCUS_12370	sequence18:14651..15169(-)	frameshift		15237	WP_011964246.1	type II restriction endonuclease	65.7	38.3	38.6
MGA_1267	LOCUS_12490	sequence18:25702..26643(-)	partial			WP_164921634.1	alpha/beta hydrolase fold domain-containing protein	86.6	71.7	34.9
MGA_1286	LOCUS_12680	sequence18:45324..45479(-)	frameshift,internal_stop_codon	45706..45708(-)	45594,45461,45654,45551	WP_002900516.1	UDP-glucose 4-epimerase GalE	86.3	13.5	53.3
MGA_1287	LOCUS_12690	sequence18:45828..46025(-)	frameshift,internal_stop_codon	45827..45829(-)	45554,45763,45654,45594,46063	WP_011476382.1	UDP-glucose 4-epimerase GalE	96.9	19.1	65.1
MGA_1347	LOCUS_13290	sequence18:111288..111677(-)	frameshift,internal_stop_codon	111720..111722(-),111254..111256(-)	111335	WP_000650743.1	hypothetical protein	86.8	16.8	64.3
MGA_1348	LOCUS_13300	sequence18:111682..112083(-)	frameshift		112139,112109	WP_000403526.1	ABC transporter ATP-binding protein	81.2	35.0	55.6
MGA_1399	LOCUS_13810	sequence19:15820..16902(-)	partial			WP_002262067.1	FtsQ-type POTRA domain-containing protein	63.6	61.2	49.3
MGA_1410	LOCUS_13920	sequence19:25527..25757(-)	partial			WP_128834060.1	IS3-like element ISSmu1 family transposase	97.4	16.5	71.6
MGA_1411	LOCUS_13930	sequence19:25842..26072(-)	partial			WP_000456288.1	hypothetical protein	98.7	47.9	60.3
MGA_1412	LOCUS_13940	sequence19:26634..26765(-)	frameshift,internal_stop_codon	26634..26636(-),26463..26465(-)	26498,26546,26579,26486,26426	WP_165694720.1	IS3-like element IS861 family transposase	100.0	9.6	69.8
MGA_1428	LOCUS_14100	sequence19:42900..43214(-)	partial			WP_004194153.1	DNA-directed RNA polymerase subunit omega	70.2	70.2	91.8
MGA_1464	LOCUS_14460	sequence19:80994..81368(-)	internal_stop_codon	80994..80996(-)		WP_000219921.1	DegV family protein	82.3	36.3	59.8
MGA_1487	LOCUS_14690	sequence19:104787..105341(-)	frameshift		105329,105458	WP_000710515.1	DUF2207 domain-containing protein	91.8	26.5	38.5
MGA_1518	LOCUS_15000	sequence20:11009..11245(-)	partial			WP_002985700.1	preprotein translocase subunit SecG	74.4	74.4	74.1
MGA_1560	LOCUS_15420	sequence20:52221..52412(+)	frameshift,internal_stop_codon	52410..52412(+)	52210	WP_010964791.1	DUF554 domain-containing protein	100.0	26.0	54.0
MGA_1563	LOCUS_15450	sequence20:54139..54351(-)	frameshift,internal_stop_codon	54396..54398(-),54600..54602(-)	54371	WP_002262692.1	methylated-DNA--[protein]-cysteine S-methyltransferase	88.6	37.8	51.6
MGA_1602	LOCUS_15840	sequence20:92607..>93843(-)	partial			WP_001247520.1	GBS Bsp-like repeat-containing protein	65.0	31.4	52.6
MGA_1610	LOCUS_15920	sequence21:12919..13359(+)	partial			WP_011202637.1	carboxymuconolactone decarboxylase family protein	93.2	48.9	57.4
MGA_1619	LOCUS_16010	sequence21:20730..20954(+)	internal_stop_codon	20721..20723(+),20517..20519(+)		WP_000939892.1	ABC transporter ATP-binding protein	94.6	35.9	50.0
MGA_1624	LOCUS_16060	sequence21:24333..24695(-)	frameshift		24769	WP_032910596.1	bifunctional glutamate--cysteine ligase GshA/glutathione synthetase GshB	97.5	15.6	73.5
MGA_1625	LOCUS_16070	sequence21:24689..25987(-)	frameshift		24771,26004	WP_000582678.1	bifunctional glutamate--cysteine ligase GshA/glutathione synthetase GshB	95.6	55.1	63.4
MGA_1626	LOCUS_16080	sequence21:25984..26286(-)	frameshift,internal_stop_codon	26296..26298(-)	26004	WP_000582678.1	bifunctional glutamate--cysteine ligase GshA/glutathione synthetase GshB	94.0	12.5	55.3
MGA_1627	LOCUS_16090	sequence21:26296..26508(-)	internal_stop_codon	26296..26298(-)		WP_019318694.1	bifunctional glutamate--cysteine ligase GshA/glutathione synthetase GshB	100.0	9.3	60.6
MGA_1638	LOCUS_16200	sequence21:35837..36259(+)	partial			WP_002263441.1	competence type IV pilus minor pilin ComGG	74.3	82.9	46.7
MGA_1642	LOCUS_16240	sequence21:39390..40073(+)	frameshift		40064	WP_011837496.1	ABC transporter ATP-binding protein	99.1	80.6	67.6
