# locus_id	locus_tag	location	classification	internal_stop	indel	ref_id	description	query_cov	ref_cov	identity
MGA_3	LOCUS_00030	sequence01:3024..4796(+)	partial			WP_009994769.1	RNA-directed DNA polymerase	58.8	61.9	25.5
MGA_56	LOCUS_00540	sequence03:49261..51507(+)	frameshift		51480,51447	WP_001060462.1	MSCRAMM family adhesin SdrC	96.0	75.2	87.9
MGA_58	LOCUS_00560	sequence03:52128..52502(+)	frameshift		52216	WP_000610259.1	MSCRAMM family adhesin SdrE	54.0	5.9	85.1
MGA_59	LOCUS_00570	sequence03:52860..56366(+)	frameshift		56345,56333	WP_000934467.1	MSCRAMM family adhesin SdrD	93.2	78.5	86.1
MGA_60	LOCUS_00580	sequence03:56293..56721(+)	frameshift		56345,56333	WP_000610259.1	MSCRAMM family adhesin SdrE	48.6	6.0	81.2
MGA_61	LOCUS_00590	sequence03:57197..60160(+)	frameshift,internal_stop_codon	60146..60148(+)	60136,60145,60206	WP_000610259.1	MSCRAMM family adhesin SdrE	94.7	81.9	79.1
MGA_62	LOCUS_00600	sequence03:60178..60672(+)	frameshift		60206,60127	WP_000610259.1	MSCRAMM family adhesin SdrE	41.5	6.0	82.4
MGA_220	LOCUS_02150	sequence05:119801..120274(+)	partial			WP_000470932.1	AAA family ATPase	87.3	20.5	40.3
MGA_221	LOCUS_02160	sequence05:120319..121638(+)	partial			WP_000181735.1	ATP-dependent helicase	99.3	72.2	35.1
MGA_284	LOCUS_02660	sequence21:1..521(+)	partial			WP_001181101.1	replication initiator protein A	100.0	53.5	94.3
MGA_300	LOCUS_02820	sequence23:14726..15490(-)	frameshift		15548	WP_000199066.1	acetyl-CoA C-acetyltransferase	100.0	64.6	93.7
MGA_301	LOCUS_02830	sequence23:15525..15899(-)	frameshift		15581	WP_000199066.1	acetyl-CoA C-acetyltransferase	84.7	26.7	96.2
MGA_364	LOCUS_03430	sequence26:339..833(-)	frameshift		392	WP_126475239.1	IS1182 family transposase	87.2	26.2	94.4
MGA_428	LOCUS_04070	sequence26:73717..73932(+)	partial			WP_000093025.1	hypothetical protein	91.5	48.1	60.0
MGA_542	LOCUS_05210	sequence26:201391..202824(+)	partial			WP_000915238.1	lipoteichoic acid-specific glycosyltransferase YfhO	100.0	55.0	77.4
MGA_563	LOCUS_05330	sequence36:7965..8591(+)	partial			WP_001549718.1	YdcF family protein	99.5	64.3	83.1
MGA_696	LOCUS_06660	sequence36:151883..152053(-)	partial			WP_001795286.1	hypothetical protein	100.0	72.7	83.9
MGA_761	LOCUS_07270	sequence39:67095..67652(+)	partial			WP_005808295.1	TetR/AcrR family transcriptional regulator	33.5	30.4	51.6
MGA_792	LOCUS_07580	sequence39:108910..109818(-)	partial			WP_001796914.1	ABC transporter permease	100.0	61.4	86.1
MGA_833	LOCUS_07990	sequence39:161791..162348(-)	partial			WP_002294234.1	chorismate mutase	48.6	32.9	48.4
MGA_845	LOCUS_08110	sequence39:175425..175619(-)	partial			WP_000469833.1	XRE family transcriptional regulator	100.0	16.4	96.9
MGA_885	LOCUS_08510	sequence39:220881..221231(+)	internal_stop_codon	221229..221231(+)		WP_000291840.1	oleate hydratase	100.0	19.6	94.8
MGA_886	LOCUS_08520	sequence39:221304..222656(+)	internal_stop_codon	221229..221231(+)		WP_000291840.1	oleate hydratase	100.0	76.1	95.6
MGA_891	LOCUS_08570	sequence39:230271..230948(-)	frameshift		230315	WP_000826312.1	tandem-type lipoprotein	93.8	82.7	87.2
MGA_908	LOCUS_08740	sequence39:243153..244679(-)	partial			WP_211850673.1	RNA-directed DNA polymerase	31.3	27.2	30.2
MGA_911	LOCUS_08760	sequence39:246603..247871(-)	partial			WP_003899494.1	type III-A CRISPR-associated CARF protein Csm6	49.5	49.6	31.9
MGA_919	LOCUS_08840	sequence39:255159..255785(+)	partial			WP_164926902.1	restriction endonuclease subunit S	97.6	44.5	26.3
MGA_920	LOCUS_08850	sequence39:256040..256783(+)	frameshift,internal_stop_codon	255905..255907(+)	256741	WP_002858356.1	type I restriction endonuclease subunit R	96.0	23.3	50.2
MGA_921	LOCUS_08860	sequence39:256771..257880(+)	frameshift,internal_stop_codon	257879..257881(+)	256741	WP_012257687.1	type I restriction endonuclease subunit R	98.1	33.9	51.5
MGA_922	LOCUS_08870	sequence39:258154..258399(+)	partial			WP_126475239.1	IS1182 family transposase	76.5	11.4	93.5
MGA_924	LOCUS_08890	sequence39:259578..259949(-)	partial			WP_003114208.1	HNH endonuclease	81.3	37.0	47.0
MGA_926	LOCUS_08910	sequence39:260202..261206(+)	frameshift,internal_stop_codon	261111..261113(+)	261107	WP_002485357.1	persulfide dioxygenase-sulfurtransferase CstB	91.3	69.0	95.7
MGA_927	LOCUS_08920	sequence39:261143..261457(+)	frameshift,internal_stop_codon	261111..261113(+)	261110	WP_002485357.1	persulfide dioxygenase-sulfurtransferase CstB	100.0	23.5	89.4
MGA_942	LOCUS_09050	sequence41:479..823(+)	frameshift,internal_stop_codon	437..439(+)	261	WP_126475239.1	IS1182 family transposase	99.1	20.7	99.1
MGA_967	LOCUS_09300	sequence41:27289..27492(+)	partial			WP_001548522.1	TM2 domain-containing protein	100.0	72.8	92.5
MGA_1060	LOCUS_10230	sequence41:126377..127288(+)	frameshift		126375	WP_001548380.1	heme A synthase	99.7	84.8	92.7
MGA_1099	LOCUS_10620	sequence41:168507..169043(+)	partial			WP_000273253.1	energy-coupling factor transporter transmembrane protein EcfT	100.0	66.4	91.0
MGA_1134	LOCUS_10970	sequence41:208903..209220(-)	frameshift		209326	WP_000620949.1	GNAT family N-acetyltransferase	100.0	57.4	84.8
MGA_1135	LOCUS_10980	sequence41:209315..209455(-)	frameshift		209326	WP_000620949.1	GNAT family N-acetyltransferase	93.5	23.5	76.7
MGA_1136	LOCUS_10990	sequence41:209620..209832(+)	partial			WP_001788574.1	NINE protein	100.0	72.9	82.9
MGA_1285	LOCUS_12480	sequence41:362966..365944(-)	partial			WP_001056195.1	MSCRAMM family adhesin clumping factor ClfA	57.3	56.5	70.4
MGA_1287	LOCUS_12500	sequence41:366981..367805(-)	partial			WP_011087810.1	N-acyl homoserine lactonase family protein	72.6	65.9	25.1
MGA_1292	LOCUS_12550	sequence41:372085..372234(-)	frameshift		372302	WP_000159787.1	transposase	83.7	45.6	75.6
MGA_1349	LOCUS_13120	sequence41:438352..438606(-)	partial			WP_001617169.1	hypothetical protein	40.5	73.5	77.8
MGA_1384	LOCUS_13470	sequence41:475050..475232(+)	internal_stop_codon	474978..474980(+),474927..474929(+)		WP_001801730.1	hypothetical protein	100.0	52.2	76.7
MGA_1445	LOCUS_14080	sequence41:538353..539345(+)	partial			WP_024666576.1	YqcI/YcgG family protein	54.8	70.0	23.9
MGA_1459	LOCUS_14220	sequence41:550838..551251(+)	internal_stop_codon	551249..551251(+)		WP_001557159.1	DMT family transporter	100.0	44.3	81.8
MGA_1460	LOCUS_14230	sequence41:551270..551767(+)	internal_stop_codon	551249..551251(+)		WP_001557159.1	DMT family transporter	87.9	46.9	79.3
MGA_1483	LOCUS_14460	sequence41:574586..574927(-)	partial			WP_000798967.1	DUF1450 domain-containing protein	69.0	69.0	100.0
MGA_1528	LOCUS_14910	sequence42:41373..41915(-)	partial			WP_000835971.1	tandem-type lipoprotein	100.0	69.2	74.4
MGA_1541	LOCUS_15040	sequence42:53301..54560(-)	frameshift		54589	WP_000028663.1	type I restriction-modification system subunit M	100.0	80.9	98.3
MGA_1542	LOCUS_15050	sequence42:54557..54847(-)	frameshift		54589	WP_000028663.1	type I restriction-modification system subunit M	85.4	15.8	98.8
MGA_1558	LOCUS_15210	sequence42:67350..67553(-)	frameshift,internal_stop_codon	67335..67337(-)	67355	WP_001293076.1	terminase small subunit	85.1	30.2	87.7
MGA_1689	LOCUS_16500	sequence44:116201..116449(+)	frameshift		116147	WP_001791980.1	hypothetical protein	98.8	74.3	71.6
MGA_1696	LOCUS_16570	sequence44:124021..124707(-)	partial			WP_003894962.1	MBL fold metallo-hydrolase	68.4	77.9	29.6
MGA_1710	LOCUS_16710	sequence44:141321..141548(-)	partial			WP_000160701.1	AAA family ATPase	98.7	27.3	87.8
MGA_1711	LOCUS_16720	sequence44:141589..141924(+)	partial			WP_126475239.1	IS1182 family transposase	89.2	18.2	96.0
MGA_1721	LOCUS_16820	sequence44:150193..153045(-)	partial			WP_000745891.1	MSCRAMM family adhesin clumping factor ClfB	60.3	62.9	84.5
MGA_1746	LOCUS_17070	sequence44:187661..188053(-)	partial			WP_000044547.1	serine-rich repeat glycoprotein adhesin SasA	80.0	4.3	50.0
MGA_1747	LOCUS_17080	sequence44:187950..188294(+)	internal_stop_codon	188292..188294(+),188562..188564(+),187944..187946(+)		WP_002485492.1	hypothetical protein	91.2	19.6	41.9
MGA_1749	LOCUS_17100	sequence44:188598..189218(+)	internal_stop_codon	188562..188564(+),189216..189218(+)		WP_235601755.1	hypothetical protein	99.5	20.5	40.7
MGA_1750	LOCUS_17110	sequence44:189402..190136(+)	internal_stop_codon	190314..190316(+),190134..190136(+),189216..189218(+),190284..190286(+),190212..190214(+)		WP_002485492.1	hypothetical protein	68.0	33.5	39.4
MGA_1752	LOCUS_17130	sequence44:190722..191390(+)	internal_stop_codon	191388..191390(+),191520..191522(+),190650..190652(+)		WP_002485492.1	hypothetical protein	89.2	35.4	39.0
MGA_1753	LOCUS_17140	sequence44:191652..192176(+)	internal_stop_codon	191388..191390(+),191520..191522(+),192174..192176(+)		WP_002485492.1	hypothetical protein	67.8	20.3	38.9
MGA_1760	LOCUS_17210	sequence44:198968..199177(+)	partial			WP_001260044.1	hypothetical protein	66.7	46.0	65.2
MGA_1762	LOCUS_17230	sequence44:200145..202238(+)	partial			WP_001260044.1	hypothetical protein	10.3	72.0	94.4
MGA_1776	LOCUS_17370	sequence44:215147..215779(-)	frameshift		215790	WP_000592610.1	imidazole glycerol phosphate synthase subunit HisF	100.0	45.5	95.2
MGA_1817	LOCUS_17780	sequence44:252356..252493(-)	partial			WP_000240855.1	50S ribosomal protein L34	60.0	60.0	100.0
MGA_1845	LOCUS_18060	sequence44:289995..290162(+)	partial			WP_020444595.1	hydroxymethylglutaryl-CoA synthase	100.0	42.6	100.0
MGA_1849	LOCUS_18100	sequence44:294339..295325(+)	partial			WP_000952923.1	beta-lactam sensor/signal transducer MecR1	96.3	54.0	100.0
MGA_1884	LOCUS_18450	sequence45:33305..33466(-)	frameshift,internal_stop_codon	33304..33306(-),33535..33537(-)	33546	WP_084146450.1	carboxylesterase/lipase family protein	100.0	10.7	41.9
MGA_1928	LOCUS_18890	sequence45:77983..78183(-)	partial			WP_000671712.1	MAP domain-containing protein	100.0	68.8	59.1
MGA_1929	LOCUS_18900	sequence45:78304..79398(-)	internal_stop_codon	78304..78306(-)		WP_001557458.1	extracellular adherence protein Eap/Map	98.9	76.3	57.6
MGA_1946	LOCUS_19070	sequence45:96530..96670(-)	partial			WP_072050172.1	Ig-like domain-containing protein	100.0	62.2	97.8
MGA_1963	LOCUS_19240	sequence45:105858..106046(-)	partial			WP_000195784.1	DUF1381 domain-containing protein	79.0	72.1	91.8
MGA_1967	LOCUS_19280	sequence45:107668..108015(-)	partial			WP_072467505.1	acetyltransferase	36.5	35.5	69.0
MGA_1977	LOCUS_19380	sequence45:112745..113206(-)	internal_stop_codon	113318..113320(-)		WP_000700557.1	AAA family ATPase	100.0	23.6	93.5
MGA_1978	LOCUS_19390	sequence45:113318..114694(-)	internal_stop_codon	113318..113320(-)		WP_000700554.1	AAA family ATPase	99.6	70.5	95.2
MGA_2000	LOCUS_19610	sequence45:129778..130053(+)	frameshift,internal_stop_codon	129764..129766(+),129779..129781(+),129695..129697(+)	129808	WP_000179343.1	tyrosine-type recombinase/integrase	69.2	15.6	58.7
MGA_2004	LOCUS_19650	sequence45:133027..134247(-)	partial			WP_000120296.1	SdrH family protein	55.9	54.7	80.2
MGA_2031	LOCUS_19920	sequence45:162273..162566(+)	frameshift		162533	WP_000531823.1	3-isopropylmalate dehydratase large subunit	94.8	20.2	94.6
MGA_2032	LOCUS_19930	sequence45:162568..163644(+)	frameshift		162533	WP_000531823.1	3-isopropylmalate dehydratase large subunit	100.0	78.5	95.3
MGA_2113	LOCUS_20700	sequence46:40148..40483(-)	frameshift,internal_stop_codon	40148..40150(-)	40541	WP_096810449.1	site-specific integrase	99.1	31.0	33.6
MGA_2114	LOCUS_20710	sequence46:40497..40808(-)	frameshift		40828,40519	WP_000857191.1	site-specific integrase	93.2	27.8	30.2
MGA_2120	LOCUS_20770	sequence46:43707..45053(-)	partial			WP_011860984.1	DUF4041 domain-containing protein	86.8	70.8	33.5
MGA_2122	LOCUS_20790	sequence46:47500..47775(+)	internal_stop_codon	47431..47433(+)		WP_000782463.1	bi-component leukocidin LukED subunit D	85.7	23.9	87.2
MGA_2125	LOCUS_20820	sequence46:49349..49591(+)	partial			WP_000586140.1	hypothetical protein	100.0	34.5	90.0
MGA_2130	LOCUS_20870	sequence46:54308..55918(-)	partial			WP_009933212.1	hypothetical protein	30.2	46.2	29.6
MGA_2131	LOCUS_20880	sequence46:55956..56408(+)	partial			WP_000755747.1	DUF1433 domain-containing protein	70.7	77.2	30.8
MGA_2168	LOCUS_21250	sequence46:87751..88488(+)	frameshift		88389	WP_001159037.1	3,4-dihydroxy-2-butanone-4-phosphate synthase	86.9	54.2	89.7
MGA_2169	LOCUS_21260	sequence46:88428..88904(+)	frameshift		88401	WP_001159037.1	3,4-dihydroxy-2-butanone-4-phosphate synthase	100.0	40.2	92.4
MGA_2213	LOCUS_21700	sequence46:150042..150506(+)	partial			WP_126475239.1	IS1182 family transposase	90.3	26.2	90.2
MGA_2243	LOCUS_22000	sequence46:187082..188041(+)	partial			WP_000849428.1	hypothetical protein	99.4	64.0	89.0
MGA_2244	LOCUS_22010	sequence46:188238..188687(-)	frameshift		188769	WP_055164393.1	IS30 family transposase	87.9	42.7	39.3
MGA_2263	LOCUS_22200	sequence46:202552..203073(+)	partial			WP_000849428.1	hypothetical protein	100.0	34.9	81.5
MGA_2267	LOCUS_22240	sequence46:207929..208150(+)	frameshift,internal_stop_codon	208430..208432(+),208148..208150(+)	207930	WP_126475239.1	IS1182 family transposase	97.3	13.0	88.7
MGA_2268	LOCUS_22250	sequence46:208241..208432(+)	frameshift,internal_stop_codon	208430..208432(+),208708..208710(+),208148..208150(+)	208596,208692	WP_126475239.1	IS1182 family transposase	100.0	11.6	98.4
MGA_2293	LOCUS_22500	sequence46:237026..237496(+)	partial			WP_000261115.1	A24 family peptidase	100.0	66.4	61.5
MGA_2369	LOCUS_23260	sequence46:311740..311916(+)	partial			WP_000048060.1	30S ribosomal protein S21	74.1	74.1	100.0
MGA_2435	LOCUS_23920	sequence46:371436..372032(+)	partial			WP_001283968.1	winged helix-turn-helix transcriptional regulator	97.0	51.3	33.9
MGA_2455	LOCUS_24120	sequence46:390243..390473(+)	frameshift		390461	WP_001557355.1	DUF1672 domain-containing protein	96.1	23.7	95.9
MGA_2456	LOCUS_24130	sequence46:390560..391108(+)	frameshift		390461	WP_001557355.1	DUF1672 domain-containing protein	100.0	59.1	95.6
MGA_2457	LOCUS_24140	sequence46:391543..391797(+)	frameshift		391782	WP_000476865.1	DUF1672 domain-containing protein	90.5	25.2	90.8
MGA_2458	LOCUS_24150	sequence46:391736..392455(+)	frameshift		391782	WP_000476346.1	DUF1672 domain-containing protein	89.1	71.5	75.6
MGA_2459	LOCUS_24160	sequence46:392565..392726(+)	frameshift		392690	WP_000913243.1	DUF1672 domain-containing protein	83.0	13.8	84.1
MGA_2460	LOCUS_24170	sequence46:392692..393393(+)	frameshift		392690	WP_000913243.1	DUF1672 domain-containing protein	97.0	71.1	93.4
MGA_2510	LOCUS_24670	sequence46:447763..461148(+)	partial			WP_080388512.1	hyperosmolarity resistance protein Ebh	99.9	44.9	36.1
MGA_2538	LOCUS_24930	sequence48:20678..21322(-)	partial			WP_001059647.1	ISL3 family transposase	99.5	48.4	45.1
MGA_2540	LOCUS_24950	sequence48:21850..22920(+)	frameshift,internal_stop_codon	21780..21782(+)	21854	WP_016117864.1	ATP-binding protein	98.3	62.3	31.7
MGA_2543	LOCUS_24980	sequence48:23823..24767(+)	frameshift		24746	WP_016117865.1	TnsD family Tn7-like transposition protein	92.4	46.3	28.9
MGA_2544	LOCUS_24990	sequence48:24764..25288(+)	frameshift		24749	WP_016117865.1	TnsD family Tn7-like transposition protein	90.8	25.9	29.9
MGA_2549	LOCUS_25040	sequence48:27279..27581(+)	partial			WP_158908668.1	HsdR family type I site-specific deoxyribonuclease	92.0	15.0	48.9
MGA_2566	LOCUS_25200	sequence48:43879..44274(+)	partial			WP_000667269.1	deoxyribose-phosphate aldolase	100.0	59.5	93.9
