# locus_id	locus_tag	location	classification	internal_stop	indel	ref_id	description	query_cov	ref_cov	identity
MGA_7	LOCUS_00050	sequence1:7830..8873(+)	frameshift		7785	WP_009901597.1	PTS cellobiose transporter subunit IIC	99.7	80.9	35.7
MGA_24	LOCUS_00220	sequence1:32086..34803(+)	partial			WP_002681765.1	leucine-rich repeat domain-containing protein	24.6	33.9	32.6
MGA_92	LOCUS_00900	sequence1:114808..115092(-)	partial			WP_002287688.1	tyrosine-type recombinase/integrase	92.6	21.8	58.6
MGA_93	LOCUS_00910	sequence1:115188..116033(-)	frameshift		116077	WP_099434174.1	IS3-like element ISEfa8 family transposase	98.9	71.8	75.9
MGA_94	LOCUS_00920	sequence1:116069..116359(-)	frameshift		116083	WP_086956687.1	IS3 family transposase	97.9	24.3	84.0
MGA_108	LOCUS_01060	sequence1:127225..127563(-)	partial			WP_016381870.1	hypothetical protein	92.9	61.3	47.1
MGA_121	LOCUS_01190	sequence1:137735..138934(+)	partial			WP_002299473.1	hypothetical protein	56.4	84.6	22.4
MGA_145	LOCUS_01430	sequence1:163035..164015(+)	internal_stop_codon	162837..162839(+)		WP_002285820.1	ISL3 family transposase	89.3	72.6	60.5
MGA_157	LOCUS_01550	sequence1:178828..179454(+)	partial			WP_002286012.1	DUF624 domain-containing protein	72.6	65.7	35.1
MGA_205	LOCUS_02030	sequence1:226955..228703(+)	partial			WP_003233292.1	multidrug resistance ABC transporter ATP-binding protein/permease BmrD	86.6	74.9	46.5
MGA_256	LOCUS_02540	sequence1:275019..275183(+)	partial			WP_002358151.1	hypothetical protein	87.0	70.1	55.3
MGA_264	LOCUS_02620	sequence1:283531..283770(+)	partial			WP_002289017.1	preprotein translocase subunit SecG	73.4	74.4	74.1
MGA_269	LOCUS_02670	sequence1:288878..289090(+)	partial			WP_002356552.1	ATP synthase F0 subunit C	77.1	74.0	74.1
MGA_280	LOCUS_02780	sequence1:298265..299011(+)	partial			WP_003733142.1	resuscitation-promoting factor	42.3	24.8	55.6
MGA_302	LOCUS_03000	sequence1:318867..319100(+)	partial			WP_002294972.1	PspC domain-containing protein	75.3	54.7	69.0
MGA_313	LOCUS_03110	sequence1:326086..326676(-)	partial			WP_002382413.1	lipoprotein	70.9	68.5	65.5
MGA_374	LOCUS_03720	sequence1:381861..383216(+)	partial			WP_002295400.1	LCP family protein	71.0	76.2	54.4
MGA_383	LOCUS_03810	sequence1:395373..395663(+)	frameshift		395648	WP_086956687.1	IS3 family transposase	97.9	24.3	84.0
MGA_384	LOCUS_03820	sequence1:395699..396544(+)	frameshift		395654	WP_099434174.1	IS3-like element ISEfa8 family transposase	98.9	71.8	75.9
MGA_398	LOCUS_03960	sequence1:408480..409022(+)	partial			WP_011403943.1	HNH endonuclease	25.6	27.7	47.8
MGA_426	LOCUS_04240	sequence1:433275..433865(+)	frameshift		433862	WP_021721377.1	flavodoxin	79.1	70.1	58.7
MGA_427	LOCUS_04250	sequence1:433862..434032(+)	frameshift		433862	WP_021721377.1	flavodoxin	96.4	24.4	50.0
MGA_441	LOCUS_04390	sequence1:445143..445418(+)	partial			WP_012546378.1	helix-turn-helix transcriptional regulator	90.1	64.6	40.5
MGA_450	LOCUS_04480	sequence1:454504..454830(+)	internal_stop_codon	454828..454830(+)		WP_002311258.1	helix-turn-helix domain-containing protein	100.0	21.0	47.3
MGA_451	LOCUS_04490	sequence1:454837..456039(+)	internal_stop_codon	454828..454830(+)		WP_002311258.1	helix-turn-helix domain-containing protein	96.8	74.6	49.4
MGA_471	LOCUS_04690	sequence1:478116..478382(-)	partial			WP_003138385.1	IS256-like element IS905 family transposase	96.6	21.7	64.7
MGA_476	LOCUS_04740	sequence1:481478..482119(+)	partial			WP_002355000.1	peptidase C39 family protein	85.0	72.5	34.6
MGA_538	LOCUS_05360	sequence1:540755..541063(+)	frameshift		540701	WP_011109521.1	class I SAM-dependent methyltransferase	97.1	61.2	59.6
MGA_546	LOCUS_05440	sequence1:549744..551525(+)	partial			WP_010922467.1	hypothetical protein	59.2	67.4	38.5
MGA_560	LOCUS_05580	sequence1:558012..562757(+)	partial			WP_012047792.1	phage tail tape measure protein	28.7	46.3	36.8
MGA_561	LOCUS_05590	sequence1:562773..563465(+)	partial			WP_004398548.1	LysM peptidoglycan-binding domain-containing protein	59.6	62.1	34.8
MGA_573	LOCUS_05710	sequence1:571077..572054(+)	partial			WP_004399108.1	N-acetylmuramoyl-L-alanine amidase BlyA	60.6	61.3	29.3
MGA_586	LOCUS_05840	sequence1:585853..586206(+)	frameshift		586134	WP_002379592.1	hypothetical protein	75.2	27.4	35.2
MGA_621	LOCUS_06190	sequence1:617327..619327(+)	partial			WP_012256471.1	carbohydrate-binding domain-containing protein	46.1	53.9	38.4
MGA_624	LOCUS_06220	sequence1:620584..621450(+)	internal_stop_codon	620542..620544(+)		WP_002286064.1	HAMP domain-containing sensor histidine kinase	99.3	64.6	41.0
MGA_713	LOCUS_07110	sequence1:718254..719321(+)	partial			WP_002289045.1	DUF58 domain-containing protein	74.6	80.5	25.5
MGA_798	LOCUS_07960	sequence1:811684..812697(+)	partial			WP_211157632.1	Ltp family lipoprotein	26.4	46.4	46.1
MGA_861	LOCUS_08590	sequence1:874533..874667(-)	internal_stop_codon	874533..874535(-)		WP_011222020.1	metalloregulator ArsR/SmtB family transcription factor	95.5	34.5	57.1
MGA_871	LOCUS_08690	sequence1:882900..883967(-)	partial			WP_011027879.1	serine hydrolase	64.8	73.6	31.5
MGA_888	LOCUS_08860	sequence1:901248..902735(-)	partial			WP_002287092.1	glucose PTS transporter subunit IIA	96.2	72.6	54.9
MGA_891	LOCUS_08890	sequence1:904871..905560(-)	partial			WP_010906017.1	ABC transporter ATP-binding protein	92.6	39.1	45.1
MGA_924	LOCUS_09220	sequence1:935968..936912(+)	partial			WP_002287386.1	NlpC/P60 family protein	88.2	48.9	36.4
MGA_976	LOCUS_09740	sequence1:991698..992543(-)	frameshift		992587	WP_099434174.1	IS3-like element ISEfa8 family transposase	98.9	71.8	75.9
MGA_977	LOCUS_09750	sequence1:992579..992869(-)	frameshift		992593	WP_086956687.1	IS3 family transposase	97.9	24.3	84.0
MGA_979	LOCUS_09770	sequence1:993450..994367(-)	partial			WP_011963749.1	glycosyltransferase	74.8	73.2	28.3
MGA_984	LOCUS_09820	sequence1:999321..1000268(-)	partial			WP_000998260.1	glycosyltransferase	68.6	32.1	41.8
MGA_1005	LOCUS_10030	sequence1:1019553..1021058(+)	partial			WP_001035315.1	pneumococcal surface protein A	50.1	39.7	38.9
MGA_1010	LOCUS_10080	sequence1:1025216..1027366(+)	frameshift,internal_stop_codon	1027364..1027366(+)	1027360,1027432,1027435,1027405,1027357,1027423	WP_010964394.1	hypothetical protein	57.8	15.1	32.9
MGA_1011	LOCUS_10090	sequence1:1027383..1028969(+)	frameshift		1027360	WP_001035315.1	pneumococcal surface protein A	41.7	35.1	41.4
MGA_1013	LOCUS_10110	sequence1:1030127..1033336(-)	partial			WP_001035315.1	pneumococcal surface protein A	38.2	71.9	29.6
MGA_1030	LOCUS_10280	sequence1:1052024..1052482(-)	frameshift		1052574	WP_002356883.1	TetR/AcrR family transcriptional regulator	98.7	78.9	52.0
MGA_1083	LOCUS_10810	sequence1:1102142..1102987(-)	frameshift		1103031	WP_099434174.1	IS3-like element ISEfa8 family transposase	98.9	71.8	75.5
MGA_1084	LOCUS_10820	sequence1:1103023..1103313(-)	frameshift		1103037	WP_086956687.1	IS3 family transposase	97.9	24.3	84.0
MGA_1085	LOCUS_10830	sequence1:1104846..1105691(-)	frameshift		1105735	WP_099434174.1	IS3-like element ISEfa8 family transposase	98.9	71.8	75.9
MGA_1086	LOCUS_10840	sequence1:1105727..1106017(-)	frameshift		1105741	WP_086956687.1	IS3 family transposase	97.9	24.3	84.0
MGA_1148	LOCUS_11430	sequence2:26881..27129(+)	partial			WP_000946120.1	ABC transporter ATP-binding protein	72.0	11.8	47.5
MGA_1207	LOCUS_12020	sequence2:86377..87072(-)	partial			WP_003566834.1	class A sortase	72.7	70.8	33.5
MGA_1227	LOCUS_12220	sequence2:108533..109474(+)	partial			WP_011023368.1	ribosome small subunit-dependent GTPase A	85.6	72.4	44.1
MGA_1239	LOCUS_12340	sequence2:119558..121798(+)	partial			WP_012582581.1	glycosyl hydrolase	57.8	42.9	26.3
MGA_1241	LOCUS_12360	sequence2:122801..124249(-)	partial			WP_010937845.1	sigma-54 dependent transcriptional regulator	34.0	35.1	31.7
MGA_1251	LOCUS_12460	sequence2:136968..140045(+)	partial			WP_010886437.1	rhamnogalacturonan exolyase	40.0	62.3	42.1
MGA_1252	LOCUS_12470	sequence2:140145..140681(+)	frameshift		140686	WP_012582581.1	glycosyl hydrolase	57.9	10.2	46.6
MGA_1254	LOCUS_12490	sequence2:143437..147024(+)	partial			WP_013225532.1	glycosyl hydrolase 115 family protein	69.7	83.9	32.0
MGA_1285	LOCUS_12800	sequence2:182280..183128(-)	partial			WP_010964372.1	arginase	67.4	63.5	39.5
MGA_1299	LOCUS_12940	sequence2:194757..198071(+)	partial			WP_010990018.1	SpaA isopeptide-forming pilin-related protein	14.5	9.9	29.2
MGA_1300	LOCUS_12950	sequence2:198073..200196(+)	partial			WP_011674874.1	pilin N-terminal domain-containing protein	49.6	77.5	30.8
MGA_1316	LOCUS_13110	sequence2:217879..219834(+)	partial			WP_010989386.1	class 1 internalin InlH	37.5	41.1	29.4
MGA_1330	LOCUS_13250	sequence2:234782..235909(+)	partial			WP_002379219.1	tRNA lysidine(34) synthetase TilS	57.1	48.7	40.2
MGA_1341	LOCUS_13330	sequence2:252584..253699(-)	partial			WP_011674942.1	sensor histidine kinase	63.1	78.5	57.1
MGA_1406	LOCUS_13980	sequence2:322177..325641(+)	partial			WP_140834635.1	Ig-like domain-containing protein	64.9	34.0	32.2
MGA_1409	LOCUS_14010	sequence2:328250..328792(+)	partial			WP_041272775.1	polysaccharide deacetylase family protein	46.7	23.8	38.4
MGA_1410	LOCUS_14020	sequence2:328981..329787(-)	partial			WP_002932053.1	AraC family transcriptional regulator	36.9	33.8	32.3
MGA_1448	LOCUS_14400	sequence2:370647..370823(+)	partial			WP_002356740.1	30S ribosomal protein S21	74.1	74.1	100.0
MGA_1476	LOCUS_14680	sequence2:401404..401913(+)	partial			WP_005814144.1	methylated-DNA--[protein]-cysteine S-methyltransferase	68.6	68.0	55.6
MGA_1481	LOCUS_14730	sequence2:405631..406281(-)	internal_stop_codon	406330..406332(-)		WP_011101137.1	DNA/RNA non-specific endonuclease	68.1	44.9	66.0
MGA_1502	LOCUS_14940	sequence2:426811..426990(-)	partial			WP_000340579.1	winged helix-turn-helix transcriptional regulator	98.3	46.0	63.8
MGA_1516	LOCUS_15080	sequence2:443964..444563(+)	partial			WP_011964264.1	virulence RhuM family protein	84.4	48.8	56.5
MGA_1523	LOCUS_15150	sequence2:449202..450515(+)	partial			WP_002285885.1	ABC transporter ATP-binding protein	99.5	73.9	76.1
MGA_1563	LOCUS_15550	sequence2:491072..492187(+)	frameshift		492178	WP_011673957.1	ABC transporter ATP-binding protein	96.0	66.0	27.0
MGA_1564	LOCUS_15560	sequence2:492223..492636(+)	frameshift		492181	WP_002680518.1	ABC transporter ATP-binding protein	98.5	26.7	33.8
MGA_1635	LOCUS_16270	sequence2:568003..568824(+)	partial			WP_002355904.1	cell division protein DivIVA	71.4	83.7	63.1
MGA_1728	LOCUS_17200	sequence3:106490..106780(+)	frameshift		106765	WP_086956687.1	IS3 family transposase	97.9	24.3	84.0
MGA_1729	LOCUS_17210	sequence3:106816..107661(+)	frameshift		106771	WP_099434174.1	IS3-like element ISEfa8 family transposase	98.9	71.8	75.5
MGA_1741	LOCUS_17330	sequence3:117093..117407(+)	partial			WP_002295743.1	IS982-like element ISEfm1 family transposase	98.1	33.8	49.0
MGA_1747	LOCUS_17390	sequence3:123465..124046(-)	partial			WP_168722861.1	IS3 family transposase	98.4	72.3	47.6
MGA_1867	LOCUS_18590	sequence3:240081..240959(+)	partial			WP_003234977.1	bacillibactin transport transcriptional regulator Btr	54.1	28.9	29.7
MGA_1893	LOCUS_18850	sequence3:265768..268179(+)	partial			WP_199567761.1	glycoside hydrolase family 2 TIM barrel-domain containing protein	94.9	33.7	28.4
MGA_1956	LOCUS_19480	sequence4:16783..17514(+)	partial			WP_011109477.1	endocarditis and biofilm-associated pilus major subunit EbpC	74.1	28.5	34.8
MGA_1962	LOCUS_19540	sequence4:23459..23815(+)	partial			WP_025481136.1	type IA DNA topoisomerase	99.2	15.9	65.8
MGA_1964	LOCUS_19560	sequence4:25572..26441(-)	partial			WP_002287807.1	ABC transporter permease/substrate binding protein	98.6	48.7	47.9
MGA_1992	LOCUS_19840	sequence4:50022..50312(+)	frameshift		50297	WP_086956687.1	IS3 family transposase	97.9	24.3	84.0
MGA_1993	LOCUS_19850	sequence4:50348..51193(+)	frameshift		50303	WP_099434174.1	IS3-like element ISEfa8 family transposase	98.9	71.8	75.9
