# locus_id	locus_tag	location	classification	internal_stop	indel	ref_id	description	query_cov	ref_cov	identity
MGA_17	LOCUS_00050	sequence011:4680..6953(-)	partial			WP_007052353.1	CHAP domain-containing protein	12.2	28.9	53.8
MGA_24	LOCUS_00120	sequence011:13457..14434(-)	partial			WP_011860781.1	replication initiator protein A	57.5	68.3	36.1
MGA_41	LOCUS_00290	sequence011:33040..33435(-)	partial			WP_003428415.1	transcription antitermination factor NusB	78.6	62.5	42.5
MGA_45	LOCUS_00330	sequence011:35935..36174(-)	partial			WP_002294955.1	YneF family protein	65.8	70.3	57.7
MGA_58	LOCUS_00460	sequence011:47595..49622(-)	partial			WP_011963674.1	AAA family ATPase	72.0	84.2	25.0
MGA_84	LOCUS_00600	sequence022:6712..7281(+)	partial			WP_012775077.1	class I SAM-dependent methyltransferase	95.2	71.7	47.8
MGA_102	LOCUS_00780	sequence022:24700..25866(+)	partial			WP_001097917.1	AraC family transcriptional regulator	35.8	35.0	32.9
MGA_107	LOCUS_00830	sequence022:30588..30950(+)	frameshift,internal_stop_codon	31053..31055(+),30999..31001(+),31035..31037(+),30948..30950(+)	31124	WP_011861353.1	DUF6017 domain-containing protein	82.5	29.5	72.7
MGA_124	LOCUS_01000	sequence022:42568..43293(-)	frameshift,internal_stop_codon	43343..43345(-),43361..43363(-)	43336	WP_011017159.1	PDDEXK nuclease domain-containing protein	97.1	68.0	47.4
MGA_125	LOCUS_01010	sequence022:43361..43618(-)	frameshift,internal_stop_codon	43343..43345(-),43361..43363(-)	43336	WP_011017159.1	PDDEXK nuclease domain-containing protein	89.4	22.0	50.0
MGA_126	LOCUS_01020	sequence022:43951..44808(+)	frameshift		44778	WP_000031832.1	recombinase family protein	96.8	49.4	71.0
MGA_139	LOCUS_01050	sequence033:1794..2426(+)	partial			WP_000413738.1	transcriptional repressor LexA	62.4	65.5	44.9
MGA_168	LOCUS_01340	sequence033:37363..38592(+)	partial			WP_002382901.1	polysaccharide deacetylase family protein	51.3	39.5	39.5
MGA_255	LOCUS_01940	sequence055:11741..11956(+)	partial			WP_011241744.1	type II toxin-antitoxin system PemK/MazF family toxin	98.6	63.2	55.6
MGA_256	LOCUS_01950	sequence055:12117..12365(+)	internal_stop_codon	12363..12365(+)		WP_011016217.1	putative DNA binding domain-containing protein	100.0	17.4	55.4
MGA_257	LOCUS_01960	sequence055:12706..12933(+)	internal_stop_codon	12700..12702(+)		WP_011861367.1	DEAD/DEAH box helicase family protein	88.0	2.2	93.9
MGA_258	LOCUS_01970	sequence055:13080..13718(+)	partial			WP_004802604.1	DNA-binding protein	67.9	68.0	74.5
MGA_261	LOCUS_02000	sequence055:15346..15675(-)	partial			WP_011860793.1	relaxase/mobilization nuclease domain-containing protein	100.0	24.6	82.6
MGA_262	LOCUS_02010	sequence055:15769..16323(-)	partial			WP_011020063.1	IS21-like element ISMac3 family helper ATPase IstB	81.0	58.0	51.0
MGA_263	LOCUS_02020	sequence055:16374..16553(+)	frameshift		16532	WP_209421102.1	IS3 family transposase	93.2	12.1	60.0
MGA_264	LOCUS_02030	sequence055:16588..16887(+)	frameshift		16881,16532	WP_211260004.1	IS3 family transposase	88.9	19.4	47.7
MGA_265	LOCUS_02040	sequence055:16995..17774(+)	frameshift,internal_stop_codon	16885..16887(+)	16890	WP_211260004.1	IS3 family transposase	98.1	53.5	52.0
MGA_266	LOCUS_02050	sequence055:17843..18823(-)	partial			WP_011837284.1	sensor histidine kinase	64.7	64.7	48.1
MGA_270	LOCUS_02090	sequence055:21450..22277(-)	partial			WP_000022803.1	protein jag	58.2	74.6	40.0
MGA_276	LOCUS_02150	sequence055:27741..34247(+)	partial			WP_000278319.1	CshA/CshB family fibrillar adhesin-related protein	73.5	39.1	26.2
MGA_289	LOCUS_02180	sequence066:1..890(+)	partial			WP_010976587.1	choline binding-anchored murein hydrolase LytC	91.5	58.5	32.5
MGA_290	LOCUS_02190	sequence066:928..2643(+)	partial			WP_011836393.1	GBS Bsp-like repeat-containing protein	29.2	17.3	36.9
MGA_294	LOCUS_02230	sequence066:4915..6216(-)	partial			WP_001125236.1	serine hydrolase	74.6	81.3	61.0
MGA_306	LOCUS_02350	sequence066:23744..24721(-)	partial			WP_196835716.1	adenine-specific methyltransferase EcoRI family protein	92.3	73.6	39.3
MGA_320	LOCUS_02430	sequence073:45..239(+)	partial			WP_010989279.1	formate dehydrogenase N subunit alpha, selenocysteine-containing	100.0	9.0	98.4
MGA_326	LOCUS_02450	sequence077:1570..4623(-)	partial			WP_012775483.1	GAG-binding domain-containing protein	36.0	54.2	24.4
MGA_331	LOCUS_02500	sequence077:8657..9673(-)	partial			WP_002438072.1	transglycosylase family protein	41.7	54.0	57.4
MGA_361	LOCUS_02700	sequence086:125..385(-)	partial			WP_004186182.1	MaoC family dehydratase	91.9	52.0	48.1
MGA_396	LOCUS_02900	sequence099:1410..2045(-)	partial			WP_002390108.1	class A sortase	58.8	58.7	28.7
MGA_463	LOCUS_03430	sequence111:8501..9364(-)	partial			WP_001034334.1	Rha family transcriptional regulator	32.1	58.8	34.7
MGA_465	LOCUS_03450	sequence111:9816..10523(+)	partial			WP_010906223.1	helix-turn-helix transcriptional regulator	34.9	34.9	46.3
MGA_476	LOCUS_03560	sequence111:23467..23754(-)	frameshift,internal_stop_codon	23466..23468(-)	23765	WP_000103844.1	CopY/TcrY family copper transport repressor	100.0	64.2	89.5
MGA_477	LOCUS_03570	sequence111:23706..23858(-)	frameshift,internal_stop_codon	23466..23468(-)	23765	WP_000103844.1	CopY/TcrY family copper transport repressor	82.0	29.1	65.1
MGA_480	LOCUS_03600	sequence111:24963..25268(-)	frameshift,internal_stop_codon	24963..24965(-)	24851	WP_105158881.1	replication initiator protein A	94.1	34.9	63.2
MGA_483	LOCUS_03630	sequence111:27431..27706(-)	internal_stop_codon	27431..27433(-),27779..27781(-)		WP_000103844.1	CopY/TcrY family copper transport repressor	100.0	61.5	90.1
MGA_484	LOCUS_03640	sequence111:28452..29279(+)	frameshift,internal_stop_codon	28324..28326(+),28405..28407(+)	28401	WP_011837676.1	site-specific integrase	99.3	64.8	68.5
MGA_515	LOCUS_03950	sequence111:62249..62908(+)	partial			WP_010965992.1	TIGR01906 family membrane protein	70.8	66.1	26.2
MGA_516	LOCUS_03960	sequence111:62957..63502(+)	partial			WP_000798967.1	DUF1450 domain-containing protein	51.4	82.3	47.3
MGA_524	LOCUS_04040	sequence111:70699..71235(-)	partial			WP_016252543.1	ISL3-like element IS1476 family transposase	86.0	36.8	37.2
MGA_525	LOCUS_04050	sequence111:71408..72148(-)	partial			WP_001059647.1	ISL3 family transposase	98.8	55.7	38.9
MGA_562	LOCUS_04420	sequence111:100041..100853(-)	internal_stop_codon	100950..100952(-)		WP_010932832.1	Eco57I restriction-modification methylase domain-containing protein	99.3	48.5	28.8
MGA_568	LOCUS_04480	sequence111:109971..110138(-)	partial			WP_011861353.1	DUF6017 domain-containing protein	96.4	15.8	75.5
MGA_571	LOCUS_04510	sequence111:112644..114290(-)	partial			WP_001083683.1	AAA family ATPase	54.4	67.8	38.9
MGA_589	LOCUS_04690	sequence111:133045..135225(-)	partial			WP_004398589.1	PBP1A family penicillin-binding protein	89.8	71.3	40.2
MGA_598	LOCUS_04780	sequence111:145930..146511(-)	partial			WP_011922483.1	YdcF family protein	93.8	53.9	65.7
MGA_606	LOCUS_04860	sequence111:153671..153844(-)	partial			WP_000048060.1	30S ribosomal protein S21	75.4	74.1	93.0
MGA_608	LOCUS_04880	sequence111:155009..155716(-)	partial			WP_003229340.1	RDD family protein	56.2	81.7	41.2
MGA_649	LOCUS_05290	sequence111:199160..200080(-)	partial			WP_000014253.1	nucleoside triphosphate pyrophosphohydrolase	98.4	65.0	33.5
MGA_650	LOCUS_05300	sequence111:200207..201232(-)	partial			WP_007052354.1	NlpC/P60 family protein	49.9	69.8	31.1
MGA_653	LOCUS_05330	sequence111:203158..203721(-)	partial			WP_003405093.1	TVP38/TMEM64 family protein	95.2	72.4	42.1
MGA_659	LOCUS_05390	sequence111:210708..>215890(-)	partial			WP_011836870.1	ZmpA/ZmpB/ZmpC family metallo-endopeptidase	99.1	58.3	28.5
MGA_671	LOCUS_05400	sequence122:307..1017(-)	partial			WP_012047975.1	ABC transporter ATP-binding protein	87.7	73.3	33.0
MGA_701	LOCUS_05600	sequence133:146..1138(-)	partial			WP_001044255.1	membrane protein	73.3	54.9	29.5
MGA_714	LOCUS_05730	sequence133:8371..9333(+)	partial			WP_002379597.1	CdaR family protein	88.1	72.4	23.7
MGA_719	LOCUS_05780	sequence133:12986..>19439(-)	partial			WP_011836870.1	ZmpA/ZmpB/ZmpC family metallo-endopeptidase	100.0	73.4	36.5
MGA_731	LOCUS_05800	sequence144:1689..5738(+)	partial			WP_012775522.1	GbpC/Spa domain-containing protein	37.5	31.4	47.1
MGA_740	LOCUS_05890	sequence144:9537..16010(+)	partial			WP_011861367.1	DEAD/DEAH box helicase family protein	77.8	57.8	48.2
MGA_754	LOCUS_05920	sequence155:235..2622(-)	partial			WP_001263850.1	SP_1767 family glycosyltransferase	33.1	66.1	59.3
MGA_819	LOCUS_06340	sequence177:17060..>17890(-)	partial			WP_013399748.1	Rib/alpha-like domain-containing protein	98.9	9.5	31.9
MGA_836	LOCUS_06400	sequence188:6734..10960(-)	partial			WP_011836870.1	ZmpA/ZmpB/ZmpC family metallo-endopeptidase	48.4	23.4	31.2
MGA_867	LOCUS_06570	sequence203:5354..5959(+)	partial			WP_033729412.1	CPBP family intramembrane metalloprotease	76.1	71.0	40.0
MGA_878	LOCUS_06680	sequence203:14307..15047(-)	partial			WP_009039948.1	hypothetical protein	37.4	29.1	44.6
MGA_896	LOCUS_06840	sequence205:126..839(-)	internal_stop_codon	126..128(-)		WP_001831057.1	30S ribosomal protein S1	100.0	56.9	38.0
MGA_932	LOCUS_07200	sequence205:39797..41107(-)	frameshift,internal_stop_codon	41195..41197(-)	39799	WP_011962421.1	TaqI-like C-terminal specificity domain-containing protein	99.8	41.8	31.0
MGA_936	LOCUS_07240	sequence205:43342..44445(-)	frameshift		43785,43346,43761	WP_011962421.1	TaqI-like C-terminal specificity domain-containing protein	95.1	35.3	35.1
MGA_983	LOCUS_07710	sequence205:92355..93269(-)	partial			WP_000301254.1	recombinase family protein	93.1	55.3	40.5
MGA_987	LOCUS_07750	sequence205:94996..95400(-)	partial			WP_003721755.1	holin family protein	76.9	72.9	50.5
MGA_991	LOCUS_07790	sequence205:98881..99441(-)	partial			WP_010869841.1	hypothetical protein	74.7	16.1	32.2
MGA_992	LOCUS_07800	sequence205:99904..100995(-)	frameshift,internal_stop_codon	99904..99906(-)	101071	WP_000140777.1	phage tail tape measure protein	99.2	37.2	33.1
MGA_993	LOCUS_07810	sequence205:101045..101614(-)	frameshift,internal_stop_codon	101077..101079(-)	101080	WP_010905723.1	phage tail tape measure protein	94.2	25.5	35.4
MGA_1001	LOCUS_07890	sequence205:104259..105191(-)	internal_stop_codon	104259..104261(-)		WP_001137336.1	phage major capsid protein	100.0	78.5	24.0
MGA_1002	LOCUS_07900	sequence205:105269..105970(-)	partial			WP_000642728.1	Clp protease ClpP	67.0	63.3	41.0
MGA_1008	LOCUS_07960	sequence205:110444..111883(-)	partial			WP_041272166.1	DNA cytosine methyltransferase	46.3	32.1	49.1
MGA_1019	LOCUS_08070	sequence205:121383..122837(-)	frameshift		121430	WP_002399687.1	DNA polymerase	98.6	73.7	47.5
MGA_1021	LOCUS_08090	sequence205:123516..125924(-)	partial			WP_026138647.1	LysM peptidoglycan-binding domain-containing protein	36.4	46.0	38.1
MGA_1032	LOCUS_08200	sequence205:132133..133977(-)	internal_stop_codon	133993..133995(-)		WP_011459352.1	heavy metal translocating P-type ATPase	99.7	78.1	68.2
MGA_1033	LOCUS_08210	sequence205:133993..134214(-)	internal_stop_codon	133993..133995(-)		WP_002327795.1	heavy metal translocating P-type ATPase	89.0	9.4	56.9
MGA_1035	LOCUS_08230	sequence205:135077..135304(+)	partial			WP_010964810.1	DNA (cytosine-5-)-methyltransferase	88.0	17.6	55.4
MGA_1042	LOCUS_08300	sequence205:140475..140675(-)	partial			WP_000301254.1	recombinase family protein	77.3	9.8	80.4
MGA_1064	LOCUS_08520	sequence205:161729..162499(-)	partial			WP_011202952.1	ABC transporter permease	74.6	52.7	25.8
MGA_1086	LOCUS_08740	sequence205:181656..181982(-)	partial			WP_000257598.1	cell division protein FtsL	82.4	66.9	36.0
MGA_1135	LOCUS_09220	sequence207:9797..10006(+)	frameshift,internal_stop_codon	9728..9730(+),9713..9715(+)	9600,9590	WP_011922516.1	GNAT family N-acetyltransferase	98.6	41.7	55.9
MGA_1171	LOCUS_09470	sequence216:203..3757(-)	partial			WP_012775427.1	LPXTG cell wall anchor domain-containing protein	22.7	35.7	34.7
MGA_1185	LOCUS_09610	sequence216:20810..21556(+)	frameshift		21544	WP_011109350.1	ATP-binding protein	96.4	45.8	43.9
MGA_1186	LOCUS_09620	sequence216:21561..22028(+)	frameshift		21550	WP_011109350.1	ATP-binding protein	99.4	30.0	43.5
MGA_1213	LOCUS_09890	sequence216:47091..48146(-)	partial			WP_009933223.1	hypothetical protein	71.2	77.8	32.2
MGA_1225	LOCUS_10010	sequence216:62103..62681(-)	partial			WP_000182211.1	nucleotide exchange factor GrpE	74.0	68.3	53.5
MGA_1240	LOCUS_10160	sequence216:75876..76142(+)	partial			WP_011030014.1	hypothetical protein	46.6	40.6	63.4
MGA_1243	LOCUS_10190	sequence216:77206..78354(-)	partial			WP_005811634.1	pyruvate kinase	73.6	48.0	40.9
MGA_1247	LOCUS_10230	sequence216:81453..82415(-)	partial			WP_001831275.1	bifunctional lysylphosphatidylglycerol flippase/synthetase MprF	89.7	33.6	31.7
MGA_1265	LOCUS_10410	sequence216:102793..103263(-)	partial			WP_000701483.1	DNA-directed RNA polymerase subunit delta	57.1	50.0	34.8
MGA_1272	LOCUS_10480	sequence216:109224..109343(+)	partial			WP_003077408.1	helix-turn-helix transcriptional regulator	89.7	7.4	94.3
MGA_1301	LOCUS_10770	sequence216:138766..139413(+)	partial			WP_003595964.1	GNAT family N-acetyltransferase	31.2	70.8	44.9
MGA_1314	LOCUS_10900	sequence216:151161..151940(-)	partial			WP_000508996.1	PI-2a pilus assembly sortase SrtC4	80.7	70.7	61.7
MGA_1315	LOCUS_10910	sequence216:152074..152952(-)	partial			WP_001178115.1	SpaA isopeptide-forming pilin-related protein	82.9	8.8	30.4
MGA_1317	LOCUS_10930	sequence216:155218..163023(-)	partial			WP_211477941.1	SpaA isopeptide-forming pilin-related protein	12.0	20.3	24.8
MGA_1324	LOCUS_10940	sequence226:32..>594(-)	partial			WP_001557163.1	ISL3-like element IS1181 family transposase	90.9	39.6	39.7
MGA_1325	LOCUS_10950	sequence227:1..1041(+)	partial			WP_001832683.1	bifunctional (p)ppGpp synthetase/guanosine-3',5'-bis(diphosphate) 3'-pyrophosphohydrolase	99.4	47.3	49.1
MGA_1334	LOCUS_11040	sequence227:5931..6791(+)	partial			WP_020862454.1	DNA polymerase III subunit gamma/tau	84.3	35.0	28.3
MGA_1336	LOCUS_11060	sequence227:7499..7801(+)	frameshift		7500	WP_040804636.1	GIY-YIG nuclease family protein	77.0	23.2	51.9
MGA_1346	LOCUS_11160	sequence227:15048..15305(+)	partial			WP_005775925.1	preprotein translocase subunit YajC	85.9	67.6	39.7
MGA_1377	LOCUS_11470	sequence227:42505..42846(+)	frameshift,internal_stop_codon	42352..42354(+)	42831	WP_011016217.1	putative DNA binding domain-containing protein	96.5	22.9	69.7
MGA_1378	LOCUS_11480	sequence227:42836..43420(+)	frameshift,internal_stop_codon	43418..43420(+)	43633,42831	WP_011016217.1	putative DNA binding domain-containing protein	100.0	40.7	82.0
MGA_1384	LOCUS_11540	sequence227:48027..49976(+)	partial			WP_010990137.1	DNA internalization-related competence protein ComEC/Rec2	60.7	53.5	26.4
MGA_1388	LOCUS_11580	sequence227:51709..52623(+)	partial			WP_000037075.1	YihY/virulence factor BrkB family protein	93.1	69.6	38.2
MGA_1389	LOCUS_11590	sequence227:52627..53115(+)	partial			WP_002672271.1	peptide-methionine (R)-S-oxide reductase MsrB	100.0	45.8	58.6
MGA_1403	LOCUS_11730	sequence227:64059..64631(+)	partial			WP_011015875.1	ribonuclease PH	98.9	44.0	56.8
MGA_1441	LOCUS_12110	sequence227:105494..107374(+)	partial			WP_000525078.1	ATP-dependent DNA helicase DinG	91.9	73.9	22.3
MGA_1470	LOCUS_12400	sequence227:140540..141085(-)	partial			WP_015703827.1	XRE family transcriptional regulator	90.6	35.9	29.1
MGA_1481	LOCUS_12410	sequence238:1..1124(+)	partial			WP_011837563.1	Cna B-type domain-containing protein	86.1	18.0	24.5
MGA_1484	LOCUS_12440	sequence238:4817..5200(+)	internal_stop_codon	5198..5200(+)		WP_064094285.1	oxidoreductase	97.6	58.0	34.4
MGA_1501	LOCUS_12610	sequence238:20624..21499(-)	partial			WP_002288821.1	helix-turn-helix domain-containing protein	72.9	76.0	26.1
MGA_1520	LOCUS_12800	sequence238:41639..42151(+)	frameshift		42145	WP_211260004.1	IS3 family transposase	93.5	35.0	51.6
MGA_1521	LOCUS_12810	sequence238:42259..43038(+)	frameshift,internal_stop_codon	42149..42151(+)	42154	WP_211260004.1	IS3 family transposase	98.1	53.5	51.4
MGA_1572	LOCUS_13320	sequence238:80664..80855(-)	frameshift		80914	WP_000811992.1	phosphorylcholine transferase LicD	92.1	21.7	55.2
MGA_1573	LOCUS_13330	sequence238:80912..81460(-)	frameshift		80926	WP_001199652.1	phosphorylcholine transferase LicD	100.0	67.7	52.7
MGA_1594	LOCUS_13460	sequence246:1..420(+)	partial			WP_005763543.1	efflux RND transporter periplasmic adaptor subunit	100.0	32.9	67.6
MGA_1610	LOCUS_13600	sequence249:15587..16111(-)	partial			WP_000551762.1	CtsR family transcriptional regulator	62.6	73.9	51.3
MGA_1651	LOCUS_14010	sequence249:57610..57903(-)	internal_stop_codon	57940..57942(-)		WP_002935466.1	VOC family protein	94.8	62.6	45.7
MGA_1706	LOCUS_14440	sequence260:11482..11868(-)	frameshift		11502	WP_011016121.1	2-amino-4-hydroxy-6-hydroxymethyldihydropteridine diphosphokinase	83.6	39.1	38.3
MGA_1731	LOCUS_14690	sequence260:40526..45208(+)	partial			WP_012775274.1	pneumococcal-type histidine triad protein	25.6	47.8	36.3
MGA_1749	LOCUS_14870	sequence260:59482..61413(-)	partial			WP_000824615.1	amidase family protein	73.7	70.7	47.3
MGA_1778	LOCUS_15060	sequence271:11341..13641(-)	partial			WP_011460911.1	endopeptidase La	76.5	73.0	52.5
MGA_1801	LOCUS_15290	sequence271:39444..40640(-)	partial			WP_010966553.1	leucine-rich repeat domain-containing protein	74.4	31.2	27.9
MGA_1813	LOCUS_15410	sequence271:55511..56335(+)	partial			WP_011017006.1	sugar phosphate nucleotidyltransferase	79.9	43.1	31.7
MGA_1814	LOCUS_15420	sequence271:56376..56828(-)	partial			WP_003723588.1	LysM peptidoglycan-binding domain-containing protein	74.0	44.8	34.2
MGA_1890	LOCUS_16050	sequence282:36166..41313(-)	partial			WP_011836870.1	ZmpA/ZmpB/ZmpC family metallo-endopeptidase	43.5	26.1	30.7
