# locus_id	locus_tag	location	classification	internal_stop	indel	ref_id	description	query_cov	ref_cov	identity
MGA_61	LOCUS_00610	sequence001:57381..58409(+)	partial			WP_003233473.1	phosphomethylpyrimidine synthase ThiC	95.3	54.7	67.0
MGA_69	LOCUS_00660	sequence003:1905..2204(-)	partial			WP_010706793.1	DNA repair protein RadC	96.0	40.9	55.8
MGA_73	LOCUS_00670	sequence006:792..932(+)	frameshift,internal_stop_codon	715..717(+),718..720(+),712..714(+),598..600(+)	708	WP_126564639.1	site-specific integrase	91.3	10.4	54.8
MGA_84	LOCUS_00700	sequence011:1722..2360(-)	partial			WP_005808204.1	ABC transporter ATP-binding protein	90.1	69.6	32.5
MGA_87	LOCUS_00730	sequence011:3573..4664(-)	partial			WP_011403089.1	NosD domain-containing protein	55.6	45.2	25.8
MGA_92	LOCUS_00780	sequence011:7865..11395(-)	partial			WP_000728853.1	S8 family serine peptidase	72.3	62.7	33.6
MGA_188	LOCUS_01740	sequence012:25610..26245(-)	partial			WP_011029732.1	C40 family peptidase	85.8	64.6	34.0
MGA_193	LOCUS_01790	sequence012:32450..33130(-)	partial			WP_041272276.1	class I SAM-dependent methyltransferase	58.0	60.8	33.6
MGA_208	LOCUS_01940	sequence012:45332..45655(-)	internal_stop_codon	45755..45757(-)		WP_001075809.1	M20 family metallopeptidase	98.1	26.8	75.2
MGA_221	LOCUS_02020	sequence019:1..618(+)	partial			WP_051532688.1	DUF3578 domain-containing protein	84.9	45.8	31.0
MGA_231	LOCUS_02090	sequence020:1212..1385(+)	partial			WP_000136509.1	sugar O-acetyltransferase	93.0	28.6	66.0
MGA_235	LOCUS_02100	sequence023:170..481(+)	partial			WP_010965371.1	sporulation transcription factor Spo0A	99.0	38.4	32.4
MGA_268	LOCUS_02430	sequence023:29210..30214(+)	partial			WP_000069289.1	elastin-binding protein EbpS	82.3	51.9	26.5
MGA_312	LOCUS_02830	sequence026:28404..28790(-)	frameshift		28837	WP_009930903.1	class I SAM-dependent methyltransferase	99.2	63.7	57.8
MGA_313	LOCUS_02840	sequence026:28808..28999(-)	frameshift		28846	WP_002494716.1	class I SAM-dependent methyltransferase	85.7	26.7	59.3
MGA_342	LOCUS_03130	sequence026:53171..53425(-)	frameshift		53420	WP_002261920.1	GIY-YIG nuclease family protein	90.5	22.4	64.5
MGA_360	LOCUS_03280	sequence028:4632..5444(-)	partial			WP_010880556.1	ATP-binding protein	65.6	70.6	27.2
MGA_382	LOCUS_03440	sequence032:10643..10951(-)	frameshift		10684	WP_002457104.1	S1 domain-containing RNA-binding protein	94.1	72.2	76.0
MGA_413	LOCUS_03740	sequence033:8015..8473(-)	partial			WP_000716775.1	restriction endonuclease	92.1	72.0	40.7
MGA_414	LOCUS_03750	sequence033:8470..9768(-)	partial			WP_000431475.1	DUF3991 and TOPRIM domain-containing protein	61.3	79.8	34.3
MGA_417	LOCUS_03780	sequence033:12596..14548(-)	partial			WP_002484931.1	DUF3991 domain-containing protein	70.3	60.5	32.8
MGA_469	LOCUS_04290	sequence034:28644..28982(-)	partial			WP_002305939.1	IS30 family transposase	98.2	34.5	63.6
MGA_509	LOCUS_04670	sequence037:15756..16211(+)	partial			WP_005423733.1	MarR family transcriptional regulator	72.2	67.5	29.4
MGA_520	LOCUS_04780	sequence037:26067..26612(+)	partial			WP_003222575.1	cytochrome c biogenesis protein	97.8	64.1	38.4
MGA_534	LOCUS_04920	sequence037:43588..44109(+)	partial			WP_000351221.1	GNAT family protein	72.8	83.0	37.9
MGA_621	LOCUS_05790	sequence038:22353..22583(+)	partial			WP_001123317.1	YneF family protein	57.9	60.3	75.0
MGA_631	LOCUS_05890	sequence038:30423..30638(-)	partial			WP_000910489.1	large conductance mechanosensitive channel protein MscL	85.9	50.0	59.0
MGA_664	LOCUS_06220	sequence039:20689..21024(+)	frameshift		21006	WP_000701483.1	DNA-directed RNA polymerase subunit delta	91.0	57.4	73.3
MGA_668	LOCUS_06260	sequence039:23582..23932(+)	partial			WP_009888625.1	response regulator transcription factor	99.1	51.7	37.5
MGA_685	LOCUS_06430	sequence039:38197..38550(+)	frameshift,internal_stop_codon	38166..38168(+)	38192	WP_001801792.1	ATP synthase subunit I	100.0	78.0	35.9
MGA_704	LOCUS_06620	sequence040:4194..5009(-)	partial			WP_003244816.1	peptidoglycan endopeptidase LytE	47.2	36.5	40.6
MGA_705	LOCUS_06630	sequence040:5128..5991(-)	frameshift		4932	WP_003244816.1	peptidoglycan endopeptidase LytE	39.4	38.0	34.4
MGA_707	LOCUS_06650	sequence041:238..906(+)	partial			WP_003232562.1	serine protease Isp	81.5	66.1	27.5
MGA_713	LOCUS_06710	sequence041:4723..5601(+)	partial			WP_012774875.1	hypothetical protein	76.4	72.8	32.9
MGA_776	LOCUS_07340	sequence044:6268..6459(+)	internal_stop_codon	6457..6459(+)		WP_002404595.1	AAA family ATPase	90.5	33.3	45.6
MGA_832	LOCUS_07890	sequence045:46678..47670(+)	partial			WP_003733917.1	resuscitation-promoting factor	37.9	48.7	45.2
MGA_833	LOCUS_07900	sequence045:47862..48302(+)	partial			WP_000731644.1	LysM peptidoglycan-binding domain-containing protein	90.4	47.9	41.4
MGA_834	LOCUS_07910	sequence045:48385..48924(+)	partial			WP_011228871.1	TlpA disulfide reductase family protein	52.0	53.4	36.2
MGA_899	LOCUS_08560	sequence046:38782..>39421(-)	partial			WP_000613541.1	PG:teichoic acid D-alanyltransferase DltB	99.5	52.2	61.6
MGA_993	LOCUS_09490	sequence048:45909..46085(-)	partial			WP_000048060.1	30S ribosomal protein S21	74.1	74.1	93.0
MGA_994	LOCUS_09500	sequence048:46202..46753(-)	frameshift		46776	WP_000108668.1	tRNA (N(6)-L-threonylcarbamoyladenosine(37)-C(2))-methylthiotransferase MtaB	98.9	40.4	69.6
MGA_995	LOCUS_09510	sequence048:46747..47547(-)	frameshift		46776	WP_000108668.1	tRNA (N(6)-L-threonylcarbamoyladenosine(37)-C(2))-methylthiotransferase MtaB	97.0	57.6	88.8
MGA_1013	LOCUS_09680	sequence050:6832..8952(-)	partial			WP_000970545.1	glycosyltransferase family A protein	32.9	70.2	25.6
MGA_1016	LOCUS_09710	sequence050:10328..11281(-)	partial			WP_003227930.1	teichoic acids export ABC transporter ATP-binding subunit TagH	82.3	48.8	51.7
MGA_1041	LOCUS_09960	sequence051:17821..19152(+)	internal_stop_codon	17797..17799(+)		WP_000725608.1	hypothetical protein	91.0	81.9	47.3
MGA_1042	LOCUS_09970	sequence051:19167..20852(+)	partial			WP_010964064.1	immune inhibitor A	57.6	40.3	42.9
MGA_1061	LOCUS_10160	sequence051:37293..37592(+)	partial			WP_003246602.1	DUF3817 domain-containing protein	71.7	74.0	62.0
MGA_1062	LOCUS_10170	sequence051:37649..38359(+)	partial			WP_162891890.1	23S rRNA pseudouridine(2604) synthase RluF	96.6	68.9	62.3
MGA_1070	LOCUS_10240	sequence053:367..783(+)	partial			WP_126564639.1	site-specific integrase	96.4	31.2	72.2
MGA_1077	LOCUS_10310	sequence053:7029..8048(+)	partial			WP_164929094.1	YsnF/AvaK domain-containing protein	37.2	42.7	46.0
MGA_1100	LOCUS_10540	sequence053:27102..27392(+)	partial			WP_003228417.1	disulfide oxidoreductase	95.8	66.7	57.6
MGA_1120	LOCUS_10740	sequence054:13774..14778(+)	partial			WP_003234641.1	uroporphyrinogen-III C-methyltransferase	94.0	65.0	40.7
MGA_1133	LOCUS_10860	sequence055:110..1261(-)	partial			WP_009966633.1	bifunctional lytic transglycosylase/C40 family peptidase	49.9	57.8	36.7
MGA_1144	LOCUS_10970	sequence055:15631..18165(-)	partial			WP_002505516.1	isopeptide-forming domain-containing fimbrial protein	83.5	68.2	33.5
MGA_1161	LOCUS_11120	sequence057:652..975(-)	partial			WP_003246525.1	SprT family protein	100.0	74.0	51.4
MGA_1219	LOCUS_11690	sequence060:3066..3512(-)	partial			WP_000805797.1	ArsR family transcriptional regulator	93.9	67.1	38.8
MGA_1226	LOCUS_11760	sequence060:10818..12905(-)	partial			WP_133431295.1	Z1 domain-containing protein	60.0	52.4	22.1
MGA_1229	LOCUS_11790	sequence060:13797..14021(+)	partial			WP_001173201.1	mannose-6-phosphate isomerase, class I	98.6	23.4	38.4
MGA_1237	LOCUS_11870	sequence060:21750..24968(+)	partial			WP_041670058.1	RecQ family ATP-dependent DNA helicase	44.0	26.0	28.9
MGA_1241	LOCUS_11910	sequence060:27637..27969(+)	partial			WP_002296570.1	hypothetical protein	89.1	48.1	49.0
MGA_1249	LOCUS_11990	sequence060:36680..39982(+)	partial			WP_002286055.1	SpaA isopeptide-forming pilin-related protein	53.7	52.9	24.8
MGA_1299	LOCUS_12470	sequence064:18958..19497(+)	frameshift		19482	WP_001831129.1	Y-family DNA polymerase	99.4	42.4	67.4
MGA_1300	LOCUS_12480	sequence064:19484..20227(+)	frameshift		19488	WP_001831129.1	Y-family DNA polymerase	98.8	58.1	59.0
MGA_1304	LOCUS_12520	sequence064:22804..24408(-)	partial			WP_011263411.1	SgrR family transcriptional regulator	55.2	51.8	23.6
MGA_1308	LOCUS_12560	sequence064:27606..27971(-)	partial			WP_011922396.1	DUF3307 domain-containing protein	79.3	38.2	36.8
MGA_1315	LOCUS_12630	sequence064:34609..35418(-)	frameshift		35498	WP_153495214.1	IS3 family transposase	95.9	56.7	46.0
MGA_1316	LOCUS_12640	sequence064:35484..36002(-)	frameshift		35504	WP_129868159.1	IS3 family transposase	70.9	26.0	41.5
MGA_1397	LOCUS_13450	sequence065:141..833(-)	frameshift		146	WP_100190734.1	IS3 family transposase	80.0	35.2	38.9
MGA_1407	LOCUS_13510	sequence069:45..887(-)	frameshift		916	WP_099835063.1	IS3 family transposase	98.2	72.4	69.5
MGA_1408	LOCUS_13520	sequence069:872..1186(-)	frameshift		916	WP_099835063.1	IS3 family transposase	96.2	26.3	64.0
MGA_1410	LOCUS_13540	sequence070:1434..1658(-)	partial			WP_074016730.1	GIY-YIG nuclease family protein	98.6	25.4	42.7
MGA_1421	LOCUS_13650	sequence070:10045..10716(+)	frameshift		10704,10659	WP_181746991.1	IS1182 family transposase	91.5	43.0	54.4
MGA_1422	LOCUS_13660	sequence070:10817..11395(+)	frameshift		10659,10710	WP_083498292.1	IS1182 family transposase	95.3	39.1	53.6
MGA_1448	LOCUS_13920	sequence070:34699..35382(-)	frameshift		35585	WP_211254473.1	IS3 family transposase	89.4	44.9	43.9
MGA_1449	LOCUS_13930	sequence070:35550..36245(-)	frameshift		35576	WP_100190734.1	IS3 family transposase	93.1	41.2	34.4
MGA_1462	LOCUS_14060	sequence070:49480..50253(-)	partial			WP_004254910.1	homoserine O-succinyltransferase	87.5	71.3	41.0
MGA_1520	LOCUS_14630	sequence071:10011..10256(-)	internal_stop_codon	10290..10292(-)		WP_011263649.1	sodium/proline symporter PutP	95.1	15.1	39.0
MGA_1521	LOCUS_14640	sequence071:10290..11543(-)	internal_stop_codon	10290..10292(-)		WP_000957020.1	sodium/proline symporter PutP	97.1	78.9	70.4
MGA_1576	LOCUS_15190	sequence072:42..>762(-)	partial			WP_086953915.1	IS3-like element ISEnfa3 family transposase	96.2	50.9	41.1
MGA_1585	LOCUS_15280	sequence073:7274..10018(-)	partial			WP_000118314.1	DNA translocase FtsK	80.9	58.0	51.8
MGA_1624	LOCUS_15650	sequence076:16..450(+)	partial			WP_011949169.1	site-specific integrase	95.1	74.6	52.5
MGA_1634	LOCUS_15730	sequence077:5141..6103(-)	partial			WP_002439305.1	serine hydrolase domain-containing protein	87.5	72.2	34.9
MGA_1635	LOCUS_15740	sequence077:6164..6643(-)	partial			WP_000598444.1	YutD family protein	60.4	75.6	65.6
MGA_1649	LOCUS_15880	sequence077:17878..19599(-)	partial			WP_011836504.1	phosphodiester glycosidase family protein	29.8	59.4	33.1
MGA_1665	LOCUS_16040	sequence077:28848..29858(-)	partial			WP_011109439.1	NAD+--arginine ADP-ribosyltransferase EFV	63.1	42.3	32.5
MGA_1667	LOCUS_16060	sequence077:31189..32418(-)	partial			WP_010883725.1	PBSX family phage terminase large subunit	56.7	51.3	25.4
MGA_1773	LOCUS_17110	sequence079:40779..41342(+)	internal_stop_codon	41340..41342(+)		WP_000047255.1	hemolysin III family protein	95.2	78.4	55.6
MGA_1783	LOCUS_17210	sequence079:48883..49506(-)	partial			WP_000588494.1	HAD family hydrolase	86.0	71.0	26.5
MGA_1796	LOCUS_17330	sequence081:4992..5609(+)	partial			WP_004399048.1	endonuclease YokF	79.0	54.4	39.9
MGA_1805	LOCUS_17420	sequence082:5865..6053(+)	partial			WP_001794540.1	twin-arginine translocase TatA/TatE family subunit	72.6	62.2	60.9
MGA_1807	LOCUS_17440	sequence082:6937..7638(+)	partial			WP_000141432.1	glycoside hydrolase family 32 protein	85.8	44.1	44.1
MGA_1824	LOCUS_17610	sequence082:21307..22806(+)	partial			WP_010714140.1	DNA primase family protein	86.6	53.9	47.5
MGA_1829	LOCUS_17660	sequence082:26542..26832(+)	partial			WP_010965201.1	HNH endonuclease signature motif containing protein	71.9	68.0	36.5
MGA_1911	LOCUS_18460	sequence086:39233..40120(+)	partial			WP_000342182.1	cell division protein FtsQ/DivIB	93.9	61.7	30.0
MGA_1919	LOCUS_18540	sequence086:45980..46546(+)	partial			WP_001830163.1	DivIVA domain-containing protein	83.5	72.0	58.6
MGA_1964	LOCUS_18960	sequence090:7739..8170(-)	partial			WP_011949169.1	site-specific integrase	93.7	72.9	50.7
MGA_2085	LOCUS_20150	sequence096:5249..5803(+)	partial			WP_003577315.1	phospholipase A2 family protein	42.9	40.5	38.8
MGA_2088	LOCUS_20180	sequence096:6695..7084(-)	partial			WP_001273859.1	recombinase family protein	96.9	67.6	67.2
MGA_2110	LOCUS_20380	sequence099:7663..>8345(-)	partial			WP_011202263.1	glycosyltransferase family 4 protein	78.3	44.5	35.2
MGA_2144	LOCUS_20690	sequence103:34239..35060(-)	partial			WP_005482997.1	cytoskeleton protein RodZ	39.9	34.5	31.2
MGA_2245	LOCUS_21680	sequence106:4519..5835(-)	partial			WP_010714140.1	DNA primase family protein	99.3	54.0	45.7
MGA_2246	LOCUS_21690	sequence106:6036..6902(-)	partial			WP_010714181.1	VapE family protein	49.0	17.1	27.7
MGA_2271	LOCUS_21900	sequence111:11895..12200(+)	partial			WP_011393014.1	sporulation transcription factor Spo0A	86.1	35.2	34.4
MGA_2281	LOCUS_21920	sequence116:994..1116(-)	frameshift,internal_stop_codon	992..994(-),1238..1240(-)	1366,1207	WP_002437604.1	multicopper oxidase domain-containing protein	100.0	8.4	90.0
MGA_2282	LOCUS_21930	sequence116:1358..2539(-)	internal_stop_codon	2558..2560(-)		WP_002437601.1	heavy metal translocating P-type ATPase	85.0	48.6	82.9
MGA_2283	LOCUS_21940	sequence116:2558..3415(-)	internal_stop_codon	2558..2560(-)		WP_002437601.1	heavy metal translocating P-type ATPase	89.8	37.3	84.4
MGA_2284	LOCUS_21950	sequence117:10..>513(-)	partial			WP_002305939.1	IS30 family transposase	97.6	51.1	67.5
MGA_2288	LOCUS_21990	sequence118:3787..4308(-)	frameshift		4361,4318	WP_168488820.1	CDP-glycerol glycerophosphotransferase family protein	90.8	14.6	29.2
MGA_2289	LOCUS_22000	sequence118:4320..5231(-)	frameshift		4322	WP_003227939.1	poly(glucosyl N-acetylgalactosamine 1-phosphate) glucosyltransferase	58.1	20.7	28.1
MGA_2290	LOCUS_22010	sequence118:5245..6351(-)	partial			WP_001832059.1	glycosyltransferase family 2 protein	70.7	71.5	36.2
MGA_2302	LOCUS_22130	sequence118:18209..20998(+)	partial			WP_001074534.1	glucosaminidase domain-containing protein	74.3	57.7	34.2
MGA_2309	LOCUS_22200	sequence118:25931..26794(-)	partial			WP_000414165.1	bifunctional UDP-sugar hydrolase/5'-nucleotidase	97.2	59.8	29.9
MGA_2311	LOCUS_22220	sequence119:187..687(-)	frameshift,internal_stop_codon	147..149(-)	204	WP_012775582.1	glycoside hydrolase family 3 N-terminal domain-containing protein	97.0	27.9	62.1
MGA_2324	LOCUS_22310	sequence122:8401..9252(+)	partial			WP_010921285.1	YgcG family protein	55.5	50.3	31.5
MGA_2360	LOCUS_22670	sequence122:45629..46162(+)	frameshift		46102	WP_000829167.1	citrate synthase	92.7	43.4	66.5
MGA_2361	LOCUS_22680	sequence122:46105..46746(+)	frameshift		46102	WP_011082708.1	citrate synthase	100.0	57.1	78.4
